-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathtokens.c
2598 lines (2463 loc) · 102 KB
/
tokens.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
/*
** This file is part of the Matrix Brandy Basic VI Interpreter.
** Copyright (C) 2000-2014 David Daniels
** Copyright (C) 2018-2024 Michael McConnell and contributors
**
** Brandy is free software; you can redistribute it and/or modify
** it under the terms of the GNU General Public License as published by
** the Free Software Foundation; either version 2, or (at your option)
** any later version.
**
** Brandy is distributed in the hope that it will be useful,
** but WITHOUT ANY WARRANTY; without even the implied warranty of
** MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
** GNU General Public License for more details.
**
** You should have received a copy of the GNU General Public License
** along with Brandy; see the file COPYING. If not, write to
** the Free Software Foundation, 59 Temple Place - Suite 330,
** Boston, MA 02111-1307, USA.
**
**
** This module contains the tokenisation routines and functions for
** manipulating pointers and offsets found in the tokenised form of the
** Basic program.
*/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include <ctype.h>
#include "common.h"
#include "target.h"
#include "basicdefs.h"
#include "tokens.h"
#include "miscprocs.h"
#include "convert.h"
#include "errors.h"
/*
** The format of a tokenised line is as follows:
**
** <line number>
** <line length>
** <offset of first executable token>
** <copy of source>
** <NUL>
** <executable tokens>
** <NUL>
**
** The line number, line length and offset are all two bytes long.
** The line length is that of the whole line, from the first byte of
** line number to the NUL at the end of the line.
** The offset gives the byte offset from the first byte of the line
** number to the first executable token.
** The original source of the line is held in a slightly compressed
** form. Keywords are replaced by tokens and some extra tokens added
** as markers to note the position of variable names.
** The executable tokens are what the interpreter executes. The line
** is compressed as much as possible. Variables are represented by
** pointers. Initially these give the offset of the variable name in
** the source part of the line from the current location in the
** executable part of it but they are replaced with pointers to the
** variable's symbol entry when the program is running. Numbers are
** converted to their binary form. Offsets are added after tokens
** such as 'ELSE' where a branch occurs that give the offset of branch
** destination. These are filled in when the program runs. A similar
** idea is used to deal with line number references in, for example,
** GOTO statements. Initially the GOTO token is followed by the number
** of the destination line but this is changed to the address of that
** line when the program is run.
** When a program is editted or is run afresh, many or all of the
** offsets and pointers have to be restored to their original state.
** This is where the marker tokens in the source part of the line
** are used. The code scans through the executable tokens and when
** it comes across an entry that has to be changed it looks for the
** corresponding marker token and updates the executable token
** accordingly. References to line numbers in, for example, GOTO
** statements, are handled slightly differently in that the code uses
** the pointer to fetch the number of the line from the start of the
** referenced line and replaces the pointer with that. When a program
** is run afresh or the 'CLEAR' statement is encountered, all pointers
** to variables are reset as the symbol table is destroyed. Branch
** offsets and line number references are left alone. If the program
** is editted then everything is reset.
*/
#define INDENTSIZE 2
#define MAXKWLEN 10
#define NOKEYWORD 255
/*
** 'thisline' contains the tokenised version of the line
** read from the keyboard. The +8 is to allow the end marker
** to be added safely when the line is executed
*/
byte thisline[MAXSTATELEN + 8];
/*
** 'tokenbase' points at the start of the buffer in which
** the tokenised version of the line is stored
*/
static byte *tokenbase;
typedef struct {
char *name; /* Name of token */
int length; /* Length of token's name */
int minlength; /* Minimum no. of chars for keyword to recognised */
byte lhtype; /* Type of token if at start of statement */
byte lhvalue; /* Token's value if at start of statement */
byte type; /* Type of token if elsewhere in statement */
byte value; /* Token's value if elsewhere in statement */
boolean alone; /* TRUE if token is not a token if followed by letter */
boolean linefollow; /* TRUE if the token can be followed by a line number */
} token;
/*
** The token table is split into two parts, the first containing all the
** normal Basic keywords, function names and so forth and the second one
** the Basic commands. These appear separately as they can be entered in
** mixed case whereas the rest have to be in upper case
*/
static token tokens [] = {
{"ABS", 3, 2, TYPE_FUNCTION, BASTOKEN_ABS, TYPE_FUNCTION, BASTOKEN_ABS, FALSE, FALSE}, /* 0 */
{"ACS", 3, 2, TYPE_FUNCTION, BASTOKEN_ACS, TYPE_FUNCTION, BASTOKEN_ACS, FALSE, FALSE},
{"ADVAL", 5, 2, TYPE_FUNCTION, BASTOKEN_ADVAL, TYPE_FUNCTION, BASTOKEN_ADVAL, FALSE, FALSE},
{"AND", 3, 1, TYPE_ONEBYTE, BASTOKEN_AND, TYPE_ONEBYTE, BASTOKEN_AND, FALSE, FALSE},
{"ARGC", 4, 4, TYPE_FUNCTION, BASTOKEN_ARGC, TYPE_FUNCTION, BASTOKEN_ARGC, FALSE, FALSE},
{"ARGV$", 5, 5, TYPE_FUNCTION, BASTOKEN_ARGVDOL, TYPE_FUNCTION, BASTOKEN_ARGVDOL, FALSE, FALSE},
{"ASC", 3, 2, TYPE_FUNCTION, BASTOKEN_ASC, TYPE_FUNCTION, BASTOKEN_ASC, FALSE, FALSE},
{"ASN", 3, 3, TYPE_FUNCTION, BASTOKEN_ASN, TYPE_FUNCTION, BASTOKEN_ASN, FALSE, FALSE},
{"ATN", 3, 2, TYPE_FUNCTION, BASTOKEN_ATN, TYPE_FUNCTION, BASTOKEN_ATN, FALSE, FALSE},
{"BEATS", 5, 2, TYPE_ONEBYTE, BASTOKEN_BEATS, TYPE_ONEBYTE, BASTOKEN_BEATS, FALSE, FALSE}, /* 9 */
{"BEAT", 4, 4, TYPE_FUNCTION, BASTOKEN_BEAT, TYPE_FUNCTION, BASTOKEN_BEAT, FALSE, FALSE},
{"BGET", 4, 1, TYPE_FUNCTION, BASTOKEN_BGET, TYPE_FUNCTION, BASTOKEN_BGET, TRUE, FALSE},
{"BPUT", 4, 2, TYPE_ONEBYTE, BASTOKEN_BPUT, TYPE_ONEBYTE, BASTOKEN_BPUT, TRUE, FALSE},
{"BY", 2, 2, TYPE_ONEBYTE, BASTOKEN_BY, TYPE_ONEBYTE, BASTOKEN_BY, FALSE, FALSE},
{"CALL", 4, 2, TYPE_ONEBYTE, BASTOKEN_CALL, TYPE_ONEBYTE, BASTOKEN_CALL, FALSE, FALSE}, /* 13 */
{"CASE", 4, 3, TYPE_ONEBYTE, BASTOKEN_XCASE, TYPE_ONEBYTE, BASTOKEN_XCASE, FALSE, FALSE},
{"CHAIN", 5, 2, TYPE_ONEBYTE, BASTOKEN_CHAIN, TYPE_ONEBYTE, BASTOKEN_CHAIN, FALSE, FALSE},
{"CHR$", 4, 4, TYPE_FUNCTION, BASTOKEN_CHR, TYPE_FUNCTION, BASTOKEN_CHR, FALSE, FALSE},
{"CIRCLE", 6, 2, TYPE_ONEBYTE, BASTOKEN_CIRCLE, TYPE_ONEBYTE, BASTOKEN_CIRCLE, FALSE, FALSE},
{"CLEAR", 5, 2, TYPE_ONEBYTE, BASTOKEN_CLEAR, TYPE_ONEBYTE, BASTOKEN_CLEAR, TRUE, FALSE},
{"CLOSE", 5, 3, TYPE_ONEBYTE, BASTOKEN_CLOSE, TYPE_ONEBYTE, BASTOKEN_CLOSE, TRUE, FALSE},
{"CLG", 3, 3, TYPE_ONEBYTE, BASTOKEN_CLG, TYPE_ONEBYTE, BASTOKEN_CLG, TRUE, FALSE},
{"CLS", 3, 3, TYPE_ONEBYTE, BASTOKEN_CLS, TYPE_ONEBYTE, BASTOKEN_CLS, TRUE, FALSE},
{"COLOR", 5, 1, TYPE_ONEBYTE, BASTOKEN_COLOUR, TYPE_ONEBYTE, BASTOKEN_COLOUR, FALSE, FALSE}, /* 22 */
{"COLOUR", 6, 1, TYPE_ONEBYTE, BASTOKEN_COLOUR, TYPE_ONEBYTE, BASTOKEN_COLOUR, FALSE, FALSE},
{"COS", 3, 3, TYPE_FUNCTION, BASTOKEN_COS, TYPE_FUNCTION, BASTOKEN_COS, FALSE, FALSE},
{"COUNT", 5, 3, TYPE_FUNCTION, BASTOKEN_COUNT, TYPE_FUNCTION, BASTOKEN_COUNT, TRUE, FALSE},
{"DATA", 4, 1, TYPE_ONEBYTE, BASTOKEN_DATA, TYPE_ONEBYTE, BASTOKEN_DATA, FALSE, FALSE}, /* 26 */
{"DEF", 3, 3, TYPE_ONEBYTE, BASTOKEN_DEF, TYPE_ONEBYTE, BASTOKEN_DEF, FALSE, FALSE},
{"DEG", 3, 2, TYPE_FUNCTION, BASTOKEN_DEG, TYPE_FUNCTION, BASTOKEN_DEG, FALSE, FALSE},
{"DIM", 3, 3, TYPE_ONEBYTE, BASTOKEN_DIM, TYPE_ONEBYTE, BASTOKEN_DIM, FALSE, FALSE},
{"DIV", 3, 2, TYPE_ONEBYTE, BASTOKEN_DIV, TYPE_ONEBYTE, BASTOKEN_DIV, FALSE, FALSE},
{"DRAW", 4, 2, TYPE_ONEBYTE, BASTOKEN_DRAW, TYPE_ONEBYTE, BASTOKEN_DRAW, FALSE, FALSE},
{"ELLIPSE", 7, 3, TYPE_ONEBYTE, BASTOKEN_ELLIPSE, TYPE_ONEBYTE, BASTOKEN_ELLIPSE, FALSE, FALSE}, /* 33 */
{"ELSE", 4, 2, TYPE_ONEBYTE, BASTOKEN_XELSE, TYPE_ONEBYTE, BASTOKEN_XELSE, FALSE, TRUE},
{"ENDCASE", 7, 4, TYPE_ONEBYTE, BASTOKEN_ENDCASE, TYPE_ONEBYTE, BASTOKEN_ENDCASE, TRUE, FALSE},
{"ENDIF", 5, 4, TYPE_ONEBYTE, BASTOKEN_ENDIF, TYPE_ONEBYTE, BASTOKEN_ENDIF, TRUE, FALSE},
{"ENDPROC", 7, 1, TYPE_ONEBYTE, BASTOKEN_ENDPROC, TYPE_ONEBYTE, BASTOKEN_ENDPROC, TRUE, FALSE},
{"ENDWHILE", 8, 4, TYPE_ONEBYTE, BASTOKEN_ENDWHILE, TYPE_ONEBYTE, BASTOKEN_ENDWHILE, TRUE, FALSE}, /* 38 */
{"END", 3, 3, TYPE_ONEBYTE, BASTOKEN_END, TYPE_ONEBYTE, BASTOKEN_END, TRUE, FALSE},
{"ENVELOPE", 8, 3, TYPE_ONEBYTE, BASTOKEN_ENVELOPE, TYPE_ONEBYTE, BASTOKEN_ENVELOPE, FALSE, FALSE},
{"EOF", 3, 3, TYPE_FUNCTION, BASTOKEN_EOF, TYPE_FUNCTION, BASTOKEN_EOF, TRUE, FALSE},
{"EOR", 3, 3, TYPE_ONEBYTE, BASTOKEN_EOR, TYPE_ONEBYTE, BASTOKEN_EOR, FALSE, FALSE},
{"ERL", 3, 3, TYPE_FUNCTION, BASTOKEN_ERL, TYPE_FUNCTION, BASTOKEN_ERL, TRUE, FALSE}, /* 43 */
{"ERROR", 5, 3, TYPE_ONEBYTE, BASTOKEN_ERROR, TYPE_ONEBYTE, BASTOKEN_ERROR, FALSE, FALSE},
{"ERR", 3, 3, TYPE_FUNCTION, BASTOKEN_ERR, TYPE_FUNCTION, BASTOKEN_ERR, TRUE, FALSE},
{"EVAL", 4, 2, TYPE_FUNCTION, BASTOKEN_EVAL, TYPE_FUNCTION, BASTOKEN_EVAL, FALSE, FALSE},
{"EXIT", 4, 3, TYPE_ONEBYTE, BASTOKEN_EXIT, TYPE_ONEBYTE, BASTOKEN_EXIT, FALSE, FALSE}, /* 47 */
{"EXP", 3, 3, TYPE_FUNCTION, BASTOKEN_EXP, TYPE_FUNCTION, BASTOKEN_EXP, FALSE, FALSE},
{"EXT", 3, 3, TYPE_FUNCTION, BASTOKEN_EXT, TYPE_FUNCTION, BASTOKEN_EXT, TRUE, FALSE},
{"FALSE", 5, 2, TYPE_ONEBYTE, BASTOKEN_FALSE, TYPE_ONEBYTE, BASTOKEN_FALSE, TRUE, FALSE}, /* 50 */
{"FILEPATH$", 9, 4, TYPE_FUNCTION, BASTOKEN_FILEPATH, TYPE_FUNCTION, BASTOKEN_FILEPATH, FALSE, FALSE},
{"FILL", 4, 2, TYPE_ONEBYTE, BASTOKEN_FILL, TYPE_ONEBYTE, BASTOKEN_FILL, FALSE, FALSE},
{"FN", 2, 2, TYPE_ONEBYTE, BASTOKEN_FN, TYPE_ONEBYTE, BASTOKEN_FN, FALSE, FALSE},
{"FOR", 3, 1, TYPE_ONEBYTE, BASTOKEN_FOR, TYPE_ONEBYTE, BASTOKEN_FOR, FALSE, FALSE},
{"GCOL", 4, 2, TYPE_ONEBYTE, BASTOKEN_GCOL, TYPE_ONEBYTE, BASTOKEN_GCOL, FALSE, FALSE}, /* 55 */
{"GET$", 4, 2, TYPE_FUNCTION, BASTOKEN_GETDOL, TYPE_FUNCTION, BASTOKEN_GETDOL, FALSE, FALSE},
{"GET", 3, 3, TYPE_FUNCTION, BASTOKEN_GET, TYPE_FUNCTION, BASTOKEN_GET, FALSE, FALSE},
{"GOSUB", 5, 3, TYPE_ONEBYTE, BASTOKEN_GOSUB, TYPE_ONEBYTE, BASTOKEN_GOSUB, FALSE, TRUE},
{"GOTO", 4, 1, TYPE_ONEBYTE, BASTOKEN_GOTO, TYPE_ONEBYTE, BASTOKEN_GOTO, FALSE, TRUE},
{"HIMEM", 5, 1, TYPE_FUNCTION, BASTOKEN_HIMEM, TYPE_FUNCTION, BASTOKEN_HIMEM, TRUE, FALSE}, /* 60 */
{"IF", 2, 2, TYPE_ONEBYTE, BASTOKEN_XIF, TYPE_ONEBYTE, BASTOKEN_XIF, FALSE, FALSE}, /* 61 */
{"INKEY$", 6, 3, TYPE_FUNCTION, BASTOKEN_INKEYDOL, TYPE_FUNCTION, BASTOKEN_INKEYDOL, FALSE, FALSE},
{"INKEY", 5, 5, TYPE_FUNCTION, BASTOKEN_INKEY, TYPE_FUNCTION, BASTOKEN_INKEY, FALSE, FALSE},
{"INPUT", 5, 1, TYPE_ONEBYTE, BASTOKEN_INPUT, TYPE_ONEBYTE, BASTOKEN_INPUT, FALSE, FALSE},
{"INSTR(", 6, 3, TYPE_FUNCTION, BASTOKEN_INSTR, TYPE_FUNCTION, BASTOKEN_INSTR, FALSE, FALSE},
{"INT", 3, 3, TYPE_FUNCTION, BASTOKEN_INT, TYPE_FUNCTION, BASTOKEN_INT, FALSE, FALSE},
{"LEFT$(", 6, 2, TYPE_FUNCTION, BASTOKEN_LEFT, TYPE_FUNCTION, BASTOKEN_LEFT, FALSE, FALSE}, /* 67 */
{"LEN", 3, 3, TYPE_FUNCTION, BASTOKEN_LEN, TYPE_FUNCTION, BASTOKEN_LEN, FALSE, FALSE},
{"LET", 3, 3, TYPE_ONEBYTE, BASTOKEN_LET, TYPE_ONEBYTE, BASTOKEN_LET, FALSE, FALSE},
{"LIBRARY", 7, 3, TYPE_ONEBYTE, BASTOKEN_LIBRARY, TYPE_ONEBYTE, BASTOKEN_LIBRARY, FALSE, FALSE}, /* 70 */
{"LINE", 4, 3, TYPE_ONEBYTE, BASTOKEN_LINE, TYPE_ONEBYTE, BASTOKEN_LINE, FALSE, FALSE},
{"LN", 2, 2, TYPE_FUNCTION, BASTOKEN_LN, TYPE_FUNCTION, BASTOKEN_LN, FALSE, FALSE},
{"LOCAL", 5, 3, TYPE_ONEBYTE, BASTOKEN_LOCAL, TYPE_ONEBYTE, BASTOKEN_LOCAL, FALSE, FALSE},
{"LOG", 3, 3, TYPE_FUNCTION, BASTOKEN_LOG, TYPE_FUNCTION, BASTOKEN_LOG, FALSE, FALSE},
{"LOMEM", 5, 3, TYPE_FUNCTION, BASTOKEN_LOMEM, TYPE_FUNCTION, BASTOKEN_LOMEM, TRUE, FALSE},
{"MID$(", 5, 1, TYPE_FUNCTION, BASTOKEN_MID, TYPE_FUNCTION, BASTOKEN_MID, FALSE, FALSE}, /* 76 */
{"MODE", 4, 2, TYPE_ONEBYTE, BASTOKEN_MODE, TYPE_ONEBYTE, BASTOKEN_MODE, FALSE, FALSE},
{"MOD", 3, 3, TYPE_ONEBYTE, BASTOKEN_MOD, TYPE_ONEBYTE, BASTOKEN_MOD, FALSE, FALSE},
{"MOUSE", 5, 3, TYPE_ONEBYTE, BASTOKEN_MOUSE, TYPE_ONEBYTE, BASTOKEN_MOUSE, FALSE, FALSE},
{"MOVE", 4, 3, TYPE_ONEBYTE, BASTOKEN_MOVE, TYPE_ONEBYTE, BASTOKEN_MOVE, FALSE, FALSE},
{"NEXT", 4, 1, TYPE_ONEBYTE, BASTOKEN_NEXT, TYPE_ONEBYTE, BASTOKEN_NEXT, FALSE, FALSE}, /* 82 */
{"NOT", 3, 3, TYPE_ONEBYTE, BASTOKEN_NOT, TYPE_ONEBYTE, BASTOKEN_NOT, FALSE, FALSE},
{"OFF", 3, 3, TYPE_ONEBYTE, BASTOKEN_OFF, TYPE_ONEBYTE, BASTOKEN_OFF, FALSE, FALSE}, /* 84 */
{"OF", 2, 2, TYPE_ONEBYTE, BASTOKEN_OF, TYPE_ONEBYTE, BASTOKEN_OF, FALSE, FALSE},
{"ON", 2, 2, TYPE_ONEBYTE, BASTOKEN_ON, TYPE_ONEBYTE, BASTOKEN_ON, FALSE, FALSE}, /* 86 */
{"OPENIN", 6, 2, TYPE_FUNCTION, BASTOKEN_OPENIN, TYPE_FUNCTION, BASTOKEN_OPENIN, FALSE, FALSE},
{"OPENOUT", 7, 5, TYPE_FUNCTION, BASTOKEN_OPENOUT, TYPE_FUNCTION, BASTOKEN_OPENOUT, FALSE, FALSE},
{"OPENUP", 6, 5, TYPE_FUNCTION, BASTOKEN_OPENUP, TYPE_FUNCTION, BASTOKEN_OPENUP, FALSE, FALSE},
{"ORIGIN", 6, 2, TYPE_ONEBYTE, BASTOKEN_ORIGIN, TYPE_ONEBYTE, BASTOKEN_ORIGIN, FALSE, FALSE},
{"OR", 2, 2, TYPE_ONEBYTE, BASTOKEN_OR, TYPE_ONEBYTE, BASTOKEN_OR, FALSE, FALSE}, /* 91 */
{"OSCLI", 5, 2, TYPE_ONEBYTE, BASTOKEN_OSCLI, TYPE_ONEBYTE, BASTOKEN_OSCLI, FALSE, FALSE},
{"OTHERWISE", 9, 2, TYPE_ONEBYTE, BASTOKEN_XOTHERWISE, TYPE_ONEBYTE, BASTOKEN_XOTHERWISE, FALSE, FALSE},
{"OVERLAY", 7, 2, TYPE_ONEBYTE, BASTOKEN_OVERLAY, TYPE_ONEBYTE, BASTOKEN_OVERLAY, FALSE, FALSE},
{"PAGE", 4, 2, TYPE_FUNCTION, BASTOKEN_PAGE, TYPE_FUNCTION, BASTOKEN_PAGE, TRUE, FALSE}, /* 95 */
{"PI", 2, 2, TYPE_FUNCTION, BASTOKEN_PI, TYPE_FUNCTION, BASTOKEN_PI, TRUE, FALSE},
{"PLOT", 4, 2, TYPE_ONEBYTE, BASTOKEN_PLOT, TYPE_ONEBYTE, BASTOKEN_PLOT, FALSE, FALSE},
{"POINT(", 6, 2, TYPE_FUNCTION, BASTOKEN_POINTFN, TYPE_FUNCTION, BASTOKEN_POINTFN, FALSE, FALSE},
{"POINT", 5, 5, TYPE_ONEBYTE, BASTOKEN_POINT, TYPE_ONEBYTE, BASTOKEN_POINT, FALSE, FALSE},
{"POS", 3, 3, TYPE_FUNCTION, BASTOKEN_POS, TYPE_FUNCTION, BASTOKEN_POS, TRUE, FALSE},
{"PRINT", 5, 1, TYPE_ONEBYTE, BASTOKEN_PRINT, TYPE_ONEBYTE, BASTOKEN_PRINT, FALSE, FALSE}, /* 103 */
{"PROC", 4, 4, TYPE_ONEBYTE, BASTOKEN_PROC, TYPE_ONEBYTE, BASTOKEN_PROC, FALSE, FALSE},
{"PTR", 3, 3, TYPE_FUNCTION, BASTOKEN_PTR, TYPE_FUNCTION, BASTOKEN_PTR, TRUE, FALSE},
{"QUIT", 4, 1, TYPE_ONEBYTE, BASTOKEN_QUIT, TYPE_ONEBYTE, BASTOKEN_QUIT, TRUE, FALSE}, /* 106 */
{"RAD", 3, 2, TYPE_FUNCTION, BASTOKEN_RAD, TYPE_FUNCTION, BASTOKEN_RAD, FALSE, FALSE}, /* 107 */
{"READ", 4, 3, TYPE_ONEBYTE, BASTOKEN_READ, TYPE_ONEBYTE, BASTOKEN_READ, FALSE, FALSE},
{"RECTANGLE", 9, 3, TYPE_ONEBYTE, BASTOKEN_RECTANGLE, TYPE_ONEBYTE, BASTOKEN_RECTANGLE, FALSE, FALSE},
{"REM", 3, 3, TYPE_ONEBYTE, BASTOKEN_REM, TYPE_ONEBYTE, BASTOKEN_REM, FALSE, FALSE},
{"REPEAT", 6, 3, TYPE_ONEBYTE, BASTOKEN_REPEAT, TYPE_ONEBYTE, BASTOKEN_REPEAT, FALSE, FALSE},
{"REPORT$", 7, 7, TYPE_FUNCTION, BASTOKEN_REPORTDOL, TYPE_FUNCTION, BASTOKEN_REPORTDOL, FALSE, FALSE},
{"REPORT", 6, 4, TYPE_ONEBYTE, BASTOKEN_REPORT, TYPE_ONEBYTE, BASTOKEN_REPORT, TRUE, FALSE}, /* 113 */
{"RESTORE", 7, 3, TYPE_ONEBYTE, BASTOKEN_RESTORE, TYPE_ONEBYTE, BASTOKEN_RESTORE, FALSE, TRUE},
{"RETURN", 6, 1, TYPE_ONEBYTE, BASTOKEN_RETURN, TYPE_ONEBYTE, BASTOKEN_RETURN, TRUE, FALSE},
{"RIGHT$(", 7, 2, TYPE_FUNCTION, BASTOKEN_RIGHT, TYPE_FUNCTION, BASTOKEN_RIGHT, FALSE, FALSE},
{"RND(", 4, 4, TYPE_FUNCTION, BASTOKEN_RNDPAR, TYPE_FUNCTION, BASTOKEN_RNDPAR, FALSE, FALSE},
{"RND", 3, 2, TYPE_FUNCTION, BASTOKEN_RND, TYPE_FUNCTION, BASTOKEN_RND, TRUE, FALSE},
{"RUN", 3, 2, TYPE_ONEBYTE, BASTOKEN_RUN, TYPE_ONEBYTE, BASTOKEN_RUN, TRUE, FALSE},
{"SGN", 3, 2, TYPE_FUNCTION, BASTOKEN_SGN, TYPE_FUNCTION, BASTOKEN_SGN, FALSE, FALSE}, /* 120 */
{"SIN", 3, 2, TYPE_FUNCTION, BASTOKEN_SIN, TYPE_FUNCTION, BASTOKEN_SIN, FALSE, FALSE},
{"SOUND", 5, 2, TYPE_ONEBYTE, BASTOKEN_SOUND, TYPE_ONEBYTE, BASTOKEN_SOUND, FALSE, FALSE},
{"SPC", 3, 3, TYPE_PRINTFN, BASTOKEN_SPC, TYPE_PRINTFN, BASTOKEN_SPC, FALSE, FALSE},
{"SQR", 3, 3, TYPE_FUNCTION, BASTOKEN_SQR, TYPE_FUNCTION, BASTOKEN_SQR, FALSE, FALSE}, /* 124 */
{"STEP", 4, 1, TYPE_ONEBYTE, BASTOKEN_STEP, TYPE_ONEBYTE, BASTOKEN_STEP, FALSE, FALSE},
{"STEREO", 6, 4, TYPE_ONEBYTE, BASTOKEN_STEREO, TYPE_ONEBYTE, BASTOKEN_STEREO, FALSE, FALSE},
{"STOP", 4, 3, TYPE_ONEBYTE, BASTOKEN_STOP, TYPE_ONEBYTE, BASTOKEN_STOP, TRUE, FALSE},
{"STR$", 4, 3, TYPE_FUNCTION, BASTOKEN_STR, TYPE_FUNCTION, BASTOKEN_STR, FALSE, FALSE},
{"STRING$(", 8, 4, TYPE_FUNCTION, BASTOKEN_STRING, TYPE_FUNCTION, BASTOKEN_STRING, FALSE, FALSE}, /* 129 */
{"SUM", 3, 2, TYPE_FUNCTION, BASTOKEN_SUM, TYPE_FUNCTION, BASTOKEN_SUM, FALSE, FALSE},
{"SWAP", 4, 2, TYPE_ONEBYTE, BASTOKEN_SWAP, TYPE_ONEBYTE, BASTOKEN_SWAP, FALSE, FALSE},
{"SYS(", 4, 4, TYPE_FUNCTION, BASTOKEN_SYSFN, TYPE_FUNCTION, BASTOKEN_SYSFN, FALSE, FALSE},
{"SYS", 3, 3, TYPE_ONEBYTE, BASTOKEN_SYS, TYPE_ONEBYTE, BASTOKEN_SYS, FALSE, FALSE},
{"TAB(", 4, 4, TYPE_PRINTFN, BASTOKEN_TAB, TYPE_PRINTFN, BASTOKEN_TAB, FALSE, FALSE}, /* 134 */
{"TAN", 3, 1, TYPE_FUNCTION, BASTOKEN_TAN, TYPE_FUNCTION, BASTOKEN_TAN, FALSE, FALSE},
{"TEMPO", 5, 2, TYPE_ONEBYTE, BASTOKEN_TEMPO, TYPE_FUNCTION, BASTOKEN_TEMPOFN, FALSE, FALSE},
{"THEN", 4, 2, TYPE_ONEBYTE, BASTOKEN_THEN, TYPE_ONEBYTE, BASTOKEN_THEN, FALSE, TRUE},
{"TIME", 4, 2, TYPE_FUNCTION, BASTOKEN_TIME, TYPE_FUNCTION, BASTOKEN_TIME, TRUE, FALSE},
{"TINT", 4, 3, TYPE_ONEBYTE, BASTOKEN_TINT, TYPE_ONEBYTE, BASTOKEN_TINT, FALSE, FALSE}, /* 139 */
{"TO", 2, 3, TYPE_ONEBYTE, BASTOKEN_TO, TYPE_ONEBYTE, BASTOKEN_TO, FALSE, FALSE},
{"TRACE", 5, 2, TYPE_ONEBYTE, BASTOKEN_TRACE, TYPE_ONEBYTE, BASTOKEN_TRACE, FALSE, FALSE},
{"TRUE", 4, 3, TYPE_ONEBYTE, BASTOKEN_TRUE, TYPE_ONEBYTE, BASTOKEN_TRUE, TRUE, FALSE},
{"UNTIL", 5, 1, TYPE_ONEBYTE, BASTOKEN_UNTIL, TYPE_ONEBYTE, BASTOKEN_UNTIL, FALSE, FALSE}, /* 143 */
{"USR", 3, 2, TYPE_FUNCTION, BASTOKEN_USR, TYPE_FUNCTION, BASTOKEN_USR, FALSE, FALSE},
{"VAL", 3, 2, TYPE_FUNCTION, BASTOKEN_VAL, TYPE_FUNCTION, BASTOKEN_VAL, FALSE, FALSE}, /* 145 */
{"VDU", 3, 1, TYPE_ONEBYTE, BASTOKEN_VDU, TYPE_ONEBYTE, BASTOKEN_VDU, FALSE, FALSE},
{"VERIFY(", 7, 2, TYPE_FUNCTION, BASTOKEN_VERIFY, TYPE_FUNCTION, BASTOKEN_VERIFY, FALSE, FALSE},
{"VOICES", 6, 2, TYPE_ONEBYTE, BASTOKEN_VOICES, TYPE_ONEBYTE, BASTOKEN_VOICES, FALSE, FALSE},
{"VOICE", 5, 5, TYPE_ONEBYTE, BASTOKEN_VOICE, TYPE_ONEBYTE, BASTOKEN_VOICE, FALSE, FALSE},
{"VPOS", 4, 2, TYPE_FUNCTION, BASTOKEN_VPOS, TYPE_FUNCTION, BASTOKEN_VPOS, TRUE, FALSE},
{"WAIT", 4, 2, TYPE_ONEBYTE, BASTOKEN_WAIT, TYPE_ONEBYTE, BASTOKEN_WAIT, TRUE, FALSE}, /* 151 */
{"WHEN", 4, 3, TYPE_ONEBYTE, BASTOKEN_XWHEN, TYPE_ONEBYTE, BASTOKEN_XWHEN, FALSE, FALSE},
{"WHILE", 5, 1, TYPE_ONEBYTE, BASTOKEN_XWHILE, TYPE_ONEBYTE, BASTOKEN_XWHILE, FALSE, FALSE},
{"WIDTH", 5, 2, TYPE_ONEBYTE, BASTOKEN_WIDTH, TYPE_ONEBYTE, BASTOKEN_WIDTH, FALSE, FALSE},
{"XLATE$(", 7, 2, TYPE_FUNCTION, BASTOKEN_XLATEDOL, TYPE_FUNCTION, BASTOKEN_XLATEDOL, FALSE, FALSE}, /* 155 */
/*
** The following keywords are Basic commands. These can be entered in mixed case.
** Note that 'RUN' is also in here so that it can be entered in lower case too.
** Also note that in the case of commands where there is 'O' version, the
** 'O' version must come first, for example, EDITO must preceed EDIT
*/
{"APPEND", 6, 2, TYPE_COMMAND, BASTOKEN_APPEND, TYPE_COMMAND, BASTOKEN_APPEND, FALSE, FALSE}, /* 156 */
{"AUTO", 4, 2, TYPE_COMMAND, BASTOKEN_AUTO, TYPE_COMMAND, BASTOKEN_AUTO, FALSE, FALSE},
{"CRUNCH", 6, 2, TYPE_COMMAND, BASTOKEN_CRUNCH, TYPE_COMMAND, BASTOKEN_CRUNCH, FALSE, FALSE}, /* 158 */
{"DELETE", 6, 3, TYPE_COMMAND, BASTOKEN_DELETE, TYPE_COMMAND, BASTOKEN_DELETE, FALSE, FALSE}, /* 159 */
{"EDITO", 5, 5, TYPE_COMMAND, BASTOKEN_EDITO, TYPE_COMMAND, BASTOKEN_EDITO, FALSE, FALSE}, /* 160 */
{"EDIT", 4, 2, TYPE_COMMAND, BASTOKEN_EDIT, TYPE_COMMAND, BASTOKEN_EDIT, FALSE, FALSE},
{"HELP", 4, 2, TYPE_COMMAND, BASTOKEN_HELP, TYPE_COMMAND, BASTOKEN_HELP, TRUE, FALSE}, /* 162 */
{"INSTALL", 7, 5, TYPE_COMMAND, BASTOKEN_INSTALL, TYPE_COMMAND, BASTOKEN_INSTALL, FALSE, FALSE}, /* 163 */
{"LISTB", 5, 5, TYPE_COMMAND, BASTOKEN_LISTB, TYPE_COMMAND, BASTOKEN_LISTB, FALSE, FALSE}, /* 164 */
{"LISTIF", 6, 6, TYPE_COMMAND, BASTOKEN_LISTIF, TYPE_COMMAND, BASTOKEN_LISTIF, FALSE, FALSE},
{"LISTL", 5, 5, TYPE_COMMAND, BASTOKEN_LISTL, TYPE_COMMAND, BASTOKEN_LISTL, FALSE, FALSE},
{"LISTO", 5, 5, TYPE_COMMAND, BASTOKEN_LISTO, TYPE_FUNCTION, BASTOKEN_LISTOFN, FALSE, FALSE},
{"LISTW", 5, 5, TYPE_COMMAND, BASTOKEN_LISTW, TYPE_COMMAND, BASTOKEN_LISTW, FALSE, FALSE},
{"LIST", 4, 1, TYPE_COMMAND, BASTOKEN_LIST, TYPE_COMMAND, BASTOKEN_LIST, FALSE, FALSE},
{"LOAD", 4, 2, TYPE_COMMAND, BASTOKEN_LOAD, TYPE_COMMAND, BASTOKEN_LOAD, FALSE, FALSE},
{"LVAR", 4, 3, TYPE_COMMAND, BASTOKEN_LVAR, TYPE_COMMAND, BASTOKEN_LVAR, TRUE, FALSE},
{"NEW", 3, 3, TYPE_COMMAND, BASTOKEN_NEW, TYPE_COMMAND, BASTOKEN_NEW, TRUE, FALSE}, /* 172 */
{"OLD", 3, 1, TYPE_COMMAND, BASTOKEN_OLD, TYPE_COMMAND, BASTOKEN_OLD, TRUE, FALSE}, /* 173 */
{"QUIT", 4, 1, TYPE_ONEBYTE, BASTOKEN_QUIT, TYPE_ONEBYTE, BASTOKEN_QUIT, TRUE, FALSE}, /* 174 */
{"RENUMBER", 8, 3, TYPE_COMMAND, BASTOKEN_RENUMBER, TYPE_COMMAND, BASTOKEN_RENUMBER, FALSE, FALSE}, /* 175 */
{"RUN", 3, 2, TYPE_ONEBYTE, BASTOKEN_RUN, TYPE_ONEBYTE, BASTOKEN_RUN, TRUE, FALSE},
{"SAVEO", 5, 5, TYPE_COMMAND, BASTOKEN_SAVEO, TYPE_COMMAND, BASTOKEN_SAVEO, FALSE, FALSE}, /* 177 */
{"SAVE", 4, 2, TYPE_COMMAND, BASTOKEN_SAVE, TYPE_COMMAND, BASTOKEN_SAVE, FALSE, FALSE},
{"TEXTLOAD", 8, 3, TYPE_COMMAND, BASTOKEN_TEXTLOAD, TYPE_COMMAND, BASTOKEN_TEXTLOAD, FALSE, FALSE}, /* 179 */
{"TEXTSAVEO", 9, 9, TYPE_COMMAND, BASTOKEN_TEXTSAVEO, TYPE_COMMAND, BASTOKEN_TEXTSAVEO, FALSE, FALSE},
{"TEXTSAVE", 8, 5, TYPE_COMMAND, BASTOKEN_TEXTSAVE, TYPE_COMMAND, BASTOKEN_TEXTSAVE, FALSE, FALSE},
{"TWINO", 5, 2, TYPE_COMMAND, BASTOKEN_TWINO, TYPE_COMMAND, BASTOKEN_TWINO, TRUE, FALSE},
{"TWIN", 4, 4, TYPE_COMMAND, BASTOKEN_TWIN, TYPE_COMMAND, BASTOKEN_TWIN, TRUE, FALSE},
{"ZZ", 1, 1, 0, 0, 0, 0, FALSE, FALSE} /* 184 */
};
#define TOKTABSIZE (sizeof(tokens)/sizeof(token))
static int start_letter [] = {
0, 9, 14, 27, 33, 50, 55, 60, 61, NOKEYWORD, NOKEYWORD, 67, 76, 81, 83, 94,
103, 104, 117, 131, 140, 142, 148, 152, NOKEYWORD, NOKEYWORD
};
static int command_start [] = { /* Starting positions for commands in 'tokens' */
153, NOKEYWORD, 155, 156, 157, NOKEYWORD, NOKEYWORD, 159, 160, NOKEYWORD,
NOKEYWORD, 161, NOKEYWORD, 169, 170, NOKEYWORD, 171, 172, 174, 176,
NOKEYWORD, NOKEYWORD, NOKEYWORD, NOKEYWORD, NOKEYWORD, NOKEYWORD
};
static char *lp; /* Pointer to current position in untokenised Basic statement */
static int
next, /* Index of next free byte in tokenised line buffer */
source, /* Index of next byte in source (used when compressing source) */
brackets, /* Current bracket nesting depth */
indentation, /* Current indentation when listing program */
lasterror; /* Number of last error detected when tokenising a line */
static boolean
linestart, /* TRUE if at the start of a tokenised line */
firstitem, /* TRUE if processing the start of an untokenised Basic statement */
numbered, /* TRUE if line starts with a line number */
immediate; /* TRUE if tokenising line in immediate mode */
/*
** 'isempty' returns true if the line passed to it has nothing on it
*/
boolean isempty(byte line[]) {
DEBUGFUNCMSGIN;
DEBUGFUNCMSGOUT;
return line[OFFSOURCE] == asc_NUL;
}
void save_lineno(byte *where, int32 number) {
DEBUGFUNCMSGIN;
*where = CAST(number, byte);
*(where+1) = CAST(number>>BYTESHIFT, byte);
DEBUGFUNCMSGOUT;
}
/*
** 'store_lineno' stores the line number at the start of the
** tokenised line. It is held in the form <low byte> <high byte>.
*/
static void store_lineno(int32 number) {
DEBUGFUNCMSGIN;
if (next+LINESIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
tokenbase[next] = CAST(number, byte);
tokenbase[next+1] = CAST(number>>BYTESHIFT, byte);
next+=2;
DEBUGFUNCMSGOUT;
}
/*
** 'store_linelen' stashes the length of the line at the start
** of the tokenised line
*/
static void store_linelen(int32 length) {
DEBUGFUNCMSGIN;
tokenbase[OFFLENGTH] = CAST(length, byte);
tokenbase[OFFLENGTH+1] = CAST(length>>BYTESHIFT, byte);
DEBUGFUNCMSGOUT;
}
/*
** 'store_exec' stores the offset of the first executable token
** in the line at the start of the line
*/
static void store_exec(int32 offset) {
DEBUGFUNCMSGIN;
tokenbase[OFFEXEC] = CAST(offset, byte);
tokenbase[OFFEXEC+1] = CAST(offset>>BYTESHIFT, byte);
DEBUGFUNCMSGOUT;
}
/*
** 'get_linelen' returns the length of a line. 'p' is assumed to point at the
** start of the line (that is, the line number)
*/
#if 0 /* Converted to macro in tokens.h */
int32 get_linelen(byte *p) {
DEBUGFU#NCMSGIN;
DEBUGFUNCMSGOUT;
return *(p+OFFLENGTH) | *(p+OFFLENGTH+1)<<BYTESHIFT;
}
/*
** 'get_lineno' returns the line number of the line starting at 'p'
*/
int32 get_lineno(byte *p) {
DEBUGFUNCMSGIN;
DEBUGFUNCMSGOUT;
return *(p+OFFLINE) | *(p+OFFLINE+1)<<BYTESHIFT;
}
/*
** 'get_srcaddr' returns the address of a byte in the source part
** of a line. This is given as an offset from the address of the
** token at 'p'. The offset is stored in the two bytes after the
** token
*/
byte *get_srcaddr(byte *p) {
DEBUGFUNCMSGIN;
DEBUGFUNCMSGOUT;
return p-(*(p+1)+(*(p+2)<<BYTESHIFT));
}
#endif /* 0 - macro conversion */
/*
** 'get_exec' returns the offset in the line of the first executable
** token. 'p' points at the start of the line. Normally a macro is
** used to do this for speed
*/
//static int32 get_exec(byte *p) {
// DEBUGFUNCMSGIN;
// DEBUGFUNCMSGOUT;
// return *(p+OFFEXEC) | *(p+OFFEXEC+1)<<BYTESHIFT;
//}
#define get_exec(p) (*(p+OFFEXEC) | *(p+OFFEXEC+1)<<BYTESHIFT)
#define PREVIOUS_TOKEN (tokenbase[next-1])
/*
** 'store' is called to add a character to the tokenised line buffer
*/
static void store(byte token) {
DEBUGFUNCMSGIN;
if (next+1>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
tokenbase[next] = token;
next++;
DEBUGFUNCMSGOUT;
}
/*
** 'store_size' is called to store a two-byte length in the tokenised
** line buffer
*/
static void store_size(int32 size) {
DEBUGFUNCMSGIN;
if (next+SIZESIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
tokenbase[next] = CAST(size, byte);
tokenbase[next+1] = CAST(size>>BYTESHIFT, byte);
next+=2;
DEBUGFUNCMSGOUT;
}
/*
** 'store_longoffset' is called to add a long offset (offset from the
** start of the Basic workspace) to the tokenised line buffer.
*/
static void store_longoffset(int32 value) {
int n;
DEBUGFUNCMSGIN;
if (next+LOFFSIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
for (n=1; n<=LOFFSIZE; n++) {
tokenbase[next] = CAST(value, byte);
value = value>>BYTESHIFT;
next++;
}
DEBUGFUNCMSGOUT;
}
/*
** 'store_shortoffset' stores a two byte offset in the tokenised
** line buffer These are used for references to lines from the
** current position in the Basic program.
*/
static void store_shortoffset(int32 value) {
DEBUGFUNCMSGIN;
if (next+OFFSIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
tokenbase[next] = CAST(value, byte);
tokenbase[next+1] = CAST(value>>BYTESHIFT, byte);
next+=2;
DEBUGFUNCMSGOUT;
}
/*
** 'store_intconst' is called to stow a four byte integer in the tokenised line
** buffer
*/
static void store_intconst(int32 value) {
int n;
DEBUGFUNCMSGIN;
if (next+INTSIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
for (n=1; n<=INTSIZE; n++) {
tokenbase[next] = CAST(value, byte);
value = value>>8;
next++;
}
DEBUGFUNCMSGOUT;
}
static void store_int64const(int64 value) {
int n;
DEBUGFUNCMSGIN;
if (next+INT64SIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
for (n=1; n<=INT64SIZE; n++) {
tokenbase[next] = CAST(value, byte);
value = value>>8;
next++;
}
DEBUGFUNCMSGOUT;
}
/*
** 'store_fpvalue' is a grubby bit of code used to store an eight-byte
** floating point value in the tokenised line buffer
*/
static void store_fpvalue(float64 fpvalue) {
byte temp[sizeof(float64)];
int n;
DEBUGFUNCMSGIN;
if (next+FLOATSIZE>=MAXSTATELEN) {
error(ERR_STATELEN);
return;
}
memcpy(temp, &fpvalue, sizeof(float64));
for (n=0; n<sizeof(float64); n++) {
tokenbase[next] = temp[n];
next++;
}
DEBUGFUNCMSGOUT;
}
/*
** 'convert_lineno' is called when a line number is found to convert
** it to binary. If the line number is too large the error is flagged
** but tokenisation continues
*/
static int32 convert_lineno(void) {
int32 line = 0;
DEBUGFUNCMSGIN;
while (*lp>='0' && *lp<='9' && line<=MAXLINENO) {
line = line*10+(*lp-'0');
lp++;
}
if (line>MAXLINENO) {
lasterror = ERR_LINENO;
error(WARN_LINENO); /* Line number is too large */
line = 0;
while (*lp>='0' && *lp<='9') lp++; /* Skip any remaining digits in line number */
}
DEBUGFUNCMSGOUT;
return line;
}
/*
** 'copy_line' is called to copy the remainder of a line to the
** tokenised line buffer
*/
static char *copy_line(char *lp) {
DEBUGFUNCMSGIN;
while (*lp != asc_NUL) {
store(*lp);
lp++;
}
DEBUGFUNCMSGOUT;
return lp;
}
#if 0
// Disabled - no longer used as DRAW BY etc are now two tokens
/*
** 'nextis' is called to check if the next non-blank characters match
** the string given by 'string'. It returns 'true' if they do. This
** function is used when checking for statement types such as 'DRAW BY'
** as 'DRAW BY' and its ilk are represented by single tokens in this
** interpreter
*/
static boolean nextis(char *string) {
char *cp;
DEBUGFUNCMSGIN;
cp = skip_blanks(lp);
DEBUGFUNCMSGOUT;
return *cp != asc_NUL && strncmp(cp, string, strlen(string)) == 0;
}
#endif
/*
** "kwsearch" checks to see if the text passed to it is a token, returning
** the index of the token entry or 'NOKEYWORD' if there is no match. As a
** side effect, it updates the pointer to the untokenised line if a keyword
** if found. Note that there are cases of strings that are tokens unless
** followed by another alphanumeric character, for example, COUNT is a token
** unless followed by a letter, so "COUNT" is a token, but "COUNTER" is not.
** Keywords start with a letter in the range A..W, excluding J and K.
** Commands are a little bit of a problem. To make things more convenient
** the case of Basic commands is normally ignored but this can give problems
** with programs that use variable names such as 'save%' which this code
** would identify as the command 'save'. To cope with this the code only
** ignores the case if the line does not start with a line number. This is
** not perfect but it should get around most problems.
*/
static int kwsearch(void) {
int n, count, kwlength;
char first, *cp;
boolean nomatch, abbreviated;
char keyword[MAXKWLEN+1];
DEBUGFUNCMSGIN;
cp = lp;
for (n=0; n<MAXKWLEN && (isalpha(*cp) || *cp == '$' || *cp == '('); n++) {
keyword[n] = *cp;
cp++;
}
abbreviated = n < MAXKWLEN && *cp == '.';
if (!abbreviated && n == 1) return NOKEYWORD; /* Text is only one character long - Cannot be a keyword */
keyword[n] = asc_NUL;
kwlength = n;
first = keyword[0];
if (matrixflags.lowercasekeywords) {
for (n=0; keyword[n] != asc_NUL; n++) keyword[n] = toupper(keyword[n]);
first = keyword[0];
}
if (islower(first)) {
nomatch = TRUE;
} else {
n = start_letter[first-'A'];
if (n == NOKEYWORD) return NOKEYWORD; /* No keyword starts with this letter */
do {
count = tokens[n].length; /* Decide on number of characters to compare */
if (abbreviated && kwlength < count) {
count = kwlength;
if (kwlength < tokens[n].minlength) count = tokens[n].minlength;
}
if (strncasecmp(keyword, tokens[n].name, count) == 0) break;
n++;
} while (*(tokens[n].name) == first);
nomatch = *(tokens[n].name) != first;
/*
* Any '.' immediately after a keyword is taken to say that the
* keyword has been abbreviated but this is not true in the case
* where we get an exact match between the word read and a keyword,
* that is, the number of characters in the word read and the
* keyword are the same. Weed out that case here.
*/
if (!nomatch && abbreviated) abbreviated = kwlength < tokens[n].length;
}
if (nomatch) { /* Keyword not found. Check if it is a command */
/*
** Kludge time...If the line does not start with a line number, convert
** the keyword to upper case and check if it is a command
*/
if (matrixflags.lowercasekeywords) {
for (n=0; keyword[n] != asc_NUL; n++) keyword[n] = toupper(keyword[n]);
first = keyword[0];
} else {
if (islower(first)) return NOKEYWORD;
}
n = command_start[first - 'A'];
if (n == NOKEYWORD) return NOKEYWORD; /* Text is not a keyword or a command */
do {
count = tokens[n].length; /* Decide on number of characters to compare */
if (abbreviated && kwlength<count) {
count = kwlength;
if (kwlength<tokens[n].minlength) count = tokens[n].minlength;
}
if (strncmp(keyword, tokens[n].name, count) == 0) break;
n++;
} while (*(tokens[n].name) == first);
nomatch = *(tokens[n].name) != first;
if (!nomatch && abbreviated) abbreviated = kwlength < tokens[n].length;
}
if (nomatch || (!abbreviated && tokens[n].alone && ISIDCHAR(keyword[count]))) { /* Not a keyword */
DEBUGFUNCMSGOUT;
return NOKEYWORD;
}
else { /* Found a keyword */
lp+=count;
if (abbreviated && *lp == '.') lp++; /* Skip '.' after abbreviated keyword */
DEBUGFUNCMSGOUT;
return n;
}
}
/*
** 'copy_keyword' is called when a keyword is found to store its equivalent
** token value and carry out any special processing needed for the type
** of keyword, in particular taking care of the 'firstitem' flag.
** The keywords 'THEN', 'ELSE', 'REPEAT' and 'OTHERWISE' can be followed
** by statements, so the flag has to be set to 'true' for these. Every
** other keyword sets it to 'false'
*/
static void copy_keyword(int token) {
byte toktype, tokvalue;
DEBUGFUNCMSGIN;
if (firstitem) { /* Keyword is the first item in the statement */
toktype = tokens[token].lhtype;
tokvalue = tokens[token].lhvalue;
if (linestart && toktype == TYPE_ONEBYTE && tokvalue == BASTOKEN_XELSE) tokvalue = BASTOKEN_XLHELSE;
}
else {
toktype = tokens[token].type;
tokvalue = tokens[token].value;
}
firstitem = FALSE;
if (toktype != TYPE_ONEBYTE) store(toktype);
store(tokvalue);
if (tokens[token].name[tokens[token].length-1] == '(') brackets++; /* Allow for '(' in things like 'TAB(' */
if (toktype == TYPE_ONEBYTE) { /* Check for special cases */
switch (tokvalue) {
case BASTOKEN_REM: case BASTOKEN_DATA: /* Copy rest of line */
lp = copy_line(lp);
break;
case BASTOKEN_THEN: case BASTOKEN_REPEAT: case BASTOKEN_XELSE: case BASTOKEN_XOTHERWISE:
firstitem = TRUE; /* Next token must use the 'first in statement' token */
break;
case BASTOKEN_FN: case BASTOKEN_PROC: /* Copy proc/function name */
while(ISIDCHAR(*lp)) {
store(*lp);
lp++;
}
break;
}
}
else if (toktype == TYPE_COMMAND) {
if (tokvalue == BASTOKEN_LISTIF || tokvalue == BASTOKEN_LVAR) { /* Copy rest of line untranslated */
lp = copy_line(lp);
}
}
DEBUGFUNCMSGOUT;
}
/*
** 'copy_token' deals with token values directly entered from the
** keyboard. It ensures that the token value is legal
*/
static void copy_token(void) {
int n;
byte toktype, tokvalue;
DEBUGFUNCMSGIN;
toktype = TYPE_ONEBYTE;
tokvalue = *lp; /* Fetch the token */
if (tokvalue>=TYPE_COMMAND) {
toktype = tokvalue;
lp++;
tokvalue = *lp; /* Fetch the actual token */
}
lp++; /* Skip the token */
if (firstitem) { /* Token is first item in the statement */
for (n=0; n<TOKTABSIZE; n++) {
if (toktype == tokens[n].lhtype && tokvalue == tokens[n].lhvalue) break;
}
}
else { /* Token is not the first item in the statement */
for (n=0; n<TOKTABSIZE; n++) {
if (toktype == tokens[n].type && tokvalue == tokens[n].value) break;
}
}
if (n<TOKTABSIZE) /* Found token - Copy it to buffer and do token-specific processing */
copy_keyword(n);
else { /* Cannot find token value */
lasterror = ERR_SYNTAX;
error(WARN_BADTOKEN);
}
DEBUGFUNCMSGOUT;
}
/*
** 'copy_variable' deals with variables. It copies the name to the
** token buffer. The name is preceded by a 'XVAR' token so that the name
** can be found easily when trying to replace pointers to variables'
** symbol table entries with references to their names (see function
** clear_varaddrs() below)
*/
static void copy_variable(void) {
DEBUGFUNCMSGIN;
if (*lp>='@' && *lp<='Z' && lp[1] == '%' && lp[2] != '%' && lp[2] != '(' && lp[2] != '[') { /* Static integer variable */
store(*lp);
lp++;
}
else { /* Dynamic variable */
store(BASTOKEN_XVAR);
while (ISIDCHAR(*lp)) {
store(*lp);
lp++;
}
}
if (*lp == '%') { /* Integer variable */
store(*lp);
lp++;
if (*lp == '%') { /* %% for 64-bit int */
store(*lp);
lp++;
}
}
if (*lp == '&') { /* Unsigned 8-bit int variable */
store(*lp);
lp++;
}
if (*lp == '$') { /* String variable */
store(*lp);
lp++;
}
DEBUGFUNCMSGOUT;
}
/*
** 'copy_lineno' copies a line number into the source part of the
** tokenised line. The number is converted to binary to make it
** easier to renumber lines
*/
static void copy_lineno(void) {
DEBUGFUNCMSGIN;
store(BASTOKEN_XLINENUM);
store_lineno(convert_lineno());
DEBUGFUNCMSGOUT;
}
/*
** 'copy_number' copies hex, binary, integer and floating point
** constants to the token buffer
*/
static void copy_number(void) {
char ch;
int digits;
DEBUGFUNCMSGIN;
ch = *lp;
lp++;
store(ch);
digits = 0;
switch (ch) { /* Copy different types of number */
case '&': /* Hex number */
while (isxdigit(*lp)) {
store(*lp);
lp++;
digits++;
}
if (digits == 0) { /* Number contains no digits */
lasterror = ERR_SYNTAX;
error(WARN_BADHEX);
}
break;
case '%': /* Binary number */
while (*lp == '0' || *lp == '1') {
store(*lp);
lp++;
digits++;
}
if (digits == 0) { /* Number contains no digits */
lasterror = ERR_SYNTAX;
error(WARN_BADBIN);
}
break;
default: /* Integer or floating point number */
while (*lp>='0' && *lp<='9') {
store(*lp);
lp++;
}
if (*lp == '.') { /* Got digits after a decimal point */
store('.');
lp++;
while (*lp>='0' && *lp<='9') {
store(*lp);
lp++;
}
}
/*
** Check for an exponent. The code also looks at the character after
** the 'E' and if it is another letter it assumes that the 'E' is part
** of a word that follows the number and does not mark the start of
** an exponent
*/
if ((*lp == 'e' || *lp == 'E') && !isalpha(*(lp+1))) {
store(*lp);
lp++;
if (*lp == '+' || *lp == '-') { /* Deal with 'E+<exponent>' or 'E-<exponent>' */
store(*lp);
lp++;
}
while (*lp>='0' && *lp<='9') {
store(*lp);
lp++;
digits++;
}
}
}
DEBUGFUNCMSGOUT;
}
/*
** 'copy_string' copies a character string to the tokenised
** line buffer
*/
static void copy_string(void) {
DEBUGFUNCMSGIN;
store('"'); /* Store the quote at the start of the string */
lp++;
while (TRUE) {
if (*lp == asc_NUL) break; /* Error - Reached end of line without finding a '"' */
store(*lp);
if (*lp == '"') { /* Found a '"' */
if (*(lp+1) != '"') break; /* '"' is not followed by '"' so end of string found */
store('"'); /* Got '""' */
lp+=2;
}
else { /* Any other character */
lp++;
}
}
if (*lp == '"') /* End of string was a '"' */
lp++; /* Skip to character after the '"' */
else {
lasterror = ERR_QUOTEMISS;
error(WARN_QUOTEMISS); /* No terminating '"' found */
store('"');
}
DEBUGFUNCMSGOUT;
}
/*
** 'copy_other' deals with any other characters and special tokens
*/
static void copy_other(void) {
byte tclass, token;
DEBUGFUNCMSGIN;
tclass = TYPE_ONEBYTE;
token = *lp;
switch (token) { /* Deal with special tokens */
case '(':
brackets++;
break;
case ')':
brackets--;
if (brackets < 0) { /* More ')' than '(' */
lasterror = ERR_LPMISS;
error(WARN_PARNEST);
}
break;
case 172: /* This is a hi-bit char and causes a compiler warning if used directly */
tclass = TYPE_FUNCTION;
token = BASTOKEN_NOT;
break;
case '+':
if (*(lp+1) == '=') { /* Found '+=' */
token = BASTOKEN_PLUSAB;
lp++;
}
break;
case '-':
if (*(lp+1) == '=') { /* Found '-=' */
token = BASTOKEN_MINUSAB;
lp++;
}
break;
case '>':
switch (*(lp+1)) {
case '=': /* Found '>=' */
token = BASTOKEN_GE;
lp++;
break;
case '>':