Artifact
3a1a1e4786f1370d3c5d9c262d6daf2a7882395e9785305a8fbd256bf033328e :
File
runtime-c/gate.h
— part of check-in
[b0d7fa6f75]
at
2018-03-20 05:45:35
on branch trunk
— rtC's mixed use of both `char` and `unsigned char` in various APIs and
code, plus interaction with `int` breaks lexing when attempting to go
beyond ASCII, even when restricted to the BMP, due to bytes > 127
showing up as negative.
Fixed by changing all uses of `char` to `unsigned char`.
Further changed extraction of semantic values.
- Lexeme length is now counted in characters, not bytes.
- Similarly, lexeme end is now characters from start.
- Input is now byte- and character counted, for proper lexeme start.
Character counting in C strings pulled from tclUtf.c
Error messages now use the new char offsets, plus byte offsets for
partially read characters.
(user:
aku
size: 2014)
[more...]
0000: 2f 2a 20 52 75 6e 74 69 6d 65 20 66 6f 72 20 43 /* Runtime for C
0010: 2d 65 6e 67 69 6e 65 20 28 52 54 43 29 2e 20 44 -engine (RTC). D
0020: 65 63 6c 61 72 61 74 69 6f 6e 73 2e 20 28 45 6e eclarations. (En
0030: 67 69 6e 65 3a 20 4c 65 78 65 72 20 67 61 74 69 gine: Lexer gati
0040: 6e 67 29 0a 20 2a 20 2d 20 2d 20 2d 2d 20 2d 2d ng). * - - -- --
0050: 2d 20 2d 2d 2d 2d 2d 20 2d 2d 2d 2d 2d 2d 2d 2d - ----- --------
0060: 20 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 20 2d ------------- -
0070: 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d ----------------
0080: 2d 2d 2d 2d 0a 20 2a 20 28 63 29 20 32 30 31 37 ----. * (c) 2017
0090: 2d 32 30 31 38 20 41 6e 64 72 65 61 73 20 4b 75 -2018 Andreas Ku
00a0: 70 72 69 65 73 0a 20 2a 2f 0a 0a 23 69 66 6e 64 pries. */..#ifnd
00b0: 65 66 20 4d 41 52 50 41 54 43 4c 5f 52 54 43 5f ef MARPATCL_RTC_
00c0: 47 41 54 45 5f 48 0a 23 64 65 66 69 6e 65 20 4d GATE_H.#define M
00d0: 41 52 50 41 54 43 4c 5f 52 54 43 5f 47 41 54 45 ARPATCL_RTC_GATE
00e0: 5f 48 0a 0a 2f 2a 0a 20 2a 20 2d 20 2d 20 2d 2d _H../*. * - - --
00f0: 20 2d 2d 2d 20 2d 2d 2d 2d 2d 20 2d 2d 2d 2d 2d --- ----- -----
0100: 2d 2d 2d 20 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d --- ------------
0110: 2d 20 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d - --------------
0120: 2d 2d 2d 2d 2d 2d 2d 0a 20 2a 20 52 65 71 75 69 -------. * Requi
0130: 72 65 6d 65 6e 74 73 0a 20 2a 2f 0a 0a 23 69 6e rements. */..#in
0140: 63 6c 75 64 65 20 3c 62 79 74 65 73 65 74 2e 68 clude <byteset.h
0150: 3e 0a 23 69 6e 63 6c 75 64 65 20 3c 73 74 61 63 >.#include <stac
0160: 6b 2e 68 3e 0a 23 69 6e 63 6c 75 64 65 20 3c 72 k.h>.#include <r
0170: 74 63 2e 68 3e 0a 0a 2f 2a 0a 20 2a 20 2d 20 2d tc.h>../*. * - -
0180: 20 2d 2d 20 2d 2d 2d 20 2d 2d 2d 2d 2d 20 2d 2d -- --- ----- --
0190: 2d 2d 2d 2d 2d 2d 20 2d 2d 2d 2d 2d 2d 2d 2d 2d ------ ---------
01a0: 2d 2d 2d 2d 20 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d ---- -----------
01b0: 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 0a 20 2a 20 53 74 ----------. * St
01c0: 72 75 63 74 75 72 65 73 0a 20 2a 2f 0a 0a 74 79 ructures. */..ty
01d0: 70 65 64 65 66 20 73 74 72 75 63 74 20 6d 61 72 pedef struct mar
01e0: 70 61 74 63 6c 5f 72 74 63 5f 67 61 74 65 20 7b patcl_rtc_gate {
01f0: 0a 20 20 20 20 69 6e 74 20 20 20 20 20 20 20 20 . int
0200: 20 20 20 20 20 20 20 20 20 20 6c 61 73 74 63 68 lastch
0210: 61 72 3b 20 20 20 2f 2a 20 6c 61 73 74 20 63 68 ar; /* last ch
0220: 61 72 61 63 74 65 72 20 65 6e 74 65 72 65 64 20 aracter entered
0230: 69 6e 74 6f 20 74 68 65 20 67 61 74 65 20 2a 2f into the gate */
0240: 0a 20 20 20 20 69 6e 74 20 20 20 20 20 20 20 20 . int
0250: 20 20 20 20 20 20 20 20 20 20 6c 61 73 74 6c 6f lastlo
0260: 63 3b 20 20 20 20 2f 2a 20 4c 6f 63 61 74 69 6f c; /* Locatio
0270: 6e 20 6f 66 20 74 68 65 20 60 6c 61 73 74 63 68 n of the `lastch
0280: 61 72 60 20 28 62 79 74 65 20 6f 66 66 73 65 74 ar` (byte offset
0290: 29 20 2a 2f 0a 20 20 20 20 69 6e 74 20 20 20 20 ) */. int
02a0: 20 20 20 20 20 20 20 20 20 20 20 20 20 20 6c 61 la
02b0: 73 74 63 6c 6f 63 3b 20 20 20 2f 2a 20 53 61 6d stcloc; /* Sam
02c0: 65 2c 20 61 73 20 63 68 61 72 20 6f 66 66 73 65 e, as char offse
02d0: 74 20 2a 2f 0a 20 20 20 20 69 6e 74 20 20 20 20 t */. int
02e0: 20 20 20 20 20 20 20 20 20 20 20 20 20 20 66 6c fl
02f0: 75 73 68 65 64 3b 20 20 20 20 2f 2a 20 46 6c 75 ushed; /* Flu
0300: 73 68 69 6e 67 20 73 74 61 74 65 20 2a 2f 0a 20 shing state */.
0310: 20 20 20 6d 61 72 70 61 74 63 6c 5f 72 74 63 5f marpatcl_rtc_
0320: 73 74 61 63 6b 5f 70 20 68 69 73 74 6f 72 79 3b stack_p history;
0330: 20 20 20 20 2f 2a 20 48 69 73 74 6f 72 79 20 6f /* History o
0340: 66 20 74 68 65 20 63 75 72 72 65 6e 74 20 6d 61 f the current ma
0350: 74 63 68 20 61 74 74 65 6d 70 74 20 2a 2f 0a 20 tch attempt */.
0360: 20 20 20 6d 61 72 70 61 74 63 6c 5f 72 74 63 5f marpatcl_rtc_
0370: 73 74 61 63 6b 5f 70 20 70 65 6e 64 69 6e 67 3b stack_p pending;
0380: 20 20 20 20 2f 2a 20 53 63 72 61 74 63 68 20 73 /* Scratch s
0390: 74 61 63 6b 20 66 6f 72 20 68 69 73 74 6f 72 79 tack for history
03a0: 20 72 65 70 6c 61 79 20 2a 2f 0a 20 20 20 20 6d replay */. m
03b0: 61 72 70 61 74 63 6c 5f 72 74 63 5f 62 79 74 65 arpatcl_rtc_byte
03c0: 73 65 74 20 61 63 63 65 70 74 61 62 6c 65 3b 20 set acceptable;
03d0: 2f 2a 20 53 65 74 20 6f 66 20 61 63 63 65 70 74 /* Set of accept
03e0: 61 62 6c 65 20 62 79 74 65 20 28 73 79 6d 62 6f able byte (symbo
03f0: 6c 73 29 20 2a 2f 0a 7d 20 6d 61 72 70 61 74 63 ls) */.} marpatc
0400: 6c 5f 72 74 63 5f 67 61 74 65 3b 0a 0a 2f 2a 0a l_rtc_gate;../*.
0410: 20 2a 20 2d 20 2d 20 2d 2d 20 2d 2d 2d 20 2d 2d * - - -- --- --
0420: 2d 2d 2d 20 2d 2d 2d 2d 2d 2d 2d 2d 20 2d 2d 2d --- -------- ---
0430: 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 20 2d 2d 2d 2d 2d ---------- -----
0440: 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d ----------------
0450: 0a 20 2a 20 41 50 49 20 2d 20 6c 69 66 65 63 79 . * API - lifecy
0460: 63 6c 65 2c 20 61 63 63 65 73 73 6f 72 73 2c 20 cle, accessors,
0470: 6d 75 74 61 74 6f 72 73 0a 20 2a 0a 20 2a 20 69 mutators. *. * i
0480: 6e 69 74 20 20 20 20 20 20 20 2d 20 69 6e 69 74 nit - init
0490: 69 61 6c 69 7a 65 20 61 20 67 61 74 65 0a 20 2a ialize a gate. *
04a0: 20 66 72 65 65 20 20 20 20 20 20 20 2d 20 72 65 free - re
04b0: 6c 65 61 73 65 20 67 61 74 65 20 73 74 61 74 65 lease gate state
04c0: 0a 20 2a 20 65 6e 74 65 72 20 20 20 20 20 20 2d . * enter -
04d0: 20 70 75 73 68 20 61 20 73 69 6e 67 6c 65 20 62 push a single b
04e0: 79 74 65 20 6f 66 20 69 6e 70 75 74 0a 20 2a 20 yte of input. *
04f0: 65 6f 66 20 20 20 20 20 20 20 20 2d 20 73 69 67 eof - sig
0500: 6e 61 6c 20 74 68 65 20 65 6e 64 20 6f 66 20 74 nal the end of t
0510: 68 65 20 69 6e 70 75 74 0a 20 2a 20 61 63 63 65 he input. * acce
0520: 70 74 61 62 6c 65 20 2d 20 69 6e 66 6f 72 6d 61 ptable - informa
0530: 74 69 6f 6e 20 66 72 6f 6d 20 6c 65 78 65 72 20 tion from lexer
0540: 61 62 6f 75 74 20 61 63 63 65 70 74 61 62 6c 65 about acceptable
0550: 20 62 79 74 65 73 0a 20 2a 20 72 65 64 6f 20 20 bytes. * redo
0560: 20 20 20 20 20 2d 20 72 65 73 65 74 20 74 6f 20 - reset to
0570: 61 6e 64 20 72 65 70 6c 61 79 20 74 68 65 20 6c and replay the l
0580: 61 73 74 20 6e 20 62 79 74 65 73 20 65 6e 74 65 ast n bytes ente
0590: 72 65 64 0a 20 2a 2f 0a 0a 76 6f 69 64 20 6d 61 red. */..void ma
05a0: 72 70 61 74 63 6c 5f 72 74 63 5f 67 61 74 65 5f rpatcl_rtc_gate_
05b0: 69 6e 69 74 20 20 20 20 20 20 20 28 6d 61 72 70 init (marp
05c0: 61 74 63 6c 5f 72 74 63 5f 70 20 70 29 3b 0a 76 atcl_rtc_p p);.v
05d0: 6f 69 64 20 6d 61 72 70 61 74 63 6c 5f 72 74 63 oid marpatcl_rtc
05e0: 5f 67 61 74 65 5f 66 72 65 65 20 20 20 20 20 20 _gate_free
05f0: 20 28 6d 61 72 70 61 74 63 6c 5f 72 74 63 5f 70 (marpatcl_rtc_p
0600: 20 70 29 3b 0a 76 6f 69 64 20 6d 61 72 70 61 74 p);.void marpat
0610: 63 6c 5f 72 74 63 5f 67 61 74 65 5f 65 6e 74 65 cl_rtc_gate_ente
0620: 72 20 20 20 20 20 20 28 6d 61 72 70 61 74 63 6c r (marpatcl
0630: 5f 72 74 63 5f 70 20 70 2c 20 75 6e 73 69 67 6e _rtc_p p, unsign
0640: 65 64 20 63 68 61 72 20 63 68 29 3b 20 2f 2a 20 ed char ch); /*
0650: 6c 6f 63 61 74 69 6f 6e 20 69 6d 70 6c 69 65 64 location implied
0660: 20 2a 2f 0a 76 6f 69 64 20 6d 61 72 70 61 74 63 */.void marpatc
0670: 6c 5f 72 74 63 5f 67 61 74 65 5f 65 6f 66 20 20 l_rtc_gate_eof
0680: 20 20 20 20 20 20 28 6d 61 72 70 61 74 63 6c 5f (marpatcl_
0690: 72 74 63 5f 70 20 70 29 3b 0a 76 6f 69 64 20 6d rtc_p p);.void m
06a0: 61 72 70 61 74 63 6c 5f 72 74 63 5f 67 61 74 65 arpatcl_rtc_gate
06b0: 5f 61 63 63 65 70 74 61 62 6c 65 20 28 6d 61 72 _acceptable (mar
06c0: 70 61 74 63 6c 5f 72 74 63 5f 70 20 70 29 3b 0a patcl_rtc_p p);.
06d0: 76 6f 69 64 20 6d 61 72 70 61 74 63 6c 5f 72 74 void marpatcl_rt
06e0: 63 5f 67 61 74 65 5f 72 65 64 6f 20 20 20 20 20 c_gate_redo
06f0: 20 20 28 6d 61 72 70 61 74 63 6c 5f 72 74 63 5f (marpatcl_rtc_
0700: 70 20 70 2c 20 69 6e 74 20 6e 29 3b 0a 2f 2a 20 p p, int n);./*
0710: 54 4f 44 4f 3a 20 67 65 74 2d 63 6f 6e 74 65 78 TODO: get-contex
0720: 74 2c 20 65 78 74 65 6e 64 2d 63 6f 6e 74 65 78 t, extend-contex
0730: 74 20 2a 2f 0a 0a 23 65 6e 64 69 66 0a 0a 2f 2a t */..#endif../*
0740: 0a 20 2a 20 2d 20 2d 20 2d 2d 20 2d 2d 2d 20 2d . * - - -- --- -
0750: 2d 2d 2d 2d 20 2d 2d 2d 2d 2d 2d 2d 2d 20 2d 2d ---- -------- --
0760: 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 20 2d 2d 2d 2d ----------- ----
0770: 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d 2d ----------------
0780: 2d 0a 20 2a 2f 0a 0c 0a 2f 2a 0a 20 2a 20 4c 6f -. */.../*. * Lo
0790: 63 61 6c 20 56 61 72 69 61 62 6c 65 73 3a 0a 20 cal Variables:.
07a0: 2a 20 6d 6f 64 65 3a 20 63 0a 20 2a 20 63 2d 62 * mode: c. * c-b
07b0: 61 73 69 63 2d 6f 66 66 73 65 74 3a 20 34 0a 20 asic-offset: 4.
07c0: 2a 20 66 69 6c 6c 2d 63 6f 6c 75 6d 6e 3a 20 37 * fill-column: 7
07d0: 38 0a 20 2a 20 45 6e 64 3a 0a 20 2a 2f 0a 8. * End:. */.