1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
|
# Generated by re2py
# re2py $INPUT -o $OUTPUT
# expect a null-terminated string
def lex(yyinput):
yycursor = 0
yylimit = len(yyinput) - 1 # terminating null not included
count = 0
while True:
yystate = 0
while True:
match yystate:
case 0:
yych = yyinput[yycursor]
if yych <= 0x20:
if yych <= 0x00:
if yylimit <= yycursor:
yystate = 9
continue
yycursor += 1
yystate = 1
continue
if yych >= 0x20:
yycursor += 1
yystate = 3
continue
yycursor += 1
yystate = 1
continue
else:
if yych == 0x27:
yycursor += 1
yystate = 5
continue
yycursor += 1
yystate = 1
continue
case 1:
yystate = 2
continue
case 2:
return -1
case 3:
yych = yyinput[yycursor]
if yych <= 0x00:
yystate = 4
continue
if yych == 0x20:
yycursor += 1
yystate = 3
continue
yystate = 4
continue
case 4:
break
case 5:
yymarker = yycursor
yych = yyinput[yycursor]
if yych >= 0x01:
yystate = 7
continue
if yylimit <= yycursor:
yystate = 2
continue
yycursor += 1
yystate = 6
continue
case 6:
yych = yyinput[yycursor]
yystate = 7
continue
case 7:
if yych <= 0x27:
if yych <= 0x00:
if yylimit <= yycursor:
yystate = 10
continue
yycursor += 1
yystate = 6
continue
if yych <= 0x26:
yycursor += 1
yystate = 6
continue
yycursor += 1
else:
if yych == 0x5C:
yycursor += 1
yystate = 8
continue
yycursor += 1
yystate = 6
continue
count += 1
break
case 8:
yych = yyinput[yycursor]
if yych <= 0x00:
if yylimit <= yycursor:
yystate = 10
continue
yycursor += 1
yystate = 6
continue
yycursor += 1
yystate = 6
continue
case 9:
return count
case 10:
yycursor = yymarker
yystate = 2
continue
case _:
raise "internal lexer error"
def test(str, count):
# termunating null not included in `lim`
assert count == lex(str)
test(b"\0", 0);
test(b"'qu\0tes' 'are' 'fine: \\'' \0", 3);
test(b"'unterminated\\'\0", -1)
|