File: reuse.re

package info (click to toggle)
re2c 4.4-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 51,512 kB
  • sloc: cpp: 34,160; ml: 8,494; sh: 5,311; makefile: 1,014; haskell: 611; python: 431; ansic: 234; javascript: 113
file content (43 lines) | stat: -rw-r--r-- 1,260 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
// re2java $INPUT -o $OUTPUT --input-encoding utf8

// This example supports multiple input encodings: UTF-8 and UTF-32.
// Both lexers are generated from the same rules block, and the use
// blocks add only encoding-specific configurations.

/*!rules:re2c
    re2c:yyfill:enable = 0;
    re2c:YYPEEK = "yyinput[yycursor]";
    re2c:indent:top = 1;

    "∀x ∃y" { return true; }
    *       { return false; }
*/

class Main {
    static boolean lex_utf8(int[] yyinput) {
        int yycursor = 0;
        int yymarker = 0;
        /*!use:re2c
            re2c:YYCTYPE = "int"; // Java lacks unsigned 8-bit integer type
            re2c:encoding:utf8 = 1;
        */
    }

    static boolean lex_utf32(int[] yyinput) {
        int yycursor = 0;
        int yymarker = 0;
        /*!use:re2c
            re2c:YYCTYPE = "int";
            re2c:encoding:utf32 = 1;
        */
    }

    public static void main(String []args) {
        // we have to use `int`, because `byte`in Java cannot represent values greater than 127
        int[] s_utf8 = new int[]{0xe2, 0x88, 0x80, 0x78, 0x20, 0xe2, 0x88, 0x83, 0x79};
        assert lex_utf8(s_utf8);

        int[] s_utf32 = new int[]{0x2200, 0x78, 0x20, 0x2203, 0x79};
        assert lex_utf32(s_utf32);
    }
};