File: gen-blocks.py

package info (click to toggle)
gnome-characters 43.1-1%2Bdeb12u1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 5,640 kB
  • sloc: ansic: 49,655; javascript: 1,164; python: 555; ruby: 62; xml: 59; sh: 25; makefile: 4
file content (54 lines) | stat: -rwxr-xr-x 1,374 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#!/usr/bin/python3

# Input: https://www.unicode.org/Public/UNIDATA/Blocks.txt

import io
import re

class Builder(object):
    def __init__(self):
        pass

    def read(self, infile):
        names = []
        for line in infile:
            if line.startswith('#'):
                continue
            line = line.strip()
            if len(line) == 0:
                continue
            range, name = line.split(';', 2)
            start, end = range.split('..')
            name = name.lstrip()

            names.append((start, end, name))

        return names

    def write(self, data):
        print('''\
struct Block
{
  gunichar start;
  gunichar end;
  const char *name;
};''')
        print('static const struct Block all_blocks[] =\n  {')
        s = ''
        offset = 0
        for start, end, name in data:
            print('    {{ 0x{0}, 0x{1}, "{2}" }},'.format(start, end, name))
        print('  };')

if __name__ == '__main__':
    import argparse

    parser = argparse.ArgumentParser(description='build')
    parser.add_argument('infile', type=argparse.FileType('r'),
                        help='input file')
    args = parser.parse_args()

    builder = Builder()
    # FIXME: argparse.FileType(encoding=...) is available since Python 3.4
    data = builder.read(io.open(args.infile.name, encoding='utf_8_sig'))
    builder.write(data)