File: glyphdump.py

package info (click to toggle)
mupdf 1.27.0%2Bds1-3
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 29,260 kB
  • sloc: ansic: 335,322; python: 20,906; java: 7,520; javascript: 2,213; makefile: 1,152; xml: 675; cpp: 639; sh: 513; cs: 307; awk: 10; sed: 7; lisp: 3
file content (111 lines) | stat: -rwxr-xr-x 2,592 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
#!/usr/bin/env python3

import sys

agl = []
aglseen = {}
single_from_name = []
multi_from_name = []
name_from_single = {}
code_from_multi = {}

print("/* This file was generated by scripts/glyphdump.py. Do not edit. */")
print()

def readlist(filename):
	f = open(filename, "r")
	for line in f.readlines():
		if line[0] == '#':
			continue
		line = line[:-1]
		name, alts = line.split(';')
		for list in alts.split(','):
			list = [int(x, 16) for x in list.split(' ')]
			okay = True
			for ucs in list:
				if ucs > 0xffff:
					okay = False
				#if ucs >= 0xe000 and ucs <= 0xf8ff:
				#	okay = False
			if okay and name not in aglseen:
				agl.append((name, list))
				aglseen[name] = True

readlist("scripts/glyphlist.txt")
readlist("scripts/texglyphlist.txt")

for name, ucslist in agl:
	num = len(ucslist)
	if num == 1:
		ucs = ucslist[0]
		single_from_name.append((name, ucs))
		if ucs not in name_from_single:
			name_from_single[ucs] = []
		name_from_single[ucs].append(name)
	else:
		multi_from_name.append((name, ucslist))

def dumplist(list):
	for item in list:
		sys.stdout.write(item)

single_from_name.sort()
singlenames = []
singlecodes = []
for name, ucs in single_from_name:
	singlenames.append("\"%s\",\n" % name)
	singlecodes.append("0x%04x,\n" % ucs)

multi_from_name.sort()
multinames = []
multioffsets = []
multicodes = []
for name, ucslist in multi_from_name:
	multinames.append("\"%s\",\n" % name)
	multioffsets.append("%d,\n" % len(multicodes))
	multicodes.append("%d," % len(ucslist))
	for ucs in ucslist:
		multicodes.append(" 0x%04x," % ucs)
	multicodes.append("\n");

keys = list(name_from_single.keys())
keys.sort()
dupoffsets = []
dupnames = []
for ucs in keys:
	list = name_from_single[ucs]
	if len(list) > 1:
		ofs = len(dupnames)
		dupoffsets.append("0x%04x, %d,\n" % (ucs, ofs))
		for name in list:
			dupnames.append("\"%s\", " % name)
		dupnames.append("0,\n")

print("static const char *single_name_list[] = {")
dumplist(singlenames)
print("};")
print()
print("static const unsigned short single_code_list[] = {")
dumplist(singlecodes)
print("};")
print()
if False:
	print("static const char *multi_name_list[] = {")
	dumplist(multinames)
	print("};")
	print()
	print("static const unsigned short multi_offset_list[] = {")
	dumplist(multioffsets)
	print("};")
	print()
	print("static const unsigned short multi_code_list[] = {")
	dumplist(multicodes)
	print("};")
	print()
print("static const unsigned short agl_dup_offsets[] = {")
dumplist(dupoffsets)
print("};")
print()
print("static const char *agl_dup_names[] = {")
dumplist(dupnames)
print("};")