File: gencharset.pl

package info (click to toggle)
0ad 0.0.17-1
  • links: PTS, VCS
  • area: main
  • in suites: jessie, jessie-kfreebsd
  • size: 51,248 kB
  • ctags: 46,933
  • sloc: cpp: 223,208; ansic: 31,240; python: 16,343; perl: 4,083; sh: 1,011; makefile: 915; xml: 733; java: 621; ruby: 229; erlang: 53; sql: 40
file content (34 lines) | stat: -rw-r--r-- 866 bytes parent folder | download | duplicates (8)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
use strict;
use warnings;

use Unicode::UCD;
use Data::Dumper;

binmode STDOUT, ':utf8';

my @cs;

for ( # (these are probably more than we really need)
    'Basic Latin',
    'Latin-1 Supplement',
    'Latin Extended-A',
    'Latin Extended-B',
    'Latin Extended Additional',
    'Spacing Modifier Letters',
    'General Punctuation',
    'Combining Diacritical Marks',
    'Mathematical Operators',
) {
    print "# $_\n";
    for my $r (@{Unicode::UCD::charblock($_)}) {
        for my $c ($r->[0]..$r->[1]) {
            next if $c < 0x20 or ($c >= 0x7f and $c < 0xa0);
            printf "%04X: %s  %s\n", $c, chr($c), Unicode::UCD::charinfo($c)->{name} if Unicode::UCD::charinfo($c);
        }
    }
    print "\n";
}

for my $c (0xFE33, 0xFFFD) {
    printf "%04X: %s  %s\n", $c, chr($c), Unicode::UCD::charinfo($c)->{name} if Unicode::UCD::charinfo($c);
}