File: gencharset.pl

package info (click to toggle)
0ad 0.0.23.1-2
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 78,292 kB
  • sloc: cpp: 245,166; ansic: 200,249; python: 13,754; sh: 6,104; perl: 4,620; makefile: 977; xml: 810; java: 533; ruby: 229; erlang: 46; pascal: 30; sql: 21; tcl: 4
file content (34 lines) | stat: -rw-r--r-- 866 bytes parent folder | download | duplicates (10)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
use strict;
use warnings;

use Unicode::UCD;
use Data::Dumper;

binmode STDOUT, ':utf8';

my @cs;

for ( # (these are probably more than we really need)
    'Basic Latin',
    'Latin-1 Supplement',
    'Latin Extended-A',
    'Latin Extended-B',
    'Latin Extended Additional',
    'Spacing Modifier Letters',
    'General Punctuation',
    'Combining Diacritical Marks',
    'Mathematical Operators',
) {
    print "# $_\n";
    for my $r (@{Unicode::UCD::charblock($_)}) {
        for my $c ($r->[0]..$r->[1]) {
            next if $c < 0x20 or ($c >= 0x7f and $c < 0xa0);
            printf "%04X: %s  %s\n", $c, chr($c), Unicode::UCD::charinfo($c)->{name} if Unicode::UCD::charinfo($c);
        }
    }
    print "\n";
}

for my $c (0xFE33, 0xFFFD) {
    printf "%04X: %s  %s\n", $c, chr($c), Unicode::UCD::charinfo($c)->{name} if Unicode::UCD::charinfo($c);
}