File: gencharset.pl

package info (click to toggle)

0ad 0.0.26-3

links: PTS, VCS
area: main
in suites: bookworm
size: 130,460 kB
sloc: cpp: 261,824; ansic: 198,392; javascript: 19,067; python: 14,557; sh: 7,629; perl: 4,072; xml: 849; makefile: 741; java: 533; ruby: 229; php: 190; pascal: 30; sql: 21; tcl: 4

file content (34 lines) | stat: -rw-r--r-- 866 bytes

parent folder | download | duplicates (8)

use strict;
use warnings;

use Unicode::UCD;
use Data::Dumper;

binmode STDOUT, ':utf8';

my @cs;

for ( # (these are probably more than we really need)
    'Basic Latin',
    'Latin-1 Supplement',
    'Latin Extended-A',
    'Latin Extended-B',
    'Latin Extended Additional',
    'Spacing Modifier Letters',
    'General Punctuation',
    'Combining Diacritical Marks',
    'Mathematical Operators',
) {
    print "# $_\n";
    for my $r (@{Unicode::UCD::charblock($_)}) {
        for my $c ($r->[0]..$r->[1]) {
            next if $c < 0x20 or ($c >= 0x7f and $c < 0xa0);
            printf "%04X: %s  %s\n", $c, chr($c), Unicode::UCD::charinfo($c)->{name} if Unicode::UCD::charinfo($c);
        }
    }
    print "\n";
}

for my $c (0xFE33, 0xFFFD) {
    printf "%04X: %s  %s\n", $c, chr($c), Unicode::UCD::charinfo($c)->{name} if Unicode::UCD::charinfo($c);
}