1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
|
# Unicode data generation rules. Except for the test data files, most
# users will not use these Makefile rules, which are primarily to re-generate
# unicode_data.c when we get a new Unicode version or charwidth data; they
# require julia to be installed.
# programs
CURL=curl
PERL=perl
MAKE=make
JULIA=julia
CURLFLAGS = --retry 5 --location
.PHONY: clean
.DELETE_ON_ERROR:
RAWDATA = UnicodeData.txt GraphemeBreakProperty.txt DerivedCoreProperties.txt CompositionExclusions.txt CaseFolding.txt EastAsianWidth.txt emoji-data.txt
utf8proc_data.c.new: data_generator.jl $(RAWDATA)
$(JULIA) --project=. -e 'using Pkg; Pkg.instantiate()'
$(JULIA) --project=. data_generator.jl > $@
# Unicode data version (must also update utf8proc_unicode_version function)
UNICODE_VERSION=17.0.0
UnicodeData.txt:
cp /usr/share/unicode/UnicodeData.txt $@
EastAsianWidth.txt:
cp /usr/share/unicode/extracted/DerivedEastAsianWidth.txt $@
GraphemeBreakProperty.txt:
cp /usr/share/unicode/auxiliary/GraphemeBreakProperty.txt $@
DerivedCoreProperties.txt:
cp /usr/share/unicode/DerivedCoreProperties.txt $@
CompositionExclusions.txt:
cp /usr/share/unicode/CompositionExclusions.txt $@
CaseFolding.txt:
cp /usr/share/unicode/CaseFolding.txt $@
NormalizationTest.txt:
bzip2 -d < /usr/share/unicode/NormalizationTest.txt.bz2 > $@
GraphemeBreakTest.txt:
cp /usr/share/unicode/auxiliary/GraphemeBreakTest.txt $@
emoji-data.txt:
cp /usr/share/unicode/emoji/emoji-data.txt $@
Uppercase.txt: DerivedCoreProperties.txt
grep -zoP '(?s)# Derived Property: Uppercase.*?# Total code points:' DerivedCoreProperties.txt > $@
Lowercase.txt: DerivedCoreProperties.txt
grep -zoP '(?s)# Derived Property: Lowercase.*?# Total code points:' DerivedCoreProperties.txt > $@
clean:
rm -f $(RAWDATA) NormalizationTest.txt GraphemeBreakTest.txt
rm -f Uppercase.txt Lowercase.txt
rm -f utf8proc_data.c.new
|