File: testdata

package info (click to toggle)
libmdn-perl 2.4-2
  • links: PTS
  • area: main
  • in suites: sarge
  • size: 240 kB
  • ctags: 73
  • sloc: perl: 780; makefile: 87; ansic: 60
file content (98 lines) | stat: -rw-r--r-- 3,854 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
#
# Test data for MDN::API and MDN::ResConf.
#
# Format:
#   <title>:<actions>:<in-encoding>:<in-name>:<exp-encoding>:<exp-name>
#
#   <title>
#       title of the test
#   <actions>
#       conversion actions.
#       same as $actions argument of MDN::ResConf::nameconv().
#   <in-encoding>
#       encoding of input domain name.
#   <in-name>
#       input domain name.
#   <exp-encoding>
#       encoding of expected output.
#   <exp-name>
#       expected output.
#

# U+78BA U+8A8D:  CJK Ideographs
# U+AC00: Hangul Syllable (EUC-JP doesn't have this character)
action l[1]: l: EUC-JP:ǧ         : UTF-8:U+78BA U+8A8D
action l[2]: l: UTF-8:U+008E        : -:invalid encoding
action L[1]: L: UTF-8:U+78BA U+8A8D : EUC-JP:ǧ
action L[2]: L: UTF-8:U+AC00        : US-ASCII:bq--vqaa

# U+5A18: CJK Ideographs
# U+3002: IDEOGRAPHIC FULL STOP (local delimiter)
action d: d: UTF-8:U+5A18 U+3002 j p : UTF-8:U+5A18 . j p

# U+304B: HIRAGANA LETTER KA
# U+309B: HIRAGANA-KATAKANA VOICED SOUND MARK
# U+304C: HIRAGANA LETTER GA
action M[1]: M: UTF-8:U+304B U+309B . j p : UTF-8:U+304B U+3099 . j p
action M[2]: M: UTF-8:U+304B U+309B . t w : UTF-8:U+304B U+309B . t w

# U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
# U+FF21: FULLWIDTH LATIN SMALL LETTER A
action m[1]: m: UTF-8:U+FF21 . c o m : UTF-8:U+FF41 . c o m
action m[2]: m: UTF-8:A . c o m      : UTF-8:A . c o m

# U+304B: HIRAGANA LETTER KA
# U+3099: COMBINING HIRAGANA-KATAKANA VOICED SOUND MARK
# U+304C: HIRAGANA LETTER GA
action n: n: UTF-8:U+304B U+3099 . j p : UTF-8:U+304C . j p

# U+3002: (prohibited character)
# U+3042: HIRAGANA LETTER A
action p[1]: p: UTF-8:U+3002 . c o m      : -:prohibited codepoint
action p[2]: p: UTF-8:U+3042 . c o m : UTF-8:U+3042 . c o m

# U+304B: HIRAGANA LETTER KA
# U+3099: COMBINING HIRAGANA-KATAKANA VOICED SOUND MARK
# U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
# U+3002: (prohibited character)
# U+304C: HIRAGANA LETTER GA
action N[1]: N: UTF-8:U+304B U+3099 U+FF21 : UTF-8:U+304C a
action N[2]: N: UTF-8:A . c o m            : UTF-8:A . c o m
action N[3]: N: UTF-8:U+3002 . c o m       : -:prohibited codepoint
action N[4]: N: UTF-8:U+3042 . c o m       : UTF-8:U+3042 . c o m

# U+0220: unassigned codepoint
action u[1]: u: UTF-8:U+0220 . c o m : -:prohibited codepoint
action u[2]: u: UTF-8:U+3042 . c o m : UTF-8:U+3042 . c o m

# U+78BA U+8A8D: CJK Ideographs
action I[1]: I: UTF-8:U+78BA U+8A8D   : US-ASCII:bq--3b4lvcun
action I[2]: I: UTF-8:A . c o m       : US-ASCII:A.com
action i[1]: i: US-ASCII:bq--3b4lvcun : UTF-8:U+78BA U+8A8D
action i[2]: i: US-ASCII:bq--abaue    : -:invalid encoding
action i[3]: i: US-ASCII:A.com        : UTF-8:A . c o m

# U+3002: (prohibited character)
# U+3042: HIRAGANA LETTER A
# U+304B: HIRAGANA LETTER KA
# U+0220: unassigned codepoint
action !N[1]: !N: UTF-8:A U+3042      : US-ASCII:bq--gd7ucqq
action !N[2]: !N: UTF-8:U+3042        : UTF-8:U+3042
action !m[1]: !m: UTF-8:A U+3042      : US-ASCII:bq--gd7ucqq
action !m[2]: !m: UTF-8:U+3042        : UTF-8:U+3042
action !n[1]: !n: UTF-8:U+304B U+3099 : US-ASCII:bq--gbfzs
action !n[2]: !n: UTF-8:U+3042        : UTF-8:U+3042
action !p[1]: !p: UTF-8:U+3002        : US-ASCII:bq--gaba
action !p[2]: !p: UTF-8:U+3042        : UTF-8:U+3042
action !u[1]: !u: UTF-8:U+0220        : US-ASCII:bq--aiqa
action !u[2]: !u: UTF-8:U+3042        : UTF-8:U+3042

# U+304B: HIRAGANA LETTER KA
# U+3099: COMBINING HIRAGANA-KATAKANA VOICED SOUND MARK
# U+309B: HIRAGANA-KATAKANA VOICED SOUND MARK
# U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
# U+3002: IDEOGRAPHIC FULL STOP (local delimiter)
action local-to-idn[1]: ldMNI: EUC-JP:jp : US-ASCII:bq--gbgp6yi.jp
action idn-to-local[1]: i!NL:  US-ASCII:bq--gbgp6yi.jp : EUC-JP:a.jp
action local-to-idn[2]: ldMNI: US-ASCII:bq--gbpx4va : US-ASCII:bq--gbpx4va
action idn-to-local[2]: i!NL:  US-ASCII:bq--gbpx4va : EUC-JP:ޤ