1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98
|
#
# Test data for MDN::API and MDN::ResConf.
#
# Format:
# <title>:<actions>:<in-encoding>:<in-name>:<exp-encoding>:<exp-name>
#
# <title>
# title of the test
# <actions>
# conversion actions.
# same as $actions argument of MDN::ResConf::nameconv().
# <in-encoding>
# encoding of input domain name.
# <in-name>
# input domain name.
# <exp-encoding>
# encoding of expected output.
# <exp-name>
# expected output.
#
# U+78BA U+8A8D: CJK Ideographs
# U+AC00: Hangul Syllable (EUC-JP doesn't have this character)
action l[1]: l: EUC-JP:ǧ : UTF-8:U+78BA U+8A8D
action l[2]: l: UTF-8:U+008E : -:invalid encoding
action L[1]: L: UTF-8:U+78BA U+8A8D : EUC-JP:ǧ
action L[2]: L: UTF-8:U+AC00 : US-ASCII:bq--vqaa
# U+5A18: CJK Ideographs
# U+3002: IDEOGRAPHIC FULL STOP (local delimiter)
action d: d: UTF-8:U+5A18 U+3002 j p : UTF-8:U+5A18 . j p
# U+304B: HIRAGANA LETTER KA
# U+309B: HIRAGANA-KATAKANA VOICED SOUND MARK
# U+304C: HIRAGANA LETTER GA
action M[1]: M: UTF-8:U+304B U+309B . j p : UTF-8:U+304B U+3099 . j p
action M[2]: M: UTF-8:U+304B U+309B . t w : UTF-8:U+304B U+309B . t w
# U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
# U+FF21: FULLWIDTH LATIN SMALL LETTER A
action m[1]: m: UTF-8:U+FF21 . c o m : UTF-8:U+FF41 . c o m
action m[2]: m: UTF-8:A . c o m : UTF-8:A . c o m
# U+304B: HIRAGANA LETTER KA
# U+3099: COMBINING HIRAGANA-KATAKANA VOICED SOUND MARK
# U+304C: HIRAGANA LETTER GA
action n: n: UTF-8:U+304B U+3099 . j p : UTF-8:U+304C . j p
# U+3002: (prohibited character)
# U+3042: HIRAGANA LETTER A
action p[1]: p: UTF-8:U+3002 . c o m : -:prohibited codepoint
action p[2]: p: UTF-8:U+3042 . c o m : UTF-8:U+3042 . c o m
# U+304B: HIRAGANA LETTER KA
# U+3099: COMBINING HIRAGANA-KATAKANA VOICED SOUND MARK
# U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
# U+3002: (prohibited character)
# U+304C: HIRAGANA LETTER GA
action N[1]: N: UTF-8:U+304B U+3099 U+FF21 : UTF-8:U+304C a
action N[2]: N: UTF-8:A . c o m : UTF-8:A . c o m
action N[3]: N: UTF-8:U+3002 . c o m : -:prohibited codepoint
action N[4]: N: UTF-8:U+3042 . c o m : UTF-8:U+3042 . c o m
# U+0220: unassigned codepoint
action u[1]: u: UTF-8:U+0220 . c o m : -:prohibited codepoint
action u[2]: u: UTF-8:U+3042 . c o m : UTF-8:U+3042 . c o m
# U+78BA U+8A8D: CJK Ideographs
action I[1]: I: UTF-8:U+78BA U+8A8D : US-ASCII:bq--3b4lvcun
action I[2]: I: UTF-8:A . c o m : US-ASCII:A.com
action i[1]: i: US-ASCII:bq--3b4lvcun : UTF-8:U+78BA U+8A8D
action i[2]: i: US-ASCII:bq--abaue : -:invalid encoding
action i[3]: i: US-ASCII:A.com : UTF-8:A . c o m
# U+3002: (prohibited character)
# U+3042: HIRAGANA LETTER A
# U+304B: HIRAGANA LETTER KA
# U+0220: unassigned codepoint
action !N[1]: !N: UTF-8:A U+3042 : US-ASCII:bq--gd7ucqq
action !N[2]: !N: UTF-8:U+3042 : UTF-8:U+3042
action !m[1]: !m: UTF-8:A U+3042 : US-ASCII:bq--gd7ucqq
action !m[2]: !m: UTF-8:U+3042 : UTF-8:U+3042
action !n[1]: !n: UTF-8:U+304B U+3099 : US-ASCII:bq--gbfzs
action !n[2]: !n: UTF-8:U+3042 : UTF-8:U+3042
action !p[1]: !p: UTF-8:U+3002 : US-ASCII:bq--gaba
action !p[2]: !p: UTF-8:U+3042 : UTF-8:U+3042
action !u[1]: !u: UTF-8:U+0220 : US-ASCII:bq--aiqa
action !u[2]: !u: UTF-8:U+3042 : UTF-8:U+3042
# U+304B: HIRAGANA LETTER KA
# U+3099: COMBINING HIRAGANA-KATAKANA VOICED SOUND MARK
# U+309B: HIRAGANA-KATAKANA VOICED SOUND MARK
# U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
# U+3002: IDEOGRAPHIC FULL STOP (local delimiter)
action local-to-idn[1]: ldMNI: EUC-JP:jp : US-ASCII:bq--gbgp6yi.jp
action idn-to-local[1]: i!NL: US-ASCII:bq--gbgp6yi.jp : EUC-JP:a.jp
action local-to-idn[2]: ldMNI: US-ASCII:bq--gbpx4va : US-ASCII:bq--gbpx4va
action idn-to-local[2]: i!NL: US-ASCII:bq--gbpx4va : EUC-JP:ޤ
|