File: Hebrew-Latin-BGN.xml

package info (click to toggle)
unicode-cldr-core 32.0.1-1
  • links: PTS
  • area: main
  • in suites: buster
  • size: 161,808 kB
  • sloc: xml: 1,825,337; sh: 10; makefile: 2
file content (140 lines) | stat: -rw-r--r-- 4,448 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
<?xml version="1.0" encoding="UTF-8" ?>
<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
<!--
Copyright © 1991-2013 Unicode, Inc.
CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
For terms of use, see http://www.unicode.org/copyright.html
-->
<supplementalData>
	<version number="$Revision: 13796 $"/>
	<transforms>
		<transform source="he" target="he_Latn" variant="BGN" direction="forward" draft="contributed" alias="Hebrew-Latin/BGN he-Latn-t-he-m0-bgn">
			<tRule><![CDATA[
#
########################################################################
# BGN/PCGN 1981 System
#
# The BGN/PCGN system for Hebrew was designed for use in romanizing
# names written in the Hebrew alphabet. The Roman letters and letter
# combinations shown as equivalents to the Hebrew characters reflect
# the eastern variety of Hebrew, i.e., the language spoken in
# the Republic of Armenia.
#
# The Hebrew Alphabet as defined by the BGN (Page 33-35):
#
# אבגדהוזחטיכךלמםנןסעפףצץקרששת
#
# Originally prepared by Michael Everson <everson@evertype.com>
########################################################################
#
# MINIMAL FILTER: Hebrew-Latin
#

:: [ ְֱֲֳִֵֶַָֹֻּׁׂאבגדהוזחטיךכלםמןנסעףפץצקרשת׳] ;
:: NFD (NFC) ;
#
#
########################################################################


#
########################################################################
#
# Define All Transformation Variables
#
########################################################################
#

$alef = ’;
$ayin = ‘;
#
#
# Use this $wordBoundary until bug 2034 is fixed in ICU:
# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
#

$wordBoundary = [^[:L:][:M:][:N:]] ;
#
#
########################################################################


#
########################################################################
#
# Rules moved to front to avoid masking
#
########################################################################
#

בּ → b ; # HEBREW LETTER BET + DAGESH
פּ → P ; # HEBREW LETTER PE + DAGESH
גּ → g ; # HEBREW LETTER GIMEL + DAGESH
ג׳ → ǧ ; # HEBREW LETTER GIMEL + GERESH
וּ → u ; # HEBREW LETTER VAV + POINT DAGESH
וֹ → o ; # HEBREW LETTER VAV + POINT HOLAM
צ׳ → č ; # HEBREW LETTER TSADI + GERESH
ז׳ → ž ; # HEBREW LETTER ZAYIN + GERESH
דּ → d ; # HEBREW LETTER DALET + DAGESH
הּ → h ; # HEBREW LETTER HE + DAGESH
ךּ → k ; # HEBREW LETTER FINAL KAF + DAGESH
כּ → k ; # HEBREW LETTER KAF + DAGESH
ךְ → kh ; # HEBREW LETTER FINAL KAF + SHEVA
תּ → t ; # HEBREW LETTER TAV + DAGESH
#
#
########################################################################


#
########################################################################
#
# Start of Alphabetic Transformations
#
########################################################################
#

א → $alef ; # HEBREW LETTER ALEF
ב → v ; # HEBREW LETTER BET
ג → g ; # HEBREW LETTER GIMEL
ד → d ; # HEBREW LETTER DALET
ה → h ; # HEBREW LETTER HE
ח → ẖ ; # HEBREW LETTER HET
ו → w ; # HEBREW LETTER VAV
ז → z ; # HEBREW LETTER ZAYIN
[טת] → t ; # HEBREW LETTER TET
י → y ; # HEBREW LETTER YOD
[כך] → kh ; # HEBREW LETTER KAF and FINAL KAF
ל → l ; # HEBREW LETTER LAMED
[מם] → m ; # HEBREW LETTER MEM and FINAL MEM
[נן] → n ; # HEBREW LETTER NUN and FINAL NUN
ס → s ; # HEBREW LETTER SAMEKH
ע → $ayin ; # HEBREW LETTER AYIN
[פף] → f ; # HEBREW LETTER PE and FINAL PE
[צץ] → ẕ ; # HEBREW LETTER TSADI and FINAL TSADI
ק → q ; # HEBREW LETTER QOF
ר → r ; # HEBREW LETTER RESH
שׁ → sh ; # HEBREW LETTER SHIN
שׂ → s ; # HEBREW LETTER SHIN

ַ → a ; # HEBREW POINT PATAH
ֲ → a ; # HEBREW POINT HATAF PATAH
ָ → o ; # HEBREW POINT QAMATS
ֶ → e ; # HEBREW POINT SEGOL
ֱ → e ; # HEBREW POINT HATAF SEGOL
ֵי → e ; # HEBREW POINT TSERE + LETTER YOD
ֵ → e ; # HEBREW POINT TSERE
ְ → e ; # HEBREW POINT SHEVA
ִי → i ; # HEBREW POINT HIRIQ + LETTER YOD
ִ → i ; # HEBREW POINT HIRIQ
ֳ → o ; # HEBREW LETTER HATAF QAMATS
ֹ → o ; # HEBREW POINT HOLAM
ֻ → u ; # HEBREW POINT QUBUTS
#
#
########################################################################

			]]></tRule>
		</transform>
	</transforms>
</supplementalData>