xref: /aosp_15_r20/external/cldr/common/transforms/Hebrew-Latin.xml (revision 912701f9769bb47905792267661f0baf2b85bed5)
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!--
4Copyright © 1991-2013 Unicode, Inc.
5CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
6For terms of use, see http://www.unicode.org/copyright.html
7-->
8<supplementalData>
9	<version number="$Revision$"/>
10	<transforms>
11		<transform source="Hebr" target="Latn" direction="both" alias="Hebrew-Latin und-Latn-t-und-hebr" backwardAlias="Latin-Hebrew und-Hebr-t-und-latn">
12			<tRule><![CDATA[
13# Transliteration table for Hebrew
14# Based on the UNGEGN table at:
15#   http://www.eki.ee/wgrs/rom1_he.pdf
16#
17# Exceptions:
18# - Accents are added to disambiguate letters
19# - Combinations of dagesh, shin/sin dot that produce different
20#   letters are not yet encoded.
21#
22# To test, open:
23#   http://www.ibm.com/software/globalization/icu/demo/transform
24# Click Edit, paste in this file, Save As hebrew-latin/XXX
25# (where XXX is a username)
26# Now go back to the main window, and try it out.
27# Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2
28# Paste in hebrew text in Input, and hit Transliterate.
29#
30# For more information, see:
31#   http://icu.sourceforge.net/userguide/Transform.html
32:: [[־׳״][:Hebrew:] [:^ccc=0:] [ְ-ֹֻ-ּׁ-ׂℵ-ℸֿ̄] - [ֽ]] ;
33:: nfkd (nfc) ;
34
35׳ ↔ '′';
36״ ↔ '″';
37־ ↔ '-';
38
39$letterAfter = [:M:]* [:L:] ;
40# move longer items here to avoid masking
41ח ↔ ẖ ;
42צ ↔ ẕ } $letterAfter;
43ץ ↔ ẕ ;
44ש ↔ ş ;
45ת ↔ ţ ;
46א ↔ ʼ ;
47ב ↔ b ;
48ג ↔ g ;
49ד ↔ d ;
50ה ↔ h ;
51ו ↔ w ;
52ז ↔ z ;
53ט ↔ t ;
54י ↔ y ;
55כ ↔ k } $letterAfter;
56ך ↔ k ;
57ל ↔ l ;
58מ ↔ m } $letterAfter;
59ם ↔ m ;
60נ ↔ n  } $letterAfter;
61ן ↔ n ;
62ס ↔ s ;
63ע ↔ ʻ ;
64פ ↔ p } $letterAfter;
65ף ↔ p ;
66ק ↔ q ;
67ר ↔ r ;
68װ → |  וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
69ױ → | וי; # HEBREW LIGATURE YIDDISH VAV YOD
70ײ → | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
71ּ ↔ ̇ ; # dagesh just goes to overdot for now
72ׁ ↔ ̌ ; # shin dot -→ sh
73ׂ ↔ ̂ ; # sin dot -→ s
74# points
75$above = [^[:ccc=0:][:ccc=230:]]*;
76‎ֲ‎ → à ;
77‎ֲ‎ $1← a ($above)  ̀;
78‎ָ‎ → á ;
79‎ָ‎  $1 ← a ($above)  ́;
80‎ֱ‎ → è ;
81‎ֱ‎  $1 ← e ($above)  ̀;
82‎ֵ‎ → é ;
83‎ֵ‎  $1 ← e ($above)   ́;
84‎ְ‎ → e ̆ ;
85‎ְ‎  $1 ← e ($above)   ̆;
86‎ֹ‎ → ò ;
87‎ֹ‎  $1 ← o ($above)   ̀;
88ִ ↔ i ;
89ֻ ↔ u ;
90ַ ↔ a ;
91ֶ ↔ e ;
92ֳ ↔ o ;
93ֿ ↔   ̄ ;
94# fallbacks
95ק ← c ;
96פ ← f } $letterAfter;
97ף ← f ;
98ז ← j ;
99ו ← v ;
100כס ← x ;
101:: (lower);
102:: nfc (nfd) ;
103:: ([[-′″][:Latin:] [:^ccc=0:] [ʻ-ʼ̀-̧̱̂̇̌̀-́    ̄ ]]);
104			]]></tRule>
105		</transform>
106	</transforms>
107</supplementalData>
108