• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# © 2016 and later: Unicode, Inc. and others.
2# License & terms of use: http://www.unicode.org/copyright.html
3# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
4#
5# File: Hebr_Latn.txt
6# Generated from CLDR
7#
8
9# Transliteration table for Hebrew
10# Based on the UNGEGN table at:
11#   http://www.eki.ee/wgrs/rom1_he.pdf
12#
13# Exceptions:
14# - Accents are added to disambiguate letters
15# - Combinations of dagesh, shin/sin dot that produce different
16#   letters are not yet encoded.
17#
18# To test, open:
19#   http://www.ibm.com/software/globalization/icu/demo/transform
20# Click Edit, paste in this file, Save As hebrew-latin/XXX
21# (where XXX is a username)
22# Now go back to the main window, and try it out.
23# Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2
24# Paste in hebrew text in Input, and hit Transliterate.
25#
26# For more information, see:
27#   http://icu.sourceforge.net/userguide/Transform.html
28:: [[:Hebrew:] [:^ccc=0:] [\u05B0-\u05B9\u05BB-\u05BC\u05C1-\u05C2ℵ-ℸ\u0304\u05BF] - [\u05BD]] ;
29:: nfkd (nfc) ;
30$letterAfter = [:M:]* [:L:] ;
31# move longer items here to avoid masking
32ח ↔ h\u0331 ;
33צ ↔ z\u0331 } $letterAfter;
34ץ ↔ z\u0331 ;
35ש ↔ s\u0327 ;
36ת ↔ t\u0327 ;
37א ↔ ʼ ;
38ב ↔ b ;
39ג ↔ g ;
40ד ↔ d ;
41ה ↔ h ;
42ו ↔ w ;
43ז ↔ z ;
44ט ↔ t ;
45י ↔ y ;
46כ ↔ k } $letterAfter;
47ך ↔ k ;
48ל ↔ l ;
49מ ↔ m } $letterAfter;
50ם ↔ m ;
51נ ↔ n  } $letterAfter;
52ן ↔ n ;
53ס ↔ s ;
54ע ↔ ʻ ;
55פ ↔ p } $letterAfter;
56ף ↔ p ;
57ק ↔ q ;
58ר ↔ r ;
59װ → |  וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
60ױ → | וי; # HEBREW LIGATURE YIDDISH VAV YOD
61ײ → | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
62\u05BC ↔ \u0307 ; # dagesh just goes to overdot for now
63\u05C1 ↔ \u030C ; # shin dot -→ sh
64\u05C2 ↔ \u0302 ; # sin dot -→ s
65# points
66$above = [^[:ccc=0:][:ccc=230:]]*;
67‎\u05B2‎ → à ;
68‎\u05B2‎ $1← a ($above)  \u0300;
69‎\u05B8‎ → á ;
70‎\u05B8‎  $1 ← a ($above)  \u0301;
71‎\u05B1‎ → è ;
72‎\u05B1‎  $1 ← e ($above)  \u0300;
73‎\u05B5‎ → é ;
74‎\u05B5‎  $1 ← e ($above)   \u0301;
75‎\u05B0‎ → e \u0306 ;
76‎\u05B0‎  $1 ← e ($above)   \u0306;
77‎\u05B9‎ → ò ;
78‎\u05B9‎  $1 ← o ($above)   \u0300;
79\u05B4 ↔ i ;
80\u05BB ↔ u ;
81\u05B7 ↔ a ;
82\u05B6 ↔ e ;
83\u05B3 ↔ o ;
84\u05BF ↔   \u0304 ;
85# fallbacks
86ק ← c ;
87פ ← f } $letterAfter;
88ף ← f ;
89ז ← j ;
90ו ← v ;
91כס ← x ;
92:: (lower);
93:: nfc (nfd) ;
94:: ([[:Latin:] [:^ccc=0:] [ʻ-ʼ\u0300-\u0302\u0307\u030C\u0327\u0331\u0340-\u0341    \u0304 ]]);
95
96