• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!--
4Copyright © 1991-2013 Unicode, Inc.
5CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
6For terms of use, see http://www.unicode.org/copyright.html
7-->
8<supplementalData>
9	<version number="$Revision: 12263 $"/>
10	<transforms>
11		<transform source="Hebr" target="Latn" direction="both" alias="Hebrew-Latin und-Latn-t-und-hebr" backwardAlias="Latin-Hebrew und-Hebr-t-und-latn">
12			<tRule><![CDATA[
13# Transliteration table for Hebrew
14# Based on the UNGEGN table at:
15#   http://www.eki.ee/wgrs/rom1_he.pdf
16#
17# Exceptions:
18# - Accents are added to disambiguate letters
19# - Combinations of dagesh, shin/sin dot that produce different
20#   letters are not yet encoded.
21#
22# To test, open:
23#   http://www.ibm.com/software/globalization/icu/demo/transform
24# Click Edit, paste in this file, Save As hebrew-latin/XXX
25# (where XXX is a username)
26# Now go back to the main window, and try it out.
27# Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2
28# Paste in hebrew text in Input, and hit Transliterate.
29#
30# For more information, see:
31#   http://icu.sourceforge.net/userguide/Transform.html
32:: [[:Hebrew:] [:^ccc=0:] [ְ-ֹֻ-ּׁ-ׂℵ-ℸֿ̄] - [ֽ]] ;
33:: nfkd (nfc) ;
34$letterAfter = [:M:]* [:L:] ;
35# move longer items here to avoid masking
36ח ↔ ẖ ;
37צ ↔ ẕ } $letterAfter;
38ץ ↔ ẕ ;
39ש ↔ ş ;
40ת ↔ ţ ;
41א ↔ ʼ ;
42ב ↔ b ;
43ג ↔ g ;
44ד ↔ d ;
45ה ↔ h ;
46ו ↔ w ;
47ז ↔ z ;
48ט ↔ t ;
49י ↔ y ;
50כ ↔ k } $letterAfter;
51ך ↔ k ;
52ל ↔ l ;
53מ ↔ m } $letterAfter;
54ם ↔ m ;
55נ ↔ n  } $letterAfter;
56ן ↔ n ;
57ס ↔ s ;
58ע ↔ ʻ ;
59פ ↔ p } $letterAfter;
60ף ↔ p ;
61ק ↔ q ;
62ר ↔ r ;
63װ → |  וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
64ױ → | וי; # HEBREW LIGATURE YIDDISH VAV YOD
65ײ → | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
66ּ ↔ ̇ ; # dagesh just goes to overdot for now
67ׁ ↔ ̌ ; # shin dot -→ sh
68ׂ ↔ ̂ ; # sin dot -→ s
69# points
70$above = [^[:ccc=0:][:ccc=230:]]*;
71‎ֲ‎ → à ;
72‎ֲ‎ $1← a ($above)  ̀;
73‎ָ‎ → á ;
74‎ָ‎  $1 ← a ($above)  ́;
75‎ֱ‎ → è ;
76‎ֱ‎  $1 ← e ($above)  ̀;
77‎ֵ‎ → é ;
78‎ֵ‎  $1 ← e ($above)   ́;
79‎ְ‎ → e ̆ ;
80‎ְ‎  $1 ← e ($above)   ̆;
81‎ֹ‎ → ò ;
82‎ֹ‎  $1 ← o ($above)   ̀;
83ִ ↔ i ;
84ֻ ↔ u ;
85ַ ↔ a ;
86ֶ ↔ e ;
87ֳ ↔ o ;
88ֿ ↔   ̄ ;
89# fallbacks
90ק ← c ;
91פ ← f } $letterAfter;
92ף ← f ;
93ז ← j ;
94ו ← v ;
95כס ← x ;
96:: (lower);
97:: nfc (nfd) ;
98:: ([[:Latin:] [:^ccc=0:] [ʻ-ʼ̀-̧̱̂̇̌̀-́    ̄ ]]);
99			]]></tRule>
100		</transform>
101	</transforms>
102</supplementalData>
103