• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!--
4Copyright © 1991-2013 Unicode, Inc.
5CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
6For terms of use, see http://www.unicode.org/copyright.html
7-->
8<supplementalData>
9	<version number="$Revision$"/>
10	<transforms>
11		<transform source="Latin" target="InterIndic" direction="forward" visibility="internal">
12			<tRule>
13# Latin-InterIndic
14#:: NFD;
15#\u0E00 reserved
16#consonants
17$chandrabindu=\uE001;
18$anusvara=\uE002;
19$visarga=\uE003;
20#\u0E004 reserved
21# w←vowel→ represents the stand-alone form
22$wa=\uE005;
23$waa=\uE006;
24$wi=\uE007;
25$wii=\uE008;
26$wu=\uE009;
27$wuu=\uE00A;
28$wr=\uE00B;
29$wl=\uE00C;
30$wce=\uE00D; # LETTER CANDRA E
31$wse=\uE00E; # LETTER SHORT E
32$we=\uE00F;  # ए LETTER E
33$wai=\uE010;
34$wco=\uE011; # LETTER CANDRA O
35$wso=\uE012; # LETTER SHORT O
36$wo=\uE013;  # ओ LETTER O
37$wau=\uE014;
38$ka=\uE015;
39$kha=\uE016;
40$ga=\uE017;
41$gha=\uE018;
42$nga=\uE019;
43$ca=\uE01A;
44$cha=\uE01B;
45$ja=\uE01C;
46$jha=\uE01D;
47$nya=\uE01E;
48$tta=\uE01F;
49$ttha=\uE020;
50$dda=\uE021;
51$ddha=\uE022;
52$nna=\uE023;
53$ta=\uE024;
54$tha=\uE025;
55$da=\uE026;
56$dha=\uE027;
57$na=\uE028;
58$ena=\uE029; #compatibility
59$pa=\uE02A;
60$pha=\uE02B;
61$ba=\uE02C;
62$bha=\uE02D;
63$ma=\uE02E;
64$ya=\uE02F;
65$ra=\uE030;
66$rra=\uE031;
67$la=\uE032;
68$lla=\uE033;
69$ela=\uE034; #compatibility
70$va=\uE035;
71$vva=\uE081;
72$sha=\uE036;
73$ssa=\uE037;
74$sa=\uE038;
75$ha=\uE039;
76#\u093A Reserved
77#\u093B Reserved
78$nukta=\uE03C;
79$avagraha=\uE03D; # SIGN AVAGRAHA
80# ←vowel→ represents the dependent form
81$aa=\uE03E;
82$i=\uE03F;
83$ii=\uE040;
84$u=\uE041;
85$uu=\uE042;
86$rh=\uE043;
87$rrh=\uE044;
88$ce=\uE045; #VOWEL SIGN CANDRA E
89$se=\uE046; #VOWEL SIGN SHORT E
90$e=\uE047;
91$ai=\uE048;
92$co=\uE049; # VOWEL SIGN CANDRA O
93$so=\uE04A; # VOWEL SIGN SHORT O
94$o=\uE04B;  # ो
95$au=\uE04C;
96$virama=\uE04D;
97# \u094E Reserved
98# \u094F Reserved
99$om = \uE050; # OM
100# ॑→;        # UNMAPPED STRESS SIGN UDATTA
101# ॒→;        # UNMAPPED STRESS SIGN ANUDATTA
102# ॓→;        # UNMAPPED GRAVE ACCENT
103# ॔→;        # UNMAPPED ACUTE ACCENT
104$lm = \uE055;#  Telugu Length Mark
105$ailm=\uE056;#  AI Length Mark
106$aulm=\uE057;#  AU Length Mark
107#urdu compatibity forms
108$uka=\uE058;
109$ukha=\uE059;
110$ugha=\uE05A;
111$ujha=\uE05B;
112$uddha=\uE05C;
113$udha=\uE05D;
114$ufa=\uE05E;
115$uya=\uE05F;
116$wrr=\uE060;
117$wll=\uE061;
118$lh=\uE062;
119$llh=\uE063;
120$danda=\uE064;
121$doubleDanda=\uE065;
122$zero=\uE066;     # DIGIT ZERO
123$one=\uE067;      # DIGIT ONE
124$two=\uE068;      # DIGIT TWO
125$three=\uE069;    # DIGIT THREE
126$four=\uE06A;     # DIGIT FOUR
127$five=\uE06B;     # DIGIT FIVE
128$six=\uE06C;      # DIGIT SIX
129$seven=\uE06D;    # DIGIT SEVEN
130$eight=\uE06E;    # DIGIT EIGHT
131$nine=\uE06F;     # DIGIT NINE
132$dgs=\uE082;
133# For all other scripts
134$ecp0=\uE070;
135$ecp1=\uE071;
136$ecp2=\uE072;
137$ecp3=\uE073;
138$ecp4=\uE074;
139$ecp5=\uE075;
140$ecp6=\uE076;
141$ecp7=\uE077;
142$ecp8=\uE078;
143$ecp9=\uE079;
144$ecpA=\uE07A;
145$ecpB=\uE07B;
146$ecpC=\uE07C;
147$ecpD=\uE07D;
148$ecpE=\uE07E;
149$ecpF=\uE07F;
150# Khanda-ta
151$kta=\uE083;
152# ॰→; # nothing in Latin maps to InterIndic ABBREVIATION SIGN
153$depVowelAbove=[\uE03E-\uE040\uE045-\uE04C];
154$depVowelBelow=[\uE041-\uE044];
155$endThing=[$danda$doubleDanda];
156# $x was originally called '§'; $z was '%'
157$x=[$virama$aa$ai$au$ii$i$uu$u$rrh$rh$lh$e$o$se$ce$so$co];
158$z=[bcdfghjklmnpqrstvwxyz];
159$consonants=[[$ka-$ha]$z[क-ह][ক-হ][ਕ-ਹ][ક-હ][କ-ହ][க-ஹ][క-హ][ಕ-ಹ][ക-ഹ]];
160̕ → $avagraha;
161̃→$chandrabindu$anusvara;
162m̐→$chandrabindu;
163ḥ→$visarga;
164x→$ka$virama$sa;
165# convert to independent forms at start of word or syllable:
166# dependent forms for roundtrip
167̔ā→$aa;
168̔ai→$ai;
169̔au→$au;
170̔ii→$ii;
171̔ī→$ii;
172̔i→$i;
173̔ū→$uu;
174̔u→$u;
175̔r̥̄→$rrh;
176̔r̥→$rh;
177̔l̥̄→$llh;
178̔lh→$lh;
179̔l̥→$lh;
180̔ē→$e;
181̔ō→$o;
182̔a→;
183̔ĕ→$ce;
184̔ŏ→$co;
185̔e→$se;
186̔o→$so;
187# preceeded by consonants
188$consonants{ ā→$aa;
189$consonants{ ai→$ai;
190$consonants{ au→$au;
191$consonants{ ii→$ii;
192$consonants{ ī→$ii;
193$consonants{ i→$i;
194$consonants{ ū→$uu;
195$consonants{ u→$u;
196$consonants{ r̥̄→$rrh;
197$consonants{ r̥a→$rh;
198$consonants{ r̥→$rh;
199$consonants{ l̥̄→$llh;
200$consonants{ lh→$lh;
201$consonants{ l̥→$lh;
202$consonants{ ē→$e;
203$consonants{ ō→$o;
204$consonants{ ĕ→$ce;
205$consonants{ ŏ→$co;
206$consonants{ e→$se;
207$consonants{ o→$so;
208# e.g. keai -→ {ka}{e}{wai}; k'ai -→ {ka}{wai}; (ai) -→ ({wai})
209ā→$waa;
210ai→$wai;
211au→$wau;
212ī→$wii;
213i→$wi;
214ū→$wuu;
215u→$wu;
216r̥̄→$wrr;
217r̥→$wr;
218l̥̄→$wll;
219lh→$wl;
220l̥→$wl;
221ē→$we;
222ō→$wo;
223a→$wa;
224ĕ→$wce;
225ŏ→$wco;
226e→$wse;
227''om→$om;
228o→$wso;
229# rules for anusvara
230n}r̥           → $na|$virama;
231n}l̥           → $na|$virama;
232n}na                → $na|$virama;
233ṅ}[kg]        → $anusvara;
234ṅ}ṅ     → $anusvara;
235n̄}[cj]        → $anusvara;
236n̄}ñ     → $anusvara;
237ṇ}[tdn]̣ → $anusvara;
238n}[tdn]             → $anusvara;
239m}[pbm]             → $anusvara;
240n}[ylvshr]          → $anusvara;
241ṁ             → $anusvara;
242#urdu compatibility
243q→$uka|$virama;
244ḵẖ→$ukha |$virama;
245ġ→ $ugha | $virama;
246z → $ujha |$virama;
247f → $ufa|$virama;
248ṯ→$kta;
249# dev
250ẏ→$uya|$virama;
251ḻ→$ela|$virama;
252ṉ→$ena|$virama;
253ṅ→$nga|$virama;
254ñ→$nya|$virama;
255ṇ→$nna|$virama;
256ṭh→$ttha|$virama;
257ṭ→$tta|$virama;
258ṛh→$udha|$virama;
259ṛ→$uddha|$virama;
260ḍh→$ddha|$virama;
261ḍ→$dda|$virama;
262kh→$kha|$virama;
263k→$ka|$virama;
264gh→$gha|$virama;
265g→$ga|$virama;
266ch→$cha|$virama;
267c→$ca|$virama;
268jh→$jha|$virama;
269j→$ja|$virama;
270ny→$nya|$virama;
271tth→$ttha|$virama;
272ddh→$ddha|$virama;
273th→$tha|$virama;
274t→$ta|$virama;
275dh→$dha|$virama;
276d→$da|$virama;
277n→$na|$virama;
278ph→$pha|$virama;
279p→$pa|$virama;
280bh→$bha|$virama;
281b→$ba|$virama;
282m→$ma|$virama;
283y→$ya|$virama;
284ṟ→$rra|$virama;
285r→$ra|$virama;
286ḷ→$lla|$virama;
287l→$la|$virama;
288v→$va|$virama;
289ẇ→$vva|$virama;
290w→$va|$virama;
291sh→$sha|$virama;
292ss→$ssa|$virama;
293ṣ→$ssa|$virama;
294ś→$sha|$virama;
295s→$sa|$virama;
296h→$ha|$virama;
297'.'→$danda;
298$danda'.'→$doubleDanda;
299$depVowelAbove{'~'→$anusvara;
300$depVowelBelow{'~'→$chandrabindu;
301# convert to dependent forms after consonant with no vowel:
302# e.g. kai -→ {ka}{virama}ai -→ {ka}{ai}
303#$virama aa→$aa;
304$virama ā→$aa;
305$virama ai→$ai;
306$virama au→$au;
307$virama ii→$ii;
308$virama ī→$ii;
309$virama i→$i;
310#$virama uu→$uu;
311$virama ū→$uu;
312$virama u→$u;
313#$virama rrh→$rrh;
314$virama r̥̄→$rrh;
315#$virama rh→$rh;
316$virama r̥a→$rh;
317$virama r̥→$rh;
318$virama l̥̄→$llh;
319$virama lh→$lh;
320$virama l̥→$lh;
321$virama ē→$e;
322$virama ō→$o;
323$virama a→;
324$virama ĕ→$ce;
325$virama ŏ→$co;
326$virama e→$se;
327$virama o→$so;
328# otherwise convert independent forms when separated by ': k'ai -→ {ka}{virama}{wai}
329#$virama''aa→$waa;
330$virama''ā→$waa;
331$virama''ai→$wai;
332$virama''au→$wau;
333#$virama''ii→$wii;
334$virama''ī→$wii;
335$virama''i→$wi;
336#$virama''uu→$wuu;
337$virama''ū→$wuu;
338$virama''u→$wu;
339#$virama''rrh→$wrr;
340$virama''r̥̄→$wrr;
341#$virama''rh→$wr;
342$virama''r̥→$wr;
343$virama''l̥̄→$wll;
344#$virama''lh→$wl;
345$virama''l̥→$wl;
346$virama''ē→$we;
347$virama''ō→$wo;
348$virama''a→$wa;
349$virama''ĕ→$wce;
350$virama''ŏ→$wco;
351$virama''e→$wse;
352$virama''o→$wso;
353# no virama
354''ā→$waa;
355''ai→$wai;
356''au→$wau;
357''ī→$wii;
358''i→$wi;
359''ū→$wuu;
360''u→$wu;
361''r̥̄→$wrr;
362''r̥→$wr;
363''l̥̄→$wll;
364''l̥→$wl;
365''ē→$we;
366''ō→$wo;
367''a→$wa;
368''ĕ→$wce;
369''ŏ→$wco;
370''e→$wse;
371''o→$wso;
372$virama } [$z] → $virama;
373$virama } ' ' → $virama ;
374$virama}$endThing→;
375ʔ→$dgs; # Glottal Stop
3760→$zero;
3771→$one;
3782→$two;
3793→$three;
3804→$four;
3815→$five;
3826→$six;
3837→$seven;
3848→$eight;
3859→$nine;
386''→;
387#:: NFC (NFD) ;
388			</tRule>
389		</transform>
390	</transforms>
391</supplementalData>
392