• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# © 2016 and later: Unicode, Inc. and others.
2# License & terms of use: http://www.unicode.org/copyright.html
3# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
4#
5# File: InterIndic_Arabic.txt
6# Generated from CLDR
7#
8
9$nonword = [^\uE000-\uE0FF];
10$wordBoundary = [^[:L:][:M:][:N:]];
11\uE015\uE03F\uE02F\uE03E } $nonword→كيا; # किया
12\uE026\uE03F\uE02F\uE03E } $nonword→ديا; # दिया
13\uE015\uE03F } $nonword→كي; # कि at word end
14\uE039\uE048→هي; # ह\u0948
15\uE001 } $nonword→ن; # chandrabindu at end to noon
16\uE001→ن; # chandrabindu not at end to noon
17\uE002 } $nonword→ن; # anusvara to noon at end
18\uE002→ن; # anusvara to noon \u0902
19\uE003→ه ا; # viarga to ha + alif  ः
20\uE004→ا; # short a to alif ऄ
21\uE005→ا; # अ
22\uE006→ا \u0653; # alif with mad आ
23[[:L:][:M:]] {\uE007}→ي; # इ after another letter or mark
24\uE007→إ; # इ at beginning of word
25[[:L:][:M:]] {\uE008}→ي; # ई after another letter or mark
26\uE008→إ; # ई at beginning of word
27\uE009→و; # उ
28\uE00A→و; # ऊ
29\uE00B→ر; # ऋ
30\uE00C→ل; # ऌ
31\uE00D→ا ي; # ऍ
32\uE00E→ي; # ऎ
33$wordBoundary {\uE00F} → إي; # word-initial ए
34\uE00F  } $nonword→ي; # ए use ي when at end
35\uE00F→ي; # ए use ي when not at end
36\uE010  } $nonword→ا ي; # ऐ use ي when at end
37\uE010→ا ي; # ऐ use ي when not at end
38\uE011→ا و; # ऑ
39\uE012→ا و; # ऒ
40\uE013→ا و; # ओ
41\uE014→ا و; # औ
42\uE015→ك; # क
43\uE016→كه; # ख
44\uE017→ج; # ग
45\uE018→جه; # घ
46\uE019→نج; # ङ
47\uE01A→تش; # च
48\uE01B→تشه; # छ
49\uE01C→ج; # ज
50\uE01D→جه; # झ
51\uE01E→ن; # ञ
52\uE01F→ط; # ट
53\uE020→طه; # ठ
54\uE021→د; # ड
55\uE022→ده; # ढ
56\uE023→ن; # ण
57\uE024→ت; # त
58\uE025→ته; # थ
59\uE026→د; # द
60\uE027→ده; # ध
61\uE028→ن; # न
62\uE029→ن; # ऩ
63\uE02A→ب; # प
64\uE02B→به; # फ
65\uE02C→ب; # ब
66\uE02D→به; # भ
67\uE02E→م; # म
68\uE02F→ي; # य
69\uE030→ر; # र
70\uE031→ر; # ऱ
71\uE032→ل; # ल
72\uE033→ر; # ळ
73\uE034→ر; # ऴ
74\uE035→و; # व
75\uE036→ش; # श
76\uE037→ش; # ष
77\uE038→س; # स
78\uE039→ه; # ह
79\uE03C→; # \u093C
80\uE03D→; # ऽ
81\uE03E→ا; # ा
82\uE03F→ي; # ि
83\uE040→ي; # ी
84\uE041→و; # \u0941
85\uE042→و; # \u0942
86\uE043→ر; # \u0943
87\uE044→ر; # \u0944
88\uE045→ن; # \u0945
89\uE046→ي; # \u0946
90\uE047 } $nonword→ي; # \u0947 use ي when at end
91\uE047→ي; # \u0947 use ي when not at end
92\uE048 } $nonword→ا ي; # \u0948 use ي when at end
93\uE048→ا ي; # \u0948 use ي when not at end
94\uE049→و; # ॉ
95\uE04A→ا و; # ॊ
96\uE04B→و; # ो
97\uE04C→ا و; # ौ
98\uE04D→; # \u094D
99\uE050→ا و; # ॐ
100\uE051→; # \u0951
101\uE052→; # \u0952
102\uE053→; # \u0953
103\uE054→; # \u0954
104\uE058→ق; # क़
105\uE059→خ; # ख़
106\uE05A→غ; # ग़
107\uE05B→ز; # ज़
108\uE05C→ر; # ड़
109\uE05D→ره; # ढ़
110\uE05E→ف; # फ़
111\uE05F→ي; # य़
112\uE060→ر; # ॠ
113\uE061→ل; # ॡ
114\uE062→ل; # \u0962
115\uE063→ل; # \u0963
116\uE064→۔; # ।
117\uE065→۔; # ॥
118\uE066→\.; # ०
119\uE067→١; # १
120\uE068→٢; # २
121\uE069→٣; # ३
122\uE06A→٤; # ४
123\uE06B→٥; # ५
124\uE06C→٦; # ६
125\uE06D→٧; # ७
126\uE06E→٨; # ८
127\uE06F→٩; # ९
128\uE070→\.; # ॰
129\uE082→; # ॽ
130# Remove sequences of alif characters.
131# For example, transform पाओला → بااولا → باولا.
132::null;
133$alif = [أإآا] [:M:]*;
134($alif) $alif+ → $1;
135
136