• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# © 2016 and later: Unicode, Inc. and others.
2# License & terms of use: http://www.unicode.org/copyright.html#License
3#
4# File: fa_fa_Latn_BGN.txt
5# Generated from CLDR
6#
7
8#
9########################################################################
10# BGN/PCGN 1956 System
11#
12# This system was adopted by the BGN in 1946 and by the PCGN in 1958.
13# It is used for the romanization of geographic names in Iran and
14# for Persian-language names in Afghanistan.
15#
16# Originally prepared by Michael Everson <everson@evertype.com>
17########################################################################
18#
19# MINIMAL FILTER: Persian-Latin
20#
21:: [[:arabic:][:block=ARABIC:][ءآابةتثجحخدذرزسشصضطظعغفقكلمنهویي\u064E\u064F\u0650\u0651\u0652٠١٢٣٤٥٦٧٨٩پچژگی]] ;
22:: NFKD (NFC) ;
23#
24#
25########################################################################
26#
27########################################################################
28#
29# Define All Transformation Variables
30#
31########################################################################
32#
33$alef = ’;
34$ayin = ‘;
35$disambig =  \u0331 ;
36#
37#
38# Use this $wordBoundary until bug 2034 is fixed in ICU:
39# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
40#
41$wordBoundary =  [^[:L:][:M:][:N:]] ;
42#
43#
44########################################################################
45# non-letters
46[:Nd:]{٫}[:Nd:] ↔ [:Nd:]{','}[:Nd:] ; # ARABIC DECIMAL SEPARATOR
47[:Nd:]{٬}[:Nd:] ↔ [:Nd:]{'.'}[:Nd:] ; # ARABIC THOUSANDS SEPARATOR
48٫ ↔ ',' $disambig ; # ARABIC DECIMAL SEPARATOR
49٬ ↔ '.' $disambig ; # ARABIC THOUSANDS SEPARATOR
50#  ٭ ↔ ; # ARABIC FIVE POINTED STAR // no need to transliterate
51، ↔ ',' ; # ARABIC COMMA
52؛ ↔ ';' ; # ARABIC SEMICOLON
53؟ ↔ '?' ; # ARABIC QUESTION MARK
54٪ ↔ '%' ; # ARABIC PERCENT SIGN
55٠ ↔ 0 $disambig ; # ARABIC-INDIC DIGIT ZERO
56١ ↔ 1 $disambig ; # ARABIC-INDIC DIGIT ONE
57٢ ↔ 2 $disambig ; # ARABIC-INDIC DIGIT TWO
58٣ ↔ 3 $disambig ; # ARABIC-INDIC DIGIT THREE
59٤ ↔ 4 $disambig ; # ARABIC-INDIC DIGIT FOUR
60٥ ↔ 5 $disambig ; # ARABIC-INDIC DIGIT FIVE
61٦ ↔ 6 $disambig ; # ARABIC-INDIC DIGIT SIX
62٧ ↔ 7 $disambig ; # ARABIC-INDIC DIGIT SEVEN
63٨ ↔ 8 $disambig ; # ARABIC-INDIC DIGIT EIGHT
64٩ ↔ 9 $disambig ; # ARABIC-INDIC DIGIT NINE
65۰ ↔ 0 ; # EXTENDED ARABIC-INDIC DIGIT ZERO
66۱ ↔ 1 ; # EXTENDED ARABIC-INDIC DIGIT ONE
67۲ ↔ 2 ; # EXTENDED ARABIC-INDIC DIGIT TWO
68۳ ↔ 3 ; # EXTENDED ARABIC-INDIC DIGIT THREE
69۴ ↔ 4 ; # EXTENDED ARABIC-INDIC DIGIT FOUR
70۵ ↔ 5 ; # EXTENDED ARABIC-INDIC DIGIT FIVE
71۶ ↔ 6 ; # EXTENDED ARABIC-INDIC DIGIT SIX
72۷ ↔ 7 ; # EXTENDED ARABIC-INDIC DIGIT SEVEN
73۸ ↔ 8 ; # EXTENDED ARABIC-INDIC DIGIT EIGHT
74۹ ↔ 9 ; # EXTENDED ARABIC-INDIC DIGIT NINE
75#
76########################################################################
77#
78# Rules moved to front to avoid masking
79#
80########################################################################
81#
82########################################################################
83#
84# BGN Page 89 Rule 4
85#
86# The character sequences كه , زه , سه , and گه may be romanized k·h, z·h,
87# s·h, and g·h in order to differentiate those romanizations from the
88# digraphs kh, zh, sh, and gh.
89#
90########################################################################
91#
92كه → k·h ; # ARABIC LETTER KAF + HEH
93زه → z·h ; # ARABIC LETTER ZAIN + HEH
94سه → s·h ; # ARABIC LETTER SEEN + HEH
95گه → g·h ; # ARABIC LETTER GAF + HEH
96#
97#
98########################################################################
99#
100# End Rule 4
101#
102########################################################################
103#
104########################################################################
105#
106# BGN Page 91 Rule 7
107#
108# Doubles consonant sounds are represented in Arabic script by
109# placing a shaddah ( \u0651 ) over a consonant character. In romanization
110# the letter should be doubled. [The remainder of this rule deals with
111# the definite article and is lexical.]
112#
113########################################################################
114#
115ب\u0651 → bb ; # ARABIC LETTER BEH + SHADDA
116پ\u0651 → pp ; # ARABIC LETTER PEH + SHADDA
117ت\u0651 → tt ; # ARABIC LETTER TEH + SHADDA
118ث\u0651 → s\u0304s\u0304 ; # ARABIC LETTER THEH + SHADDA
119ج\u0651 → jj ; # ARABIC LETTER JEEM + SHADDA
120چ\u0651 → chch ; # ARABIC LETTER TCHEH + SHADDA
121ح\u0651 → ḥḥ ; # ARABIC LETTER HAH + SHADDA
122خ\u0651 → khkh ; # ARABIC LETTER KHAH + SHADDA
123د\u0651 → dd ; # ARABIC LETTER DAL + SHADDA
124ذ\u0651 → z\u0304z\u0304 ; # ARABIC LETTER THAL + SHADDA
125ر\u0651 → rr ; # ARABIC LETTER REH + SHADDA
126ز\u0651 → zz ; # ARABIC LETTER ZAIN + SHADDA
127ژ\u0651 → zhzh ; # ARABIC LETTER JEH + SHADDA
128س\u0651 → ss ; # ARABIC LETTER SEEN + SHADDA
129ش\u0651 → shsh ; # ARABIC LETTER SHEEN + SHADDA
130ص\u0651 → ṣṣ ; # ARABIC LETTER SAD + SHADDA
131ض\u0651 → ḍḍ ; # ARABIC LETTER DAD + SHADDA
132ط\u0651 → ṭṭ ; # ARABIC LETTER TAH + SHADDA
133ظ\u0651 → ẓẓ ; # ARABIC LETTER ZAH + SHADDA
134ع\u0651 → $ayin $ayin ; # ARABIC LETTER AIN + SHADDA
135غ\u0651 → ghgh ; # ARABIC LETTER GHAIN + SHADDA
136ف\u0651 → ff ; # ARABIC LETTER FEH + SHADDA
137ق\u0651 → qq ; # ARABIC LETTER QAF + SHADDA
138ك\u0651 → kk ; # ARABIC LETTER KAF + SHADDA
139ل\u0651 → ll ; # ARABIC LETTER LAM + SHADDA
140م\u0651 → mm ; # ARABIC LETTER MEEM + SHADDA
141ن\u0651 → nn ; # ARABIC LETTER NOON + SHADDA
142ه\u0651 → hh ; # ARABIC LETTER HEH + SHADDA
143و\u0651 → ww ; # ARABIC LETTER WAW + SHADDA
144ی\u0651 → yy ; # ARABIC LETTER FARSI YEH + SHADDA
145#
146#
147########################################################################
148#
149# End Rule 7
150#
151########################################################################
152#
153########################################################################
154#
155# Start of Transformations
156#
157########################################################################
158#
159$wordBoundary{ء →  ; # ARABIC LETTER HAMZA
160ء → $alef ; # ARABIC LETTER HAMZA
161$wordBoundary{ا →  ; # ARABIC LETTER ALEF
162آ → $alef ā ; # ARABIC FATHA ALEF WITH MADDA ABOVE
163ب → b ; # ARABIC LETTER BEH
164پ → p ; # ARABIC LETTER PEH
165ت → t ; # ARABIC LETTER TEH
166ة → h ; # ARABIC LETTER TEH MARBUTA
167ث → s\u0304 ; # ARABIC LETTER THEH
168ج → j ; # ARABIC LETTER JEEM
169چ → ch ; # ARABIC LETTER TCHEH
170ح → ḥ ; # ARABIC LETTER HAH
171خ → kh ; # ARABIC LETTER KHAH
172د → d ; # ARABIC LETTER DAL
173ذ → z\u0304 ; # ARABIC LETTER THAL
174ر → r ; # ARABIC LETTER REH
175ز → z ; # ARABIC LETTER ZAIN
176ژ → zh ; # ARABIC LETTER JEH
177س → s ; # ARABIC LETTER SEEN
178ش → sh ; # ARABIC LETTER SHEEN
179ص → ṣ ; # ARABIC LETTER SAD
180ض → ẕ ; # ARABIC LETTER DAD
181ط → ṭ ; # ARABIC LETTER TAH
182ظ → ẓ ; # ARABIC LETTER ZAH
183ع → $ayin ; # ARABIC LETTER AIN
184غ → gh ; # ARABIC LETTER GHAIN
185ف → f ; # ARABIC LETTER FEH
186ق → q ; # ARABIC LETTER QAF
187ک ↔ k ; # ARABIC LETTER KEHEH
188ك ↔ k $disambig ; # ARABIC LETTER KAF
189گ → g ; # ARABIC LETTER GAF
190ل → l ; # ARABIC LETTER LAM
191م → m ; # ARABIC LETTER MEEM
192ن → n ; # ARABIC LETTER NOON
193ه → h ; # ARABIC LETTER HEH
194و → v ; # ARABIC LETTER WAW
195ی → y ; # ARABIC LETTER FARSI YEH
196\u064Eا → ā ; # ARABIC FATHA + ALEF
197\u064Eی → á ; # ARABIC FATHA + FARSI YEH
198\u064Eو\u0652 → ow ; # ARABIC FATHA + WAW + SUKUN
199\u064E → a ; # ARABIC FATHA
200\u0650ي → ī ; # ARABIC KASRA + YEH
201\u0650 → e ; # ARABIC KASRA
202\u064Fو → ū ; # ARABIC DAMMA + WAW
203\u064F → o ; # ARABIC DAMMA
204\u0652 →  ; # ARABIC SUKUN
205::NFC (NFD) ;
206#
207#
208########################################################################
209
210