• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!--
4Copyright © 1991-2013 Unicode, Inc.
5CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
6For terms of use, see http://www.unicode.org/copyright.html
7-->
8<supplementalData>
9	<version number="$Revision: 13787 $"/>
10	<transforms>
11		<transform source="bg" target="bg_Latn" variant="BGN" direction="forward" draft="contributed" alias="Bulgarian-Latin/BGN bg-Latn-t-bg-m0-bgn">
12			<tRule><![CDATA[
13#
14########################################################################
15# BGN/PCGN 1952 System
16#
17# This system was adopted by the BGN in 1949 and by the PCGN in 1952.
18# It reflects the much simplified Bulgarian orthography as officially
19# revised in February 1945. The Bulgarian alphabet contains all of
20# the characters present in the Russian alphabet with the exception
21# of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given.
22#
23# The Bulgarian Alphabet as defined by the BGN (Page 15):
24#
25#   АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ
26#   абвгдежзийклмнопрстуфхцчшщъьюяѫѣ
27#
28# Originally prepared by Michael Everson <everson@evertype.com>
29########################################################################
30#
31# MINIMAL FILTER: Bulgarian-Latin
32#
33
34:: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ;
35:: NFD (NFC) ;
36#
37#
38########################################################################
39
40
41#
42########################################################################
43#
44# Define All Transformation Variables
45#
46########################################################################
47#
48
49$upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ;
50$lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ;
51$consonants = [$upperConsonants $lowerConsonants] ;
52
53$upperVowels = [АЕИОУЪЮЯѪѢ] ;
54$lowerVowels = [аеиоуъюяѫѣ] ;
55$vowels = [$upperVowels $lowerVowels] ;
56
57$lower = [$lowerConsonants $lowerVowels] ;
58
59$bulgarian = [ $lower $upperConsonants $upperVowels ] ;
60#
61#
62# Use this $wordBoundary until bug 2034 is fixed in ICU:
63# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
64#
65
66$wordBoundary =  [^[:L:][:M:][:N:]] ;
67#
68#
69########################################################################
70
71
72#
73########################################################################
74#
75# Start of Alphabetic Transformations
76#
77########################################################################
78#
79
80А → A ; # CYRILLIC CAPITAL LETTER A
81а → a ; # CYRILLIC SMALL LETTER A
82Б → B ; # CYRILLIC CAPITAL LETTER BE
83б → b ; # CYRILLIC SMALL LETTER BE
84В → V ; # CYRILLIC CAPITAL LETTER VE
85в → v ; # CYRILLIC SMALL LETTER VE
86Г → G ; # CYRILLIC CAPITAL LETTER GHE
87г → g ; # CYRILLIC SMALL LETTER GHE
88Д → D ; # CYRILLIC CAPITAL LETTER DE
89д → d ; # CYRILLIC SMALL LETTER DE
90Е → E ; # CYRILLIC CAPITAL LETTER DE
91е → e ; # CYRILLIC SMALL LETTER DE
92Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE
93Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE
94ж → zh ; # CYRILLIC SMALL LETTER ZHE
95З → Z ; # CYRILLIC CAPITAL LETTER ZE
96з → z ; # CYRILLIC SMALL LETTER ZE
97И → I ; # CYRILLIC CAPITAL LETTER I
98и → i ; # CYRILLIC SMALL LETTER I
99Й → Y ; # CYRILLIC CAPITAL LETTER I
100й → y ; # CYRILLIC SMALL LETTER I
101К → K ; # CYRILLIC CAPITAL LETTER KA
102к → k ; # CYRILLIC SMALL LETTER KA
103Л → L ; # CYRILLIC CAPITAL LETTER EL
104л → l ; # CYRILLIC SMALL LETTER EL
105М → M ; # CYRILLIC CAPITAL LETTER EM
106м → m ; # CYRILLIC SMALL LETTER EM
107Н → N ; # CYRILLIC CAPITAL LETTER EN
108н → n ; # CYRILLIC SMALL LETTER EN
109О → O ; # CYRILLIC CAPITAL LETTER O
110о → o ; # CYRILLIC SMALL LETTER O
111П → P ; # CYRILLIC CAPITAL LETTER PE
112п → p ; # CYRILLIC SMALL LETTER PE
113Р → R ; # CYRILLIC CAPITAL LETTER ER
114р → r ; # CYRILLIC SMALL LETTER ER
115С → S ; # CYRILLIC CAPITAL LETTER ES
116с → s ; # CYRILLIC SMALL LETTER ES
117#
118#
119########################################################################
120#
121# BGN Page 16 Note 4
122#
123# тс becomes t·s
124#
125########################################################################
126#
127
128ТС → T·S ; # CYRILLIC CAPITAL LETTER TE
129Тс → T·s ; # CYRILLIC CAPITAL LETTER TE
130тс → t·s ; # CYRILLIC SMALL LETTER TE
131Т → T ; # CYRILLIC CAPITAL LETTER TE
132т → t ; # CYRILLIC SMALL LETTER TE
133#
134#
135########################################################################
136#
137# End Note 4
138#
139########################################################################
140
141
142У → U ; # CYRILLIC CAPITAL LETTER U
143у → u ; # CYRILLIC SMALL LETTER U
144Ф → F ; # CYRILLIC CAPITAL LETTER EF
145ф → f ; # CYRILLIC SMALL LETTER EF
146Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
147Х → KH ; # CYRILLIC CAPITAL LETTER HA
148х → kh ; # CYRILLIC SMALL LETTER HA
149Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
150Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
151ц → ts ; # CYRILLIC SMALL LETTER TSE
152Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
153Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
154ч → ch ; # CYRILLIC SMALL LETTER CHE
155
156#
157########################################################################
158#
159# Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6).
160#
161# шт becomes sh·t
162#
163########################################################################
164#
165
166ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA
167Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA
168шт → sh·t ; # CYRILLIC SMALL LETTER SHA
169Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
170Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
171ш → sh ; # CYRILLIC SMALL LETTER SHA
172Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA
173Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA
174щ → sht ; # CYRILLIC SMALL LETTER SHCHA
175#
176#
177########################################################################
178#
179# End Implied rule
180#
181########################################################################
182
183
184Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN
185ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN
186
187#
188########################################################################
189#
190# BGN Page 16 Note 1
191#
192# In modern Bulgarian orthography, the character ъ does not occur in
193# word-final position.  It should be omitted in romanization when found
194# on older sources.
195#
196# The following rule removes all Ъъ at the end of a word. It is assumed
197# that when the condition is met, the text must be from an older source.
198# Comment out with a '#' at the start of a line to disable.
199#
200#
201########################################################################
202#
203
204$bulgarian { [Ъъ]  } $wordBoundary > ;
205#
206#
207########################################################################
208#
209# End BGN Page 16 Note 1
210#
211########################################################################
212
213
214Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN
215ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN
216Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
217Ю → YU ; # CYRILLIC CAPITAL LETTER YU
218ю → yu ; # CYRILLIC SMALL LETTER YU
219Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
220Я → YA ; # CYRILLIC CAPITAL LETTER YA
221я → ya ; # CYRILLIC SMALL LETTER YA
222
223#
224########################################################################
225#
226# BGN Page 16 Note 2
227#
228# The obsolete character Ѫ, which was replaced by Ъ in 1945, should be
229# romanized Ŭ.
230#
231########################################################################
232#
233
234Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS
235ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS
236#
237#
238########################################################################
239#
240# End BGN Page 16 Note 2
241#
242########################################################################
243
244
245#
246########################################################################
247#
248# BGN Page 16 Note 3
249#
250# The obsolete character Ѣ, replaced in 1945 by Я or Е according to local
251# pronunciation, should be romanized as e or ya, accordingly, if the
252# pronunciation is known; otherwise as ye.
253#
254########################################################################
255#
256
257Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT
258Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT
259ѣ → ye ; # CYRILLIC SMALL LETTER YAT
260#
261#
262# Alternative rule where appropriate for local pronounciation. To apply
263# uncomment the following by removing the '#' mark at the start of the
264# line and insert before the three rule lines above.
265#
266# Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT
267# Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT
268# ѣ → e ; # CYRILLIC SMALL LETTER YAT
269#
270########################################################################
271#
272# End BGN Page 16 Note 3
273#
274########################################################################
275
276			]]></tRule>
277		</transform>
278	</transforms>
279</supplementalData>
280