• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# © 2016 and later: Unicode, Inc. and others.
2# License & terms of use: http://www.unicode.org/copyright.html#License
3#
4# File: bg_bg_Latn_BGN.txt
5# Generated from CLDR
6#
7
8#
9########################################################################
10# BGN/PCGN 1952 System
11#
12# This system was adopted by the BGN in 1949 and by the PCGN in 1952.
13# It reflects the much simplified Bulgarian orthography as officially
14# revised in February 1945. The Bulgarian alphabet contains all of
15# the characters present in the Russian alphabet with the exception
16# of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given.
17#
18# The Bulgarian Alphabet as defined by the BGN (Page 15):
19#
20#   АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ
21#   абвгдежзийклмнопрстуфхцчшщъьюяѫѣ
22#
23# Originally prepared by Michael Everson <everson@evertype.com>
24########################################################################
25#
26# MINIMAL FILTER: Bulgarian-Latin
27#
28:: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ;
29:: NFD (NFC) ;
30#
31#
32########################################################################
33#
34########################################################################
35#
36# Define All Transformation Variables
37#
38########################################################################
39#
40$upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ;
41$lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ;
42$consonants = [$upperConsonants $lowerConsonants] ;
43$upperVowels = [АЕИОУЪЮЯѪѢ] ;
44$lowerVowels = [аеиоуъюяѫѣ] ;
45$vowels = [$upperVowels $lowerVowels] ;
46$lower = [$lowerConsonants $lowerVowels] ;
47$bulgarian = [ $lower $upperConsonants $upperVowels ] ;
48#
49#
50# Use this $wordBoundary until bug 2034 is fixed in ICU:
51# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
52#
53$wordBoundary =  [^[:L:][:M:][:N:]] ;
54#
55#
56########################################################################
57#
58########################################################################
59#
60# Start of Alphabetic Transformations
61#
62########################################################################
63#
64А → A ; # CYRILLIC CAPITAL LETTER A
65а → a ; # CYRILLIC SMALL LETTER A
66Б → B ; # CYRILLIC CAPITAL LETTER BE
67б → b ; # CYRILLIC SMALL LETTER BE
68В → V ; # CYRILLIC CAPITAL LETTER VE
69в → v ; # CYRILLIC SMALL LETTER VE
70Г → G ; # CYRILLIC CAPITAL LETTER GHE
71г → g ; # CYRILLIC SMALL LETTER GHE
72Д → D ; # CYRILLIC CAPITAL LETTER DE
73д → d ; # CYRILLIC SMALL LETTER DE
74Е → E ; # CYRILLIC CAPITAL LETTER DE
75е → e ; # CYRILLIC SMALL LETTER DE
76Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE
77Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE
78ж → zh ; # CYRILLIC SMALL LETTER ZHE
79З → Z ; # CYRILLIC CAPITAL LETTER ZE
80з → z ; # CYRILLIC SMALL LETTER ZE
81И → I ; # CYRILLIC CAPITAL LETTER I
82и → i ; # CYRILLIC SMALL LETTER I
83Й → Y ; # CYRILLIC CAPITAL LETTER I
84й → y ; # CYRILLIC SMALL LETTER I
85К → K ; # CYRILLIC CAPITAL LETTER KA
86к → k ; # CYRILLIC SMALL LETTER KA
87Л → L ; # CYRILLIC CAPITAL LETTER EL
88л → l ; # CYRILLIC SMALL LETTER EL
89М → M ; # CYRILLIC CAPITAL LETTER EM
90м → m ; # CYRILLIC SMALL LETTER EM
91Н → N ; # CYRILLIC CAPITAL LETTER EN
92н → n ; # CYRILLIC SMALL LETTER EN
93О → O ; # CYRILLIC CAPITAL LETTER O
94о → o ; # CYRILLIC SMALL LETTER O
95П → P ; # CYRILLIC CAPITAL LETTER PE
96п → p ; # CYRILLIC SMALL LETTER PE
97Р → R ; # CYRILLIC CAPITAL LETTER ER
98р → r ; # CYRILLIC SMALL LETTER ER
99С → S ; # CYRILLIC CAPITAL LETTER ES
100с → s ; # CYRILLIC SMALL LETTER ES
101#
102#
103########################################################################
104#
105# BGN Page 16 Note 4
106#
107# тс becomes t·s
108#
109########################################################################
110#
111ТС → T·S ; # CYRILLIC CAPITAL LETTER TE
112Тс → T·s ; # CYRILLIC CAPITAL LETTER TE
113тс → t·s ; # CYRILLIC SMALL LETTER TE
114Т → T ; # CYRILLIC CAPITAL LETTER TE
115т → t ; # CYRILLIC SMALL LETTER TE
116#
117#
118########################################################################
119#
120# End Note 4
121#
122########################################################################
123У → U ; # CYRILLIC CAPITAL LETTER U
124у → u ; # CYRILLIC SMALL LETTER U
125Ф → F ; # CYRILLIC CAPITAL LETTER EF
126ф → f ; # CYRILLIC SMALL LETTER EF
127Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
128Х → KH ; # CYRILLIC CAPITAL LETTER HA
129х → kh ; # CYRILLIC SMALL LETTER HA
130Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
131Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
132ц → ts ; # CYRILLIC SMALL LETTER TSE
133Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
134Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
135ч → ch ; # CYRILLIC SMALL LETTER CHE
136#
137########################################################################
138#
139# Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6).
140#
141# шт becomes sh·t
142#
143########################################################################
144#
145ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA
146Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA
147шт → sh·t ; # CYRILLIC SMALL LETTER SHA
148Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
149Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
150ш → sh ; # CYRILLIC SMALL LETTER SHA
151Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA
152Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA
153щ → sht ; # CYRILLIC SMALL LETTER SHCHA
154#
155#
156########################################################################
157#
158# End Implied rule
159#
160########################################################################
161Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN
162ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN
163#
164########################################################################
165#
166# BGN Page 16 Note 1
167#
168# In modern Bulgarian orthography, the character ъ does not occur in
169# word-final position.  It should be omitted in romanization when found
170# on older sources.
171#
172# The following rule removes all Ъъ at the end of a word. It is assumed
173# that when the condition is met, the text must be from an older source.
174# Comment out with a '#' at the start of a line to disable.
175#
176#
177########################################################################
178#
179$bulgarian { [Ъъ]  } $wordBoundary > ;
180#
181#
182########################################################################
183#
184# End BGN Page 16 Note 1
185#
186########################################################################
187Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN
188ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN
189Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
190Ю → YU ; # CYRILLIC CAPITAL LETTER YU
191ю → yu ; # CYRILLIC SMALL LETTER YU
192Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
193Я → YA ; # CYRILLIC CAPITAL LETTER YA
194я → ya ; # CYRILLIC SMALL LETTER YA
195#
196########################################################################
197#
198# BGN Page 16 Note 2
199#
200# The obsolete character Ѫ, which was replaced by Ъ in 1945, should be
201# romanized Ŭ.
202#
203########################################################################
204#
205Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS
206ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS
207#
208#
209########################################################################
210#
211# End BGN Page 16 Note 2
212#
213########################################################################
214#
215########################################################################
216#
217# BGN Page 16 Note 3
218#
219# The obsolete character Ѣ, replaced in 1945 by Я or Е according to local
220# pronunciation, should be romanized as e or ya, accordingly, if the
221# pronunciation is known; otherwise as ye.
222#
223########################################################################
224#
225Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT
226Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT
227ѣ → ye ; # CYRILLIC SMALL LETTER YAT
228#
229#
230# Alternative rule where appropriate for local pronounciation. To apply
231# uncomment the following by removing the '#' mark at the start of the
232# line and insert before the three rule lines above.
233#
234# Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT
235# Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT
236# ѣ → e ; # CYRILLIC SMALL LETTER YAT
237#
238########################################################################
239#
240# End BGN Page 16 Note 3
241#
242########################################################################
243
244