1# © 2016 and later: Unicode, Inc. and others. 2# License & terms of use: http://www.unicode.org/copyright.html#License 3# 4# File: ru_ru_Latn_BGN.txt 5# Generated from CLDR 6# 7 8# BGN/PCGN 1947 System 9# 10# The BGN/PCGN system for Russian was adopted by the BGN in 1944 and 11# by the PCGN in 1947 for use in romanizing names written in the 12# Russian Cyrillic alphabet. 13# 14# The Russian Alphabet as defined by the BGN (Page 93): 15# АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ 16# абвгдеёжзийклмнопрстуфхцчшщъыьэюя 17# 18# Originally prepared by Michael Everson everson@evertype.com 19# Fixed by Frank Yung-Fong Tang ftang@google.com 20# 21# Test Data from http://en.wikipedia.org/wiki/BGN/PCGN_romanization_of_Russian 22######################################################################## 23# MINIMAL FILTER: Russian-Latin 24::[АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯабвгдеёжзийклмнопрстуфхцчшщъыьэюя]; 25::NFC; 26######################################################################## 27# Define All Transformation Variables 28######################################################################## 29$prime = ʹ ; 30$doublePrime = ʺ ; 31$wordBoundary = [^[:L:][:M:][:N:]] ; 32$upperVowels = [АЕЁЭИОУЫЮЯ] ; 33$lowerVowels = [аеёэиоуыюя] ; 34$vowels = [$upperVowels $lowerVowels] ; 35$upperConsonants = [[:Uppercase:]-$vowels] ; 36$lowerConsonants = [[:Lowercase:]-$vowels] ; 37$consonants = [$upperConsonants $lowerConsonants] ; 38$upper = [:Uppercase:]; 39$lower = [:Lowercase:]; 40######################################################################## 41# Rules moved to front to avoid masking 42######################################################################## 43$lowerVowels { ы → ·y ; 44$upperVowels { [Ыы] } $lower → ·y ; 45$upperVowels { [Ыы] } → ·Y ; 46[$consonants - [Йй]]{Э → ·E ; 47[$consonants - [Йй]]{э → ·e ; 48[$upperVowels [ЙЪЬ]] { Е } $upper → YE ; # CYRILLIC CAPITAL LETTER IE 49[$upperVowels [ЙЪЬ]] { Е → Ye ; # CYRILLIC CAPITAL LETTER IE 50[$upperVowels $lowerVowels [ЙйЪъЬь]] { е → ye ; # CYRILLIC SMALL LETTER IE 51[$upperVowels [ЙЪЬ]] { Ё } $upper → YË ; # CYRILLIC CAPITAL LETTER IO 52[$upperVowels [ЙЪЬ]] { Ё → Yë ; # CYRILLIC CAPITAL LETTER IO 53[$upperVowels $lowerVowels [ЙйЪъЬь]] { ё → yë ; # CYRILLIC SMALL LETTER IO 54# Since in the above rule we look at the Cyrillic context before the E/Ё/ё, 55# we have to transform these in a separate pass before we change the vowels. 56# The ::Null forces a separate pass. 57::Null; 58######################################################################## 59# Start of Alphabetic Transformations 60######################################################################## 61А → A ; # CYRILLIC CAPITAL LETTER A 62а → a ; # CYRILLIC SMALL LETTER A 63Б → B ; # CYRILLIC CAPITAL LETTER BE 64б → b ; # CYRILLIC SMALL LETTER BE 65В → V ; # CYRILLIC CAPITAL LETTER VE 66в → v ; # CYRILLIC SMALL LETTER VE 67Г → G ; # CYRILLIC CAPITAL LETTER GHE 68г → g ; # CYRILLIC SMALL LETTER GHE 69Д → D ; # CYRILLIC CAPITAL LETTER DE 70д → d ; # CYRILLIC SMALL LETTER DE 71######################################################################## 72# BGN Page 94 Rule 1: 73# # The character e should be romanized ye 74# initially, after the vowel # characters a, e, ё, и, о, у, ы, э, ю, 75# and я, and after й, ъ, and ь. 76# In all other instances, it should 77# be romanized e. 78######################################################################## 79# BUG(ftang)- the following two lines said BEFORE the vowels, instead of AFTER 80# Е}[$upperVowels [ЙЪЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE 81# Е}[$lowerVowels [йъь]] → Ye ; # CYRILLIC CAPITAL LETTER IE 82$wordBoundary{Е} $upper → YE ; # CYRILLIC CAPITAL LETTER IE 83$wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE 84Е → E ; # CYRILLIC CAPITAL LETTER IE 85# 86# BUG(ftang)- the following line said BEFORE the vowels, instead of AFTER 87# е}[$upperVowels $lowerVowels [ЙйЪъЬь]] → ye ; # CYRILLIC SMALL LETTER IE 88$wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE 89е → e ; # CYRILLIC SMALL LETTER IE 90######################################################################## 91# End of Rule 1 92######################################################################## 93######################################################################## 94# BGN Page 94 Rule 2: 95# 96# The character ё is not considered a separate character of the 97# Russian alphabet and the dieresis is generally not shown. When the 98# dieresis is shown, the character should be romanized yë initially, 99# after the vowel characters a, e, ё, и, о, у, ы, э, ю, and я, and 100# after й, ъ, and ь, In all other instances, it should be romanized 101# ё. When the dieresis is not shown, the character may still be 102# romanized in the preceding manner or, alternatively, in accordance 103# with note 1. 104######################################################################## 105# BUG(ftang)- the following two lines said BEFORE the vowels, instead of AFTER 106# Ё}[$upperVowels [ЙЪЬ]] → YË ; # CYRILLIC CAPITAL LETTER IO 107# Ё}[$lowerVowels [йъь]] → Yë ; # CYRILLIC CAPITAL LETTER IO 108$wordBoundary {Ё} [·]? $upper → YË ; # CYRILLIC CAPITAL LETTER IO 109$wordBoundary {Ё} [·]? $lower → Yë ; # CYRILLIC CAPITAL LETTER IO 110Ё → Ë ; # CYRILLIC CAPITAL LETTER IO 111# BUG(ftang)- the following line said BEFORE the vowels, instead of AFTER 112# ё}[$upperVowels $lowerVowels [ЙйЪъЬь]] → yë ; # CYRILLIC SMALL LETTER IO 113$wordBoundary{ё → yë ; # CYRILLIC SMALL LETTER IO 114ё → ë ; # CYRILLIC SMALL LETTER IO 115######################################################################## 116# End of Rule 2 117######################################################################## 118Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE 119Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE 120ж → zh ; # CYRILLIC SMALL LETTER ZHE 121######################################################################## 122# BGN Page 94 Rule 3.4 123# э after any consonant character except 124# й becomes ·е 125######################################################################## 126З → Z ; # CYRILLIC CAPITAL LETTER ZE 127з → z ; # CYRILLIC SMALL LETTER ZE 128# BUG(ftang) The following two lines said those consonant becomes ·е 129# [$consonants - [Йй]]}Э → ·Е ; 130# [$consonants - [Йй]]}э → ·е ; 131######################################################################## 132# End of Rule 3.4 133######################################################################## 134И → I ; # CYRILLIC CAPITAL LETTER I 135и → i ; # CYRILLIC SMALL LETTER I 136######################################################################## 137# BGN Page 94 Rule 3: 138# 139# Unusual Russian character sequences occurring primarily in 140# non-Russian-language names may be romanized as shown below in order 141# to provide differentiation from regularly-occurring digraphs and 142# character sequences. 143# 144# BGN Page 94 Rule 3.1 145# й before а, у, ы, or э becomes у· 146######################################################################## 147Й}[АаУуЫыЭэ] → Y· ; # CYRILLIC CAPITAL LETTER I 148й}[АаУуЫыЭэ] → y· ; # CYRILLIC SMALL LETTER I 149Й → Y ; # CYRILLIC CAPITAL LETTER I 150й → y ; # CYRILLIC SMALL LETTER I 151######################################################################## 152# End Rule 3.1 153######################################################################## 154К → K ; # CYRILLIC CAPITAL LETTER KA 155к → k ; # CYRILLIC SMALL LETTER KA 156Л → L ; # CYRILLIC CAPITAL LETTER EL 157л → l ; # CYRILLIC SMALL LETTER EL 158М → M ; # CYRILLIC CAPITAL LETTER EM 159м → m ; # CYRILLIC SMALL LETTER EM 160Н → N ; # CYRILLIC CAPITAL LETTER EN 161н → n ; # CYRILLIC SMALL LETTER EN 162О → O ; # CYRILLIC CAPITAL LETTER O 163о → o ; # CYRILLIC SMALL LETTER O 164П → P ; # CYRILLIC CAPITAL LETTER PE 165п → p ; # CYRILLIC SMALL LETTER PE 166Р → R ; # CYRILLIC CAPITAL LETTER ER 167р → r ; # CYRILLIC SMALL LETTER ER 168С → S ; # CYRILLIC CAPITAL LETTER ES 169с → s ; # CYRILLIC SMALL LETTER ES 170######################################################################## 171# BGN Page 94 Rule 3.5 172# тс becomes t·s 173######################################################################## 174ТС → T·S ; # CYRILLIC CAPITAL LETTER TE 175Тс → T·s ; # CYRILLIC CAPITAL LETTER TE 176тс → t·s ; # CYRILLIC SMALL LETTER TE 177Т → T ; # CYRILLIC CAPITAL LETTER TE 178т → t ; # CYRILLIC SMALL LETTER TE 179######################################################################## 180# End Rule 3.5 181######################################################################## 182У → U ; # CYRILLIC CAPITAL LETTER U 183у → u ; # CYRILLIC SMALL LETTER U 184Ф → F ; # CYRILLIC CAPITAL LETTER EF 185ф → f ; # CYRILLIC SMALL LETTER EF 186Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA 187Х → KH ; # CYRILLIC CAPITAL LETTER HA 188х → kh ; # CYRILLIC SMALL LETTER HA 189Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE 190Ц → TS ; # CYRILLIC CAPITAL LETTER TSE 191ц → ts ; # CYRILLIC SMALL LETTER TSE 192Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE 193Ч → CH ; # CYRILLIC CAPITAL LETTER CHE 194ч → ch ; # CYRILLIC SMALL LETTER CHE 195######################################################################## 196# BGN Page 94 Rule 3.6 197# шч becomes sh·ch 198######################################################################## 199ШЧ → SH·CH ; # CYRILLIC CAPITAL LETTER SHA 200Шч → Sh·ch ; # CYRILLIC CAPITAL LETTER SHA 201шч → sh·ch ; # CYRILLIC SMALL LETTER SHA 202Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA 203Ш → SH ; # CYRILLIC CAPITAL LETTER SHA 204ш → sh ; # CYRILLIC SMALL LETTER SHA 205Щ} $lower → Shch ; # CYRILLIC CAPITAL LETTER SHCHA 206Щ → SHCH ; # CYRILLIC CAPITAL LETTER SHCHA 207щ → shch ; # CYRILLIC SMALL LETTER SHCHA 208######################################################################## 209# End Rule 3.6 210######################################################################## 211Ъ → $doublePrime ; # CYRILLIC CAPITAL LETTER HARD SIGN 212ъ → $doublePrime ; # CYRILLIC SMALL LETTER HARD SIGN 213######################################################################## 214# BGN Page 94 Rule 3.2 215# ы before а, у, ы, or э becomes у· 216# 217# BGN Page 94 Rule 3.3 218# ы after any vowel character becomes ·у 219######################################################################## 220# 221# BUG(ftang) the following line said the vowels will change 222# $vowels}Ы → ·Y ; # CYRILLIC CAPITAL LETTER I 223# $vowels}ы → ·y ; # CYRILLIC CAPITAL LETTER I 224Ы}[АаУуЫыЭэ] → Y· ; # CYRILLIC CAPITAL LETTER YERU 225ы}[ауыэ] → y· ; # CYRILLIC SMALL LETTER YERU 226Ы → Y ; # CYRILLIC CAPITAL LETTER YERU 227ы → y ; # CYRILLIC SMALL LETTER YERU 228######################################################################## 229# End Rule 3.2 and 3.3 230######################################################################## 231Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN 232ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN 233Э → E ; # CYRILLIC CAPITAL LETTER E 234э → e ; # CYRILLIC SMALL LETTER E 235Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU 236Ю → YU ; # CYRILLIC CAPITAL LETTER YU 237ю → yu ; # CYRILLIC SMALL LETTER YU 238Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA 239Я → YA ; # CYRILLIC CAPITAL LETTER YA 240я → ya ; # CYRILLIC SMALL LETTER YA 241 242