|
|||
CLDR Version 28 | Index |
Lists data fields that differ from the last version. Inherited differences in locales are suppressed, except where the source locales are different. The collations and metadata still have a raw format. The rbnf, segmentations, and annotations are not yet included.
Path | Old | New |
---|---|---|
…/transforms/transform[@source="Russian"][@target="Latin"][@variant="BGN"][@direction="forward"]/tRule | ::[АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯабвгдеёжзийклмнопрстуфхцчшщъыьэюя]; $prime = ʹ ; $doublePrime = ʺ ; $wordBoundary = [^[:L:][:M:][:N:]] ; $upperConsonants = [БВГДЖЙКЛМНПРСТФХЦЧШЩЭ] ; $lowerConsonants = [бвгджйклмнпрстфхцчшщэ] ; $consonants = [$upperConsonants $lowerConsonants] ; $upperVowels = [АЕЁЭИОУЫЮЯ] ; $lowerVowels = [аеёэиоуыюя] ; $vowels = [$upperVowels $lowerVowels] ; $lower = [$lowerConsonants $lowerVowels] ; $upper = [$upperConsonants $upperVowels] ; [$upperVowels [ЙЪЬ]] { Е } $upper → YE ; # CYRILLIC CAPITAL LETTER IE [$upperVowels [ЙЪЬ]] { Е → Ye ; # CYRILLIC CAPITAL LETTER IE [$upperVowels $lowerVowels [ЙйЪъЬь]] { е → ye ; # CYRILLIC SMALL LETTER IE [$upperVowels [ЙЪЬ]] { Ё } $upper → YË ; # CYRILLIC CAPITAL LETTER IO [$upperVowels [ЙЪЬ]] { Ё → Yë ; # CYRILLIC CAPITAL LETTER IO [$upperVowels $lowerVowels [ЙйЪъЬь]] { ё → yë ; # CYRILLIC SMALL LETTER IO ::Null; А → A ; # CYRILLIC CAPITAL LETTER A а → a ; # CYRILLIC SMALL LETTER A Б → B ; # CYRILLIC CAPITAL LETTER BE б → b ; # CYRILLIC SMALL LETTER BE В → V ; # CYRILLIC CAPITAL LETTER VE в → v ; # CYRILLIC SMALL LETTER VE Г → G ; # CYRILLIC CAPITAL LETTER GHE г → g ; # CYRILLIC SMALL LETTER GHE Д → D ; # CYRILLIC CAPITAL LETTER DE д → d ; # CYRILLIC SMALL LETTER DE $wordBoundary{Е} $upper → YE ; # CYRILLIC CAPITAL LETTER IE $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE Е → E ; # CYRILLIC CAPITAL LETTER IE $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE е → e ; # CYRILLIC SMALL LETTER IE $wordBoundary {Ё} $upper → YË ; # CYRILLIC CAPITAL LETTER IO $wordBoundary {Ё} $lower → Yë ; # CYRILLIC CAPITAL LETTER IO Ё → Ë ; # CYRILLIC CAPITAL LETTER IO $wordBoundary{ё → yë ; # CYRILLIC SMALL LETTER IO ё → ë ; # CYRILLIC SMALL LETTER IO Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE ж → zh ; # CYRILLIC SMALL LETTER ZHE З → Z ; # CYRILLIC CAPITAL LETTER ZE з → z ; # CYRILLIC SMALL LETTER ZE И → I ; # CYRILLIC CAPITAL LETTER I и → i ; # CYRILLIC SMALL LETTER I Й → Y ; # CYRILLIC CAPITAL LETTER I й → y ; # CYRILLIC SMALL LETTER I К → K ; # CYRILLIC CAPITAL LETTER KA к → k ; # CYRILLIC SMALL LETTER KA Л → L ; # CYRILLIC CAPITAL LETTER EL л → l ; # CYRILLIC SMALL LETTER EL М → M ; # CYRILLIC CAPITAL LETTER EM м → m ; # CYRILLIC SMALL LETTER EM Н → N ; # CYRILLIC CAPITAL LETTER EN н → n ; # CYRILLIC SMALL LETTER EN О → O ; # CYRILLIC CAPITAL LETTER O о → o ; # CYRILLIC SMALL LETTER O П → P ; # CYRILLIC CAPITAL LETTER PE п → p ; # CYRILLIC SMALL LETTER PE Р → R ; # CYRILLIC CAPITAL LETTER ER р → r ; # CYRILLIC SMALL LETTER ER С → S ; # CYRILLIC CAPITAL LETTER ES с → s ; # CYRILLIC SMALL LETTER ES ТС → TS ; # CYRILLIC CAPITAL LETTER TE Тс → Ts ; # CYRILLIC CAPITAL LETTER TE тс → ts ; # CYRILLIC SMALL LETTER TE Т → T ; # CYRILLIC CAPITAL LETTER TE т → t ; # CYRILLIC SMALL LETTER TE У → U ; # CYRILLIC CAPITAL LETTER U у → u ; # CYRILLIC SMALL LETTER U Ф → F ; # CYRILLIC CAPITAL LETTER EF ф → f ; # CYRILLIC SMALL LETTER EF Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA Х → KH ; # CYRILLIC CAPITAL LETTER HA х → kh ; # CYRILLIC SMALL LETTER HA Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE Ц → TS ; # CYRILLIC CAPITAL LETTER TSE ц → ts ; # CYRILLIC SMALL LETTER TSE Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE Ч → CH ; # CYRILLIC CAPITAL LETTER CHE ч → ch ; # CYRILLIC SMALL LETTER CHE ШЧ → SHCH ; # CYRILLIC CAPITAL LETTER SHA Шч → Shch ; # CYRILLIC CAPITAL LETTER SHA шч → shch ; # CYRILLIC SMALL LETTER SHA Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA Ш → SH ; # CYRILLIC CAPITAL LETTER SHA ш → sh ; # CYRILLIC SMALL LETTER SHA Щ} $lower → Shch ; # CYRILLIC CAPITAL LETTER SHCHA Щ → SHCH ; # CYRILLIC CAPITAL LETTER SHCHA щ → shch ; # CYRILLIC SMALL LETTER SHCHA Ъ → $doublePrime ; # CYRILLIC CAPITAL LETTER HARD SIGN ъ → $doublePrime ; # CYRILLIC SMALL LETTER HARD SIGN Ы → Y ; # CYRILLIC CAPITAL LETTER YERU ы → y ; # CYRILLIC SMALL LETTER YERU Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN Э → E ; # CYRILLIC CAPITAL LETTER E э → e ; # CYRILLIC SMALL LETTER E Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU Ю → YU ; # CYRILLIC CAPITAL LETTER YU ю → yu ; # CYRILLIC SMALL LETTER YU Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA Я → YA ; # CYRILLIC CAPITAL LETTER YA я → ya ; # CYRILLIC SMALL LETTER YA | # ######################################################################## # BGN/PCGN 1947 System # # The BGN/PCGN system for Russian was # adopted by the BGN in 1944 and by # the PCGN in 1947 for use in # romanizing names written in the Russian # Cyrillic alphabet. # # # The Russian Alphabet as defined by the BGN (Page 93): # # # АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ # # абвгдеёжзийклмнопрстуфхцчшщъыьэюя # # Originally prepared by # Michael Everson everson@evertype.com # Fixed by Frank Yung-Fong Tang ftang@google.com # # Test Data from http://en.wikipedia.org/wiki/BGN/PCGN_romanization_of_Russian # Since the use of · is optional, we do NOT implement here. # Азов Azov # Тамбов Tambov # Барнаул Barnaul # Кубань Kubanʹ # Владимир Vladimir # Ульяновск Ulʹyanovsk # Грозный Groznyy # Волгодонск Volgodonsk # Дзержинский Dzerzhinskiy # Нелидово Nelidovo # Елизово Yelizovo # Чапаевск Chapayevsk # Майер Mayyer # Юрьев Yurʹyev # Съезд Sʺyezd # Белкин Belkin # Ёлкин Yëlkin # Остриё Ostriyë ## Йёнчёпинг Y·ënchëping # Йёнчёпинг Yënchëping # Громадьё Gromadʹyë # Подъёмный Podʺyëmnyy # Жуков Zhukov # Лужники Luzhniki # Звенигород Zvenigorod # Вязьма Vyazʹma # Иркутск Irkutsk # Апатиты Apatity ## Кайафа Kay·afa # Кайафа Kayafa # Йошкар-Ола Yoshkar-Ola # Бийск Biysk # Киров Kirov # Енисейск Yeniseysk # Ломоносов Lomonosov # Нелидово Nelidovo # Менделеев Mendeleyev # Каменка Kamenka # Новосибирск Novosibirsk # Кандалакша Kandalaksha # Омск Omsk # Красноярск Krasnoyarsk # Петрозаводск Petrozavodsk # Серпухов Serpukhov # Ростов Rostov # Северобайкальск Severobaykalʹsk # Сковородино Skovorodino # Чайковский Chaykovskiy # Тамбов Tambov # Мытищи Mytishchi # Углич Uglich # Дудинка Dudinka # Фурманов Furmanov # Уфа Ufa # Хабаровск Khabarovsk # Прохладный Prokhladnyy # Цимлянск Tsimlyansk # Ельцин Yelʹtsin # Чебоксары Cheboksary # Печора Pechora # Шахтёрск Shakhtërsk # Мышкин Myshkin # Щёлково Shchëlkovo # Ртищево Rtishchevo # Подъездной Podʺyezdnoy ## Выудить Vy·uditʹ # Выудить Vyuditʹ ## Суык-Су Su·yk-Su # Суык-Су Suyk-Su # Ыттык-Кёль Yttyk-Këlʹ # Тында Tynda # Тюмень Tyumenʹ ## Двухэлементный Dvukh·elementnyy # Двухэлементный Dvukhelementnyy # Электрогорск Elektrogorsk # Радиоэлектроника Radioelektronika # Юбилейный Yubileynyy # Ключевская Klyuchevskaya # Якутск Yakutsk # Брянск Bryansk ## Соответствие Sootvet·stviye # Соответствие Sootvetstviye ## Веснушчатый Vesnush·chatyy # Веснушчатый Vesnushchatyy # ######################################################################## # # MINIMAL FILTER: Russian-Latin # ::[АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯабвгдеёжзийклмнопрстуфхцчшщъыьэюя]; # # BUG(ftang) remove the following line. Otherwise the rule for # Й й Ё ё will break since the rule is written in NFC but # the line decomposes the text. # :: NFD (NFC) ; # ######################################################################## # ######################################################################## # Define All Transformation Variables # ######################################################################## # $prime = ʹ ; $doublePrime = ʺ ; $wordBoundary = [^[:L:][:M:][:N:]] ; $upperConsonants = [БВГДЖЙКЛМНПРСТФХЦЧШЩЭ] ; $lowerConsonants = [бвгджйклмнпрстфхцчшщэ] ; $consonants = [$upperConsonants $lowerConsonants] ; $upperVowels = [АЕЁЭИОУЫЮЯ] ; $lowerVowels = [аеёэиоуыюя] ; $vowels = [$upperVowels $lowerVowels] ; $lower = [$lowerConsonants $lowerVowels] ; $upper = [$upperConsonants $upperVowels] ; # # ######################################################################## # ######################################################################## # Rules moved to front to avoid masking # ######################################################################## # # REMOVEOPTIONAL(ftang) The following two rules for · option is commented out. #$lowerVowels { ы → ·y ; #$upperVowels { [Ыы] → ·Y ; ######################################################################## # # # REMOVEOPTIONAL(ftang) The following two rules for · option is commented out. #[$consonants - [Йй]]{Э → ·E ; #[$consonants - [Йй]]{э → ·e ; [$upperVowels [ЙЪЬ]] { Е } $upper → YE ; # CYRILLIC CAPITAL LETTER IE [$upperVowels [ЙЪЬ]] { Е → Ye ; # CYRILLIC CAPITAL LETTER IE [$upperVowels $lowerVowels [ЙйЪъЬь]] { е → ye ; # CYRILLIC SMALL LETTER IE [$upperVowels [ЙЪЬ]] { Ё } $upper → YË ; # CYRILLIC CAPITAL LETTER IO [$upperVowels [ЙЪЬ]] { Ё → Yë ; # CYRILLIC CAPITAL LETTER IO [$upperVowels $lowerVowels [ЙйЪъЬь]] { ё → yë ; # CYRILLIC SMALL LETTER IO # # Since in the above rule we look use the context before the characters, # we have to perform them in a separate pass before we change the vowels # the ::Null forces a separate pass. ::Null; # # ######################################################################## # Start of Alphabetic Transformations # ######################################################################## # А → A ; # CYRILLIC CAPITAL LETTER A а → a ; # CYRILLIC SMALL LETTER A Б → B ; # CYRILLIC CAPITAL LETTER BE б → b ; # CYRILLIC SMALL LETTER BE В → V ; # CYRILLIC CAPITAL LETTER VE в → v ; # CYRILLIC SMALL LETTER VE Г → G ; # CYRILLIC CAPITAL LETTER GHE г → g ; # CYRILLIC SMALL LETTER GHE Д → D ; # CYRILLIC CAPITAL LETTER DE д → d ; # CYRILLIC SMALL LETTER DE # # ######################################################################## # BGN Page 94 Rule 1: # # The character e should be romanized ye # initially, after the vowel # characters a, e, ё, и, о, у, ы, э, ю, # and я, and after й, ъ, and ь. # In all other instances, it should # be romanized e. ######################################################################## # # BUG(ftang)- the following two lines said BEFORE the vowels, instead of AFTER # Е}[$upperVowels [ЙЪЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE # Е}[$lowerVowels [йъь]] → Ye ; # CYRILLIC CAPITAL LETTER IE $wordBoundary{Е} $upper → YE ; # CYRILLIC CAPITAL LETTER IE $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE Е → E ; # CYRILLIC CAPITAL LETTER IE # # BUG(ftang)- the following line said BEFORE the vowels, instead of AFTER # е}[$upperVowels $lowerVowels [ЙйЪъЬь]] → ye ; # CYRILLIC SMALL LETTER IE $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE е → e ; # CYRILLIC SMALL LETTER IE # # ######################################################################## # End of Rule 1 ######################################################################## ######################################################################## # BGN Page 94 Rule 2: # # The character ё is not considered a # separate character of the Russian # alphabet and the dieresis is # generally not shown. When the dieresis is # shown, the character # should be romanized yë initially, after the vowel # characters a, # e, ё, и, о, у, ы, э, ю, and я, and after й, ъ, and ь, In # all # other instances, it should be romanized ё. When the dieresis is not # shown, the character may still be romanized in the preceding # manner or, # alternatively, in accordance with note 1. # ######################################################################## # BUG(ftang)- the following two lines said BEFORE the vowels, instead of AFTER # Ё}[$upperVowels [ЙЪЬ]] → YË ; # CYRILLIC CAPITAL LETTER IO # Ё}[$lowerVowels [йъь]] → Yë ; # CYRILLIC CAPITAL LETTER IO $wordBoundary {Ё} $upper → YË ; # CYRILLIC CAPITAL LETTER IO $wordBoundary {Ё} $lower → Yë ; # CYRILLIC CAPITAL LETTER IO Ё → Ë ; # CYRILLIC CAPITAL LETTER IO # # BUG(ftang)- the following line said BEFORE the vowels, instead of AFTER # ё}[$upperVowels $lowerVowels [ЙйЪъЬь]] → yë ; # CYRILLIC SMALL LETTER IO $wordBoundary{ё → yë ; # CYRILLIC SMALL LETTER IO ё → ë ; # CYRILLIC SMALL LETTER IO # # ######################################################################## # End of Rule 2 # ######################################################################## # Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE ж → zh ; # CYRILLIC SMALL LETTER ZHE # # ######################################################################## # BGN Page 94 Rule 3.4 # э after any consonant character except # й becomes ·е ######################################################################## # З → Z ; # CYRILLIC CAPITAL LETTER ZE з → z ; # CYRILLIC SMALL LETTER ZE # # BUG(ftang) The following two lines said those consonant becomes ·е # [$consonants - [Йй]]}Э → ·Е ; # [$consonants - [Йй]]}э → ·е ; # ######################################################################## # End of Rule 3.4 # ######################################################################## # И → I ; # CYRILLIC CAPITAL LETTER I и → i ; # CYRILLIC SMALL LETTER I # # ######################################################################## # BGN Page 94 Rule 3: # Unusual Russian character sequences # occurring primarily in non-Russian-language names may be # romanized as shown below in order to provide differentiation from # regularly-occurring digraphs and # character sequences. # BGN Page 94 Rule 3.1 # й before а, у, ы, or э becomes у· # ######################################################################## # # REMOVEOPTIONAL(ftang) The following two rules for · option is commented out. # Й}[АаУуЫыЭэ] → Y· ; # CYRILLIC CAPITAL LETTER I # й}[АаУуЫыЭэ] → y· ; # CYRILLIC SMALL LETTER I Й → Y ; # CYRILLIC CAPITAL LETTER I й → y ; # CYRILLIC SMALL LETTER I # # ######################################################################## # End Rule 3.1 # ######################################################################## # К → K ; # CYRILLIC CAPITAL LETTER KA к → k ; # CYRILLIC SMALL LETTER KA Л → L ; # CYRILLIC CAPITAL LETTER EL л → l ; # CYRILLIC SMALL LETTER EL М → M ; # CYRILLIC CAPITAL LETTER EM м → m ; # CYRILLIC SMALL LETTER EM Н → N ; # CYRILLIC CAPITAL LETTER EN н → n ; # CYRILLIC SMALL LETTER EN О → O ; # CYRILLIC CAPITAL LETTER O о → o ; # CYRILLIC SMALL LETTER O П → P ; # CYRILLIC CAPITAL LETTER PE п → p ; # CYRILLIC SMALL LETTER PE Р → R ; # CYRILLIC CAPITAL LETTER ER р → r ; # CYRILLIC SMALL LETTER ER С → S ; # CYRILLIC CAPITAL LETTER ES с → s ; # CYRILLIC SMALL LETTER ES # # ######################################################################## # BGN Page 94 Rule 3.5 # # тс becomes t·s # ######################################################################## # # REMOVEOPTIONAL(ftang) The following three rules for · option is commented out # and change to the version without · # ТС → T·S ; # CYRILLIC CAPITAL LETTER TE # Тс → T·s ; # CYRILLIC CAPITAL LETTER TE # тс → t·s ; # CYRILLIC SMALL LETTER TE ТС → TS ; # CYRILLIC CAPITAL LETTER TE Тс → Ts ; # CYRILLIC CAPITAL LETTER TE тс → ts ; # CYRILLIC SMALL LETTER TE Т → T ; # CYRILLIC CAPITAL LETTER TE т → t ; # CYRILLIC SMALL LETTER TE # # ######################################################################## # End Rule 3.5 # ######################################################################## # У → U ; # CYRILLIC CAPITAL LETTER U у → u ; # CYRILLIC SMALL LETTER U Ф → F ; # CYRILLIC CAPITAL LETTER EF ф → f ; # CYRILLIC SMALL LETTER EF Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA Х → KH ; # CYRILLIC CAPITAL LETTER HA х → kh ; # CYRILLIC SMALL LETTER HA Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE Ц → TS ; # CYRILLIC CAPITAL LETTER TSE ц → ts ; # CYRILLIC SMALL LETTER TSE Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE Ч → CH ; # CYRILLIC CAPITAL LETTER CHE ч → ch ; # CYRILLIC SMALL LETTER CHE # # ######################################################################## # BGN Page 94 Rule 3.6 # # шч becomes sh·ch # ######################################################################## # # REMOVEOPTIONAL(ftang) The following three rules for · option is commented out # and change to the version without · # ШЧ → SH·CH ; # CYRILLIC CAPITAL LETTER SHA # Шч → Sh·ch ; # CYRILLIC CAPITAL LETTER SHA # шч → sh·ch ; # CYRILLIC SMALL LETTER SHA ШЧ → SHCH ; # CYRILLIC CAPITAL LETTER SHA Шч → Shch ; # CYRILLIC CAPITAL LETTER SHA шч → shch ; # CYRILLIC SMALL LETTER SHA Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA Ш → SH ; # CYRILLIC CAPITAL LETTER SHA ш → sh ; # CYRILLIC SMALL LETTER SHA Щ} $lower → Shch ; # CYRILLIC CAPITAL LETTER SHCHA Щ → SHCH ; # CYRILLIC CAPITAL LETTER SHCHA щ → shch ; # CYRILLIC SMALL LETTER SHCHA # # ######################################################################## # End Rule 3.6 # ######################################################################## # Ъ → $doublePrime ; # CYRILLIC CAPITAL LETTER HARD SIGN ъ → $doublePrime ; # CYRILLIC SMALL LETTER HARD SIGN # # ######################################################################## # BGN Page 94 Rule 3.2 # # ы before а, у, ы, or э becomes у· # BGN Page 94 Rule 3.3 # # ы after any vowel character becomes ·у ######################################################################## # # BUG(ftang) the following line said the vowels will change # $vowels}Ы → ·Y ; # CYRILLIC CAPITAL LETTER I # $vowels}ы → ·y ; # CYRILLIC CAPITAL LETTER I # REMOVEOPTIONAL(ftang) The following two rules for · option is commented out. #Ы}[АаУуЫыЭэ] → Y· ; # CYRILLIC CAPITAL LETTER YERU #ы}[ауыэ] → y· ; # CYRILLIC SMALL LETTER YERU Ы → Y ; # CYRILLIC CAPITAL LETTER YERU ы → y ; # CYRILLIC SMALL LETTER YERU # # ######################################################################## # End Rule 3.2 and 3.3 # ######################################################################## # Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN Э → E ; # CYRILLIC CAPITAL LETTER E э → e ; # CYRILLIC SMALL LETTER E Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU Ю → YU ; # CYRILLIC CAPITAL LETTER YU ю → yu ; # CYRILLIC SMALL LETTER YU Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA Я → YA ; # CYRILLIC CAPITAL LETTER YA я → ya ; # CYRILLIC SMALL LETTER YA |