Index: source/data/translit/bg_bg_Latn_BGN.txt |
diff --git a/source/data/translit/bg_bg_Latn_BGN.txt b/source/data/translit/bg_bg_Latn_BGN.txt |
new file mode 100644 |
index 0000000000000000000000000000000000000000..d8351ce9bb4166fd24e3f8ae21c57e493992f756 |
--- /dev/null |
+++ b/source/data/translit/bg_bg_Latn_BGN.txt |
@@ -0,0 +1,243 @@ |
+# © 2016 and later: Unicode, Inc. and others. |
+# License & terms of use: http://www.unicode.org/copyright.html#License |
+# |
+# File: bg_bg_Latn_BGN.txt |
+# Generated from CLDR |
+# |
+ |
+# |
+######################################################################## |
+# BGN/PCGN 1952 System |
+# |
+# This system was adopted by the BGN in 1949 and by the PCGN in 1952. |
+# It reflects the much simplified Bulgarian orthography as officially |
+# revised in February 1945. The Bulgarian alphabet contains all of |
+# the characters present in the Russian alphabet with the exception |
+# of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given. |
+# |
+# The Bulgarian Alphabet as defined by the BGN (Page 15): |
+# |
+# АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ |
+# абвгдежзийклмнопрстуфхцчшщъьюяѫѣ |
+# |
+# Originally prepared by Michael Everson <everson@evertype.com> |
+######################################################################## |
+# |
+# MINIMAL FILTER: Bulgarian-Latin |
+# |
+:: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ; |
+:: NFD (NFC) ; |
+# |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Define All Transformation Variables |
+# |
+######################################################################## |
+# |
+$upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ; |
+$lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ; |
+$consonants = [$upperConsonants $lowerConsonants] ; |
+$upperVowels = [АЕИОУЪЮЯѪѢ] ; |
+$lowerVowels = [аеиоуъюяѫѣ] ; |
+$vowels = [$upperVowels $lowerVowels] ; |
+$lower = [$lowerConsonants $lowerVowels] ; |
+$bulgarian = [ $lower $upperConsonants $upperVowels ] ; |
+# |
+# |
+# Use this $wordBoundary until bug 2034 is fixed in ICU: |
+# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest |
+# |
+$wordBoundary = [^[:L:][:M:][:N:]] ; |
+# |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Start of Alphabetic Transformations |
+# |
+######################################################################## |
+# |
+А → A ; # CYRILLIC CAPITAL LETTER A |
+а → a ; # CYRILLIC SMALL LETTER A |
+Б → B ; # CYRILLIC CAPITAL LETTER BE |
+б → b ; # CYRILLIC SMALL LETTER BE |
+В → V ; # CYRILLIC CAPITAL LETTER VE |
+в → v ; # CYRILLIC SMALL LETTER VE |
+Г → G ; # CYRILLIC CAPITAL LETTER GHE |
+г → g ; # CYRILLIC SMALL LETTER GHE |
+Д → D ; # CYRILLIC CAPITAL LETTER DE |
+д → d ; # CYRILLIC SMALL LETTER DE |
+Е → E ; # CYRILLIC CAPITAL LETTER DE |
+е → e ; # CYRILLIC SMALL LETTER DE |
+Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE |
+Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE |
+ж → zh ; # CYRILLIC SMALL LETTER ZHE |
+З → Z ; # CYRILLIC CAPITAL LETTER ZE |
+з → z ; # CYRILLIC SMALL LETTER ZE |
+И → I ; # CYRILLIC CAPITAL LETTER I |
+и → i ; # CYRILLIC SMALL LETTER I |
+Й → Y ; # CYRILLIC CAPITAL LETTER I |
+й → y ; # CYRILLIC SMALL LETTER I |
+К → K ; # CYRILLIC CAPITAL LETTER KA |
+к → k ; # CYRILLIC SMALL LETTER KA |
+Л → L ; # CYRILLIC CAPITAL LETTER EL |
+л → l ; # CYRILLIC SMALL LETTER EL |
+М → M ; # CYRILLIC CAPITAL LETTER EM |
+м → m ; # CYRILLIC SMALL LETTER EM |
+Н → N ; # CYRILLIC CAPITAL LETTER EN |
+н → n ; # CYRILLIC SMALL LETTER EN |
+О → O ; # CYRILLIC CAPITAL LETTER O |
+о → o ; # CYRILLIC SMALL LETTER O |
+П → P ; # CYRILLIC CAPITAL LETTER PE |
+п → p ; # CYRILLIC SMALL LETTER PE |
+Р → R ; # CYRILLIC CAPITAL LETTER ER |
+р → r ; # CYRILLIC SMALL LETTER ER |
+С → S ; # CYRILLIC CAPITAL LETTER ES |
+с → s ; # CYRILLIC SMALL LETTER ES |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 16 Note 4 |
+# |
+# тс becomes t·s |
+# |
+######################################################################## |
+# |
+ТС → T·S ; # CYRILLIC CAPITAL LETTER TE |
+Тс → T·s ; # CYRILLIC CAPITAL LETTER TE |
+тс → t·s ; # CYRILLIC SMALL LETTER TE |
+Т → T ; # CYRILLIC CAPITAL LETTER TE |
+т → t ; # CYRILLIC SMALL LETTER TE |
+# |
+# |
+######################################################################## |
+# |
+# End Note 4 |
+# |
+######################################################################## |
+У → U ; # CYRILLIC CAPITAL LETTER U |
+у → u ; # CYRILLIC SMALL LETTER U |
+Ф → F ; # CYRILLIC CAPITAL LETTER EF |
+ф → f ; # CYRILLIC SMALL LETTER EF |
+Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA |
+Х → KH ; # CYRILLIC CAPITAL LETTER HA |
+х → kh ; # CYRILLIC SMALL LETTER HA |
+Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE |
+Ц → TS ; # CYRILLIC CAPITAL LETTER TSE |
+ц → ts ; # CYRILLIC SMALL LETTER TSE |
+Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE |
+Ч → CH ; # CYRILLIC CAPITAL LETTER CHE |
+ч → ch ; # CYRILLIC SMALL LETTER CHE |
+# |
+######################################################################## |
+# |
+# Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6). |
+# |
+# шт becomes sh·t |
+# |
+######################################################################## |
+# |
+ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA |
+Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA |
+шт → sh·t ; # CYRILLIC SMALL LETTER SHA |
+Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA |
+Ш → SH ; # CYRILLIC CAPITAL LETTER SHA |
+ш → sh ; # CYRILLIC SMALL LETTER SHA |
+Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA |
+Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA |
+щ → sht ; # CYRILLIC SMALL LETTER SHCHA |
+# |
+# |
+######################################################################## |
+# |
+# End Implied rule |
+# |
+######################################################################## |
+Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN |
+ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN |
+# |
+######################################################################## |
+# |
+# BGN Page 16 Note 1 |
+# |
+# In modern Bulgarian orthography, the character ъ does not occur in |
+# word-final position. It should be omitted in romanization when found |
+# on older sources. |
+# |
+# The following rule removes all Ъъ at the end of a word. It is assumed |
+# that when the condition is met, the text must be from an older source. |
+# Comment out with a '#' at the start of a line to disable. |
+# |
+# |
+######################################################################## |
+# |
+$bulgarian { [Ъъ] } $wordBoundary > ; |
+# |
+# |
+######################################################################## |
+# |
+# End BGN Page 16 Note 1 |
+# |
+######################################################################## |
+Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN |
+ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN |
+Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU |
+Ю → YU ; # CYRILLIC CAPITAL LETTER YU |
+ю → yu ; # CYRILLIC SMALL LETTER YU |
+Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA |
+Я → YA ; # CYRILLIC CAPITAL LETTER YA |
+я → ya ; # CYRILLIC SMALL LETTER YA |
+# |
+######################################################################## |
+# |
+# BGN Page 16 Note 2 |
+# |
+# The obsolete character Ѫ, which was replaced by Ъ in 1945, should be |
+# romanized Ŭ. |
+# |
+######################################################################## |
+# |
+Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS |
+ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS |
+# |
+# |
+######################################################################## |
+# |
+# End BGN Page 16 Note 2 |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# BGN Page 16 Note 3 |
+# |
+# The obsolete character Ѣ, replaced in 1945 by Я or Е according to local |
+# pronunciation, should be romanized as e or ya, accordingly, if the |
+# pronunciation is known; otherwise as ye. |
+# |
+######################################################################## |
+# |
+Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT |
+Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT |
+ѣ → ye ; # CYRILLIC SMALL LETTER YAT |
+# |
+# |
+# Alternative rule where appropriate for local pronounciation. To apply |
+# uncomment the following by removing the '#' mark at the start of the |
+# line and insert before the three rule lines above. |
+# |
+# Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT |
+# Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT |
+# ѣ → e ; # CYRILLIC SMALL LETTER YAT |
+# |
+######################################################################## |
+# |
+# End BGN Page 16 Note 3 |
+# |
+######################################################################## |
+ |