Index: source/data/translit/tk_Cyrl_tk_BGN.txt |
diff --git a/source/data/translit/tk_Cyrl_tk_BGN.txt b/source/data/translit/tk_Cyrl_tk_BGN.txt |
new file mode 100644 |
index 0000000000000000000000000000000000000000..da7785433acd9d1568158430d0d4cc9e1cf54f26 |
--- /dev/null |
+++ b/source/data/translit/tk_Cyrl_tk_BGN.txt |
@@ -0,0 +1,308 @@ |
+# © 2016 and later: Unicode, Inc. and others. |
+# License & terms of use: http://www.unicode.org/copyright.html#License |
+# |
+# File: tk_Cyrl_tk_BGN.txt |
+# Generated from CLDR |
+# |
+ |
+# |
+######################################################################## |
+# BGN/PCGN 1979 System |
+# |
+# The BGN/PCGN system for Turkmen was designed for use in |
+# romanizing names written in the Turkmen alphabet. |
+# The Turkmen alphabet contains five letters not present |
+# in the Russian alphabet: Җҗ, Ңң, Өө, Үү, and Әә. |
+# |
+# The Turkmen Cyrillic Alphabet as defined by the BGN (Page 103): |
+# |
+# АБВГДЕЁЖҖЗИЙКЛМНҢОӨПРСТУҮФХЦЧШЩЪЫЬЭӘЮЯ |
+# абвгдеёжзҗийклмнңоөпрстуүфхцчшщъыьэәюя |
+# |
+# Originally prepared by Michael Everson <everson@evertype.com> |
+######################################################################## |
+# |
+# MINIMAL FILTER: Turkmen-Latin |
+# |
+# :: [АБВГДЕЁЖҖЗИЙКЛМНҢОӨПРСТУҮФХЦЧШЩЪЫЬЭӘЮЯабвгдеёжзҗийклмнңоөпрстуүфхцчшщъыьэәюя] ; |
+:: NFD (NFC) ; |
+# |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Define All Transformation Variables |
+# |
+######################################################################## |
+# |
+$prime = ʹ ; |
+$doublePrime = ʺ ; |
+$upperConsonants = [БВГДЖҖЗЙКЛМНҢПРСТФХЦЧШЩЪЬ] ; |
+$lowerConsonants = [бвгджҗзйклмнңпрстфхцчшщъь] ; |
+$consonants = [$upperConsonants $lowerConsonants] ; |
+$upperVowels = [АЕЁИОӨУҮЫЭӘЮЯ] ; |
+$lowerVowels = [аеёиоөуүыэәюя] ; |
+$vowels = [$upperVowels $lowerVowels] ; |
+$lower = [$lowerConsonants $lowerVowels] ; |
+# |
+# |
+# Use this $wordBoundary until bug 2034 is fixed in ICU: |
+# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest |
+# |
+$wordBoundary = [^[:L:][:M:][:N:]] ; |
+# |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Start of Alphabetic Transformations |
+# |
+######################################################################## |
+# |
+А → A ; # CYRILLIC CAPITAL LETTER A |
+а → a ; # CYRILLIC SMALL LETTER A |
+Б → B ; # CYRILLIC CAPITAL LETTER BE |
+б → b ; # CYRILLIC SMALL LETTER BE |
+В → W ; # CYRILLIC CAPITAL LETTER VE |
+в → w ; # CYRILLIC SMALL LETTER VE |
+Г → G ; # CYRILLIC CAPITAL LETTER GHE |
+г → g ; # CYRILLIC SMALL LETTER GHE |
+Д → D ; # CYRILLIC CAPITAL LETTER DE |
+д → d ; # CYRILLIC SMALL LETTER DE |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 104 Rule 1: |
+# |
+# The character e should be romanized ye initially, after the vowel |
+# characters a, e, ё, и, о, ө, у, ү, ы, э, ю, and я, and after й, ъ, and ь. |
+# In all other instances, it should be romanized e. |
+# |
+######################################################################## |
+# |
+Е}[[$upperVowels - [Ә]] [ЙЪЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE |
+Е}[[$lowerVowels - [ә]] [йъь]] → Ye ; # CYRILLIC CAPITAL LETTER IE |
+$wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE |
+Е → E ; # CYRILLIC CAPITAL LETTER IE |
+е}[[$upperVowels - [Ә]] [$lowerVowels - [ә]] [ЙйЪъЬь]] → ye ; # CYRILLIC SMALL LETTER IE |
+$wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE |
+е → e ; # CYRILLIC SMALL LETTER IE |
+# |
+# |
+######################################################################## |
+# |
+# End of Rule 1 |
+# |
+######################################################################## |
+# |
+Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO |
+Ё → YO ; # CYRILLIC CAPITAL LETTER IO |
+ё → yo ; # CYRILLIC SMALL LETTER IO |
+Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE |
+Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE |
+ж → zh ; # CYRILLIC SMALL LETTER ZHE |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 104 Rule 2 |
+# |
+# The character sequences зх, нг, сх, and цх may be romanized z·h, |
+# n·g, s·h, and ts·h in order to differentiate those romanizations form |
+# the digraphs zh, ng, sh, and the letter sequence tsh, which are used |
+# to render the characters ж, ң, ш, and the character sequence тш. |
+# |
+######################################################################## |
+# |
+ЗХ → Z·H ; # CYRILLIC CAPITAL LETTER ZE |
+Зх → Z·h ; # CYRILLIC CAPITAL LETTER ZE |
+зх → z·h ; # CYRILLIC SMALL LETTER ZE |
+З → Z ; # CYRILLIC CAPITAL LETTER ZE |
+з → z ; # CYRILLIC SMALL LETTER ZE |
+# |
+# |
+######################################################################## |
+# |
+# End Rule 2 |
+# |
+######################################################################## |
+# |
+И → И ; # CYRILLIC CAPITAL LETTER I |
+и → и ; # CYRILLIC SMALL LETTER I |
+Й → Y ; # CYRILLIC CAPITAL LETTER I |
+й → y ; # CYRILLIC SMALL LETTER I |
+К → K ; # CYRILLIC CAPITAL LETTER KA |
+к → k ; # CYRILLIC SMALL LETTER KA |
+Л → L ; # CYRILLIC CAPITAL LETTER EL |
+л → l ; # CYRILLIC SMALL LETTER EL |
+М → M ; # CYRILLIC CAPITAL LETTER EM |
+м → m ; # CYRILLIC SMALL LETTER EM |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 104 Rule 2 |
+# |
+# нг becomes n·g |
+# |
+######################################################################## |
+# |
+НГ → N·G ; # CYRILLIC CAPITAL LETTER EN |
+Нг → N·g ; # CYRILLIC CAPITAL LETTER EN |
+нг → n·g ; # CYRILLIC SMALL LETTER EN |
+Н → N ; # CYRILLIC CAPITAL LETTER EN |
+н → n ; # CYRILLIC SMALL LETTER EN |
+# |
+# |
+######################################################################## |
+# |
+# End Rule 2 |
+# |
+######################################################################## |
+# |
+Ң} $lower → Ng ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER |
+Ң → NG ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER |
+ң → ng ; # CYRILLIC SMALL LETTER EN WITH DESCENDER |
+О → O ; # CYRILLIC CAPITAL LETTER O |
+о → o ; # CYRILLIC SMALL LETTER O |
+Ө → Ö ; # CYRILLIC CAPITAL LETTER BARRED O |
+ө → ö ; # CYRILLIC SMALL LETTER BARRED O |
+П → P ; # CYRILLIC CAPITAL LETTER PE |
+п → p ; # CYRILLIC SMALL LETTER PE |
+Р → R ; # CYRILLIC CAPITAL LETTER ER |
+р → r ; # CYRILLIC SMALL LETTER ER |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 104 Rule 2 |
+# |
+# сх becomes s·h |
+# |
+######################################################################## |
+# |
+СХ → S·H ; # CYRILLIC CAPITAL LETTER ES |
+Сх → S·h ; # CYRILLIC CAPITAL LETTER ES |
+сх → s·h ; # CYRILLIC SMALL LETTER ES |
+С → S ; # CYRILLIC CAPITAL LETTER ES |
+с → s ; # CYRILLIC SMALL LETTER ES |
+# |
+# |
+######################################################################## |
+# |
+# End Rule 2 |
+# |
+######################################################################## |
+# |
+Т → T ; # CYRILLIC CAPITAL LETTER TE |
+т → t ; # CYRILLIC SMALL LETTER TE |
+У → U ; # CYRILLIC CAPITAL LETTER U |
+у → u ; # CYRILLIC SMALL LETTER U |
+Ү → Ü ; # CYRILLIC CAPITAL LETTER STRAIGHT U |
+ү → ü ; # CYRILLIC SMALL LETTER STRAIGHT U |
+Ф → F ; # CYRILLIC CAPITAL LETTER EF |
+ф → f ; # CYRILLIC SMALL LETTER EF |
+Х → H ; # CYRILLIC CAPITAL LETTER HA |
+х → h ; # CYRILLIC SMALL LETTER HA |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 104 Rule 2 |
+# |
+# цх becomes ts·h |
+# |
+######################################################################## |
+# |
+ЦХ → TS·H ; # CYRILLIC CAPITAL LETTER GHE |
+Цх → Ts·h ; # CYRILLIC CAPITAL LETTER GHE |
+цх → ts·h ; # CYRILLIC SMALL LETTER GHE |
+Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE |
+Ц → TS ; # CYRILLIC CAPITAL LETTER TSE |
+ц → ts ; # CYRILLIC SMALL LETTER TSE |
+# |
+# |
+######################################################################## |
+# |
+# End Rule 2 |
+# |
+######################################################################## |
+# |
+Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE |
+Ч → CH ; # CYRILLIC CAPITAL LETTER CHE |
+ч → ch ; # CYRILLIC SMALL LETTER CHE |
+# |
+# |
+######################################################################## |
+# |
+# Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6). |
+# |
+# шч becomes sh·ch |
+# |
+######################################################################## |
+# |
+ШЧ → SH·CH ; # CYRILLIC CAPITAL LETTER SHA |
+Шч → Sh·ch ; # CYRILLIC CAPITAL LETTER SHA |
+шч → sh·ch ; # CYRILLIC SMALL LETTER SHA |
+Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA |
+Ш → SH ; # CYRILLIC CAPITAL LETTER SHA |
+ш → sh ; # CYRILLIC SMALL LETTER SHA |
+Щ} $lower → Shch ; # CYRILLIC CAPITAL LETTER SHCHA |
+Щ → SHCH ; # CYRILLIC CAPITAL LETTER SHCHA |
+щ → shch ; # CYRILLIC SMALL LETTER SHCHA |
+# |
+# |
+######################################################################## |
+# |
+# End Implied rule |
+# |
+######################################################################## |
+# |
+Ъ → $doublePrime ; # CYRILLIC CAPITAL LETTER HARD SIGN |
+ъ → $doublePrime ; # CYRILLIC SMALL LETTER HARD SIGN |
+# |
+# |
+######################################################################## |
+# |
+# BGN Page 104 Note 3 |
+# |
+# The character Ыы may be romanized Ɨɨ instead of Yy, if so desired. |
+# |
+######################################################################## |
+# |
+Ы → Y ; # CYRILLIC CAPITAL LETTER YERU |
+ы → y ; # CYRILLIC SMALL LETTER YERU |
+# |
+# |
+# Alternative rule to implement the option described here. To apply |
+# uncomment the following by removing the '#' mark at the start of the |
+# line and insert before the two rule lines above. |
+# |
+#Ы → Ɨ ; # CYRILLIC CAPITAL LETTER YERU |
+#ы → ɨ ; # CYRILLIC SMALL LETTER YERU |
+# |
+######################################################################## |
+# |
+# End BGN Page 104 Note 2 |
+# |
+######################################################################## |
+# |
+Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN |
+ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN |
+Э → E ; # CYRILLIC CAPITAL LETTER E |
+э → e ; # CYRILLIC SMALL LETTER E |
+Ә → Ä ; # CYRILLIC CAPITAL LETTER SCHWA |
+ә → ä ; # CYRILLIC SMALL LETTER SCHWA |
+Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU |
+Ю → YU ; # CYRILLIC CAPITAL LETTER YU |
+ю → yu ; # CYRILLIC SMALL LETTER YU |
+Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA |
+Я → YA ; # CYRILLIC CAPITAL LETTER YA |
+я → ya ; # CYRILLIC SMALL LETTER YA |
+# |
+# |
+######################################################################## |
+ |