| Index: source/data/translit/tk_Cyrl_tk_BGN.txt
|
| diff --git a/source/data/translit/tk_Cyrl_tk_BGN.txt b/source/data/translit/tk_Cyrl_tk_BGN.txt
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..da7785433acd9d1568158430d0d4cc9e1cf54f26
|
| --- /dev/null
|
| +++ b/source/data/translit/tk_Cyrl_tk_BGN.txt
|
| @@ -0,0 +1,308 @@
|
| +# © 2016 and later: Unicode, Inc. and others.
|
| +# License & terms of use: http://www.unicode.org/copyright.html#License
|
| +#
|
| +# File: tk_Cyrl_tk_BGN.txt
|
| +# Generated from CLDR
|
| +#
|
| +
|
| +#
|
| +########################################################################
|
| +# BGN/PCGN 1979 System
|
| +#
|
| +# The BGN/PCGN system for Turkmen was designed for use in
|
| +# romanizing names written in the Turkmen alphabet.
|
| +# The Turkmen alphabet contains five letters not present
|
| +# in the Russian alphabet: Җҗ, Ңң, Өө, Үү, and Әә.
|
| +#
|
| +# The Turkmen Cyrillic Alphabet as defined by the BGN (Page 103):
|
| +#
|
| +# АБВГДЕЁЖҖЗИЙКЛМНҢОӨПРСТУҮФХЦЧШЩЪЫЬЭӘЮЯ
|
| +# абвгдеёжзҗийклмнңоөпрстуүфхцчшщъыьэәюя
|
| +#
|
| +# Originally prepared by Michael Everson <everson@evertype.com>
|
| +########################################################################
|
| +#
|
| +# MINIMAL FILTER: Turkmen-Latin
|
| +#
|
| +# :: [АБВГДЕЁЖҖЗИЙКЛМНҢОӨПРСТУҮФХЦЧШЩЪЫЬЭӘЮЯабвгдеёжзҗийклмнңоөпрстуүфхцчшщъыьэәюя] ;
|
| +:: NFD (NFC) ;
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +########################################################################
|
| +#
|
| +# Define All Transformation Variables
|
| +#
|
| +########################################################################
|
| +#
|
| +$prime = ʹ ;
|
| +$doublePrime = ʺ ;
|
| +$upperConsonants = [БВГДЖҖЗЙКЛМНҢПРСТФХЦЧШЩЪЬ] ;
|
| +$lowerConsonants = [бвгджҗзйклмнңпрстфхцчшщъь] ;
|
| +$consonants = [$upperConsonants $lowerConsonants] ;
|
| +$upperVowels = [АЕЁИОӨУҮЫЭӘЮЯ] ;
|
| +$lowerVowels = [аеёиоөуүыэәюя] ;
|
| +$vowels = [$upperVowels $lowerVowels] ;
|
| +$lower = [$lowerConsonants $lowerVowels] ;
|
| +#
|
| +#
|
| +# Use this $wordBoundary until bug 2034 is fixed in ICU:
|
| +# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
|
| +#
|
| +$wordBoundary = [^[:L:][:M:][:N:]] ;
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +########################################################################
|
| +#
|
| +# Start of Alphabetic Transformations
|
| +#
|
| +########################################################################
|
| +#
|
| +А → A ; # CYRILLIC CAPITAL LETTER A
|
| +а → a ; # CYRILLIC SMALL LETTER A
|
| +Б → B ; # CYRILLIC CAPITAL LETTER BE
|
| +б → b ; # CYRILLIC SMALL LETTER BE
|
| +В → W ; # CYRILLIC CAPITAL LETTER VE
|
| +в → w ; # CYRILLIC SMALL LETTER VE
|
| +Г → G ; # CYRILLIC CAPITAL LETTER GHE
|
| +г → g ; # CYRILLIC SMALL LETTER GHE
|
| +Д → D ; # CYRILLIC CAPITAL LETTER DE
|
| +д → d ; # CYRILLIC SMALL LETTER DE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 104 Rule 1:
|
| +#
|
| +# The character e should be romanized ye initially, after the vowel
|
| +# characters a, e, ё, и, о, ө, у, ү, ы, э, ю, and я, and after й, ъ, and ь.
|
| +# In all other instances, it should be romanized e.
|
| +#
|
| +########################################################################
|
| +#
|
| +Е}[[$upperVowels - [Ә]] [ЙЪЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE
|
| +Е}[[$lowerVowels - [ә]] [йъь]] → Ye ; # CYRILLIC CAPITAL LETTER IE
|
| +$wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE
|
| +Е → E ; # CYRILLIC CAPITAL LETTER IE
|
| +е}[[$upperVowels - [Ә]] [$lowerVowels - [ә]] [ЙйЪъЬь]] → ye ; # CYRILLIC SMALL LETTER IE
|
| +$wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
|
| +е → e ; # CYRILLIC SMALL LETTER IE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End of Rule 1
|
| +#
|
| +########################################################################
|
| +#
|
| +Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO
|
| +Ё → YO ; # CYRILLIC CAPITAL LETTER IO
|
| +ё → yo ; # CYRILLIC SMALL LETTER IO
|
| +Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE
|
| +Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE
|
| +ж → zh ; # CYRILLIC SMALL LETTER ZHE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 104 Rule 2
|
| +#
|
| +# The character sequences зх, нг, сх, and цх may be romanized z·h,
|
| +# n·g, s·h, and ts·h in order to differentiate those romanizations form
|
| +# the digraphs zh, ng, sh, and the letter sequence tsh, which are used
|
| +# to render the characters ж, ң, ш, and the character sequence тш.
|
| +#
|
| +########################################################################
|
| +#
|
| +ЗХ → Z·H ; # CYRILLIC CAPITAL LETTER ZE
|
| +Зх → Z·h ; # CYRILLIC CAPITAL LETTER ZE
|
| +зх → z·h ; # CYRILLIC SMALL LETTER ZE
|
| +З → Z ; # CYRILLIC CAPITAL LETTER ZE
|
| +з → z ; # CYRILLIC SMALL LETTER ZE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| +И → И ; # CYRILLIC CAPITAL LETTER I
|
| +и → и ; # CYRILLIC SMALL LETTER I
|
| +Й → Y ; # CYRILLIC CAPITAL LETTER I
|
| +й → y ; # CYRILLIC SMALL LETTER I
|
| +К → K ; # CYRILLIC CAPITAL LETTER KA
|
| +к → k ; # CYRILLIC SMALL LETTER KA
|
| +Л → L ; # CYRILLIC CAPITAL LETTER EL
|
| +л → l ; # CYRILLIC SMALL LETTER EL
|
| +М → M ; # CYRILLIC CAPITAL LETTER EM
|
| +м → m ; # CYRILLIC SMALL LETTER EM
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 104 Rule 2
|
| +#
|
| +# нг becomes n·g
|
| +#
|
| +########################################################################
|
| +#
|
| +НГ → N·G ; # CYRILLIC CAPITAL LETTER EN
|
| +Нг → N·g ; # CYRILLIC CAPITAL LETTER EN
|
| +нг → n·g ; # CYRILLIC SMALL LETTER EN
|
| +Н → N ; # CYRILLIC CAPITAL LETTER EN
|
| +н → n ; # CYRILLIC SMALL LETTER EN
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| +Ң} $lower → Ng ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER
|
| +Ң → NG ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER
|
| +ң → ng ; # CYRILLIC SMALL LETTER EN WITH DESCENDER
|
| +О → O ; # CYRILLIC CAPITAL LETTER O
|
| +о → o ; # CYRILLIC SMALL LETTER O
|
| +Ө → Ö ; # CYRILLIC CAPITAL LETTER BARRED O
|
| +ө → ö ; # CYRILLIC SMALL LETTER BARRED O
|
| +П → P ; # CYRILLIC CAPITAL LETTER PE
|
| +п → p ; # CYRILLIC SMALL LETTER PE
|
| +Р → R ; # CYRILLIC CAPITAL LETTER ER
|
| +р → r ; # CYRILLIC SMALL LETTER ER
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 104 Rule 2
|
| +#
|
| +# сх becomes s·h
|
| +#
|
| +########################################################################
|
| +#
|
| +СХ → S·H ; # CYRILLIC CAPITAL LETTER ES
|
| +Сх → S·h ; # CYRILLIC CAPITAL LETTER ES
|
| +сх → s·h ; # CYRILLIC SMALL LETTER ES
|
| +С → S ; # CYRILLIC CAPITAL LETTER ES
|
| +с → s ; # CYRILLIC SMALL LETTER ES
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| +Т → T ; # CYRILLIC CAPITAL LETTER TE
|
| +т → t ; # CYRILLIC SMALL LETTER TE
|
| +У → U ; # CYRILLIC CAPITAL LETTER U
|
| +у → u ; # CYRILLIC SMALL LETTER U
|
| +Ү → Ü ; # CYRILLIC CAPITAL LETTER STRAIGHT U
|
| +ү → ü ; # CYRILLIC SMALL LETTER STRAIGHT U
|
| +Ф → F ; # CYRILLIC CAPITAL LETTER EF
|
| +ф → f ; # CYRILLIC SMALL LETTER EF
|
| +Х → H ; # CYRILLIC CAPITAL LETTER HA
|
| +х → h ; # CYRILLIC SMALL LETTER HA
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 104 Rule 2
|
| +#
|
| +# цх becomes ts·h
|
| +#
|
| +########################################################################
|
| +#
|
| +ЦХ → TS·H ; # CYRILLIC CAPITAL LETTER GHE
|
| +Цх → Ts·h ; # CYRILLIC CAPITAL LETTER GHE
|
| +цх → ts·h ; # CYRILLIC SMALL LETTER GHE
|
| +Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
|
| +Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
|
| +ц → ts ; # CYRILLIC SMALL LETTER TSE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| +Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
|
| +Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
|
| +ч → ch ; # CYRILLIC SMALL LETTER CHE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6).
|
| +#
|
| +# шч becomes sh·ch
|
| +#
|
| +########################################################################
|
| +#
|
| +ШЧ → SH·CH ; # CYRILLIC CAPITAL LETTER SHA
|
| +Шч → Sh·ch ; # CYRILLIC CAPITAL LETTER SHA
|
| +шч → sh·ch ; # CYRILLIC SMALL LETTER SHA
|
| +Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
|
| +Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
|
| +ш → sh ; # CYRILLIC SMALL LETTER SHA
|
| +Щ} $lower → Shch ; # CYRILLIC CAPITAL LETTER SHCHA
|
| +Щ → SHCH ; # CYRILLIC CAPITAL LETTER SHCHA
|
| +щ → shch ; # CYRILLIC SMALL LETTER SHCHA
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Implied rule
|
| +#
|
| +########################################################################
|
| +#
|
| +Ъ → $doublePrime ; # CYRILLIC CAPITAL LETTER HARD SIGN
|
| +ъ → $doublePrime ; # CYRILLIC SMALL LETTER HARD SIGN
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 104 Note 3
|
| +#
|
| +# The character Ыы may be romanized Ɨɨ instead of Yy, if so desired.
|
| +#
|
| +########################################################################
|
| +#
|
| +Ы → Y ; # CYRILLIC CAPITAL LETTER YERU
|
| +ы → y ; # CYRILLIC SMALL LETTER YERU
|
| +#
|
| +#
|
| +# Alternative rule to implement the option described here. To apply
|
| +# uncomment the following by removing the '#' mark at the start of the
|
| +# line and insert before the two rule lines above.
|
| +#
|
| +#Ы → Ɨ ; # CYRILLIC CAPITAL LETTER YERU
|
| +#ы → ɨ ; # CYRILLIC SMALL LETTER YERU
|
| +#
|
| +########################################################################
|
| +#
|
| +# End BGN Page 104 Note 2
|
| +#
|
| +########################################################################
|
| +#
|
| +Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN
|
| +ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN
|
| +Э → E ; # CYRILLIC CAPITAL LETTER E
|
| +э → e ; # CYRILLIC SMALL LETTER E
|
| +Ә → Ä ; # CYRILLIC CAPITAL LETTER SCHWA
|
| +ә → ä ; # CYRILLIC SMALL LETTER SCHWA
|
| +Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
|
| +Ю → YU ; # CYRILLIC CAPITAL LETTER YU
|
| +ю → yu ; # CYRILLIC SMALL LETTER YU
|
| +Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
|
| +Я → YA ; # CYRILLIC CAPITAL LETTER YA
|
| +я → ya ; # CYRILLIC SMALL LETTER YA
|
| +#
|
| +#
|
| +########################################################################
|
| +
|
|
|