| Index: source/data/translit/uz_Cyrl_uz_BGN.txt
|
| diff --git a/source/data/translit/Uzbek_Latin_BGN.txt b/source/data/translit/uz_Cyrl_uz_BGN.txt
|
| similarity index 53%
|
| rename from source/data/translit/Uzbek_Latin_BGN.txt
|
| rename to source/data/translit/uz_Cyrl_uz_BGN.txt
|
| index d6e947c4f7d3a2124a951e02435a353c7f013304..84898e65e108ef06644cc42e44c4a4846db56a05 100644
|
| --- a/source/data/translit/Uzbek_Latin_BGN.txt
|
| +++ b/source/data/translit/uz_Cyrl_uz_BGN.txt
|
| @@ -1,14 +1,41 @@
|
| -# ***************************************************************************
|
| -# *
|
| -# * Copyright (C) 2004-2015, International Business Machines
|
| -# * Corporation; Unicode, Inc.; and others. All Rights Reserved.
|
| -# *
|
| -# ***************************************************************************
|
| -# File: Uzbek_Latin_BGN.txt
|
| -# Generated from CLDR
|
| +# © 2016 and later: Unicode, Inc. and others.
|
| +# License & terms of use: http://www.unicode.org/copyright.html#License
|
| +#
|
| +# File: uz_Cyrl_uz_BGN.txt
|
| +# Generated from CLDR
|
| +#
|
| +
|
| +#
|
| +########################################################################
|
| +# BGN/PCGN 1979 System
|
| +#
|
| +# The BGN/PCGN system for Uzbek was designed for use in
|
| +# romanizing names written in the Uzbek alphabet.
|
| +# The Uzbek alphabet contains four letters not present
|
| +# in the Russian alphabet: Ўў, Ққ, Ғғ, and Ҳҳ.
|
| +#
|
| +# The Uzbek Alphabet as defined by the BGN (Page 107):
|
| +#
|
| +# АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲ
|
| +# абвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ
|
| +#
|
| +# Originally prepared by Michael Everson <everson@evertype.com>
|
| +########################################################################
|
| +#
|
| +# MINIMAL FILTER: Uzbek-Latin
|
| #
|
| :: [АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲабвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ] ;
|
| :: NFD (NFC) ;
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +########################################################################
|
| +#
|
| +# Define All Transformation Variables
|
| +#
|
| +########################################################################
|
| +#
|
| $prime = ʹ ;
|
| $doublePrime = ʺ ;
|
| $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЪЬҚҒҲ] ;
|
| @@ -18,22 +45,78 @@ $upperVowels = [АЕЁИОУЭЮЯЎ] ;
|
| $lowerVowels = [аеёиоуэюяў] ;
|
| $vowels = [$upperVowels $lowerVowels] ;
|
| $lower = [$lowerConsonants $lowerVowels] ;
|
| +#
|
| +#
|
| +# Use this $wordBoundary until bug 2034 is fixed in ICU:
|
| +# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
|
| +#
|
| $wordBoundary = [^[:L:][:M:][:N:]] ;
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +########################################################################
|
| +#
|
| +# Rules moved to front to avoid masking
|
| +#
|
| +########################################################################
|
| +#
|
| $lowerVowels ы → y ;
|
| $upperVowels[Ыы] → Y ;
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# Start of Alphabetic Transformations
|
| +#
|
| +########################################################################
|
| +#
|
| А → A ; # CYRILLIC CAPITAL LETTER A
|
| а → a ; # CYRILLIC SMALL LETTER A
|
| Б → B ; # CYRILLIC CAPITAL LETTER BE
|
| б → b ; # CYRILLIC SMALL LETTER BE
|
| В → W ; # CYRILLIC CAPITAL LETTER VE
|
| в → w ; # CYRILLIC SMALL LETTER VE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 108 Rule 2
|
| +#
|
| +# The character sequences гҳ, кҳ, сҳ, and цҳ may be romanized g·h,
|
| +# k·h, s·h, and ts·h in order to differentiate those romanizations from
|
| +# the digraphs gh, kh, sh, and the letter sequence tsh, which are used
|
| +# to render the chаracters г, х, ш, and the character sequence тш.
|
| +#
|
| +########################################################################
|
| +#
|
| ГҲ → G·H ; # CYRILLIC CAPITAL LETTER GHE
|
| Гҳ → G·h ; # CYRILLIC CAPITAL LETTER GHE
|
| гҳ → g·h ; # CYRILLIC SMALL LETTER GHE
|
| Г → G ; # CYRILLIC CAPITAL LETTER GHE
|
| г → g ; # CYRILLIC SMALL LETTER GHE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| Д → D ; # CYRILLIC CAPITAL LETTER DE
|
| д → d ; # CYRILLIC SMALL LETTER DE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 108 Rule 1:
|
| +#
|
| +# The character e should be romanized ye initially, after the vowel
|
| +# characters a, e, ё, и, о, у, э, ю, я, and ў, and after й and ь.
|
| +# In all other instances, it should be romanized e.
|
| +#
|
| +########################################################################
|
| +#
|
| Е}[$upperVowels [ЙЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE
|
| Е}[$lowerVowels [йь]] → Ye ; # CYRILLIC CAPITAL LETTER IE
|
| $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE
|
| @@ -41,6 +124,14 @@ $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE
|
| е}[$upperVowels $lowerVowels [ЙйЬь]] → ye ; # CYRILLIC SMALL LETTER IE
|
| $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
|
| е → e ; # CYRILLIC SMALL LETTER IE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End of Rule 1
|
| +#
|
| +########################################################################
|
| +#
|
| Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO
|
| Ё → YO ; # CYRILLIC CAPITAL LETTER IO
|
| ё → yo ; # CYRILLIC SMALL LETTER IO
|
| @@ -52,11 +143,29 @@ $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
|
| и → i ; # CYRILLIC SMALL LETTER I
|
| Й → Y ; # CYRILLIC CAPITAL LETTER I
|
| й → y ; # CYRILLIC SMALL LETTER I
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 108 Rule 2
|
| +#
|
| +# кҳ becomes k·h
|
| +#
|
| +########################################################################
|
| +#
|
| КҲ → K·H ; # CYRILLIC CAPITAL LETTER KA
|
| Кҳ → K·h ; # CYRILLIC CAPITAL LETTER KA
|
| кҳ → k·h ; # CYRILLIC SMALL LETTER KA
|
| К → K ; # CYRILLIC CAPITAL LETTER KA
|
| к → k ; # CYRILLIC SMALL LETTER KA
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| Л → L ; # CYRILLIC CAPITAL LETTER EL
|
| л → l ; # CYRILLIC SMALL LETTER EL
|
| М → M ; # CYRILLIC CAPITAL LETTER EM
|
| @@ -69,11 +178,29 @@ $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
|
| п → p ; # CYRILLIC SMALL LETTER PE
|
| Р → R ; # CYRILLIC CAPITAL LETTER ER
|
| р → r ; # CYRILLIC SMALL LETTER ER
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 108 Rule 2
|
| +#
|
| +# сҳ becomes s·h
|
| +#
|
| +########################################################################
|
| +#
|
| СҲ → S·H ; # CYRILLIC CAPITAL LETTER ES
|
| Сҳ → S·h ; # CYRILLIC CAPITAL LETTER ES
|
| сҳ → s·h ; # CYRILLIC SMALL LETTER ES
|
| С → S ; # CYRILLIC CAPITAL LETTER ES
|
| с → s ; # CYRILLIC SMALL LETTER ES
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| Т → T ; # CYRILLIC CAPITAL LETTER TE
|
| т → t ; # CYRILLIC SMALL LETTER TE
|
| У → Ū ; # CYRILLIC CAPITAL LETTER U
|
| @@ -83,12 +210,30 @@ $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
|
| Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
|
| Х → KH ; # CYRILLIC CAPITAL LETTER HA
|
| х → kh ; # CYRILLIC SMALL LETTER HA
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# BGN Page 108 Rule 2
|
| +#
|
| +# цҳ becomes ts·h
|
| +#
|
| +########################################################################
|
| +#
|
| ЦҲ → TS·H ; # CYRILLIC CAPITAL LETTER GHE
|
| Цҳ → Ts·h ; # CYRILLIC CAPITAL LETTER GHE
|
| цҳ → ts·h ; # CYRILLIC SMALL LETTER GHE
|
| Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
|
| Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
|
| ц → ts ; # CYRILLIC SMALL LETTER TSE
|
| +#
|
| +#
|
| +########################################################################
|
| +#
|
| +# End Rule 2
|
| +#
|
| +########################################################################
|
| +#
|
| Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
|
| Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
|
| ч → ch ; # CYRILLIC SMALL LETTER CHE
|
| @@ -116,3 +261,7 @@ $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
|
| ғ → gh ; # CYRILLIC SMALL LETTER GHE WITH STROKE
|
| Ҳ → H ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER
|
| ҳ → h ; # CYRILLIC SMALL LETTER HA WITH DESCENDER
|
| +#
|
| +#
|
| +########################################################################
|
| +
|
|
|