Index: source/data/translit/dv_dv_Latn_BGN.txt |
diff --git a/source/data/translit/dv_dv_Latn_BGN.txt b/source/data/translit/dv_dv_Latn_BGN.txt |
new file mode 100644 |
index 0000000000000000000000000000000000000000..45f0d12bae666a550f482bd401fe1e252f6950b2 |
--- /dev/null |
+++ b/source/data/translit/dv_dv_Latn_BGN.txt |
@@ -0,0 +1,177 @@ |
+# © 2016 and later: Unicode, Inc. and others. |
+# License & terms of use: http://www.unicode.org/copyright.html#License |
+# |
+# File: dv_dv_Latn_BGN.txt |
+# Generated from CLDR |
+# |
+ |
+# BGN/PCGN 1988 Agreement, with modifications 2009 |
+# |
+# This romanization system supersedes the one which was approved by |
+# the BGN and the PCGN in 1972. This official system was submitted |
+# to the PCGN by the Maldivian government in 1987 and approved by BGN |
+# and PCGN in 1988. The system presented here reflects the 1988 Agreement |
+# with minor modifications introduced by the government of the Maldives |
+# in 2009. |
+# |
+# In our rules, we also convert Arabic punctuation characters to Latin. |
+# These appears to be used in Maldivian text, for example in the Universal |
+# Declaration of Human Rights. |
+::[[:block=thaana:][،؛؟٪٫٬]\uFDF2] ; |
+::NFD; |
+$wordBoundary = [^[:L:][:M:][:N:]] ; |
+$vowel = [\u07A6-\u07AF] ; |
+$sukun = \u07B0 ; |
+$sign = [$sukun $vowel] ; |
+$rule4 = [އށ] $sukun ; # see note 4 |
+### Consonants |
+# HAA |
+$rule4 ހ → hh ; |
+ހ → h ; |
+# NOONU |
+# See note 5: "romanized n’ when appearing without any vowel or auxiliary sign" |
+$rule4 ނ } $sign → nn ; |
+$rule4 ނ → nn\' ; |
+ނ } $sign → n ; |
+ނ → n\' ; |
+# RAA |
+$rule4 ރ → rr ; |
+ރ → r ; |
+# BAA |
+$rule4 ބ → bb ; |
+ބ → b ; |
+# LHAVIYANI |
+$rule4 ޅ → hlh ; |
+ޅ → lh; |
+# KAAFU |
+$rule4 ކ → kk ; |
+ކ → k ; |
+# VAAVU |
+$rule4 ވ → vv ; |
+ވ → v ; |
+# MEEMU |
+$rule4 މ → mm ; |
+މ → m ; |
+# FAAFU |
+$rule4 ފ → ff ; |
+ފ → f; |
+# DHAALU |
+$rule4 ދ → hdh ; |
+ދ → dh; |
+# THAA |
+# See note 6: "romanized iy when appearing in combination with a supercircle" |
+$rule4 ތ $sukun → hiy ; |
+$rule4 ތ → hth ; |
+\u07A8 ތ $sukun → iy ; |
+ތ $sukun → iy ; |
+ތ → th ; |
+# LAAMU |
+$rule4 ލ → ll ; |
+ލ → l ; |
+# GAAFU |
+$rule4 ގ → gg ; |
+ގ → g ; |
+# GNAVIYANI |
+$rule4 ޏ → hgn ; |
+ޏ → gn ; |
+# SEENU |
+$rule4 ސ → ss ; |
+ސ → s ; |
+# DAVIYANI |
+$rule4 ޑ → dd ; |
+ޑ → d ; |
+# ZAVIYANI |
+$rule4 ޒ → zz ; |
+ޒ → z ; |
+# TAVIYANI |
+$rule4 ޓ → tt ; |
+ޓ → t ; |
+# YAA |
+$rule4 ޔ → yy ; |
+ޔ → y ; |
+# PAVIYANI |
+$rule4 ޕ → pp ; |
+ޕ → p ; |
+# JAVIYANI |
+$rule4 ޖ → jj ; |
+ޖ → j ; |
+# CHAVIYANI |
+$rule4 ޗ → hch ; |
+ޗ → ch ; |
+### Borrowed Consonants (See Rule 7) |
+# SAADHU |
+$rule4 ޞ → şş ; |
+ޞ → ş ; |
+# SHEENU |
+$rule4 ޝ → hsh ; |
+ޝ → sh ; |
+# ZAA |
+$rule4 ޜ → zz ; |
+ޜ → z; |
+# KHAA |
+$rule4 ޚ → hkh ; |
+ޚ → kh; |
+# HHAA |
+$rule4 ޙ → ḩḩ ; |
+ޙ → ḩ ; |
+# THAALU |
+$rule4 ޛ → hdh ; |
+ޛ → dh ; |
+# TTAA |
+$rule4 ޘ → hth ; |
+ޘ → th ; |
+# WAAVU |
+$rule4 ޥ → ww ; |
+ޥ → w ; |
+# QAAFU |
+$rule4 ޤ → qq ; |
+ޤ → q ; |
+# GHAINU |
+$rule4 ޣ → hgh ; |
+ޣ → gh ; |
+# AINU |
+$rule4 ޢ → \'\' ; |
+ޢ → \' ; |
+# ZO |
+$rule4 ޡ → z\u0327z\u0327 ; |
+ޡ → z\u0327 ; |
+# TO |
+$rule4 ޠ → ţţ ; |
+ޠ → ţ ; |
+# DAADHU |
+$rule4 ޟ → ḑḑ ; |
+ޟ → ḑ ; |
+# NOTE: not in Maldivian BGN system, but for completeness of Thaana block |
+# NAA |
+$rule4 ޱ → n\u0332n\u0332 ; |
+ޱ → n\u0332 ; |
+# Rule 4 in word-final position |
+$rule4 } $wordBoundary → h; |
+# SHAVIYANI (placed last to avoid masking) |
+$rule4 ށ → hsh; |
+ށ → sh; |
+# Otherwise, these signs are not romanized elsewhere |
+$rule4 → ; |
+\u07B0 → ; |
+އ → ; |
+# NOTE: not in Maldivian BGN system, but common in names (e.g. Abdullah) |
+($vowel) \uFDF2 → | $1 llāh ; |
+\uFDF2 → allāh; |
+### Vowels |
+\u07A6 → a; # ABAFILI |
+\u07A7 → aa; # AABAAFILI |
+\u07AC → e; # EBEFILI |
+\u07AD → ey; # EYBEYFILI |
+\u07A8 → i; # IBIFILI |
+\u07A9 → ee; # EEBEEFILI |
+\u07AE → o; # OBOFILI |
+\u07AF → oa; # OABOAFILI |
+\u07AA → u; # UBUFILI |
+\u07AB → oo; # OOBOOFILI |
+، → ','; # U+060C ARABIC COMMA |
+؛ → ';'; # U+061B ARABIC SEMICOLON |
+؟ → '?'; # U+061F ARABIC QUESTION MARK |
+٪ → '%'; # U+066A ARABIC PERCENT SIGN |
+٫ → '.'; # U+066B ARABIC DECIMAL SEPARATOR |
+٬ → ','; # U+066C ARABIC THOUSANDS SEPARATOR |
+ |