Index: source/data/translit/ko_ko_Latn_BGN.txt |
diff --git a/source/data/translit/Korean_Latin_BGN.txt b/source/data/translit/ko_ko_Latn_BGN.txt |
similarity index 86% |
rename from source/data/translit/Korean_Latin_BGN.txt |
rename to source/data/translit/ko_ko_Latn_BGN.txt |
index 682493d99de1d1befddbceb2621362b9274adeb7..ff54254be1b2832bcdcb673a0828ab1432d34ac8 100644 |
--- a/source/data/translit/Korean_Latin_BGN.txt |
+++ b/source/data/translit/ko_ko_Latn_BGN.txt |
@@ -1,18 +1,69 @@ |
-# *************************************************************************** |
-# * |
-# * Copyright (C) 2004-2015, International Business Machines |
-# * Corporation; Unicode, Inc.; and others. All Rights Reserved. |
-# * |
-# *************************************************************************** |
-# File: Korean_Latin_BGN.txt |
-# Generated from CLDR |
+# © 2016 and later: Unicode, Inc. and others. |
+# License & terms of use: http://www.unicode.org/copyright.html#License |
+# |
+# File: ko_ko_Latn_BGN.txt |
+# Generated from CLDR |
+# |
+ |
+# |
+######################################################################## |
+# BGN/PCGN Agreement |
+# |
+# This system wad devised by G. M. McCune and E. O. Reischauer, and |
+# was originally published in the Transactions of the Korea Branch of |
+# the Royal Asiatic Society, Volume XXIX, 1939. It has been used by |
+# the BGN since 1943, and was later adopted for use by the PCGN. A |
+# main characteristic of this system is the attempt to represent |
+# approximate Korean pronunciation, while systematically converting |
+# the Hangul characters to corresponding Roman-script letters. Since |
+# Korean pronunciation is often inconsistently represented in Hangul, |
+# the McCune-Reischauer conversion tables are rather elaborate, and |
+# reverse conversion (from Roman script back to Hangul) is not possible. |
+# |
+# Originally prepared by Michael Everson <everson@evertype.com> |
+######################################################################## |
+# |
+# MINIMAL FILTER: Korean-Latin |
# |
:: [ᄀᄁᄂᄃᄄᄅᄆᄇᄈᄉᄊᄋᄌᄍᄎᄏᄐᄑᄒᄭᄯᄲᄶᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵᆨᆫᆮᆯᆰᆱᆲᆷᆸᆺᆼᆽᆾᆿᇀᇁ] ; |
:: NFD (NFC) ; |
+# |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Define All Transformation Variables |
+# |
+######################################################################## |
+# |
$aspirate = ’; |
$apostrophe = ’; |
$vowels = [ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ] ; |
+# |
+# |
+# Use this $wordBoundary until bug 2034 is fixed in ICU: |
+# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest |
+# |
$wordBoundary = [^[:L:][:M:][:N:]] ; |
+# |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Rules moved to front to avoid masking |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# BGN Page 60 Rule 1: |
+# |
+# Romanization of Hangul consonants and consonant clusters within words. |
+# |
+######################################################################## |
+# |
ᆨᄀ → kk ; # HANGUL JONGSEONG KIYEOK + CHOSEONG KIYEOK |
ᆨᄂ → ngn ; # HANGUL JONGSEONG KIYEOK + CHOSEONG NIEUN |
ᆨᄃ → kt ; # HANGUL JONGSEONG KIYEOK + CHOSEONG TIKEUT |
@@ -222,6 +273,19 @@ $wordBoundary = [^[:L:][:M:][:N:]] ; |
ᆲᄈ → lpp ; # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGPIEUP |
ᆲᄊ → pss ; # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGSIOS |
ᆲᄍ → ptch ; # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGCIEUC |
+# |
+# |
+######################################################################## |
+# |
+# End of Rule 1 |
+# |
+######################################################################## |
+# |
+######################################################################## |
+# |
+# Start of Transformations |
+# |
+######################################################################## |
$wordBoundary{ᄀ → k ; # HANGUL CHOSEONG KIYEOK |
$wordBoundary{ᄂ → n ; # HANGUL CHOSEONG NIEUN |
$wordBoundary{ᄃ → t ; # HANGUL CHOSEONG TIKEUT |
@@ -281,3 +345,7 @@ $wordBoundary{ᄶ → tch ; # HANGUL CHOSEONG SIOS-CIEUC |
ᇁ}$wordBoundary → p ; # HANGUL JONGSEONG PHIEUPH |
ᆰ}$wordBoundary → k ; # HANGUL JONGSEONG RIEUL-KIYEOK |
ᆲ}$wordBoundary → p ; # HANGUL JONGSEONG RIEUL-PIEUP |
+# |
+# |
+######################################################################## |
+ |