Index: source/data/translit/it_ja.txt |
diff --git a/source/data/translit/it_ja.txt b/source/data/translit/it_ja.txt |
index 27ec5e898206cc32915d880f695cf8888651c021..78e3a9bc0691f483b10189d58bf59475fa904b3b 100644 |
--- a/source/data/translit/it_ja.txt |
+++ b/source/data/translit/it_ja.txt |
@@ -1,19 +1,29 @@ |
-# *************************************************************************** |
-# * |
-# * Copyright (C) 2004-2015, International Business Machines |
-# * Corporation; Unicode, Inc.; and others. All Rights Reserved. |
-# * |
-# *************************************************************************** |
+# © 2016 and later: Unicode, Inc. and others. |
+# License & terms of use: http://www.unicode.org/copyright.html#License |
+# |
# File: it_ja.txt |
-# Generated from CLDR |
+# Generated from CLDR |
# |
+ |
+# Italian to Katakana Transliteration Table for ICU |
+# Based on: |
+# "現代イタリア語入門" (大学書林, 1974. ISBN:978-4475017176) |
+# http://ja.wikipedia.org/wiki/%E3%82%A4%E3%82%BF%E3%83%AA%E3%82%A2%E8%AA%9E |
::NFD(NFC); |
::Lower(); |
::[:Latin:] fullwidth-halfwidth(); |
+# |
+# |
+# Variables. |
$vowel = [aeiou]; |
$consonant = [bcdfghjklmnpqrstvwxyz]; |
+# |
+# |
+# Ignore apostrophe. |
($consonant) \' → | $1; |
\' → ; |
+# |
+# |
cqu → ック; |
cc → ッ | c; |
ca → カ; |
@@ -23,11 +33,15 @@ ci → チ; |
cu → ク; |
ce → チェ; |
co → コ; |
+# |
+# |
cha → シャ; |
chi → キ; |
chu → チュ; |
che → ケ; |
cho → チョ; |
+# |
+# |
gg → ッ | g; |
ghi → ギ; |
ghe → ゲ; |
@@ -38,6 +52,8 @@ gni → ニ; |
gnu → ヌ; |
gne → ニェ; |
gno → ニョ; |
+# |
+# |
ga → ガ; |
gia → ジャ; |
giu → ジュ; |
@@ -46,18 +62,24 @@ gi → ジ; |
gu → グ; |
ge → ジェ; |
go → ゴ; |
+# |
+# |
rr → ッ | r; |
ra → ラ; |
ri → リ; |
ru → ル; |
re → レ; |
ro → ロ; |
+# |
+# |
ll → ッ | l; |
la → ラ; |
li → リ; |
lu → ル; |
le → レ; |
lo → ロ; |
+# |
+# |
tt → ッ | t; |
ta → タ; |
ti → ティ; |
@@ -70,49 +92,68 @@ to → ト; |
tho → ト; |
tzu → | ッツ; |
tz → | zz; |
+# |
+# |
dd → ッ | d; |
da → ダ; |
di → ディ; |
du → ドゥ; |
de → デ; |
do → ド; |
+# |
+# |
ma → マ; |
mi → ミ; |
mu → ム; |
me → メ; |
mo → モ; |
m } $consonant → ン; |
+# |
+# |
na → ナ; |
ni → ニ; |
nu → ヌ; |
ne → ネ; |
no → ノ; |
+# |
+# |
ff → ッ | f; |
fa → ファ; |
fi → フィ; |
fu → フ; |
fe → フェ; |
fo → フォ; |
+# |
+# |
bb → ッ | b; |
ba → バ; |
bi → ビ; |
bu → ブ; |
be → ベ; |
bo → ボ; |
+# |
+# |
pp → ッ | p; |
pa → パ; |
pi → ピ; |
pu → プ; |
pe → ペ; |
po → ポ; |
+# |
+# |
vv → ッ | v; |
va → ヴァ; |
vi → ヴィ; |
vu → ヴ; |
ve → ヴェ; |
vo → ヴォ; |
+# |
+# |
sa } nt[ao] → サ; |
ss → ッ | \~s; |
+# |
+# |
+# 's' is voiced before [bdglmnrv]. |
sb → ズ | b; |
sd → ズ | d; |
sg → ズ | g; |
@@ -121,46 +162,71 @@ sm → ズ | m; |
sn → ズ | n; |
sr → ズ | r; |
sv → ズ | v; |
+# |
+# |
+# Force 's' after a consonat to be unvoiced. |
($consonant) s } $vowel → | $1 \~ s; |
\~sa → サ; |
\~si → シ; |
\~su → ス; |
\~se → セ; |
\~so → ソ; |
+# |
+# |
+# 's' at the beginning is usually unvoiced. |
[:^Letter:] { sa → サ; |
[:^Letter:] { si → シ; |
[:^Letter:] { su → ス; |
[:^Letter:] { se → セ; |
[:^Letter:] { so → ソ; |
+# |
+# |
+# Otherwise voiced 's' are common. |
sa → ザ; |
si → ジ; |
su → ズ; |
se → ゼ; |
so → ゾ; |
+# |
+# |
scia → シャ; |
sci → シ; |
sce → シェ; |
+# |
+# |
zz → ッ | \~z; |
+# |
+# Force 'z' after a consonat to be unvoiced. |
($consonant) z → | $1 \~z; |
\~za → ツァ; |
\~zi → ツィ; |
\~zu → ツ; |
\~ze → ツェ; |
\~zo → ツォ; |
+# |
+# |
+# Otherwise voiced 'z' are common except for 'zi'. |
za → ザ; |
[:^Letter:] { zi → ジ; |
zi → ツィ; |
zu → ズ; |
ze → ゼ; |
zo → ゾ; |
+# |
+# |
ja → ヤ; |
je → イェ; |
j → | i; |
+# |
+# |
+# Standalone vowels and consonants. |
a → ア; |
i → イ; |
u → ウ; |
e → エ; |
o → オ; |
+# |
+# |
b → ブ; |
c → ク; |
d → ド; |
@@ -180,7 +246,20 @@ v → ヴ; |
x → | cs; |
y → | i; |
z → ツ; |
+# |
+# |
+# word delimiter of transliterated foreign phrase is '・'. |
' ' → ・; |
+# |
+# |
+# Latin hyphen should be transliterated to U+30A0 (KATAKANA-HIRAGANA |
+# DOUBLE HYPHEN), ideally. But since the character isn't supported by |
+# many fonts or softwares, we use U+FF1D (FULLWIDTH EQUALS SIGN), |
+# which is widely used as "double hyphen". |
+# |
\- → =; |
+# |
+# |
[:nonspacing mark:] → ; |
::NFC(NFD); |
+ |