| Index: source/data/translit/it_ja.txt
|
| diff --git a/source/data/translit/it_ja.txt b/source/data/translit/it_ja.txt
|
| index 27ec5e898206cc32915d880f695cf8888651c021..78e3a9bc0691f483b10189d58bf59475fa904b3b 100644
|
| --- a/source/data/translit/it_ja.txt
|
| +++ b/source/data/translit/it_ja.txt
|
| @@ -1,19 +1,29 @@
|
| -# ***************************************************************************
|
| -# *
|
| -# * Copyright (C) 2004-2015, International Business Machines
|
| -# * Corporation; Unicode, Inc.; and others. All Rights Reserved.
|
| -# *
|
| -# ***************************************************************************
|
| +# © 2016 and later: Unicode, Inc. and others.
|
| +# License & terms of use: http://www.unicode.org/copyright.html#License
|
| +#
|
| # File: it_ja.txt
|
| -# Generated from CLDR
|
| +# Generated from CLDR
|
| #
|
| +
|
| +# Italian to Katakana Transliteration Table for ICU
|
| +# Based on:
|
| +# "現代イタリア語入門" (大学書林, 1974. ISBN:978-4475017176)
|
| +# http://ja.wikipedia.org/wiki/%E3%82%A4%E3%82%BF%E3%83%AA%E3%82%A2%E8%AA%9E
|
| ::NFD(NFC);
|
| ::Lower();
|
| ::[:Latin:] fullwidth-halfwidth();
|
| +#
|
| +#
|
| +# Variables.
|
| $vowel = [aeiou];
|
| $consonant = [bcdfghjklmnpqrstvwxyz];
|
| +#
|
| +#
|
| +# Ignore apostrophe.
|
| ($consonant) \' → | $1;
|
| \' → ;
|
| +#
|
| +#
|
| cqu → ック;
|
| cc → ッ | c;
|
| ca → カ;
|
| @@ -23,11 +33,15 @@ ci → チ;
|
| cu → ク;
|
| ce → チェ;
|
| co → コ;
|
| +#
|
| +#
|
| cha → シャ;
|
| chi → キ;
|
| chu → チュ;
|
| che → ケ;
|
| cho → チョ;
|
| +#
|
| +#
|
| gg → ッ | g;
|
| ghi → ギ;
|
| ghe → ゲ;
|
| @@ -38,6 +52,8 @@ gni → ニ;
|
| gnu → ヌ;
|
| gne → ニェ;
|
| gno → ニョ;
|
| +#
|
| +#
|
| ga → ガ;
|
| gia → ジャ;
|
| giu → ジュ;
|
| @@ -46,18 +62,24 @@ gi → ジ;
|
| gu → グ;
|
| ge → ジェ;
|
| go → ゴ;
|
| +#
|
| +#
|
| rr → ッ | r;
|
| ra → ラ;
|
| ri → リ;
|
| ru → ル;
|
| re → レ;
|
| ro → ロ;
|
| +#
|
| +#
|
| ll → ッ | l;
|
| la → ラ;
|
| li → リ;
|
| lu → ル;
|
| le → レ;
|
| lo → ロ;
|
| +#
|
| +#
|
| tt → ッ | t;
|
| ta → タ;
|
| ti → ティ;
|
| @@ -70,49 +92,68 @@ to → ト;
|
| tho → ト;
|
| tzu → | ッツ;
|
| tz → | zz;
|
| +#
|
| +#
|
| dd → ッ | d;
|
| da → ダ;
|
| di → ディ;
|
| du → ドゥ;
|
| de → デ;
|
| do → ド;
|
| +#
|
| +#
|
| ma → マ;
|
| mi → ミ;
|
| mu → ム;
|
| me → メ;
|
| mo → モ;
|
| m } $consonant → ン;
|
| +#
|
| +#
|
| na → ナ;
|
| ni → ニ;
|
| nu → ヌ;
|
| ne → ネ;
|
| no → ノ;
|
| +#
|
| +#
|
| ff → ッ | f;
|
| fa → ファ;
|
| fi → フィ;
|
| fu → フ;
|
| fe → フェ;
|
| fo → フォ;
|
| +#
|
| +#
|
| bb → ッ | b;
|
| ba → バ;
|
| bi → ビ;
|
| bu → ブ;
|
| be → ベ;
|
| bo → ボ;
|
| +#
|
| +#
|
| pp → ッ | p;
|
| pa → パ;
|
| pi → ピ;
|
| pu → プ;
|
| pe → ペ;
|
| po → ポ;
|
| +#
|
| +#
|
| vv → ッ | v;
|
| va → ヴァ;
|
| vi → ヴィ;
|
| vu → ヴ;
|
| ve → ヴェ;
|
| vo → ヴォ;
|
| +#
|
| +#
|
| sa } nt[ao] → サ;
|
| ss → ッ | \~s;
|
| +#
|
| +#
|
| +# 's' is voiced before [bdglmnrv].
|
| sb → ズ | b;
|
| sd → ズ | d;
|
| sg → ズ | g;
|
| @@ -121,46 +162,71 @@ sm → ズ | m;
|
| sn → ズ | n;
|
| sr → ズ | r;
|
| sv → ズ | v;
|
| +#
|
| +#
|
| +# Force 's' after a consonat to be unvoiced.
|
| ($consonant) s } $vowel → | $1 \~ s;
|
| \~sa → サ;
|
| \~si → シ;
|
| \~su → ス;
|
| \~se → セ;
|
| \~so → ソ;
|
| +#
|
| +#
|
| +# 's' at the beginning is usually unvoiced.
|
| [:^Letter:] { sa → サ;
|
| [:^Letter:] { si → シ;
|
| [:^Letter:] { su → ス;
|
| [:^Letter:] { se → セ;
|
| [:^Letter:] { so → ソ;
|
| +#
|
| +#
|
| +# Otherwise voiced 's' are common.
|
| sa → ザ;
|
| si → ジ;
|
| su → ズ;
|
| se → ゼ;
|
| so → ゾ;
|
| +#
|
| +#
|
| scia → シャ;
|
| sci → シ;
|
| sce → シェ;
|
| +#
|
| +#
|
| zz → ッ | \~z;
|
| +#
|
| +# Force 'z' after a consonat to be unvoiced.
|
| ($consonant) z → | $1 \~z;
|
| \~za → ツァ;
|
| \~zi → ツィ;
|
| \~zu → ツ;
|
| \~ze → ツェ;
|
| \~zo → ツォ;
|
| +#
|
| +#
|
| +# Otherwise voiced 'z' are common except for 'zi'.
|
| za → ザ;
|
| [:^Letter:] { zi → ジ;
|
| zi → ツィ;
|
| zu → ズ;
|
| ze → ゼ;
|
| zo → ゾ;
|
| +#
|
| +#
|
| ja → ヤ;
|
| je → イェ;
|
| j → | i;
|
| +#
|
| +#
|
| +# Standalone vowels and consonants.
|
| a → ア;
|
| i → イ;
|
| u → ウ;
|
| e → エ;
|
| o → オ;
|
| +#
|
| +#
|
| b → ブ;
|
| c → ク;
|
| d → ド;
|
| @@ -180,7 +246,20 @@ v → ヴ;
|
| x → | cs;
|
| y → | i;
|
| z → ツ;
|
| +#
|
| +#
|
| +# word delimiter of transliterated foreign phrase is '・'.
|
| ' ' → ・;
|
| +#
|
| +#
|
| +# Latin hyphen should be transliterated to U+30A0 (KATAKANA-HIRAGANA
|
| +# DOUBLE HYPHEN), ideally. But since the character isn't supported by
|
| +# many fonts or softwares, we use U+FF1D (FULLWIDTH EQUALS SIGN),
|
| +# which is widely used as "double hyphen".
|
| +#
|
| \- → =;
|
| +#
|
| +#
|
| [:nonspacing mark:] → ;
|
| ::NFC(NFD);
|
| +
|
|
|