summaryrefslogtreecommitdiffstats
path: root/intl/icu/source/data/translit/it_ja.txt
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 19:33:14 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 19:33:14 +0000
commit36d22d82aa202bb199967e9512281e9a53db42c9 (patch)
tree105e8c98ddea1c1e4784a60a5a6410fa416be2de /intl/icu/source/data/translit/it_ja.txt
parentInitial commit. (diff)
downloadfirefox-esr-36d22d82aa202bb199967e9512281e9a53db42c9.tar.xz
firefox-esr-36d22d82aa202bb199967e9512281e9a53db42c9.zip
Adding upstream version 115.7.0esr.upstream/115.7.0esrupstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/icu/source/data/translit/it_ja.txt')
-rw-r--r--intl/icu/source/data/translit/it_ja.txt266
1 files changed, 266 insertions, 0 deletions
diff --git a/intl/icu/source/data/translit/it_ja.txt b/intl/icu/source/data/translit/it_ja.txt
new file mode 100644
index 0000000000..017bdebb58
--- /dev/null
+++ b/intl/icu/source/data/translit/it_ja.txt
@@ -0,0 +1,266 @@
+# © 2016 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html
+# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
+#
+# File: it_ja.txt
+# Generated from CLDR
+#
+
+# Italian to Katakana Transliteration Table for ICU
+# Based on:
+# "現代イタリア語入門" (大学書林, 1974. ISBN:978-4475017176)
+# http://ja.wikipedia.org/wiki/%E3%82%A4%E3%82%BF%E3%83%AA%E3%82%A2%E8%AA%9E
+::NFD(NFC);
+::Lower();
+::[:Latin:] fullwidth-halfwidth();
+#
+#
+# Variables.
+$vowel = [aeiou];
+$consonant = [bcdfghjklmnpqrstvwxyz];
+#
+#
+# Ignore apostrophe.
+($consonant) \' → | $1;
+\' → ;
+#
+#
+cqu → ック;
+cc → ッ | c;
+ca → カ;
+ッ { cia → チャ;
+cio → チョ;
+ci → チ;
+cu → ク;
+ce → チェ;
+co → コ;
+#
+#
+cha → シャ;
+chi → キ;
+chu → チュ;
+che → ケ;
+cho → チョ;
+#
+#
+gg → ッ | g;
+ghi → ギ;
+ghe → ゲ;
+ghu → グ;
+gli → | li;
+gna → ニャ;
+gni → ニ;
+gnu → ヌ;
+gne → ニェ;
+gno → ニョ;
+#
+#
+ga → ガ;
+gia → ジャ;
+giu → ジュ;
+gio → ジョ;
+gi → ジ;
+gu → グ;
+ge → ジェ;
+go → ゴ;
+#
+#
+rr → ッ | r;
+ra → ラ;
+ri → リ;
+ru → ル;
+re → レ;
+ro → ロ;
+#
+#
+ll → ッ | l;
+la → ラ;
+li → リ;
+lu → ル;
+le → レ;
+lo → ロ;
+#
+#
+tt → ッ | t;
+ta → タ;
+ti → ティ;
+thi → ティ;
+tu → トゥ;
+thu → トゥ;
+te → テ;
+the → テ;
+to → ト;
+tho → ト;
+tzu → | ッツ;
+tz → | zz;
+#
+#
+dd → ッ | d;
+da → ダ;
+di → ディ;
+du → ドゥ;
+de → デ;
+do → ド;
+#
+#
+ma → マ;
+mi → ミ;
+mu → ム;
+me → メ;
+mo → モ;
+m } $consonant → ン;
+#
+#
+na → ナ;
+ni → ニ;
+nu → ヌ;
+ne → ネ;
+no → ノ;
+#
+#
+ff → ッ | f;
+fa → ファ;
+fi → フィ;
+fu → フ;
+fe → フェ;
+fo → フォ;
+#
+#
+bb → ッ | b;
+ba → バ;
+bi → ビ;
+bu → ブ;
+be → ベ;
+bo → ボ;
+#
+#
+pp → ッ | p;
+pa → パ;
+pi → ピ;
+pu → プ;
+pe → ペ;
+po → ポ;
+#
+#
+vv → ッ | v;
+va → ヴァ;
+vi → ヴィ;
+vu → ヴ;
+ve → ヴェ;
+vo → ヴォ;
+#
+#
+sa } nt[ao] → サ;
+ss → ッ | \~s;
+#
+#
+# 's' is voiced before [bdglmnrv].
+sb → ズ | b;
+sd → ズ | d;
+sg → ズ | g;
+sl → ズ | l;
+sm → ズ | m;
+sn → ズ | n;
+sr → ズ | r;
+sv → ズ | v;
+#
+#
+# Force 's' after a consonat to be unvoiced.
+($consonant) s } $vowel → | $1 \~ s;
+\~sa → サ;
+\~si → シ;
+\~su → ス;
+\~se → セ;
+\~so → ソ;
+#
+#
+# 's' at the beginning is usually unvoiced.
+[:^Letter:] { sa → サ;
+[:^Letter:] { si → シ;
+[:^Letter:] { su → ス;
+[:^Letter:] { se → セ;
+[:^Letter:] { so → ソ;
+#
+#
+# Otherwise voiced 's' are common.
+sa → ザ;
+si → ジ;
+su → ズ;
+se → ゼ;
+so → ゾ;
+#
+#
+scia → シャ;
+sci → シ;
+sce → シェ;
+#
+#
+zz → ッ | \~z;
+#
+# Force 'z' after a consonat to be unvoiced.
+($consonant) z → | $1 \~z;
+\~za → ツァ;
+\~zi → ツィ;
+\~zu → ツ;
+\~ze → ツェ;
+\~zo → ツォ;
+#
+#
+# Otherwise voiced 'z' are common except for 'zi'.
+za → ザ;
+[:^Letter:] { zi → ジ;
+zi → ツィ;
+zu → ズ;
+ze → ゼ;
+zo → ゾ;
+#
+#
+ja → ヤ;
+je → イェ;
+j → | i;
+#
+#
+# Standalone vowels and consonants.
+a → ア;
+i → イ;
+u → ウ;
+e → エ;
+o → オ;
+#
+#
+b → ブ;
+c → ク;
+d → ド;
+f → フ;
+g → グ;
+h → ;
+k → | c;
+l → ル;
+m → ム;
+n → ン;
+p → プ;
+q → | c;
+r → ル;
+s → ス;
+t → ト;
+v → ヴ;
+x → | cs;
+y → | i;
+z → ツ;
+#
+#
+# word delimiter of transliterated foreign phrase is '・'.
+' ' → ・;
+#
+#
+# Latin hyphen should be transliterated to U+30A0 (KATAKANA-HIRAGANA
+# DOUBLE HYPHEN), ideally. But since the character isn't supported by
+# many fonts or software, we use U+FF1D (FULLWIDTH EQUALS SIGN),
+# which is widely used as "double hyphen".
+#
+\- → =;
+#
+#
+[:nonspacing mark:] → ;
+::NFC(NFD);
+