summaryrefslogtreecommitdiffstats
path: root/intl/icu/source/data/translit/ja_Latn_ru.txt
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 19:33:14 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 19:33:14 +0000
commit36d22d82aa202bb199967e9512281e9a53db42c9 (patch)
tree105e8c98ddea1c1e4784a60a5a6410fa416be2de /intl/icu/source/data/translit/ja_Latn_ru.txt
parentInitial commit. (diff)
downloadfirefox-esr-36d22d82aa202bb199967e9512281e9a53db42c9.tar.xz
firefox-esr-36d22d82aa202bb199967e9512281e9a53db42c9.zip
Adding upstream version 115.7.0esr.upstream/115.7.0esr
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/icu/source/data/translit/ja_Latn_ru.txt')
-rw-r--r--intl/icu/source/data/translit/ja_Latn_ru.txt130
1 files changed, 130 insertions, 0 deletions
diff --git a/intl/icu/source/data/translit/ja_Latn_ru.txt b/intl/icu/source/data/translit/ja_Latn_ru.txt
new file mode 100644
index 0000000000..9d7ec6a240
--- /dev/null
+++ b/intl/icu/source/data/translit/ja_Latn_ru.txt
@@ -0,0 +1,130 @@
+# © 2016 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html
+# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
+#
+# File: ja_Latn_ru.txt
+# Generated from CLDR
+#
+
+# Japanese (Rōmaji) to Russian (Cyrillic) Polivanov transliteration for ICU.
+# Can be run in sequence after e.g. Katakana-Latin.
+#
+# These rules cannot be used to target Bulgarian, Serbian, Tajik, or Ukrainian.
+#
+# TODO: Cyrillization needs to respect morpheme/Kanji boundaries.
+# 中井 becomes Накаи, but 北海道 becomes Хоккайдо. We need boundary
+# markup in the input in order to do that properly.
+#
+::NFD(NFC);
+::[:Latin:] Lower();
+#
+#
+$lengthMarker = [\u0302\u0304];
+#
+#
+# Delete apostrophes. Apostrophes after "n" are consumed below.
+\' → ;
+#
+#
+# Turn long /e:/ into diphthong /ei/.
+# Note that /ei/ across a morpheme boundary (e.g. 武井 Takei) becomes эи.
+e $lengthMarker → эй ;
+#
+#
+# Turn long /i:/ into two vowels /ii/.
+i $lengthMarker → | i i ;
+#
+#
+# Ignore vowel length everywhere else.
+$lengthMarker → ;
+#
+#
+# Vowels.
+#
+# TODO(mjansche): Enable diphthongs once we have Kanji boundaries.
+## ai → ай ;
+a → а ;
+i\~e → | ye ;
+i → и ;
+u\~ → в ; # ウィ etc.
+#
+## ui → уй ;
+u → у ;
+e → э ;
+o → о ;
+#
+#
+# Consonants.
+#
+k → к ;
+#
+#
+sh → | sy ;
+s → с ;
+#
+#
+ch → | ty ;
+c } ch → t ;
+te\~ → | t ; # テュ
+to\~ → | t ; # トゥ
+tsu\~ → | ts ; # ツァ, ツィ, etc.
+ts → ц ;
+t → т ;
+#
+#
+\~tsu → | tsu ;
+#
+#
+n } [bpm] → м ; # 群馬 → Гумма
+n\' → нъ ;
+n → н ;
+#
+#
+h → х ;
+fu\~ → | f ; # フュ
+f → ф ;
+#
+#
+m → м ;
+#
+#
+ya → я ;
+yi → и ; # Added for convenience, after sh, ch, j.
+yu → ю ;
+ye → е ; # ?? unobserved
+yo → ё ;
+#
+#
+r → р ;
+#
+#
+wa → ва ;
+w → ;
+#
+#
+g → г ;
+#
+#
+j → | zy ;
+z → дз ;
+#
+#
+de\~ → | d ; # デュ
+dji\~ → | z ; # ヂャ, ヂュ, etc.
+dj → | j ; # ヂ
+do\~ → | d ; # ドゥ
+dzu\~ → | z ; # ヅァ, ヅィ, etc.
+dz → | z ; # ヅ
+d → д ;
+#
+#
+b → б ;
+vu\~ → | v ; # ヴァ, etc.
+v → в ; # ?? unobserved
+#
+#
+p → п ;
+#
+#
+::NFC(NFD);
+