diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-28 14:29:10 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-28 14:29:10 +0000 |
commit | 2aa4a82499d4becd2284cdb482213d541b8804dd (patch) | |
tree | b80bf8bf13c3766139fbacc530efd0dd9d54394c /intl/icu/source/data/translit/ja_Latn_ru.txt | |
parent | Initial commit. (diff) | |
download | firefox-upstream.tar.xz firefox-upstream.zip |
Adding upstream version 86.0.1.upstream/86.0.1upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/icu/source/data/translit/ja_Latn_ru.txt')
-rw-r--r-- | intl/icu/source/data/translit/ja_Latn_ru.txt | 129 |
1 files changed, 129 insertions, 0 deletions
diff --git a/intl/icu/source/data/translit/ja_Latn_ru.txt b/intl/icu/source/data/translit/ja_Latn_ru.txt new file mode 100644 index 0000000000..fc2bf525a2 --- /dev/null +++ b/intl/icu/source/data/translit/ja_Latn_ru.txt @@ -0,0 +1,129 @@ +# © 2016 and later: Unicode, Inc. and others. +# License & terms of use: http://www.unicode.org/copyright.html#License +# +# File: ja_Latn_ru.txt +# Generated from CLDR +# + +# Japanese (Rōmaji) to Russian (Cyrillic) Polivanov transliteration for ICU. +# Can be run in sequence after e.g. Katakana-Latin. +# +# These rules cannot be used to target Bulgarian, Serbian, Tajik, or Ukrainian. +# +# TODO: Cyrillization needs to respect morpheme/Kanji boundaries. +# 中井 becomes Накаи, but 北海道 becomes Хоккайдо. We need boundary +# markup in the input in order to do that properly. +# +::NFD(NFC); +::[:Latin:] Lower(); +# +# +$lengthMarker = [\u0302\u0304]; +# +# +# Delete apostrophes. Apostrophes after "n" are consumed below. +\' → ; +# +# +# Turn long /e:/ into diphthong /ei/. +# Note that /ei/ across a morpheme boundary (e.g. 武井 Takei) becomes эи. +e $lengthMarker → эй ; +# +# +# Turn long /i:/ into two vowels /ii/. +i $lengthMarker → | i i ; +# +# +# Ignore vowel length everywhere else. +$lengthMarker → ; +# +# +# Vowels. +# +# TODO(mjansche): Enable diphthongs once we have Kanji boundaries. +## ai → ай ; +a → а ; +i\~e → | ye ; +i → и ; +u\~ → в ; # ウィ etc. +# +## ui → уй ; +u → у ; +e → э ; +o → о ; +# +# +# Consonants. +# +k → к ; +# +# +sh → | sy ; +s → с ; +# +# +ch → | ty ; +c } ch → t ; +te\~ → | t ; # テュ +to\~ → | t ; # トゥ +tsu\~ → | ts ; # ツァ, ツィ, etc. +ts → ц ; +t → т ; +# +# +\~tsu → | tsu ; +# +# +n } [bpm] → м ; # 群馬 → Гумма +n\' → нъ ; +n → н ; +# +# +h → х ; +fu\~ → | f ; # フュ +f → ф ; +# +# +m → м ; +# +# +ya → я ; +yi → и ; # Added for convenience, after sh, ch, j. +yu → ю ; +ye → е ; # ?? unobserved +yo → ё ; +# +# +r → р ; +# +# +wa → ва ; +w → ; +# +# +g → г ; +# +# +j → | zy ; +z → дз ; +# +# +de\~ → | d ; # デュ +dji\~ → | z ; # ヂャ, ヂュ, etc. +dj → | j ; # ヂ +do\~ → | d ; # ドゥ +dzu\~ → | z ; # ヅァ, ヅィ, etc. +dz → | z ; # ヅ +d → д ; +# +# +b → б ; +vu\~ → | v ; # ヴァ, etc. +v → в ; # ?? unobserved +# +# +p → п ; +# +# +::NFC(NFD); + |