summaryrefslogtreecommitdiffstats
path: root/intl/icu/source/data/translit/blt_blt_FONIPA.txt
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 19:33:14 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 19:33:14 +0000
commit36d22d82aa202bb199967e9512281e9a53db42c9 (patch)
tree105e8c98ddea1c1e4784a60a5a6410fa416be2de /intl/icu/source/data/translit/blt_blt_FONIPA.txt
parentInitial commit. (diff)
downloadfirefox-esr-36d22d82aa202bb199967e9512281e9a53db42c9.tar.xz
firefox-esr-36d22d82aa202bb199967e9512281e9a53db42c9.zip
Adding upstream version 115.7.0esr.upstream/115.7.0esrupstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/icu/source/data/translit/blt_blt_FONIPA.txt')
-rw-r--r--intl/icu/source/data/translit/blt_blt_FONIPA.txt139
1 files changed, 139 insertions, 0 deletions
diff --git a/intl/icu/source/data/translit/blt_blt_FONIPA.txt b/intl/icu/source/data/translit/blt_blt_FONIPA.txt
new file mode 100644
index 0000000000..dbe1c710c4
--- /dev/null
+++ b/intl/icu/source/data/translit/blt_blt_FONIPA.txt
@@ -0,0 +1,139 @@
+# © 2016 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html
+# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
+#
+# File: blt_blt_FONIPA.txt
+# Generated from CLDR
+#
+
+# Output phonemes
+# ---------------
+# Nasals: m mʷ n nʷ ɲ ɲʷ ŋ ŋʷ
+# Plosives: p pʰ pʰʷ pʷ b t tʷ tʰ d dʷ k kʰ kʰʷ kʷ ɡ ɡʷ ʔ
+# Fricatives: f fʷ v s sʷ h hʷ x xʷ
+# Other consonants: w j l
+# Affricates: t\u0361ɕ t\u0361ɕʷ t\u0361ɕʰ t\u0361ɕʰʷ
+# Vowels: i ɨ u ɛ e ə ɔ o a aː
+# Diphthongs: iə\u032F ɨə\u032F uə\u032F ai\u032F
+# Tones: ˨ ˧˥ ˨˩ ˥ ˦ ˧˩
+#
+#
+# Limitations
+# -----------
+# Currently, these rules only support tone marks, but not tone letters.
+#
+#
+# References
+# ----------
+# [1] Jim Brase, SIL International: Proposal to encode the Tai Viet script
+# in the UCS. ISO/IEC JTC1/SC2/WG2 N3220. March 20, 2007.
+# http://std.dkuug.dk/jtc1/sc2/wg2/docs/n3220.pdf
+#
+# [2] ScriptSource: Tai Viet Vowels.
+# http://scriptsource.org/entry/eusd5ehysa
+#
+# [3] ScriptSource: Tai Viet Consonants.
+# http://scriptsource.org/entry/lbwpkrqk7b
+#
+# [4] http://www.seasite.niu.edu/tai/TaiDam/tones.htm
+$LO = [ꪀ ꪂ ꪄ ꪆ ꪈ ꪊ ꪌ ꪎ ꪐ ꪒ ꪔ ꪖ ꪘ ꪚ ꪜ ꪞ ꪠ ꪢ ꪤ ꪦ ꪨ ꪪ ꪬ ꪮ];
+$HI = [ꪁ ꪃ ꪅ ꪇ ꪉ ꪋ ꪍ ꪏ ꪑ ꪓ ꪕ ꪗ ꪙ ꪛ ꪝ ꪟ ꪡ ꪣ ꪥ ꪧ ꪩ ꪫ ꪭ ꪯ];
+$C = [$LO $HI];
+$V1 = [ꪵ ꪶ ꪹ ꪻ ꪼ]; # vowels written before consonant
+$V2 = [ \uAAB0 \uAAB2 \uAAB3 \uAAB4 \uAAB7 \uAAB8 \uAABE]; # vowels written above or below consonant
+$V3 = [ꪱ ꪮ ꪺ ꪽ]; # vowels written after consonant
+$DIGRAPHS = [{ꪹ \uAAB8} {ꪹ \uAAB7} {ꪹ ꪱ}];
+$V12 = [$V1 $V2 $DIGRAPHS];
+$V123 = [$V12 $V3];
+$W = [ꪫ]; # labialization marker
+$F = [$C]; # syllable-final consonant
+$IPA_TONE = [˥ ˦ ˧ ˨ ˩];
+$NOT_IPA_TONE = [^$IPA_TONE];
+$BOUNDARY = [^[:L:][:M:][:N:]];
+# Consonants at the end of “checked” syllables.
+$CHK = [ꪜ ꪝ ꪞ ꪟ ꪔ ꪕ ꪖ ꪗ ꪀ ꪁ ꪂ ꪃ ꪮ ꪯ];
+# The Tai Viet script uses visual ordering. Convert to logical order.
+($V1) ($C $W?) → $2 $1;
+::null;
+# Special handling for stand-alone ꪽ ‘that’.
+$BOUNDARY {ꪽ} $BOUNDARY → nan˧˩;
+# Convert tones for checked syllables (those ending in /p/, /t/, /k/, /ʔ/)
+$LO $W? $V12 {($CHK)} → $1 ˧˥; # Tone class 2: High-rising tone
+$LO $W? {($V3 $CHK)} → $1 ˧˥; # Tone class 2: High-rising tone
+$HI $W? $V12 {($CHK)} → $1 ˦; # Tone class 5: High-mid tone
+$HI $W? {($V3 $CHK)} → $1 ˦; # Tone class 5: High-mid tone
+# Convert tones for unchecked syllables with vowels that are written
+# after the consonant (V3).
+# TODO: Also support tone letters, not just tone marks.
+$LO $W? { \uAABF ($V3 $F?)} → $1 ˧˥; # Tone class 2: High-rising tone
+$LO $W? { \uAAC1 ($V3 $F?)} → $1 ˨˩; # Tone class 3: Low-falling tone
+$HI $W? { \uAABF ($V3 $F?)} → $1 ˦; # Tone class 5: High-mid tone
+$HI $W? { \uAAC1 ($V3 $F?)} → $1 ˧˩; # Tone class 6: Mid-falling tone
+# Convert tones for unchecked syllables with vowels that are either written
+# before the consonant (V1) or vowels that are written above or below it (V2).
+# TODO: Also support tone letters, not just tone marks.
+$LO $W? $V12 { \uAABF ($F?)} → $1 ˧˥; # Tone class 2: High-rising tone
+$LO $W? $V12 { \uAAC1 ($F?)} → $1 ˨˩; # Tone class 3: Low-falling tone
+$HI $W? $V12 { \uAABF ($F?)} → $1 ˦; # Tone class 5: High-mid tone
+$HI $W? $V12 { \uAAC1 ($F?)} → $1 ˧˩; # Tone class 6: Mid-falling tone
+::null;
+{($LO $W? $V123 $F?)} $NOT_IPA_TONE → $1 ˨; # Tone class 1: Low-mid tone.
+{($HI $W? $V123 $F?)} $NOT_IPA_TONE → $1 ˥; # Tone class 4: High tone.
+::null;
+# Harden syllable-final consonants.
+$C $W? $V123 {ꪒ} → ꪔ; # /d/ → /t/
+::null;
+# Convert labialization marker.
+$C {$W} $V123 → ʷ;
+::null;
+[ꪀ ꪁ] → k;
+[ꪂ ꪃ] → kʰ; # Tai Dón; not used in Tai Dam according to [3]
+[ꪄ ꪅ] → x;
+[ꪆ ꪇ] → ɡ; # only in loanwords, according to [3]
+[ꪈ ꪉ] → ŋ;
+[ꪊ ꪋ] → t\u0361ɕ; # Tai Dón; not used in Tai Dam according to [3]
+[ꪌ ꪍ] → t\u0361ɕʰ; # Tai Dón; not used in Tai Dam according to [3]
+[ꪎ ꪏ] → s;
+[ꪐ ꪑ] → ɲ;
+[ꪒ ꪓ] → d;
+[ꪔ ꪕ] → t;
+[ꪖ ꪗ] → tʰ;
+[ꪘ ꪙ] → n;
+[ꪚ ꪛ] → b;
+[ꪜ ꪝ] → p;
+[ꪞ ꪟ] → pʰ; # Tai Dón; not used in Tai Dam according to [3]
+[ꪠ ꪡ] → f;
+[ꪢ ꪣ] → m;
+[ꪤ ꪥ] → j;
+[ꪦ ꪧ] → r; # only in loanwords, according to [3]
+[ꪨ ꪩ] → l;
+{[ꪪ ꪫ]} $IPA_TONE → w; # at the end of a syllable (before tone letters)
+[ꪪ ꪫ] → v; # not at the end of a syllable
+[ꪬ ꪭ] → h;
+ʔ {[ꪮ ꪯ]} → ɔ; # eg. ꪮꪮꪀ
+[ꪮ ꪯ] → ʔ;
+# Digraphs.
+ꪹ \uAAB8 → e;
+ꪹ \uAAB7 → ə;
+ꪹ ꪱ → aːw;
+# Vowels.
+\uAAB0 → a;
+ꪱ → aː;
+\uAAB2 → i;
+\uAAB3 → ɨ;
+\uAAB4 → u;
+ꪵ → ɛ;
+ꪶ → o;
+\uAAB7 → ɔ;
+ꪮ → ɔ;
+ꪺ → uə\u032F;
+ꪽ → an;
+ꪹ → ɨə\u032F;
+\uAAB8 → iə\u032F;
+ꪻ → əw;
+ꪼ → ai\u032F;
+\uAABE → am;
+# Word ligature symbols.
+ꫛ → kon˥;
+ꫜ → nɨŋ˦;
+