summaryrefslogtreecommitdiffstats
path: root/intl/icu/source/data/translit/InterIndic_Arabic.txt
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-19 01:47:29 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-19 01:47:29 +0000
commit0ebf5bdf043a27fd3dfb7f92e0cb63d88954c44d (patch)
treea31f07c9bcca9d56ce61e9a1ffd30ef350d513aa /intl/icu/source/data/translit/InterIndic_Arabic.txt
parentInitial commit. (diff)
downloadfirefox-esr-0ebf5bdf043a27fd3dfb7f92e0cb63d88954c44d.tar.xz
firefox-esr-0ebf5bdf043a27fd3dfb7f92e0cb63d88954c44d.zip
Adding upstream version 115.8.0esr.upstream/115.8.0esr
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/icu/source/data/translit/InterIndic_Arabic.txt')
-rw-r--r--intl/icu/source/data/translit/InterIndic_Arabic.txt135
1 files changed, 135 insertions, 0 deletions
diff --git a/intl/icu/source/data/translit/InterIndic_Arabic.txt b/intl/icu/source/data/translit/InterIndic_Arabic.txt
new file mode 100644
index 0000000000..8f31e05bdf
--- /dev/null
+++ b/intl/icu/source/data/translit/InterIndic_Arabic.txt
@@ -0,0 +1,135 @@
+# © 2016 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html
+# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
+#
+# File: InterIndic_Arabic.txt
+# Generated from CLDR
+#
+
+$nonword = [^\uE000-\uE0FF];
+$wordBoundary = [^[:L:][:M:][:N:]];
+\uE015\uE03F\uE02F\uE03E } $nonword→كيا; # किया
+\uE026\uE03F\uE02F\uE03E } $nonword→ديا; # दिया
+\uE015\uE03F } $nonword→كي; # कि at word end
+\uE039\uE048→هي; # ह\u0948
+\uE001 } $nonword→ن; # chandrabindu at end to noon
+\uE001→ن; # chandrabindu not at end to noon
+\uE002 } $nonword→ن; # anusvara to noon at end
+\uE002→ن; # anusvara to noon \u0902
+\uE003→ه ا; # viarga to ha + alif ः
+\uE004→ا; # short a to alif ऄ
+\uE005→ا; # अ
+\uE006→ا \u0653; # alif with mad आ
+[[:L:][:M:]] {\uE007}→ي; # इ after another letter or mark
+\uE007→إ; # इ at beginning of word
+[[:L:][:M:]] {\uE008}→ي; # ई after another letter or mark
+\uE008→إ; # ई at beginning of word
+\uE009→و; # उ
+\uE00A→و; # ऊ
+\uE00B→ر; # ऋ
+\uE00C→ل; # ऌ
+\uE00D→ا ي; # ऍ
+\uE00E→ي; # ऎ
+$wordBoundary {\uE00F} → إي; # word-initial ए
+\uE00F } $nonword→ي; # ए use ي when at end
+\uE00F→ي; # ए use ي when not at end
+\uE010 } $nonword→ا ي; # ऐ use ي when at end
+\uE010→ا ي; # ऐ use ي when not at end
+\uE011→ا و; # ऑ
+\uE012→ا و; # ऒ
+\uE013→ا و; # ओ
+\uE014→ا و; # औ
+\uE015→ك; # क
+\uE016→كه; # ख
+\uE017→ج; # ग
+\uE018→جه; # घ
+\uE019→نج; # ङ
+\uE01A→تش; # च
+\uE01B→تشه; # छ
+\uE01C→ج; # ज
+\uE01D→جه; # झ
+\uE01E→ن; # ञ
+\uE01F→ط; # ट
+\uE020→طه; # ठ
+\uE021→د; # ड
+\uE022→ده; # ढ
+\uE023→ن; # ण
+\uE024→ت; # त
+\uE025→ته; # थ
+\uE026→د; # द
+\uE027→ده; # ध
+\uE028→ن; # न
+\uE029→ن; # ऩ
+\uE02A→ب; # प
+\uE02B→به; # फ
+\uE02C→ب; # ब
+\uE02D→به; # भ
+\uE02E→م; # म
+\uE02F→ي; # य
+\uE030→ر; # र
+\uE031→ر; # ऱ
+\uE032→ل; # ल
+\uE033→ر; # ळ
+\uE034→ر; # ऴ
+\uE035→و; # व
+\uE036→ش; # श
+\uE037→ش; # ष
+\uE038→س; # स
+\uE039→ه; # ह
+\uE03C→; # \u093C
+\uE03D→; # ऽ
+\uE03E→ا; # ा
+\uE03F→ي; # ि
+\uE040→ي; # ी
+\uE041→و; # \u0941
+\uE042→و; # \u0942
+\uE043→ر; # \u0943
+\uE044→ر; # \u0944
+\uE045→ن; # \u0945
+\uE046→ي; # \u0946
+\uE047 } $nonword→ي; # \u0947 use ي when at end
+\uE047→ي; # \u0947 use ي when not at end
+\uE048 } $nonword→ا ي; # \u0948 use ي when at end
+\uE048→ا ي; # \u0948 use ي when not at end
+\uE049→و; # ॉ
+\uE04A→ا و; # ॊ
+\uE04B→و; # ो
+\uE04C→ا و; # ौ
+\uE04D→; # \u094D
+\uE050→ا و; # ॐ
+\uE051→; # \u0951
+\uE052→; # \u0952
+\uE053→; # \u0953
+\uE054→; # \u0954
+\uE058→ق; # क़
+\uE059→خ; # ख़
+\uE05A→غ; # ग़
+\uE05B→ز; # ज़
+\uE05C→ر; # ड़
+\uE05D→ره; # ढ़
+\uE05E→ف; # फ़
+\uE05F→ي; # य़
+\uE060→ر; # ॠ
+\uE061→ل; # ॡ
+\uE062→ل; # \u0962
+\uE063→ل; # \u0963
+\uE064→۔; # ।
+\uE065→۔; # ॥
+\uE066→\.; # ०
+\uE067→١; # १
+\uE068→٢; # २
+\uE069→٣; # ३
+\uE06A→٤; # ४
+\uE06B→٥; # ५
+\uE06C→٦; # ६
+\uE06D→٧; # ७
+\uE06E→٨; # ८
+\uE06F→٩; # ९
+\uE070→\.; # ॰
+\uE082→; # ॽ
+# Remove sequences of alif characters.
+# For example, transform पाओला → بااولا → باولا.
+::null;
+$alif = [أإآا] [:M:]*;
+($alif) $alif+ → $1;
+