diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-19 01:47:29 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-19 01:47:29 +0000 |
commit | 0ebf5bdf043a27fd3dfb7f92e0cb63d88954c44d (patch) | |
tree | a31f07c9bcca9d56ce61e9a1ffd30ef350d513aa /intl/icu/source/data/translit/InterIndic_Latin.txt | |
parent | Initial commit. (diff) | |
download | firefox-esr-0ebf5bdf043a27fd3dfb7f92e0cb63d88954c44d.tar.xz firefox-esr-0ebf5bdf043a27fd3dfb7f92e0cb63d88954c44d.zip |
Adding upstream version 115.8.0esr.upstream/115.8.0esr
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/icu/source/data/translit/InterIndic_Latin.txt')
-rw-r--r-- | intl/icu/source/data/translit/InterIndic_Latin.txt | 499 |
1 files changed, 499 insertions, 0 deletions
diff --git a/intl/icu/source/data/translit/InterIndic_Latin.txt b/intl/icu/source/data/translit/InterIndic_Latin.txt new file mode 100644 index 0000000000..44d1ea1733 --- /dev/null +++ b/intl/icu/source/data/translit/InterIndic_Latin.txt @@ -0,0 +1,499 @@ +# © 2016 and later: Unicode, Inc. and others. +# License & terms of use: http://www.unicode.org/copyright.html +# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml +# +# File: InterIndic_Latin.txt +# Generated from CLDR +# + +# InterIndic-Latin +#\u0E00 reserved +#consonants +$chandrabindu=\uE001; +$anusvara=\uE002; +$visarga=\uE003; +#\u0E004 reserved +# w←vowel→ represents the stand-alone form +$wa=\uE005; +$waa=\uE006; +$wi=\uE007; +$wii=\uE008; +$wu=\uE009; +$wuu=\uE00A; +$wr=\uE00B; +$wl=\uE00C; +$wce=\uE00D; # LETTER CANDRA E +$wse=\uE00E; # LETTER SHORT E +$we=\uE00F; # ए LETTER E +$wai=\uE010; +$wco=\uE011; # LETTER CANDRA O +$wso=\uE012; # LETTER SHORT O +$wo=\uE013; # ओ LETTER O +$wau=\uE014; +$ka=\uE015; +$kha=\uE016; +$ga=\uE017; +$gha=\uE018; +$nga=\uE019; +$ca=\uE01A; +$cha=\uE01B; +$ja=\uE01C; +$jha=\uE01D; +$nya=\uE01E; +$tta=\uE01F; +$ttha=\uE020; +$dda=\uE021; +$ddha=\uE022; +$nna=\uE023; +$ta=\uE024; +$tha=\uE025; +$da=\uE026; +$dha=\uE027; +$na=\uE028; +$ena=\uE029; #compatibility +$pa=\uE02A; +$pha=\uE02B; +$ba=\uE02C; +$bha=\uE02D; +$ma=\uE02E; +$ya=\uE02F; +$ra=\uE030; +$vva=\uE081; +$rra=\uE031; +$la=\uE032; +$lla=\uE033; +$ela=\uE034; #compatibility +$va=\uE035; +$sha=\uE036; +$ssa=\uE037; +$sa=\uE038; +$ha=\uE039; +#\u093A Reserved +#\u093B Reserved +$nukta=\uE03C; +$avagraha=\uE03D; # SIGN AVAGRAHA +# ←vowel→ represents the dependent form +$aa=\uE03E; +$i=\uE03F; +$ii=\uE040; +$u=\uE041; +$uu=\uE042; +$rh=\uE043; +$rrh=\uE044; +$ce=\uE045; #VOWEL SIGN CANDRA E +$se=\uE046; #VOWEL SIGN SHORT E +$e=\uE047; +$ai=\uE048; +$co=\uE049; # VOWEL SIGN CANDRA O +$so=\uE04A; # VOWEL SIGN SHORT O +$o=\uE04B; # ो +$au=\uE04C; +$virama=\uE04D; +# \u094E Reserved +# \u094F Reserved +$om=\uE050; # OM +\uE051→; # UNMAPPED STRESS SIGN UDATTA +\uE052→; # UNMAPPED STRESS SIGN ANUDATTA +\uE053→; # UNMAPPED GRAVE ACCENT +\uE054→; # UNMAPPED ACUTE ACCENT +$lm = \uE055;# Telugu Length Mark +$ailm=\uE056;# AI Length Mark +$aulm=\uE057;# AU Length Mark +#urdu compatibility forms +$uka=\uE058; +$ukha=\uE059; +$ugha=\uE05A; +$ujha=\uE05B; +$uddha=\uE05C; +$udha=\uE05D; +$ufa=\uE05E; +$uya=\uE05F; +$wrr=\uE060; +$wll=\uE061; +$lh=\uE062; +$llh=\uE063; +$danda=\uE064; +$doubleDanda=\uE065; +$zero=\uE066; # DIGIT ZERO +$one=\uE067; # DIGIT ONE +$two=\uE068; # DIGIT TWO +$three=\uE069; # DIGIT THREE +$four=\uE06A; # DIGIT FOUR +$five=\uE06B; # DIGIT FIVE +$six=\uE06C; # DIGIT SIX +$seven=\uE06D; # DIGIT SEVEN +$eight=\uE06E; # DIGIT EIGHT +$nine=\uE06F; # DIGIT NINE +# Glottal stop +$dgs=\uE082; +#Khanda-ta +$kta=\uE083; +$depVowelAbove=[\uE03E-\uE040\uE045-\uE04C]; +$depVowelBelow=[\uE041-\uE044]; +# $x was originally called '§'; $z was '%' +$x=[$aa$ai$au$ii$i$uu$u$rrh$rh$lh$llh$e$o$se$ce$so$co]; +$z=[bcdfghjklmnpqrstvwxyz]; +$vowels=[aeiour\u0304\u0325\u0306]; +$forceIndependentMatra = [^[[:L:][\u0300-\u034C]]]; +###################################################################### +# convert from Native letters to Latin letters +###################################################################### +#transliterations for anusvara +$anusvara} [$ka$kha$ga$gha$nga] → n\u0307; +$anusvara} [$ca$cha$ja$jha$nya] → n\u0304; +$anusvara} [$tta$ttha$dda$ddha$nna] → n\u0323; +$anusvara} [$ta$tha$da$dha$na] → n; +$anusvara} [$pa$pha$ba$bha$ma] → m; +$anusvara} [$ya$ra$lla$la$va$ssa$sha$sa$ha] → n; +$anusvara→ m\u0307; +# Urdu compatibility +$ya$nukta}$x → y\u0307; +$ya$nukta$virama → y\u0307; +$ya$nukta → y\u0307a; +$la$nukta }$x → l\u0331; +$la$nukta$virama → l\u0331; +$la$nukta → l\u0331a; +$na$nukta }$x → n\u0331; +$na$nukta$virama → n\u0331; +$na$nukta → n\u0331a; +$ena }$x → n\u0331; +$ena$virama → n\u0331; +$ena → n\u0331a; +$uka → qa; +$ka$nukta }$x → q; +$ka$nukta$virama → q; +$ka$nukta → qa; +$kha$nukta }$x → k\u0331h\u0331; +$kha$nukta$virama → k\u0331h\u0331; +$kha$nukta → k\u0331h\u0331a; +$ukha$virama → k\u0331h\u0331; +$ukha → k\u0331h\u0331a; +$ugha → g\u0307a; +$ga$nukta }$x → g\u0307; +$ga$nukta$virama → g\u0307; +$ga$nukta → g\u0307a; +$ujha → za; +$ja$nukta }$x → z; +$ja$nukta$virama → z; +$ja$nukta → za; +$ddha$nukta}$x → r\u0323h; +$ddha$nukta$virama → r\u0323h; +$ddha$nukta → r\u0323ha; +$uddha}$x → r\u0323; +$uddha$virama → r\u0323; +$uddha → r\u0323a; +$udha → r\u0323a; +$dda$nukta}$x → r\u0323; +$dda$nukta$virama → r\u0323; +$dda$nukta → r\u0323a; +$pha$nukta }$x → f; +$pha$nukta$virama → f; +$pha$nukta → fa; +$ufa }$x → f; +$ufa$virama → f; +$ufa → fa; +$ra$nukta}$x → r\u0331; +$ra$nukta$virama → r\u0331; +$ra$nukta → r\u0331a; +$lla$nukta}$x → l\u0331; +$lla$nukta$virama → l\u0331; +$lla$nukta → l\u0331a; +$ela}$x → l\u0331; +$ela$virama → l\u0331; +$ela → l\u0331a; +$uya}$x → y\u0307; +$uya$virama → y\u0307; +$uya → y\u0307a; +# normal consonants +$ka$virama}$ha→k''; +$ka}$x→k; +$ka$virama→k; +$ka→ka; +$kha}$x→kh; +$kha$virama→kh; +$kha→kha; +$ga$virama}$ha→g''; +$ga}$x→g; +$ga$virama→g; +$ga→ga; +$gha}$x→gh; +$gha$virama→gh; +$gha→gha; +$nga}$x→n\u0307; +$nga$virama→n\u0307; +$nga→n\u0307a; +$ca$virama}$ha→c''; +$ca}$x→c; +$ca$virama→c; +$ca→ca; +$cha}$x→ch; +$cha$virama→ch; +$cha→cha; +$ja$virama}$ha→j''; +$ja}$x→j; +$ja$virama→j; +$ja→ja; +$jha}$x→jh; +$jha$virama→jh; +$jha→jha; +$nya }$x→n\u0303; +$nya$virama→n\u0303; +$nya → n\u0303a; +$tta$virama}$ha→t\u0323''; +$tta}$x→t\u0323; +$tta$virama→t\u0323; +$tta→t\u0323a; +$ttha}$x→t\u0323h; +$ttha$virama→t\u0323h; +$ttha→t\u0323ha; +$dda}$x$ha→d\u0323''; +$dda}$x→d\u0323; +$dda$virama→d\u0323; +$dda→d\u0323a; +$ddha}$x→d\u0323h; +$ddha$virama→d\u0323h; +$ddha→d\u0323ha; +$nna}$x→n\u0323; +$nna$virama→n\u0323; +$nna→n\u0323a; +$ta$virama}$ha→t''; +$ta$virama}$ttha→t''; +$ta$virama}$tta→t''; +$ta$virama}$tha→t''; +$ta}$x→t; +$ta$virama→t; +$ta→ta; +$tha}$x→th; +$tha$virama→th; +$tha→tha; +$da$virama}$ha→d''; +$da$virama}$ddha→d''; +$da$virama}$dda→d''; +$da$virama}$dha→d''; +$da}$x→d; +$da$virama→d; +$da→da; +$dha}$x→dh; +$dha$virama→dh; +$dha→dha; +$na$virama}$ga→n''; +$na$virama}$ya→n''; +$na}$x→n; +$na$virama→n; +$na→na; +$pa$virama}$ha→p''; +$pa}$x→p; +$pa$virama→p; +$pa→pa; +$pha}$x→ph; +$pha$virama→ph; +$pha→pha; +$ba$virama}$ha→b''; +$ba}$x→b; +$ba$virama→b; +$ba→ba; +$bha}$x→bh; +$bha$virama→bh; +$bha→bha; +$ma$virama}$ma→m''; +$ma}$x→m; +$ma$virama→m; +$ma→ma; +$ya}$x→y; +$ya$virama→y; +$ya→ya; +$ra$virama}$ha→r''; +$ra}$x→r; +$ra$virama→r; +$ra→ra; +$vva$virama}$ha→w\u0307''; +$vva}$x→w\u0307; +$vva$virama→w\u0307; +$vva→w\u0307a; +$rra$virama}$ha→r\u0331''; +$rra}$x→r\u0331; +$rra$virama→r\u0331; +$rra→r\u0331a; +$la$virama}$ha→l''; +$la}$x→l; +$la$virama→l; +$la→la; +$lla$virama}$ha→l\u0323''; +$lla}$x→l\u0323; +$lla$virama→l\u0323; +$lla→l\u0323a; +$va}$x→v; +$va$virama→v; +$va→va; +$sa$virama}$ha→s''; +$sa$virama}$sha→s''; +$sa$virama}$ssa→s''; +$sa$virama}$sa→s''; +$sa}$x→s; +$sa$virama→s; +#for gurmukhi +$sa$nukta}$x→s\u0301; +$sa$nukta$virama→s\u0301; +$sa$nukta→s\u0301a; +$sa→sa; +$sha}$x→s\u0301; +$sha$virama→s\u0301; +$sha→s\u0301a; +$ssa}$x→s\u0323; +$ssa$virama→s\u0323; +$ssa→s\u0323a; +$ha}$x→h; +$ha$virama→h; +$ha→ha; +# dependent vowels (should never occur except following consonants) +$forceIndependentMatra{$aa → \u0314a\u0304; +$forceIndependentMatra{$ai → \u0314ai; +$forceIndependentMatra{$au → \u0314au; +$forceIndependentMatra{$ii → \u0314i\u0304; +$forceIndependentMatra{$i → \u0314i; +$forceIndependentMatra{$uu → \u0314u\u0304; +$forceIndependentMatra{$u → \u0314u; +$forceIndependentMatra{$rrh → \u0314r\u0325\u0304; +$forceIndependentMatra{$rh → \u0314r\u0325; +$forceIndependentMatra{$llh → \u0314l\u0325\u0304; +$forceIndependentMatra{$lh → \u0314l\u0325; +$forceIndependentMatra{$e → \u0314e\u0304; +$forceIndependentMatra{$o → \u0314o\u0304; +#extra vowels +$forceIndependentMatra{$ce → \u0314e\u0306; +$forceIndependentMatra{$co → \u0314o\u0306; +$forceIndependentMatra{$se → \u0314e; +$forceIndependentMatra{$so → \u0314o; +$forceIndependentMatra{$nukta →; # Nukta cannot appear independently or as first character +$forceIndependentMatra{$virama →; # Virama cannot appear independently or as first character +$aa → a\u0304; +$ai → ai; +$au → au; +$ii → i\u0304; +$i → i; +$uu → u\u0304; +$u → u; +$rrh → r\u0325\u0304; +$rh → r\u0325; +$llh → l\u0325\u0304; +$lh → l\u0325; +$e → e\u0304; +$o → o\u0304; +#extra vowels +$ce → e\u0306; +$co → o\u0306; +$se → e; +$so → o; +#dependent vowels when following independent vowels. Generally Illegal only for roundtripping +$waa} $x → a\u0304\u0314; +$wai} $x → ai\u0314; +$wau} $x → au\u0314; +$wii} $x → i\u0304\u0314; +$wi } $x → i\u0314; +$wuu} $x → u\u0304\u0314; +$wu } $x → u\u0314; +$wrr} $x → r\u0325\u0304\u0314; +$wr } $x → r\u0325\u0314; +$wll} $x → l\u0325\u0304\u0314; +$wl } $x → l\u0325\u0314; +$we } $x → e\u0304\u0314; +$wo } $x → o\u0304\u0314; +$wa } $x → a\u0314; +#extra vowels +$wce} $x → e\u0306\u0314; +$wco} $x → o\u0306\u0314; +$wse} $x → e\u0314; +$wso} $x → o\u0314; +$om} $x → ''om\u0314; +# independent vowels when preceded by vowels +$vowels{$waa → ''a\u0304; +$vowels{$wai → ''ai; +$vowels{$wau → ''au; +$vowels{$wii → ''i\u0304; +$vowels{$wi → ''i; +$vowels{$wuu → ''u\u0304; +$vowels{$wu → ''u; +$vowels{$wrr → ''r\u0325\u0304; +$vowels{$wr → ''r\u0325; +$vowels{$wll → ''l\u0325\u0304; +$vowels{$wl → ''l\u0325; +$vowels{$we → ''e\u0304; +$vowels{$wo → ''o\u0304; +$vowels{$wa → ''a; +#extra vowels +$vowels{$wce → ''e\u0306; +$vowels{$wco → ''o\u0306; +$vowels{$wse → ''e; +$vowels{$wso → ''o; +# independent vowels (otherwise) +$waa → a\u0304; +$wai → ai; +$wau → au; +$wii → i\u0304; +$wi → i; +$wuu → u\u0304; +$wu → u; +$wrr → r\u0325\u0304; +$wr → r\u0325; +$wll → l\u0325\u0304; +$wl → l\u0325; +$we → e\u0304; +$wo → o\u0304; +$wa → a; +#extra vowels +$wce → e\u0306; +$wco → o\u0306; +$wse → e; +$wso → o; +$om → ''om; +#stress marks +$avagraha → \u0315; +$chandrabindu$anusvara→\u0303; +$chandrabindu → m\u0310; +$visarga→h\u0323; +#numbers +$zero → 0; +$one → 1; +$two → 2; +$three → 3; +$four → 4; +$five → 5; +$six → 6; +$seven → 7; +$eight → 8; +$nine → 9; +$lm →; +$ailm →; +$aulm →; +$dgs→ʔ; +$kta→t\u0331; +$danda→'.'; +$doubleDanda→'.'; +\uE070→'.'; # ABBREVIATION SIGN +# LETTER RA WITH MIDDLE DIAGONAL +\uE071}$x→ra; +\uE071$virama→r; +\uE071→ra; +# LETTER RA WITH LOWER DIAGONAL +\uE072}$x→ra; +\uE072$virama→r; +\uE072→ra; +\uE073→; # RUPEE MARK +\uE074→; # RUPEE SIGN +\uE075→; # CURRENCY NUMERATOR ONE +\uE076→; # CURRENCY NUMERATOR TWO +\uE077→; # CURRENCY NUMERATOR THREE +\uE078→; # CURRENCY NUMERATOR FOUR +\uE079→; # CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR +\uE07A→; # CURRENCY DENOMINATOR SIXTEEN +\uE07B→; # ISSHAR +\uE07C→; # TIPPI +\uE07D→; # ADDAK +\uE07E→; # IRI +\uE07F→; # URA +\uE080→; # EK ONKAR +\uE004→; # DEVANAGARI VOWEL SIGN SHORT A +$virama→; # remove remaining viramas +$nukta→\u0323 ; # combining dot below +\uE084→æ; # DEVANAGARI VOWEL SIGN SHORT A + |