blob: 68aaacf6415c8880a5d0c87262c533871fd79acd (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
|
# © 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html
# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml
#
# File: ro_ro_FONIPA.txt
# Generated from CLDR
#
# Romanian orthography to phonemic transcription.
# http://en.wikipedia.org/wiki/Romanian_phonology
#
# TODO: Currently this transform does not palatalize consonants.
$VowelEI = [e i î];
$VowelAOU = [a â ă o u];
$Vowel = [$VowelEI $VowelAOU];
$Boundary = [^[:L:][:M:][:N:]];
:: NFC () ;
:: Lower () ;
# Special cases.
eoai → eo\u032Faj ; # eg. leoaică → /leo\u032Fajkə/, not /le\u032Fo\u032Faikə/
# Triphthongs.
eai → e\u032Faj ;
eau → e\u032Faw ;
eoa → e\u032Fo\u032Fa ;
i\-ai → jaj ;
ia\-i → jaj ;
iau → jaw ;
iei → jej ;
ieu → jew ;
$Boundary {eu} → jew ;
ioa → jo\u032Fa ;
ioi → joj ;
i\-oi → joj ;
iou → jow ;
oai → o\u032Faj ;
uai → waj ;
uau → waw ;
uăi → wəj ;
# Diphthongs.
ai → aj ;
âi → ɨj ;
ăi → əj ;
au} r → au ;
au → aw ;
âu → ɨw ;
ău → əw ;
ea → e\u032Fa ;
ei → ej ;
eo → e\u032Fo ;
e\-o → e\u032Fo ;
eu → ew ;
e\-u → e\u032Fu ;
ia → ja ;
i\-a → ja ;
ie → je ;
ii → ij ;
io → jo ;
iu} [$Vowel $Boundary] → iw ;
iu → ju ;
oa → o\u032Fa ;
oi → oj ;
ou → ow ;
ua → wa ;
uâ → wɨ ;
uă → wə ;
ue → we ;
ui → uj ;
uu → uw ;
a → a ;
â → ɨ ;
ă → ə ;
b → b ;
ch → k ;
{c} [ei] → t\u0361ʃ ;
c → k ;
d → d ;
e → e ;
f → f ;
gh → ɡ ;
{g} [ei] → d\u0361ʒ ;
g → ɡ ;
h → h ;
i → i ;
î → ɨ ;
j → ʒ ;
k → k ;
l → l ;
m → m ;
ng → ŋ ;
n → n ;
o → o ;
p → p ;
q → k ;
r → r ;
s → s ;
ş → ʃ ;
ș → ʃ ;
t → t ;
ţ → t\u0361s ;
ț → t\u0361s ;
u → u ;
v → v ;
x → ks ;
y → i ;
z → z ;
[:P:]+ → ' ';
# Romanian does not have any gemination.
# https://en.wikipedia.org/wiki/Gemination#Latin_and_Romance_languages
::null;
pp+ → p;
bb+ → b;
tt+ → t;
dd+ → d;
kk+ → k;
dd+ → d;
ɡɡ+ → ɡ;
ff+ → f;
vv+ → v;
hh+ → h;
ss+ → s;
zz+ → z;
ʃʃ+ → ʃ;
ʒʒ+ → ʒ;
rr+ → r;
ll+ → l;
jj+ → j;
ww+ → w;
|