blob: 45f0d12bae666a550f482bd401fe1e252f6950b2 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
|
# © 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html#License
#
# File: dv_dv_Latn_BGN.txt
# Generated from CLDR
#
# BGN/PCGN 1988 Agreement, with modifications 2009
#
# This romanization system supersedes the one which was approved by
# the BGN and the PCGN in 1972. This official system was submitted
# to the PCGN by the Maldivian government in 1987 and approved by BGN
# and PCGN in 1988. The system presented here reflects the 1988 Agreement
# with minor modifications introduced by the government of the Maldives
# in 2009.
#
# In our rules, we also convert Arabic punctuation characters to Latin.
# These appears to be used in Maldivian text, for example in the Universal
# Declaration of Human Rights.
::[[:block=thaana:][،؛؟٪٫٬]\uFDF2] ;
::NFD;
$wordBoundary = [^[:L:][:M:][:N:]] ;
$vowel = [\u07A6-\u07AF] ;
$sukun = \u07B0 ;
$sign = [$sukun $vowel] ;
$rule4 = [އށ] $sukun ; # see note 4
### Consonants
# HAA
$rule4 ހ → hh ;
ހ → h ;
# NOONU
# See note 5: "romanized n’ when appearing without any vowel or auxiliary sign"
$rule4 ނ } $sign → nn ;
$rule4 ނ → nn\' ;
ނ } $sign → n ;
ނ → n\' ;
# RAA
$rule4 ރ → rr ;
ރ → r ;
# BAA
$rule4 ބ → bb ;
ބ → b ;
# LHAVIYANI
$rule4 ޅ → hlh ;
ޅ → lh;
# KAAFU
$rule4 ކ → kk ;
ކ → k ;
# VAAVU
$rule4 ވ → vv ;
ވ → v ;
# MEEMU
$rule4 މ → mm ;
މ → m ;
# FAAFU
$rule4 ފ → ff ;
ފ → f;
# DHAALU
$rule4 ދ → hdh ;
ދ → dh;
# THAA
# See note 6: "romanized iy when appearing in combination with a supercircle"
$rule4 ތ $sukun → hiy ;
$rule4 ތ → hth ;
\u07A8 ތ $sukun → iy ;
ތ $sukun → iy ;
ތ → th ;
# LAAMU
$rule4 ލ → ll ;
ލ → l ;
# GAAFU
$rule4 ގ → gg ;
ގ → g ;
# GNAVIYANI
$rule4 ޏ → hgn ;
ޏ → gn ;
# SEENU
$rule4 ސ → ss ;
ސ → s ;
# DAVIYANI
$rule4 ޑ → dd ;
ޑ → d ;
# ZAVIYANI
$rule4 ޒ → zz ;
ޒ → z ;
# TAVIYANI
$rule4 ޓ → tt ;
ޓ → t ;
# YAA
$rule4 ޔ → yy ;
ޔ → y ;
# PAVIYANI
$rule4 ޕ → pp ;
ޕ → p ;
# JAVIYANI
$rule4 ޖ → jj ;
ޖ → j ;
# CHAVIYANI
$rule4 ޗ → hch ;
ޗ → ch ;
### Borrowed Consonants (See Rule 7)
# SAADHU
$rule4 ޞ → şş ;
ޞ → ş ;
# SHEENU
$rule4 ޝ → hsh ;
ޝ → sh ;
# ZAA
$rule4 ޜ → zz ;
ޜ → z;
# KHAA
$rule4 ޚ → hkh ;
ޚ → kh;
# HHAA
$rule4 ޙ → ḩḩ ;
ޙ → ḩ ;
# THAALU
$rule4 ޛ → hdh ;
ޛ → dh ;
# TTAA
$rule4 ޘ → hth ;
ޘ → th ;
# WAAVU
$rule4 ޥ → ww ;
ޥ → w ;
# QAAFU
$rule4 ޤ → qq ;
ޤ → q ;
# GHAINU
$rule4 ޣ → hgh ;
ޣ → gh ;
# AINU
$rule4 ޢ → \'\' ;
ޢ → \' ;
# ZO
$rule4 ޡ → z\u0327z\u0327 ;
ޡ → z\u0327 ;
# TO
$rule4 ޠ → ţţ ;
ޠ → ţ ;
# DAADHU
$rule4 ޟ → ḑḑ ;
ޟ → ḑ ;
# NOTE: not in Maldivian BGN system, but for completeness of Thaana block
# NAA
$rule4 ޱ → n\u0332n\u0332 ;
ޱ → n\u0332 ;
# Rule 4 in word-final position
$rule4 } $wordBoundary → h;
# SHAVIYANI (placed last to avoid masking)
$rule4 ށ → hsh;
ށ → sh;
# Otherwise, these signs are not romanized elsewhere
$rule4 → ;
\u07B0 → ;
އ → ;
# NOTE: not in Maldivian BGN system, but common in names (e.g. Abdullah)
($vowel) \uFDF2 → | $1 llāh ;
\uFDF2 → allāh;
### Vowels
\u07A6 → a; # ABAFILI
\u07A7 → aa; # AABAAFILI
\u07AC → e; # EBEFILI
\u07AD → ey; # EYBEYFILI
\u07A8 → i; # IBIFILI
\u07A9 → ee; # EEBEEFILI
\u07AE → o; # OBOFILI
\u07AF → oa; # OABOAFILI
\u07AA → u; # UBUFILI
\u07AB → oo; # OOBOOFILI
، → ','; # U+060C ARABIC COMMA
؛ → ';'; # U+061B ARABIC SEMICOLON
؟ → '?'; # U+061F ARABIC QUESTION MARK
٪ → '%'; # U+066A ARABIC PERCENT SIGN
٫ → '.'; # U+066B ARABIC DECIMAL SEPARATOR
٬ → ','; # U+066C ARABIC THOUSANDS SEPARATOR
|