148 lines
2.4 KiB
XML
148 lines
2.4 KiB
XML
<?xml version="1.0" encoding="UTF-8" ?>
|
||
<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
|
||
<!--
|
||
Copyright © 1991-2013 Unicode, Inc.
|
||
CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
|
||
For terms of use, see http://www.unicode.org/copyright.html
|
||
-->
|
||
<supplementalData>
|
||
<version number="$Revision$"/>
|
||
<transforms>
|
||
<transform source="ro" target="ro_FONIPA" direction="forward" alias="ro-fonipa-t-ro">
|
||
<tRule><![CDATA[
|
||
# Romanian orthography to phonemic transcription.
|
||
# http://en.wikipedia.org/wiki/Romanian_phonology
|
||
#
|
||
# TODO: Currently this transform does not palatalize consonants.
|
||
|
||
$VowelEI = [e i î];
|
||
$VowelAOU = [a â ă o u];
|
||
$Vowel = [$VowelEI $VowelAOU];
|
||
$Boundary = [^[:L:][:M:][:N:]];
|
||
|
||
:: NFC () ;
|
||
:: Lower () ;
|
||
|
||
# Special cases.
|
||
eoai → eo̯aj ; # eg. leoaică → /leo̯ajkə/, not /le̯o̯aikə/
|
||
|
||
# Triphthongs.
|
||
eai → e̯aj ;
|
||
eau → e̯aw ;
|
||
eoa → e̯o̯a ;
|
||
i\-ai → jaj ;
|
||
ia\-i → jaj ;
|
||
iau → jaw ;
|
||
iei → jej ;
|
||
ieu → jew ;
|
||
$Boundary {eu} → jew ;
|
||
ioa → jo̯a ;
|
||
ioi → joj ;
|
||
i\-oi → joj ;
|
||
iou → jow ;
|
||
oai → o̯aj ;
|
||
uai → waj ;
|
||
uau → waw ;
|
||
uăi → wəj ;
|
||
|
||
# Diphthongs.
|
||
ai → aj ;
|
||
âi → ɨj ;
|
||
ăi → əj ;
|
||
au} r → au ;
|
||
au → aw ;
|
||
âu → ɨw ;
|
||
ău → əw ;
|
||
ea → e̯a ;
|
||
ei → ej ;
|
||
eo → e̯o ;
|
||
e\-o → e̯o ;
|
||
eu → ew ;
|
||
e\-u → e̯u ;
|
||
ia → ja ;
|
||
i\-a → ja ;
|
||
ie → je ;
|
||
ii → ij ;
|
||
io → jo ;
|
||
iu} [$Vowel $Boundary] → iw ;
|
||
iu → ju ;
|
||
oa → o̯a ;
|
||
oi → oj ;
|
||
ou → ow ;
|
||
ua → wa ;
|
||
uâ → wɨ ;
|
||
uă → wə ;
|
||
ue → we ;
|
||
ui → uj ;
|
||
uu → uw ;
|
||
|
||
a → a ;
|
||
â → ɨ ;
|
||
ă → ə ;
|
||
b → b ;
|
||
ch → k ;
|
||
{c} [ei] → t͡ʃ ;
|
||
c → k ;
|
||
d → d ;
|
||
e → e ;
|
||
f → f ;
|
||
gh → ɡ ;
|
||
{g} [ei] → d͡ʒ ;
|
||
g → ɡ ;
|
||
h → h ;
|
||
i → i ;
|
||
î → ɨ ;
|
||
j → ʒ ;
|
||
k → k ;
|
||
l → l ;
|
||
m → m ;
|
||
ng → ŋ ;
|
||
n → n ;
|
||
o → o ;
|
||
p → p ;
|
||
q → k ;
|
||
r → r ;
|
||
s → s ;
|
||
ş → ʃ ;
|
||
ș → ʃ ;
|
||
t → t ;
|
||
ţ → t͡s ;
|
||
ț → t͡s ;
|
||
u → u ;
|
||
v → v ;
|
||
x → ks ;
|
||
y → i ;
|
||
z → z ;
|
||
[:P:]+ → ' ';
|
||
|
||
# Romanian does not have any gemination.
|
||
# https://en.wikipedia.org/wiki/Gemination#Latin_and_Romance_languages
|
||
::null;
|
||
pp+ → p;
|
||
bb+ → b;
|
||
tt+ → t;
|
||
dd+ → d;
|
||
kk+ → k;
|
||
dd+ → d;
|
||
ɡɡ+ → ɡ;
|
||
|
||
ff+ → f;
|
||
vv+ → v;
|
||
hh+ → h;
|
||
|
||
ss+ → s;
|
||
zz+ → z;
|
||
ʃʃ+ → ʃ;
|
||
ʒʒ+ → ʒ;
|
||
|
||
rr+ → r;
|
||
ll+ → l;
|
||
|
||
jj+ → j;
|
||
ww+ → w;
|
||
|
||
]]></tRule>
|
||
</transform>
|
||
</transforms>
|
||
</supplementalData>
|