148 lines
		
	
	
		
			2.4 KiB
		
	
	
	
		
			XML
		
	
	
	
			
		
		
	
	
			148 lines
		
	
	
		
			2.4 KiB
		
	
	
	
		
			XML
		
	
	
	
| <?xml version="1.0" encoding="UTF-8" ?>
 | ||
| <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
 | ||
| <!--
 | ||
| Copyright © 1991-2013 Unicode, Inc.
 | ||
| CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
 | ||
| For terms of use, see http://www.unicode.org/copyright.html
 | ||
| -->
 | ||
| <supplementalData>
 | ||
| 	<version number="$Revision$"/>
 | ||
| 	<transforms>
 | ||
| 		<transform source="ro" target="ro_FONIPA" direction="forward" alias="ro-fonipa-t-ro">
 | ||
| 			<tRule><![CDATA[
 | ||
| # Romanian orthography to phonemic transcription.
 | ||
| # http://en.wikipedia.org/wiki/Romanian_phonology
 | ||
| #
 | ||
| # TODO: Currently this transform does not palatalize consonants.
 | ||
| 
 | ||
| $VowelEI = [e i î];
 | ||
| $VowelAOU = [a â ă o u];
 | ||
| $Vowel = [$VowelEI $VowelAOU];
 | ||
| $Boundary =  [^[:L:][:M:][:N:]];
 | ||
| 
 | ||
| :: NFC () ;
 | ||
| :: Lower () ;
 | ||
| 
 | ||
| # Special cases.
 | ||
| eoai → eo̯aj ;  # eg. leoaică → /leo̯ajkə/, not /le̯o̯aikə/
 | ||
| 
 | ||
| # Triphthongs.
 | ||
| eai → e̯aj ;
 | ||
| eau → e̯aw ;
 | ||
| eoa → e̯o̯a ;
 | ||
| i\-ai → jaj ;
 | ||
| ia\-i → jaj ;
 | ||
| iau → jaw ;
 | ||
| iei → jej ;
 | ||
| ieu → jew ;
 | ||
| $Boundary {eu} → jew ;
 | ||
| ioa → jo̯a ;
 | ||
| ioi → joj ;
 | ||
| i\-oi → joj ;
 | ||
| iou → jow ;
 | ||
| oai → o̯aj ;
 | ||
| uai → waj ;
 | ||
| uau → waw ;
 | ||
| uăi → wəj ;
 | ||
| 
 | ||
| # Diphthongs.
 | ||
| ai → aj ;
 | ||
| âi → ɨj ;
 | ||
| ăi → əj ;
 | ||
| au} r → au ;
 | ||
| au → aw ;
 | ||
| âu → ɨw ;
 | ||
| ău → əw ;
 | ||
| ea → e̯a ;
 | ||
| ei → ej ;
 | ||
| eo → e̯o ;
 | ||
| e\-o → e̯o ;
 | ||
| eu → ew ;
 | ||
| e\-u → e̯u ;
 | ||
| ia → ja ;
 | ||
| i\-a → ja ;
 | ||
| ie → je ;
 | ||
| ii → ij ;
 | ||
| io → jo ;
 | ||
| iu} [$Vowel $Boundary] → iw ;
 | ||
| iu → ju ;
 | ||
| oa → o̯a ;
 | ||
| oi → oj ;
 | ||
| ou → ow ;
 | ||
| ua → wa ;
 | ||
| uâ → wɨ ;
 | ||
| uă → wə ;
 | ||
| ue → we ;
 | ||
| ui → uj ;
 | ||
| uu → uw ;
 | ||
| 
 | ||
| a → a ;
 | ||
| â → ɨ ;
 | ||
| ă → ə ;
 | ||
| b → b ;
 | ||
| ch → k ;
 | ||
| {c} [ei] → t͡ʃ ;
 | ||
| c → k ;
 | ||
| d → d ;
 | ||
| e → e ;
 | ||
| f → f ;
 | ||
| gh → ɡ ;
 | ||
| {g} [ei] → d͡ʒ ;
 | ||
| g → ɡ ;
 | ||
| h → h ;
 | ||
| i → i ;
 | ||
| î → ɨ ;
 | ||
| j → ʒ ;
 | ||
| k → k ;
 | ||
| l → l ;
 | ||
| m → m ;
 | ||
| ng → ŋ ;
 | ||
| n → n ;
 | ||
| o → o ;
 | ||
| p → p ;
 | ||
| q → k ;
 | ||
| r → r ;
 | ||
| s → s ;
 | ||
| ş → ʃ ;
 | ||
| ș → ʃ ;
 | ||
| t → t ;
 | ||
| ţ → t͡s ;
 | ||
| ț → t͡s ;
 | ||
| u → u ;
 | ||
| v → v ;
 | ||
| x → ks ;
 | ||
| y → i ;
 | ||
| z → z ;
 | ||
| [:P:]+ → ' ';
 | ||
| 
 | ||
| # Romanian does not have any gemination.
 | ||
| # https://en.wikipedia.org/wiki/Gemination#Latin_and_Romance_languages
 | ||
| ::null;
 | ||
| pp+ → p;
 | ||
| bb+ → b;
 | ||
| tt+ → t;
 | ||
| dd+ → d;
 | ||
| kk+ → k;
 | ||
| dd+ → d;
 | ||
| ɡɡ+ → ɡ;
 | ||
| 
 | ||
| ff+ → f;
 | ||
| vv+ → v;
 | ||
| hh+ → h;
 | ||
| 
 | ||
| ss+ → s;
 | ||
| zz+ → z;
 | ||
| ʃʃ+ → ʃ;
 | ||
| ʒʒ+ → ʒ;
 | ||
| 
 | ||
| rr+ → r;
 | ||
| ll+ → l;
 | ||
| 
 | ||
| jj+ → j;
 | ||
| ww+ → w;
 | ||
| 
 | ||
| 			]]></tRule>
 | ||
| 		</transform>
 | ||
| 	</transforms>
 | ||
| </supplementalData>
 |