135 lines
		
	
	
		
			2.3 KiB
		
	
	
	
		
			XML
		
	
	
	
			
		
		
	
	
			135 lines
		
	
	
		
			2.3 KiB
		
	
	
	
		
			XML
		
	
	
	
| <?xml version="1.0" encoding="UTF-8" ?>
 | ||
| <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
 | ||
| <!--
 | ||
| Copyright © 1991-2013 Unicode, Inc.
 | ||
| CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
 | ||
| For terms of use, see http://www.unicode.org/copyright.html
 | ||
| -->
 | ||
| <supplementalData>
 | ||
| 	<version number="$Revision$"/>
 | ||
| 	<transforms>
 | ||
| 		<transform source="pl" target="pl_FONIPA" direction="forward" alias="pl-fonipa-t-pl">
 | ||
| 			<tRule>
 | ||
| # Polish orthography to phonemic transcription.
 | ||
| # http://en.wikipedia.org/wiki/Polish_phonology
 | ||
| #
 | ||
| # Transform input to normalized form NFC, and to lowercase.
 | ||
| 
 | ||
| :: NFC () ;
 | ||
| :: Lower () ;
 | ||
| #
 | ||
| #
 | ||
| # Definitions.
 | ||
| 
 | ||
| $voiceless = [cfhkpst];
 | ||
| $vowel = [ aąeęioóuy ];
 | ||
| #
 | ||
| #
 | ||
| # Digraphs and Trigraphs.
 | ||
| #
 | ||
| 
 | ||
| ch } i → ç ;
 | ||
| ch → x ;
 | ||
| ci } $vowel → t \u0361 ɕ ;
 | ||
| ci → t \u0361 ɕ i ;
 | ||
| cz → t \u0361 ʂ ;
 | ||
| dzi } $vowel → d \u0361 ʑ ;
 | ||
| dzi → d \u0361 ʑ i ;
 | ||
| dz } $voiceless → t \u0361 s ;
 | ||
| dz → d \u0361 z ;
 | ||
| dź } $voiceless → t \u0361 ɕ ;
 | ||
| dź → d \u0361 ʑ ;
 | ||
| dż } $voiceless → t \u0361 ʂ ;
 | ||
| dż → d \u0361 ʐ ;
 | ||
| kw → kf ;
 | ||
| krw → krf ;
 | ||
| ni } $vowel → ɲ ;
 | ||
| ni → ɲ i ;
 | ||
| $voiceless { rz → ʂ ;
 | ||
| rz } $voiceless → ʂ ;
 | ||
| rz → ʐ ;
 | ||
| sz → ʂ ;
 | ||
| trw → trf ;
 | ||
| tw → tf ;
 | ||
| zi } $vowel → ʑ ;
 | ||
| zi → ʑ i ;
 | ||
| #
 | ||
| #
 | ||
| 
 | ||
| a → a ;
 | ||
| ą } [bp] → ɔm ;
 | ||
| ą } [kg] → ɔŋ ;
 | ||
| ą } [cdt] → ɔn ;
 | ||
| ą → ɔ̃ ;
 | ||
| b } $voiceless → p ;
 | ||
| b → b ;
 | ||
| c → t \u0361 s ;
 | ||
| ć → t \u0361 ɕ ;
 | ||
| d } $voiceless → t ;
 | ||
| d → d ;
 | ||
| e → ɛ ;
 | ||
| ę } [bp] → ɛm ;
 | ||
| ę } [dt] → ɛn ;
 | ||
| ę } [gk] → ɛŋ ;
 | ||
| ę → ɛ̃;
 | ||
| f → f ;
 | ||
| g } $voiceless → k ;
 | ||
| g → ɡ ;
 | ||
| h } i → ç ;
 | ||
| h → x ;
 | ||
| i } $vowel → ʲ ;
 | ||
| i → i ;
 | ||
| j → j ;
 | ||
| k } [bdzż] → ɡ ;
 | ||
| k → k ;
 | ||
| l } i → ʎ ;
 | ||
| l → l ;
 | ||
| ł → w ;
 | ||
| m → m ;
 | ||
| n → n ;
 | ||
| ń → ɲ ;
 | ||
| o → ɔ ;
 | ||
| ó → u ;
 | ||
| r → r ;
 | ||
| si } $vowel → ɕ ;
 | ||
| si → ɕi ;
 | ||
| s → s ;
 | ||
| ś → ɕ ;
 | ||
| t → t ;
 | ||
| u → u ;
 | ||
| w } $voiceless → f ;
 | ||
| w → v ;
 | ||
| y → ɨ ;
 | ||
| ź } $voiceless → ɕ ;
 | ||
| ź → ʑ ;
 | ||
| ż } $voiceless → ʂ ;
 | ||
| ż → ʐ ;
 | ||
| #
 | ||
| #
 | ||
| # Second pass: Phoneme-to-phone rules.
 | ||
| 
 | ||
| :: Null ;
 | ||
| #
 | ||
| #
 | ||
| 
 | ||
| tʐ → tʂ ;
 | ||
| pʐ → pʂ ;
 | ||
| xʐ → xʂ ;
 | ||
| ʐt͡ʂ → ʂt͡ʂ ;
 | ||
| #
 | ||
| #
 | ||
| # Final de-voicing.
 | ||
| 
 | ||
| b } [$] → p ;
 | ||
| d \u0361 z } [$] → t \u0361 s ;  # rydz → rɨt͡s
 | ||
| d } [$] → t ;
 | ||
| ɡ } [$] → k ;
 | ||
| v } [$] → f ;
 | ||
| ʐ } [$] → ʂ ;
 | ||
| ʑ } [$] → ɕ ;
 | ||
| z } [$] → s ;
 | ||
| 			</tRule>
 | ||
| 		</transform>
 | ||
| 	</transforms>
 | ||
| </supplementalData>
 |