271 lines
		
	
	
		
			9.2 KiB
		
	
	
	
		
			XML
		
	
	
	
			
		
		
	
	
			271 lines
		
	
	
		
			9.2 KiB
		
	
	
	
		
			XML
		
	
	
	
| <?xml version="1.0" encoding="UTF-8" ?>
 | ||
| <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
 | ||
| <!--
 | ||
| Copyright © 1991-2013 Unicode, Inc.
 | ||
| CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
 | ||
| For terms of use, see http://www.unicode.org/copyright.html
 | ||
| -->
 | ||
| <supplementalData>
 | ||
| 	<version number="$Revision$"/>
 | ||
| 	<transforms>
 | ||
| 		<transform source="ps" target="ps_Latn" variant="BGN" direction="forward" draft="contributed" alias="Pashto-Latin/BGN ps-Latn-t-ps-m0-bgn">
 | ||
| 			<tRule><![CDATA[
 | ||
| #
 | ||
| ########################################################################
 | ||
| # BGN/PCGN 1968 System
 | ||
| #
 | ||
| # This system was adopted in 1968 for the romanization of Pashto
 | ||
| # geographic names in Afghanistan. Persian names in Afghanistan are
 | ||
| # romanized in accordance with the Romanization System for Persian
 | ||
| # (BGN/PCGN 1958 System), shown on pages 87-92).
 | ||
| #
 | ||
| # Originally prepared by Michael Everson <everson@evertype.com>
 | ||
| ########################################################################
 | ||
| #
 | ||
| # MINIMAL FILTER: Pashto-Latin
 | ||
| #
 | ||
| 
 | ||
| :: [ءآابةتثجحخدذرزسشصضطظعغفقكلمنهوىئَُِّْ٠١٢٣٤٥٦٧٨٩ټپځڅچډړږژښگڰڼیۍې] ;
 | ||
| :: NFD (NFC) ;
 | ||
| #
 | ||
| #
 | ||
| ########################################################################
 | ||
| 
 | ||
| 
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # Define All Transformation Variables
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| 
 | ||
| $alef = ’;
 | ||
| $ayin = ‘;
 | ||
| $disambig =  ̱ ;
 | ||
| #
 | ||
| #
 | ||
| # Use this $wordBoundary until bug 2034 is fixed in ICU:
 | ||
| # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
 | ||
| #
 | ||
| 
 | ||
| $wordBoundary =  [^[:L:][:M:][:N:]] ;
 | ||
| #
 | ||
| #
 | ||
| ########################################################################
 | ||
| 
 | ||
| [:Nd:]{٫}[:Nd:] ↔ [:Nd:]{','}[:Nd:] ; # ARABIC DECIMAL SEPARATOR
 | ||
| [:Nd:]{٬}[:Nd:] ↔ [:Nd:]{'.'}[:Nd:] ; # ARABIC THOUSANDS SEPARATOR
 | ||
| ٫ ↔ ',' $disambig ; # ARABIC DECIMAL SEPARATOR
 | ||
| ٬ ↔ '.' $disambig ; # ARABIC THOUSANDS SEPARATOR
 | ||
| #  ٭ ↔ ; # ARABIC FIVE POINTED STAR // no need to transliterate
 | ||
| ، ↔ ',' ; # ARABIC COMMA
 | ||
| ؛ ↔ ';' ; # ARABIC SEMICOLON
 | ||
| ؟ ↔ '?' ; # ARABIC QUESTION MARK
 | ||
| ٪ ↔ '%' ; # ARABIC PERCENT SIGN
 | ||
| ٠ ↔ 0 $disambig ; # ARABIC-INDIC DIGIT ZERO
 | ||
| ١ ↔ 1 $disambig ; # ARABIC-INDIC DIGIT ONE
 | ||
| ٢ ↔ 2 $disambig ; # ARABIC-INDIC DIGIT TWO
 | ||
| ٣ ↔ 3 $disambig ; # ARABIC-INDIC DIGIT THREE
 | ||
| ٤ ↔ 4 $disambig ; # ARABIC-INDIC DIGIT FOUR
 | ||
| ٥ ↔ 5 $disambig ; # ARABIC-INDIC DIGIT FIVE
 | ||
| ٦ ↔ 6 $disambig ; # ARABIC-INDIC DIGIT SIX
 | ||
| ٧ ↔ 7 $disambig ; # ARABIC-INDIC DIGIT SEVEN
 | ||
| ٨ ↔ 8 $disambig ; # ARABIC-INDIC DIGIT EIGHT
 | ||
| ٩ ↔ 9 $disambig ; # ARABIC-INDIC DIGIT NINE
 | ||
| ۰ ↔ 0 ; # EXTENDED ARABIC-INDIC DIGIT ZERO
 | ||
| ۱ ↔ 1 ; # EXTENDED ARABIC-INDIC DIGIT ONE
 | ||
| ۲ ↔ 2 ; # EXTENDED ARABIC-INDIC DIGIT TWO
 | ||
| ۳ ↔ 3 ; # EXTENDED ARABIC-INDIC DIGIT THREE
 | ||
| ۴ ↔ 4 ; # EXTENDED ARABIC-INDIC DIGIT FOUR
 | ||
| ۵ ↔ 5 ; # EXTENDED ARABIC-INDIC DIGIT FIVE
 | ||
| ۶ ↔ 6 ; # EXTENDED ARABIC-INDIC DIGIT SIX
 | ||
| ۷ ↔ 7 ; # EXTENDED ARABIC-INDIC DIGIT SEVEN
 | ||
| ۸ ↔ 8 ; # EXTENDED ARABIC-INDIC DIGIT EIGHT
 | ||
| ۹ ↔ 9 ; # EXTENDED ARABIC-INDIC DIGIT NINE
 | ||
| 
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # Rules moved to front to avoid masking
 | ||
| #
 | ||
| ########################################################################
 | ||
| 
 | ||
| 
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # BGN Page 89 Rule 4
 | ||
| #
 | ||
| # The character sequences كه , زه , سه , and گه may be romanized k·h, z·h,
 | ||
| # s·h, and g·h in order to differentiate those romanizations from the
 | ||
| # digraphs kh, zh, sh, and gh.
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| 
 | ||
| كه → k·h ; # ARABIC LETTER KAF + HEH
 | ||
| زه → z·h ; # ARABIC LETTER ZAIN + HEH
 | ||
| سه → s·h ; # ARABIC LETTER SEEN + HEH
 | ||
| گه → g·h ; # ARABIC LETTER GAF + HEH
 | ||
| #
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # End Rule 4
 | ||
| #
 | ||
| ########################################################################
 | ||
| 
 | ||
| 
 | ||
| 
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # BGN Page 91 Rule 7
 | ||
| #
 | ||
| # Doubles consonant sounds are represented in Arabic script by
 | ||
| # placing a shaddah ( ّ ) over a consonant character. In romanization
 | ||
| # the letter should be doubled. [The remainder of this rule deals with
 | ||
| # the definite article and is lexical.]
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| 
 | ||
| بّ → bb ; # ARABIC LETTER BEH + SHADDA
 | ||
| پّ → pp ; # ARABIC LETTER PEH + SHADDA
 | ||
| تّ → tt ; # ARABIC LETTER TEH + SHADDA
 | ||
| ټّ → ṯṯ ; # ARABIC LETTER TEH WITH RING + SHADDA
 | ||
| ثّ → s̄s̄ ; # ARABIC LETTER THEH + SHADDA
 | ||
| جّ → jj ; # ARABIC LETTER JEEM + SHADDA
 | ||
| چّ → chch ; # ARABIC LETTER TCHEH + SHADDA
 | ||
| ّڅ → tsts ; # ARABIC LETTER HAH WITH THREE DOTS ABOVE + SHADDA
 | ||
| ّځ → dz ; # ARABIC LETTER HAH WITH HAMZA ABOVE + SHADDA
 | ||
| حّ → ḥḥ ; # ARABIC LETTER HAH + SHADDA
 | ||
| خّ → khkh ; # ARABIC LETTER KHAH + SHADDA
 | ||
| دّ → dd ; # ARABIC LETTER DAL + SHADDA
 | ||
| ّډ → ḏḏ ; # ARABIC LETTER DAL WITH RING + SHADDA
 | ||
| ذّ → z̄z̄ ; # ARABIC LETTER THAL + SHADDA
 | ||
| رّ → rr ; # ARABIC LETTER REH + SHADDA
 | ||
| ّړ → ṟṟ ; # ARABIC LETTER REH WITH RING + SHADDA
 | ||
| زّ → zz ; # ARABIC LETTER ZAIN + SHADDA
 | ||
| ژّ → zhzh ; # ARABIC LETTER JEH + SHADDA
 | ||
| ّژ → z͟hz͟h ; # ARABIC LETTER REH WITH DOT BELOW AND DOT ABOVE + SHADDA
 | ||
| سّ → ss ; # ARABIC LETTER SEEN + SHADDA
 | ||
| شّ → shsh ; # ARABIC LETTER SHEEN + SHADDA
 | ||
| ّښ → s͟hs͟h ; # ARABIC LETTER SEEN WITH DOT BELOW AND DOT ABOVE
 | ||
| صّ → ṣṣ ; # ARABIC LETTER SAD + SHADDA
 | ||
| ضّ → ḍḍ ; # ARABIC LETTER DAD + SHADDA
 | ||
| طّ → ṭṭ ; # ARABIC LETTER TAH + SHADDA
 | ||
| ظّ → ẓẓ ; # ARABIC LETTER ZAH + SHADDA
 | ||
| عّ → $ayin $ayin ; # ARABIC LETTER AIN + SHADDA
 | ||
| غّ → ghgh ; # ARABIC LETTER GHAIN + SHADDA
 | ||
| فّ → ff ; # ARABIC LETTER FEH + SHADDA
 | ||
| قّ → qq ; # ARABIC LETTER QAF + SHADDA
 | ||
| كّ → kk ; # ARABIC LETTER KAF + SHADDA
 | ||
| ّگ → gg ; # ARABIC LETTER GAF + SHADDA
 | ||
| ّڰ → gg ; # ARABIC LETTER GAF WITH RING + SHADDA
 | ||
| لّ → ll ; # ARABIC LETTER LAM + SHADDA
 | ||
| مّ → mm ; # ARABIC LETTER MEEM + SHADDA
 | ||
| نّ → nn ; # ARABIC LETTER NOON + SHADDA
 | ||
| ّڼ → ṉṉ ; # ARABIC LETTER NOON WITH RING + SHADDA
 | ||
| هّ → hh ; # ARABIC LETTER HEH + SHADDA
 | ||
| وّ → ww ; # ARABIC LETTER WAW + SHADDA
 | ||
| ّی → yy ; # ARABIC LETTER FARSI YEH + SHADDA
 | ||
| ىّ → yy ; # ARABIC LETTER YEH + SHADDA
 | ||
| #
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # End Rule 7
 | ||
| #
 | ||
| ########################################################################
 | ||
| 
 | ||
| 
 | ||
| 
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| # Start of Transformations
 | ||
| #
 | ||
| ########################################################################
 | ||
| #
 | ||
| 
 | ||
| $wordBoundary{ء →  ; # ARABIC LETTER HAMZA
 | ||
| ء → $alef ; # ARABIC LETTER HAMZA
 | ||
| $wordBoundary{ا →  ; # ARABIC LETTER ALEF
 | ||
| آ → $alef ā ; # ARABIC LETTER ALEF WITH MADDA ABOVE
 | ||
| ب → b ; # ARABIC LETTER BEH
 | ||
| پ → p ; # ARABIC LETTER PEH
 | ||
| ت → t ; # ARABIC LETTER TEH
 | ||
| ټ → ṯ ; # ARABIC LETTER TEH WITH RING
 | ||
| ة → h ; # ARABIC LETTER TEH MARBUTA
 | ||
| ث → s̄ ; # ARABIC LETTER THEH
 | ||
| ج → j ; # ARABIC LETTER JEEM
 | ||
| چ → ch ; # ARABIC LETTER TCHEH
 | ||
| څ → ts ; # ARABIC LETTER HAH WITH THREE DOTS ABOVE
 | ||
| ځ → dz ; # ARABIC LETTER HAH WITH HAMZA ABOVE
 | ||
| ح → ḥ ; # ARABIC LETTER HAH
 | ||
| خ → kh ; # ARABIC LETTER KHAH
 | ||
| د → d ; # ARABIC LETTER DAL
 | ||
| ډ → ḏ ; # ARABIC LETTER DAL WITH RING
 | ||
| ذ → z̄ ; # ARABIC LETTER THAL
 | ||
| ر → r ; # ARABIC LETTER REH
 | ||
| ړ → ṟ ; # ARABIC LETTER REH WITH RING
 | ||
| ز → z ; # ARABIC LETTER ZAIN
 | ||
| ژ → zh ; # ARABIC LETTER JEH
 | ||
| ږ → z͟h ; # ARABIC LETTER REH WITH DOT BELOW AND DOT ABOVE
 | ||
| س → s ; # ARABIC LETTER SEEN
 | ||
| ش → sh ; # ARABIC LETTER SHEEN
 | ||
| ښ → s͟h ; # ARABIC LETTER SEEN WITH DOT BELOW AND DOT ABOVE
 | ||
| ص → ṣ ; # ARABIC LETTER SAD
 | ||
| ض → ẕ ; # ARABIC LETTER DAD
 | ||
| ط → ṭ ; # ARABIC LETTER TAH
 | ||
| ظ → ẓ ; # ARABIC LETTER ZAH
 | ||
| ع → $ayin ; # ARABIC LETTER AIN
 | ||
| غ → gh ; # ARABIC LETTER GHAIN
 | ||
| ف → f ; # ARABIC LETTER FEH
 | ||
| ق → q ; # ARABIC LETTER QAF
 | ||
| ك → k ; # ARABIC LETTER KAF
 | ||
| گ → g ; # ARABIC LETTER GAF
 | ||
| ڰ → g ; # ARABIC LETTER GAF WITH RING
 | ||
| ل → l ; # ARABIC LETTER LAM
 | ||
| م → m ; # ARABIC LETTER MEEM
 | ||
| ن → n ; # ARABIC LETTER NOON
 | ||
| ڼ → ṉ ; # ARABIC LETTER NOON WITH RING
 | ||
| و → w ; # ARABIC LETTER WAW
 | ||
| ه → h ; # ARABIC LETTER HEH
 | ||
| ٔی → ey ; # ARABIC LETTER FARSI YEH + HAMZA ABOVE
 | ||
| ی → y ; # ARABIC LETTER FARSI YEH
 | ||
| ى → y ; # ARABIC LETTER YEH
 | ||
| ې → e ; # ARABIC LETTER E
 | ||
| 
 | ||
| َا → ā ; # ARABIC FATHA + ALEF
 | ||
| َىْ → ay ; # ARABIC FATHA + FARSI YEH + SUKUN
 | ||
| َى → á ; # ARABIC FATHA + ALEF MAKSURA
 | ||
| َْۍ → êy ; # ARABIC FATHA + SUKUN + YEH WITH TAIL
 | ||
| َْ → ê ; # ARABIC FATHA + SUKUN
 | ||
| َ → a ; # ARABIC FATHA
 | ||
| 
 | ||
| ِْي → ey ; # ARABIC KASRA + FARSI YEH + SUKUN
 | ||
| ِي → ī ; # ARABIC KASRA + FARSI YEH
 | ||
| ِى → ī ; # ARABIC KASRA + YEH
 | ||
| ِو → ew ; # ARABIC KASRA + WAW
 | ||
| ِ → i ; # ARABIC KASRA
 | ||
| 
 | ||
| ُوْ → ow ; # ARABIC DAMMA + WAW + SUKUN
 | ||
| ُوی → ūy ; # ARABIC DAMMA + WAW + FARSI YEH
 | ||
| ُو → ū ; # ARABIC DAMMA + WAW
 | ||
| ُ → u ; # ARABIC DAMMA
 | ||
| 
 | ||
| ْ →  ; # ARABIC SUKUN
 | ||
| 
 | ||
| 
 | ||
| #
 | ||
| #
 | ||
| ########################################################################
 | ||
| 
 | ||
| 			]]></tRule>
 | ||
| 		</transform>
 | ||
| 	</transforms>
 | ||
| </supplementalData>
 |