Home | History | Annotate | Download | only in transforms
      1 <?xml version="1.0" encoding="UTF-8" ?>
      2 <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
      3 <!--
      4 Copyright  1991-2013 Unicode, Inc.
      5 CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
      6 For terms of use, see http://www.unicode.org/copyright.html
      7 -->
      8 <supplementalData>
      9 	<version number="$Revision: 13787 $"/>
     10 	<transforms>
     11 		<transform source="fa" target="fa_Latn" variant="BGN" direction="forward" draft="contributed" alias="Persian-Latin/BGN fa-Latn-t-fa-m0-bgn">
     12 			<tRule><![CDATA[
     13 #
     14 ########################################################################
     15 # BGN/PCGN 1956 System
     16 #
     17 # This system was adopted by the BGN in 1946 and by the PCGN in 1958.
     18 # It is used for the romanization of geographic names in Iran and
     19 # for Persian-language names in Afghanistan.
     20 #
     21 # Originally prepared by Michael Everson <everson (a] evertype.com>
     22 ########################################################################
     23 #
     24 # MINIMAL FILTER: Persian-Latin
     25 #
     26 
     27 :: [[:arabic:][:block=ARABIC:][]] ;
     28 :: NFKD (NFC) ;
     29 #
     30 #
     31 ########################################################################
     32 
     33 
     34 #
     35 ########################################################################
     36 #
     37 # Define All Transformation Variables
     38 #
     39 ########################################################################
     40 #
     41 
     42 $alef = ;
     43 $ayin = ;
     44 $disambig =   ;
     45 #
     46 #
     47 # Use this $wordBoundary until bug 2034 is fixed in ICU:
     48 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
     49 #
     50 
     51 $wordBoundary =  [^[:L:][:M:][:N:]] ;
     52 #
     53 #
     54 ########################################################################
     55 
     56 # non-letters
     57 [:Nd:]{}[:Nd:]  [:Nd:]{','}[:Nd:] ; # ARABIC DECIMAL SEPARATOR
     58 [:Nd:]{}[:Nd:]  [:Nd:]{'.'}[:Nd:] ; # ARABIC THOUSANDS SEPARATOR
     59   ',' $disambig ; # ARABIC DECIMAL SEPARATOR
     60   '.' $disambig ; # ARABIC THOUSANDS SEPARATOR
     61 #    ; # ARABIC FIVE POINTED STAR // no need to transliterate
     62   ',' ; # ARABIC COMMA
     63   ';' ; # ARABIC SEMICOLON
     64   '?' ; # ARABIC QUESTION MARK
     65   '%' ; # ARABIC PERCENT SIGN
     66   0 $disambig ; # ARABIC-INDIC DIGIT ZERO
     67   1 $disambig ; # ARABIC-INDIC DIGIT ONE
     68   2 $disambig ; # ARABIC-INDIC DIGIT TWO
     69   3 $disambig ; # ARABIC-INDIC DIGIT THREE
     70   4 $disambig ; # ARABIC-INDIC DIGIT FOUR
     71   5 $disambig ; # ARABIC-INDIC DIGIT FIVE
     72   6 $disambig ; # ARABIC-INDIC DIGIT SIX
     73   7 $disambig ; # ARABIC-INDIC DIGIT SEVEN
     74   8 $disambig ; # ARABIC-INDIC DIGIT EIGHT
     75   9 $disambig ; # ARABIC-INDIC DIGIT NINE
     76   0 ; # EXTENDED ARABIC-INDIC DIGIT ZERO
     77   1 ; # EXTENDED ARABIC-INDIC DIGIT ONE
     78   2 ; # EXTENDED ARABIC-INDIC DIGIT TWO
     79   3 ; # EXTENDED ARABIC-INDIC DIGIT THREE
     80   4 ; # EXTENDED ARABIC-INDIC DIGIT FOUR
     81   5 ; # EXTENDED ARABIC-INDIC DIGIT FIVE
     82   6 ; # EXTENDED ARABIC-INDIC DIGIT SIX
     83   7 ; # EXTENDED ARABIC-INDIC DIGIT SEVEN
     84   8 ; # EXTENDED ARABIC-INDIC DIGIT EIGHT
     85   9 ; # EXTENDED ARABIC-INDIC DIGIT NINE
     86 
     87 #
     88 ########################################################################
     89 #
     90 # Rules moved to front to avoid masking
     91 #
     92 ########################################################################
     93 
     94 
     95 #
     96 ########################################################################
     97 #
     98 # BGN Page 89 Rule 4
     99 #
    100 # The character sequences  ,  ,  , and  may be romanized kh, zh,
    101 # sh, and gh in order to differentiate those romanizations from the
    102 # digraphs kh, zh, sh, and gh.
    103 #
    104 ########################################################################
    105 #
    106 
    107   kh ; # ARABIC LETTER KAF + HEH
    108   zh ; # ARABIC LETTER ZAIN + HEH
    109   sh ; # ARABIC LETTER SEEN + HEH
    110   gh ; # ARABIC LETTER GAF + HEH
    111 #
    112 #
    113 ########################################################################
    114 #
    115 # End Rule 4
    116 #
    117 ########################################################################
    118 
    119 
    120 
    121 #
    122 ########################################################################
    123 #
    124 # BGN Page 91 Rule 7
    125 #
    126 # Doubles consonant sounds are represented in Arabic script by
    127 # placing a shaddah (  ) over a consonant character. In romanization
    128 # the letter should be doubled. [The remainder of this rule deals with
    129 # the definite article and is lexical.]
    130 #
    131 ########################################################################
    132 #
    133 
    134   bb ; # ARABIC LETTER BEH + SHADDA
    135   pp ; # ARABIC LETTER PEH + SHADDA
    136   tt ; # ARABIC LETTER TEH + SHADDA
    137   ss ; # ARABIC LETTER THEH + SHADDA
    138   jj ; # ARABIC LETTER JEEM + SHADDA
    139   chch ; # ARABIC LETTER TCHEH + SHADDA
    140    ; # ARABIC LETTER HAH + SHADDA
    141   khkh ; # ARABIC LETTER KHAH + SHADDA
    142   dd ; # ARABIC LETTER DAL + SHADDA
    143   zz ; # ARABIC LETTER THAL + SHADDA
    144   rr ; # ARABIC LETTER REH + SHADDA
    145   zz ; # ARABIC LETTER ZAIN + SHADDA
    146   zhzh ; # ARABIC LETTER JEH + SHADDA
    147   ss ; # ARABIC LETTER SEEN + SHADDA
    148   shsh ; # ARABIC LETTER SHEEN + SHADDA
    149    ; # ARABIC LETTER SAD + SHADDA
    150    ; # ARABIC LETTER DAD + SHADDA
    151    ; # ARABIC LETTER TAH + SHADDA
    152    ; # ARABIC LETTER ZAH + SHADDA
    153   $ayin $ayin ; # ARABIC LETTER AIN + SHADDA
    154   ghgh ; # ARABIC LETTER GHAIN + SHADDA
    155   ff ; # ARABIC LETTER FEH + SHADDA
    156   qq ; # ARABIC LETTER QAF + SHADDA
    157   kk ; # ARABIC LETTER KAF + SHADDA
    158   ll ; # ARABIC LETTER LAM + SHADDA
    159   mm ; # ARABIC LETTER MEEM + SHADDA
    160   nn ; # ARABIC LETTER NOON + SHADDA
    161   hh ; # ARABIC LETTER HEH + SHADDA
    162   ww ; # ARABIC LETTER WAW + SHADDA
    163   yy ; # ARABIC LETTER FARSI YEH + SHADDA
    164 #
    165 #
    166 ########################################################################
    167 #
    168 # End Rule 7
    169 #
    170 ########################################################################
    171 
    172 
    173 
    174 #
    175 ########################################################################
    176 #
    177 # Start of Transformations
    178 #
    179 ########################################################################
    180 #
    181 
    182 $wordBoundary{   ; # ARABIC LETTER HAMZA
    183   $alef ; # ARABIC LETTER HAMZA
    184 $wordBoundary{   ; # ARABIC LETTER ALEF
    185   $alef  ; # ARABIC FATHA ALEF WITH MADDA ABOVE
    186   b ; # ARABIC LETTER BEH
    187   p ; # ARABIC LETTER PEH
    188   t ; # ARABIC LETTER TEH
    189   h ; # ARABIC LETTER TEH MARBUTA
    190   s ; # ARABIC LETTER THEH
    191   j ; # ARABIC LETTER JEEM
    192   ch ; # ARABIC LETTER TCHEH
    193    ; # ARABIC LETTER HAH
    194   kh ; # ARABIC LETTER KHAH
    195   d ; # ARABIC LETTER DAL
    196   z ; # ARABIC LETTER THAL
    197   r ; # ARABIC LETTER REH
    198   z ; # ARABIC LETTER ZAIN
    199   zh ; # ARABIC LETTER JEH
    200   s ; # ARABIC LETTER SEEN
    201   sh ; # ARABIC LETTER SHEEN
    202    ; # ARABIC LETTER SAD
    203    ; # ARABIC LETTER DAD
    204    ; # ARABIC LETTER TAH
    205    ; # ARABIC LETTER ZAH
    206   $ayin ; # ARABIC LETTER AIN
    207   gh ; # ARABIC LETTER GHAIN
    208   f ; # ARABIC LETTER FEH
    209   q ; # ARABIC LETTER QAF
    210   k ; # ARABIC LETTER KEHEH
    211   k $disambig ; # ARABIC LETTER KAF
    212   g ; # ARABIC LETTER GAF
    213   l ; # ARABIC LETTER LAM
    214   m ; # ARABIC LETTER MEEM
    215   n ; # ARABIC LETTER NOON
    216   h ; # ARABIC LETTER HEH
    217   v ; # ARABIC LETTER WAW
    218   y ; # ARABIC LETTER FARSI YEH
    219 
    220    ; # ARABIC FATHA + ALEF
    221    ; # ARABIC FATHA + FARSI YEH
    222   ow ; # ARABIC FATHA + WAW + SUKUN
    223   a ; # ARABIC FATHA
    224 
    225    ; # ARABIC KASRA + YEH
    226   e ; # ARABIC KASRA
    227 
    228    ; # ARABIC DAMMA + WAW
    229   o ; # ARABIC DAMMA
    230 
    231    ; # ARABIC SUKUN
    232 ::NFC (NFD) ;
    233 
    234 #
    235 #
    236 ########################################################################
    237 
    238 			]]></tRule>
    239 		</transform>
    240 	</transforms>
    241 </supplementalData>
    242