Home | History | Annotate | Download | only in transforms
      1 <?xml version="1.0" encoding="UTF-8" ?>
      2 <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
      3 <!--
      4 Copyright  1991-2013 Unicode, Inc.
      5 CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
      6 For terms of use, see http://www.unicode.org/copyright.html
      7 -->
      8 <supplementalData>
      9 	<version number="$Revision: 12137 $"/>
     10 	<transforms>
     11 		<transform source="Latin" target="InterIndic" direction="forward" visibility="internal">
     12 			<tRule>
     13 # Latin-InterIndic
     14 #:: NFD;
     15 #\u0E00 reserved
     16 #consonants
     17 $chandrabindu=\uE001;
     18 $anusvara=\uE002;
     19 $visarga=\uE003;
     20 #\u0E004 reserved
     21 # wvowel represents the stand-alone form
     22 $wa=\uE005;
     23 $waa=\uE006;
     24 $wi=\uE007;
     25 $wii=\uE008;
     26 $wu=\uE009;
     27 $wuu=\uE00A;
     28 $wr=\uE00B;
     29 $wl=\uE00C;
     30 $wce=\uE00D; # LETTER CANDRA E
     31 $wse=\uE00E; # LETTER SHORT E
     32 $we=\uE00F;  #  LETTER E
     33 $wai=\uE010;
     34 $wco=\uE011; # LETTER CANDRA O
     35 $wso=\uE012; # LETTER SHORT O
     36 $wo=\uE013;  #  LETTER O
     37 $wau=\uE014;
     38 $ka=\uE015;
     39 $kha=\uE016;
     40 $ga=\uE017;
     41 $gha=\uE018;
     42 $nga=\uE019;
     43 $ca=\uE01A;
     44 $cha=\uE01B;
     45 $ja=\uE01C;
     46 $jha=\uE01D;
     47 $nya=\uE01E;
     48 $tta=\uE01F;
     49 $ttha=\uE020;
     50 $dda=\uE021;
     51 $ddha=\uE022;
     52 $nna=\uE023;
     53 $ta=\uE024;
     54 $tha=\uE025;
     55 $da=\uE026;
     56 $dha=\uE027;
     57 $na=\uE028;
     58 $ena=\uE029; #compatibility
     59 $pa=\uE02A;
     60 $pha=\uE02B;
     61 $ba=\uE02C;
     62 $bha=\uE02D;
     63 $ma=\uE02E;
     64 $ya=\uE02F;
     65 $ra=\uE030;
     66 $rra=\uE031;
     67 $la=\uE032;
     68 $lla=\uE033;
     69 $ela=\uE034; #compatibility
     70 $va=\uE035;
     71 $vva=\uE081;
     72 $sha=\uE036;
     73 $ssa=\uE037;
     74 $sa=\uE038;
     75 $ha=\uE039;
     76 #\u093A Reserved
     77 #\u093B Reserved
     78 $nukta=\uE03C;
     79 $avagraha=\uE03D; # SIGN AVAGRAHA
     80 # vowel represents the dependent form
     81 $aa=\uE03E;
     82 $i=\uE03F;
     83 $ii=\uE040;
     84 $u=\uE041;
     85 $uu=\uE042;
     86 $rh=\uE043;
     87 $rrh=\uE044;
     88 $ce=\uE045; #VOWEL SIGN CANDRA E
     89 $se=\uE046; #VOWEL SIGN SHORT E
     90 $e=\uE047;
     91 $ai=\uE048;
     92 $co=\uE049; # VOWEL SIGN CANDRA O
     93 $so=\uE04A; # VOWEL SIGN SHORT O
     94 $o=\uE04B;  # 
     95 $au=\uE04C;
     96 $virama=\uE04D;
     97 # \u094E Reserved
     98 # \u094F Reserved
     99 $om = \uE050; # OM
    100 # ;        # UNMAPPED STRESS SIGN UDATTA
    101 # ;        # UNMAPPED STRESS SIGN ANUDATTA
    102 # ;        # UNMAPPED GRAVE ACCENT
    103 # ;        # UNMAPPED ACUTE ACCENT
    104 $lm = \uE055;#  Telugu Length Mark
    105 $ailm=\uE056;#  AI Length Mark
    106 $aulm=\uE057;#  AU Length Mark
    107 #urdu compatibity forms
    108 $uka=\uE058;
    109 $ukha=\uE059;
    110 $ugha=\uE05A;
    111 $ujha=\uE05B;
    112 $uddha=\uE05C;
    113 $udha=\uE05D;
    114 $ufa=\uE05E;
    115 $uya=\uE05F;
    116 $wrr=\uE060;
    117 $wll=\uE061;
    118 $lh=\uE062;
    119 $llh=\uE063;
    120 $danda=\uE064;
    121 $doubleDanda=\uE065;
    122 $zero=\uE066;     # DIGIT ZERO
    123 $one=\uE067;      # DIGIT ONE
    124 $two=\uE068;      # DIGIT TWO
    125 $three=\uE069;    # DIGIT THREE
    126 $four=\uE06A;     # DIGIT FOUR
    127 $five=\uE06B;     # DIGIT FIVE
    128 $six=\uE06C;      # DIGIT SIX
    129 $seven=\uE06D;    # DIGIT SEVEN
    130 $eight=\uE06E;    # DIGIT EIGHT
    131 $nine=\uE06F;     # DIGIT NINE
    132 $dgs=\uE082;
    133 # For all other scripts
    134 $ecp0=\uE070;
    135 $ecp1=\uE071;
    136 $ecp2=\uE072;
    137 $ecp3=\uE073;
    138 $ecp4=\uE074;
    139 $ecp5=\uE075;
    140 $ecp6=\uE076;
    141 $ecp7=\uE077;
    142 $ecp8=\uE078;
    143 $ecp9=\uE079;
    144 $ecpA=\uE07A;
    145 $ecpB=\uE07B;
    146 $ecpC=\uE07C;
    147 $ecpD=\uE07D;
    148 $ecpE=\uE07E;
    149 $ecpF=\uE07F;
    150 # Khanda-ta
    151 $kta=\uE083;
    152 # ; # nothing in Latin maps to InterIndic ABBREVIATION SIGN
    153 $depVowelAbove=[\uE03E-\uE040\uE045-\uE04C];
    154 $depVowelBelow=[\uE041-\uE044];
    155 $endThing=[$danda$doubleDanda];
    156 # $x was originally called ''; $z was '%'
    157 $x=[$virama$aa$ai$au$ii$i$uu$u$rrh$rh$lh$e$o$se$ce$so$co];
    158 $z=[bcdfghjklmnpqrstvwxyz];
    159 $consonants=[[$ka-$ha]$z[-][-][-][-][-][-][-][-][-]];
    160   $avagraha;
    161 $chandrabindu$anusvara;
    162 m$chandrabindu;
    163 h$visarga;
    164 x$ka$virama$sa;
    165 # convert to independent forms at start of word or syllable:
    166 # dependent forms for roundtrip
    167 a$aa;
    168 ai$ai;
    169 au$au;
    170 ii$ii;
    171 i$ii;
    172 i$i;
    173 u$uu;
    174 u$u;
    175 r$rrh;
    176 r$rh;
    177 l$llh;
    178 lh$lh;
    179 l$lh;
    180 e$e;
    181 o$o;
    182 a;
    183 e$ce;
    184 o$co;
    185 e$se;
    186 o$so;
    187 # preceeded by consonants
    188 $consonants{ a$aa;
    189 $consonants{ ai$ai;
    190 $consonants{ au$au;
    191 $consonants{ ii$ii;
    192 $consonants{ i$ii;
    193 $consonants{ i$i;
    194 $consonants{ u$uu;
    195 $consonants{ u$u;
    196 $consonants{ r$rrh;
    197 $consonants{ ra$rh;
    198 $consonants{ r$rh;
    199 $consonants{ l$llh;
    200 $consonants{ lh$lh;
    201 $consonants{ l$lh;
    202 $consonants{ e$e;
    203 $consonants{ o$o;
    204 $consonants{ e$ce;
    205 $consonants{ o$co;
    206 $consonants{ e$se;
    207 $consonants{ o$so;
    208 # e.g. keai - {ka}{e}{wai}; k'ai - {ka}{wai}; (ai) - ({wai})
    209 a$waa;
    210 ai$wai;
    211 au$wau;
    212 i$wii;
    213 i$wi;
    214 u$wuu;
    215 u$wu;
    216 r$wrr;
    217 r$wr;
    218 l$wll;
    219 lh$wl;
    220 l$wl;
    221 e$we;
    222 o$wo;
    223 a$wa;
    224 e$wce;
    225 o$wco;
    226 e$wse;
    227 ''om$om;
    228 o$wso;
    229 # rules for anusvara
    230 n}r            $na|$virama;
    231 n}l            $na|$virama;
    232 n}na                 $na|$virama;
    233 n}[kg]         $anusvara;
    234 n}n      $anusvara;
    235 n}[cj]         $anusvara;
    236 n}n      $anusvara;
    237 n}[tdn]  $anusvara;
    238 n}[tdn]              $anusvara;
    239 m}[pbm]              $anusvara;
    240 n}[ylvshr]           $anusvara;
    241 m              $anusvara;
    242 #urdu compatibility
    243 q$uka|$virama;
    244 kh$ukha |$virama;
    245 g $ugha | $virama;
    246 z  $ujha |$virama;
    247 f  $ufa|$virama;
    248 t$kta;
    249 # dev
    250 y$uya|$virama;
    251 l$ela|$virama;
    252 n$ena|$virama;
    253 n$nga|$virama;
    254 n$nya|$virama;
    255 n$nna|$virama;
    256 th$ttha|$virama;
    257 t$tta|$virama;
    258 rh$udha|$virama;
    259 r$uddha|$virama;
    260 dh$ddha|$virama;
    261 d$dda|$virama;
    262 kh$kha|$virama;
    263 k$ka|$virama;
    264 gh$gha|$virama;
    265 g$ga|$virama;
    266 ch$cha|$virama;
    267 c$ca|$virama;
    268 jh$jha|$virama;
    269 j$ja|$virama;
    270 ny$nya|$virama;
    271 tth$ttha|$virama;
    272 ddh$ddha|$virama;
    273 th$tha|$virama;
    274 t$ta|$virama;
    275 dh$dha|$virama;
    276 d$da|$virama;
    277 n$na|$virama;
    278 ph$pha|$virama;
    279 p$pa|$virama;
    280 bh$bha|$virama;
    281 b$ba|$virama;
    282 m$ma|$virama;
    283 y$ya|$virama;
    284 r$rra|$virama;
    285 r$ra|$virama;
    286 l$lla|$virama;
    287 l$la|$virama;
    288 v$va|$virama;
    289 w$vva|$virama;
    290 w$va|$virama;
    291 sh$sha|$virama;
    292 ss$ssa|$virama;
    293 s$ssa|$virama;
    294 s$sha|$virama;
    295 s$sa|$virama;
    296 h$ha|$virama;
    297 '.'$danda;
    298 $danda'.'$doubleDanda;
    299 $depVowelAbove{'~'$anusvara;
    300 $depVowelBelow{'~'$chandrabindu;
    301 # convert to dependent forms after consonant with no vowel:
    302 # e.g. kai - {ka}{virama}ai - {ka}{ai}
    303 #$virama aa$aa;
    304 $virama a$aa;
    305 $virama ai$ai;
    306 $virama au$au;
    307 $virama ii$ii;
    308 $virama i$ii;
    309 $virama i$i;
    310 #$virama uu$uu;
    311 $virama u$uu;
    312 $virama u$u;
    313 #$virama rrh$rrh;
    314 $virama r$rrh;
    315 #$virama rh$rh;
    316 $virama ra$rh;
    317 $virama r$rh;
    318 $virama l$llh;
    319 $virama lh$lh;
    320 $virama l$lh;
    321 $virama e$e;
    322 $virama o$o;
    323 $virama a;
    324 $virama e$ce;
    325 $virama o$co;
    326 $virama e$se;
    327 $virama o$so;
    328 # otherwise convert independent forms when separated by ': k'ai - {ka}{virama}{wai}
    329 #$virama''aa$waa;
    330 $virama''a$waa;
    331 $virama''ai$wai;
    332 $virama''au$wau;
    333 #$virama''ii$wii;
    334 $virama''i$wii;
    335 $virama''i$wi;
    336 #$virama''uu$wuu;
    337 $virama''u$wuu;
    338 $virama''u$wu;
    339 #$virama''rrh$wrr;
    340 $virama''r$wrr;
    341 #$virama''rh$wr;
    342 $virama''r$wr;
    343 $virama''l$wll;
    344 #$virama''lh$wl;
    345 $virama''l$wl;
    346 $virama''e$we;
    347 $virama''o$wo;
    348 $virama''a$wa;
    349 $virama''e$wce;
    350 $virama''o$wco;
    351 $virama''e$wse;
    352 $virama''o$wso;
    353 # no virama
    354 ''a$waa;
    355 ''ai$wai;
    356 ''au$wau;
    357 ''i$wii;
    358 ''i$wi;
    359 ''u$wuu;
    360 ''u$wu;
    361 ''r$wrr;
    362 ''r$wr;
    363 ''l$wll;
    364 ''l$wl;
    365 ''e$we;
    366 ''o$wo;
    367 ''a$wa;
    368 ''e$wce;
    369 ''o$wco;
    370 ''e$wse;
    371 ''o$wso;
    372 $virama } [$z]  $virama;
    373 $virama } ' '  $virama ;
    374 $virama}$endThing;
    375 $dgs; # Glottal Stop
    376 0$zero;
    377 1$one;
    378 2$two;
    379 3$three;
    380 4$four;
    381 5$five;
    382 6$six;
    383 7$seven;
    384 8$eight;
    385 9$nine;
    386 '';
    387 #:: NFC (NFD) ;
    388 			</tRule>
    389 		</transform>
    390 	</transforms>
    391 </supplementalData>
    392