Home | History | Annotate | Download | only in transforms
      1 <?xml version="1.0" encoding="UTF-8" ?>
      2 <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
      3 <!--
      4 Copyright  1991-2013 Unicode, Inc.
      5 CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
      6 For terms of use, see http://www.unicode.org/copyright.html
      7 -->
      8 <supplementalData>
      9 	<version number="$Revision: 12813 $"/>
     10 	<transforms>
     11 		<transform source="ro" target="ro_FONIPA" direction="forward" alias="ro-fonipa-t-ro">
     12 			<tRule><![CDATA[
     13 # Romanian orthography to phonemic transcription.
     14 # http://en.wikipedia.org/wiki/Romanian_phonology
     15 #
     16 # TODO: Currently this transform does not palatalize consonants.
     17 
     18 $VowelEI = [e i ];
     19 $VowelAOU = [a   o u];
     20 $Vowel = [$VowelEI $VowelAOU];
     21 $Boundary =  [^[:L:][:M:][:N:]];
     22 
     23 :: NFC () ;
     24 :: Lower () ;
     25 
     26 # Special cases.
     27 eoai  eoaj ;  # eg. leoaic  /leoajk/, not /leoaik/
     28 
     29 # Triphthongs.
     30 eai  eaj ;
     31 eau  eaw ;
     32 eoa  eoa ;
     33 i\-ai  jaj ;
     34 ia\-i  jaj ;
     35 iau  jaw ;
     36 iei  jej ;
     37 ieu  jew ;
     38 $Boundary {eu}  jew ;
     39 ioa  joa ;
     40 ioi  joj ;
     41 i\-oi  joj ;
     42 iou  jow ;
     43 oai  oaj ;
     44 uai  waj ;
     45 uau  waw ;
     46 ui  wj ;
     47 
     48 # Diphthongs.
     49 ai  aj ;
     50 i  j ;
     51 i  j ;
     52 au} r  au ;
     53 au  aw ;
     54 u  w ;
     55 u  w ;
     56 ea  ea ;
     57 ei  ej ;
     58 eo  eo ;
     59 e\-o  eo ;
     60 eu  ew ;
     61 e\-u  eu ;
     62 ia  ja ;
     63 i\-a  ja ;
     64 ie  je ;
     65 ii  ij ;
     66 io  jo ;
     67 iu} [$Vowel $Boundary]  iw ;
     68 iu  ju ;
     69 oa  oa ;
     70 oi  oj ;
     71 ou  ow ;
     72 ua  wa ;
     73 u  w ;
     74 u  w ;
     75 ue  we ;
     76 ui  uj ;
     77 uu  uw ;
     78 
     79 a  a ;
     80    ;
     81    ;
     82 b  b ;
     83 ch  k ;
     84 {c} [ei]  t ;
     85 c  k ;
     86 d  d ;
     87 e  e ;
     88 f  f ;
     89 gh   ;
     90 {g} [ei]  d ;
     91 g   ;
     92 h  h ;
     93 i  i ;
     94    ;
     95 j   ;
     96 k  k ;
     97 l  l ;
     98 m  m ;
     99 ng   ;
    100 n  n ;
    101 o  o ;
    102 p  p ;
    103 q  k ;
    104 r  r ;
    105 s  s ;
    106    ;
    107    ;
    108 t  t ;
    109   ts ;
    110   ts ;
    111 u  u ;
    112 v  v ;
    113 x  ks ;
    114 y  i ;
    115 z  z ;
    116 [:P:]+  ' ';
    117 
    118 # Romanian does not have any gemination.
    119 # https://en.wikipedia.org/wiki/Gemination#Latin_and_Romance_languages
    120 ::null;
    121 pp+  p;
    122 bb+  b;
    123 tt+  t;
    124 dd+  d;
    125 kk+  k;
    126 dd+  d;
    127 +  ;
    128 
    129 ff+  f;
    130 vv+  v;
    131 hh+  h;
    132 
    133 ss+  s;
    134 zz+  z;
    135 +  ;
    136 +  ;
    137 
    138 rr+  r;
    139 ll+  l;
    140 
    141 jj+  j;
    142 ww+  w;
    143 
    144 			]]></tRule>
    145 		</transform>
    146 	</transforms>
    147 </supplementalData>
    148