Home | History | Annotate | Download | only in transforms
      1 <?xml version="1.0" encoding="UTF-8" ?>
      2 <!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
      3 <!--
      4 Copyright  1991-2013 Unicode, Inc.
      5 CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
      6 For terms of use, see http://www.unicode.org/copyright.html
      7 -->
      8 <supplementalData>
      9 	<version number="$Revision: 12243 $"/>
     10 	<transforms>
     11 		<transform source="it" target="ja" direction="forward" alias="ja-t-it">
     12 			<tRule>
     13 # Italian to Katakana Transliteration Table for ICU
     14 # Based on:
     15 #   "" (, 1974. ISBN:978-4475017176)
     16 #   http://ja.wikipedia.org/wiki/%E3%82%A4%E3%82%BF%E3%83%AA%E3%82%A2%E8%AA%9E
     17 
     18 ::NFD(NFC);
     19 ::Lower();
     20 ::[:Latin:] fullwidth-halfwidth();
     21 #
     22 #
     23 # Variables.
     24 
     25 $vowel = [aeiou];
     26 $consonant = [bcdfghjklmnpqrstvwxyz];
     27 #
     28 #
     29 # Ignore apostrophe.
     30 
     31 ($consonant) \'  | $1;
     32 \'  ;
     33 #
     34 #
     35 
     36 cqu  ;
     37 cc   | c;
     38 ca  ;
     39  { cia  ;
     40 cio  ;
     41 ci  ;
     42 cu  ;
     43 ce  ;
     44 co  ;
     45 #
     46 #
     47 
     48 cha  ;
     49 chi  ;
     50 chu  ;
     51 che  ;
     52 cho  ;
     53 #
     54 #
     55 
     56 gg   | g;
     57 ghi  ;
     58 ghe  ;
     59 ghu  ;
     60 gli  | li;
     61 gna  ;
     62 gni  ;
     63 gnu  ;
     64 gne  ;
     65 gno  ;
     66 #
     67 #
     68 
     69 ga  ;
     70 gia  ;
     71 giu  ;
     72 gio  ;
     73 gi  ;
     74 gu  ;
     75 ge  ;
     76 go  ;
     77 #
     78 #
     79 
     80 rr   | r;
     81 ra  ;
     82 ri  ;
     83 ru  ;
     84 re  ;
     85 ro  ;
     86 #
     87 #
     88 
     89 ll   | l;
     90 la  ;
     91 li  ;
     92 lu  ;
     93 le  ;
     94 lo  ;
     95 #
     96 #
     97 
     98 tt   | t;
     99 ta  ;
    100 ti  ;
    101 thi  ;
    102 tu  ;
    103 thu  ;
    104 te  ;
    105 the  ;
    106 to  ;
    107 tho  ;
    108 tzu  | ;
    109 tz  | zz;
    110 #
    111 #
    112 
    113 dd   | d;
    114 da  ;
    115 di  ;
    116 du  ;
    117 de  ;
    118 do  ;
    119 #
    120 #
    121 
    122 ma  ;
    123 mi  ;
    124 mu  ;
    125 me  ;
    126 mo  ;
    127 m } $consonant  ;
    128 #
    129 #
    130 
    131 na  ;
    132 ni  ;
    133 nu  ;
    134 ne  ;
    135 no  ;
    136 #
    137 #
    138 
    139 ff   | f;
    140 fa  ;
    141 fi  ;
    142 fu  ;
    143 fe  ;
    144 fo  ;
    145 #
    146 #
    147 
    148 bb   | b;
    149 ba  ;
    150 bi  ;
    151 bu  ;
    152 be  ;
    153 bo  ;
    154 #
    155 #
    156 
    157 pp   | p;
    158 pa  ;
    159 pi  ;
    160 pu  ;
    161 pe  ;
    162 po  ;
    163 #
    164 #
    165 
    166 vv   | v;
    167 va  ;
    168 vi  ;
    169 vu  ;
    170 ve  ;
    171 vo  ;
    172 #
    173 #
    174 
    175 sa } nt[ao]  ;
    176 ss   | \~s;
    177 #
    178 #
    179 # 's' is voiced before [bdglmnrv].
    180 
    181 sb   | b;
    182 sd   | d;
    183 sg   | g;
    184 sl   | l;
    185 sm   | m;
    186 sn   | n;
    187 sr   | r;
    188 sv   | v;
    189 #
    190 #
    191 # Force 's' after a consonat to be unvoiced.
    192 
    193 ($consonant) s } $vowel  | $1 \~ s;
    194 \~sa  ;
    195 \~si  ;
    196 \~su  ;
    197 \~se  ;
    198 \~so  ;
    199 #
    200 #
    201 # 's' at the beginning is usually unvoiced.
    202 
    203 [:^Letter:] { sa  ;
    204 [:^Letter:] { si  ;
    205 [:^Letter:] { su  ;
    206 [:^Letter:] { se  ;
    207 [:^Letter:] { so  ;
    208 #
    209 #
    210 # Otherwise voiced 's' are common.
    211 
    212 sa  ;
    213 si  ;
    214 su  ;
    215 se  ;
    216 so  ;
    217 #
    218 #
    219 
    220 scia  ;
    221 sci  ;
    222 sce  ;
    223 #
    224 #
    225 
    226 zz   | \~z;
    227 #
    228 # Force 'z' after a consonat to be unvoiced.
    229 
    230 ($consonant) z  | $1 \~z;
    231 \~za  ;
    232 \~zi  ;
    233 \~zu  ;
    234 \~ze  ;
    235 \~zo  ;
    236 #
    237 #
    238 # Otherwise voiced 'z' are common except for 'zi'.
    239 
    240 za  ;
    241 [:^Letter:] { zi  ;
    242 zi  ;
    243 zu  ;
    244 ze  ;
    245 zo  ;
    246 #
    247 #
    248 
    249 ja  ;
    250 je  ;
    251 j  | i;
    252 #
    253 #
    254 # Standalone vowels and consonants.
    255 
    256 a  ;
    257 i  ;
    258 u  ;
    259 e  ;
    260 o  ;
    261 #
    262 #
    263 
    264 b  ;
    265 c  ;
    266 d  ;
    267 f  ;
    268 g  ;
    269 h  ;
    270 k  | c;
    271 l  ;
    272 m  ;
    273 n  ;
    274 p  ;
    275 q  | c;
    276 r  ;
    277 s  ;
    278 t  ;
    279 v  ;
    280 x  | cs;
    281 y  | i;
    282 z  ;
    283 #
    284 #
    285 # word delimiter of transliterated foreign phrase is ''.
    286 
    287 ' '  ;
    288 #
    289 #
    290 # Latin hyphen should be transliterated to U+30A0 (KATAKANA-HIRAGANA
    291 # DOUBLE HYPHEN), ideally. But since the character isn't supported by
    292 # many fonts or softwares, we use U+FF1D (FULLWIDTH EQUALS SIGN),
    293 # which is widely used as "double hyphen".
    294 #
    295 
    296 \-  ;
    297 #
    298 #
    299 
    300 [:nonspacing mark:]  ;
    301 ::NFC(NFD);
    302 			</tRule>
    303 		</transform>
    304 	</transforms>
    305 </supplementalData>
    306