Home | History | Annotate | Download | only in testdata
      1 # Copyright (C) 2016 and later: Unicode, Inc. and others.
      2 # License & terms of use: http://www.unicode.org/copyright.html
      3 # *******************************************************************************
      4 # * Copyright (C) 2012, International Business Machines
      5 # * Corporation and others.  All Rights Reserved.
      6 # *******************************************************************************
      7 #
      8 # test2.ucm
      9 #
     10 # Test file for MBCS conversion with two-byte codepage data. (DBCS)
     11 # Also contains extension mappings (m:n).
     12 
     13 <code_set_name>     "test2"
     14 <mb_cur_max>        2
     15 <mb_cur_min>        1
     16 <uconv_class>       "MBCS"
     17 <subchar>           \x1A
     18 <icu:state>         0, 1:1, 5-9, 1a, ff
     19 <icu:state>         a-f.p
     20 
     21 CHARMAP
     22 
     23 # fromUnicode result is zero byte from other than U+0000
     24 <U0040>     \x00 |0
     25 
     26 # nothing special
     27 <U0065>     \x05 |0
     28 
     29 # extensions
     30 <U00c0>     \x05+\x01\x0d |0
     31 <U00c0>     \x05+\x01\x0e |3
     32 <U00c0>     \x05+\xff |3
     33 
     34 # toUnicode result is fallback direct
     35 <U0066>     \x06 |3
     36 
     37 # toUnicode result is direct non-BMP code point
     38 <U101234>   \x07 |0
     39 <Ufebcd>    \x08 |3
     40 
     41 # extensions
     42 <U101234>+<U50005>+<U60006> \x07+\x00+\x01\x0f+\x09 |0
     43 <U101234>+<U50005>          \x07+\x00+\x01\x0e+\x05 |0
     44 <U101234>+<U60006>          \x07+\x00+\x01\x0f+\x06 |0
     45 <U101234>+<U70007>          \x07+\x00+\x01\x0f |1
     46 
     47 #unassigned \x09
     48 
     49 # extensions where the first code point is unassigned, for replay testing
     50 #<U00c4><U0300> \x09+\x09 |0
     51 <U00c4><U00c4><U101234><U0005> \x05+\x01\x0c |0
     52 
     53 # toUnicode result is surrogate pair: test real pair, single unit, unassigned
     54 <U23456>    \x01\x0a |0
     55 <U000b>     \x01\x0b |0
     56 #unassigned \x01\x0c
     57 <U34567>    \x01\x0d |3
     58 <U000e>     \x01\x0e |3
     59 #unassigned \x01\x0f
     60 
     61 END CHARMAP
     62