Home | History | Annotate | Download | only in musl-ctype
      1 #include <wchar.h>
      2 #include <wctype.h>
      3 #include <stdio.h>
      4 
      5 #define CASEMAP(u1,u2,l) { (u1), (l)-(u1), (u2)-(u1)+1 }
      6 #define CASELACE(u1,u2) CASEMAP((u1),(u2),(u1)+1)
      7 
      8 static const struct {
      9 	unsigned short upper;
     10 	signed char lower;
     11 	unsigned char len;
     12 } casemaps[] = {
     13 	CASEMAP('A','Z','a'),
     14 	CASEMAP(0xc0,0xde,0xe0),
     15 
     16 	CASELACE(0x0100,0x012e),
     17 	CASELACE(0x0132,0x0136),
     18 	CASELACE(0x0139,0x0147),
     19 	CASELACE(0x014a,0x0176),
     20 	CASELACE(0x0179,0x017d),
     21 
     22 	CASELACE(0x370,0x372),
     23 	CASEMAP(0x391,0x3a1,0x3b1),
     24 	CASEMAP(0x3a3,0x3ab,0x3c3),
     25 	CASEMAP(0x400,0x40f,0x450),
     26 	CASEMAP(0x410,0x42f,0x430),
     27 
     28 	CASELACE(0x460,0x480),
     29 	CASELACE(0x48a,0x4be),
     30 	CASELACE(0x4c1,0x4cd),
     31 	CASELACE(0x4d0,0x50e),
     32 
     33 	CASELACE(0x514,0x526),
     34 	CASEMAP(0x531,0x556,0x561),
     35 
     36 	CASELACE(0x01a0,0x01a4),
     37 	CASELACE(0x01b3,0x01b5),
     38 	CASELACE(0x01cd,0x01db),
     39 	CASELACE(0x01de,0x01ee),
     40 	CASELACE(0x01f8,0x021e),
     41 	CASELACE(0x0222,0x0232),
     42 	CASELACE(0x03d8,0x03ee),
     43 
     44 	CASELACE(0x1e00,0x1e94),
     45 	CASELACE(0x1ea0,0x1efe),
     46 
     47 	CASEMAP(0x1f08,0x1f0f,0x1f00),
     48 	CASEMAP(0x1f18,0x1f1d,0x1f10),
     49 	CASEMAP(0x1f28,0x1f2f,0x1f20),
     50 	CASEMAP(0x1f38,0x1f3f,0x1f30),
     51 	CASEMAP(0x1f48,0x1f4d,0x1f40),
     52 
     53 	CASEMAP(0x1f68,0x1f6f,0x1f60),
     54 	CASEMAP(0x1f88,0x1f8f,0x1f80),
     55 	CASEMAP(0x1f98,0x1f9f,0x1f90),
     56 	CASEMAP(0x1fa8,0x1faf,0x1fa0),
     57 	CASEMAP(0x1fb8,0x1fb9,0x1fb0),
     58 	CASEMAP(0x1fba,0x1fbb,0x1f70),
     59 	CASEMAP(0x1fc8,0x1fcb,0x1f72),
     60 	CASEMAP(0x1fd8,0x1fd9,0x1fd0),
     61 	CASEMAP(0x1fda,0x1fdb,0x1f76),
     62 	CASEMAP(0x1fe8,0x1fe9,0x1fe0),
     63 	CASEMAP(0x1fea,0x1feb,0x1f7a),
     64 	CASEMAP(0x1ff8,0x1ff9,0x1f78),
     65 	CASEMAP(0x1ffa,0x1ffb,0x1f7c),
     66 
     67 	CASELACE(0x246,0x24e),
     68 	CASELACE(0x510,0x512),
     69 	CASEMAP(0x2160,0x216f,0x2170),
     70 	CASEMAP(0x2c00,0x2c2e,0x2c30),
     71 	CASELACE(0x2c67,0x2c6b),
     72 	CASELACE(0x2c80,0x2ce2),
     73 	CASELACE(0x2ceb,0x2ced),
     74 
     75 	CASELACE(0xa640,0xa66c),
     76 	CASELACE(0xa680,0xa696),
     77 
     78 	CASELACE(0xa722,0xa72e),
     79 	CASELACE(0xa732,0xa76e),
     80 	CASELACE(0xa779,0xa77b),
     81 	CASELACE(0xa77e,0xa786),
     82 
     83 	CASELACE(0xa790,0xa792),
     84 	CASELACE(0xa7a0,0xa7a8),
     85 
     86 	CASEMAP(0xff21,0xff3a,0xff41),
     87 	{ 0,0,0 }
     88 };
     89 
     90 static const unsigned short pairs[][2] = {
     91 	{ 'I',    0x0131 },
     92 	{ 'S',    0x017f },
     93 	{ 0x0130, 'i'    },
     94 	{ 0x0178, 0x00ff },
     95 	{ 0x0181, 0x0253 },
     96 	{ 0x0182, 0x0183 },
     97 	{ 0x0184, 0x0185 },
     98 	{ 0x0186, 0x0254 },
     99 	{ 0x0187, 0x0188 },
    100 	{ 0x0189, 0x0256 },
    101 	{ 0x018a, 0x0257 },
    102 	{ 0x018b, 0x018c },
    103 	{ 0x018e, 0x01dd },
    104 	{ 0x018f, 0x0259 },
    105 	{ 0x0190, 0x025b },
    106 	{ 0x0191, 0x0192 },
    107 	{ 0x0193, 0x0260 },
    108 	{ 0x0194, 0x0263 },
    109 	{ 0x0196, 0x0269 },
    110 	{ 0x0197, 0x0268 },
    111 	{ 0x0198, 0x0199 },
    112 	{ 0x019c, 0x026f },
    113 	{ 0x019d, 0x0272 },
    114 	{ 0x019f, 0x0275 },
    115 	{ 0x01a6, 0x0280 },
    116 	{ 0x01a7, 0x01a8 },
    117 	{ 0x01a9, 0x0283 },
    118 	{ 0x01ac, 0x01ad },
    119 	{ 0x01ae, 0x0288 },
    120 	{ 0x01af, 0x01b0 },
    121 	{ 0x01b1, 0x028a },
    122 	{ 0x01b2, 0x028b },
    123 	{ 0x01b7, 0x0292 },
    124 	{ 0x01b8, 0x01b9 },
    125 	{ 0x01bc, 0x01bd },
    126 	{ 0x01c4, 0x01c6 },
    127 	{ 0x01c4, 0x01c5 },
    128 	{ 0x01c5, 0x01c6 },
    129 	{ 0x01c7, 0x01c9 },
    130 	{ 0x01c7, 0x01c8 },
    131 	{ 0x01c8, 0x01c9 },
    132 	{ 0x01ca, 0x01cc },
    133 	{ 0x01ca, 0x01cb },
    134 	{ 0x01cb, 0x01cc },
    135 	{ 0x01f1, 0x01f3 },
    136 	{ 0x01f1, 0x01f2 },
    137 	{ 0x01f2, 0x01f3 },
    138 	{ 0x01f4, 0x01f5 },
    139 	{ 0x01f6, 0x0195 },
    140 	{ 0x01f7, 0x01bf },
    141 	{ 0x0220, 0x019e },
    142 	{ 0x0386, 0x03ac },
    143 	{ 0x0388, 0x03ad },
    144 	{ 0x0389, 0x03ae },
    145 	{ 0x038a, 0x03af },
    146 	{ 0x038c, 0x03cc },
    147 	{ 0x038e, 0x03cd },
    148 	{ 0x038f, 0x03ce },
    149 	{ 0x0399, 0x0345 },
    150 	{ 0x0399, 0x1fbe },
    151 	{ 0x03a3, 0x03c2 },
    152 	{ 0x03f7, 0x03f8 },
    153 	{ 0x03fa, 0x03fb },
    154 	{ 0x1e60, 0x1e9b },
    155 	{ 0xdf, 0xdf },
    156 	{ 0x1e9e, 0xdf },
    157 
    158 	{ 0x1f59, 0x1f51 },
    159 	{ 0x1f5b, 0x1f53 },
    160 	{ 0x1f5d, 0x1f55 },
    161 	{ 0x1f5f, 0x1f57 },
    162 	{ 0x1fbc, 0x1fb3 },
    163 	{ 0x1fcc, 0x1fc3 },
    164 	{ 0x1fec, 0x1fe5 },
    165 	{ 0x1ffc, 0x1ff3 },
    166 
    167 	{ 0x23a, 0x2c65 },
    168 	{ 0x23b, 0x23c },
    169 	{ 0x23d, 0x19a },
    170 	{ 0x23e, 0x2c66 },
    171 	{ 0x241, 0x242 },
    172 	{ 0x243, 0x180 },
    173 	{ 0x244, 0x289 },
    174 	{ 0x245, 0x28c },
    175 	{ 0x3f4, 0x3b8 },
    176 	{ 0x3f9, 0x3f2 },
    177 	{ 0x3fd, 0x37b },
    178 	{ 0x3fe, 0x37c },
    179 	{ 0x3ff, 0x37d },
    180 	{ 0x4c0, 0x4cf },
    181 
    182 	{ 0x2126, 0x3c9 },
    183 	{ 0x212a, 'k' },
    184 	{ 0x212b, 0xe5 },
    185 	{ 0x2132, 0x214e },
    186 	{ 0x2183, 0x2184 },
    187 	{ 0x2c60, 0x2c61 },
    188 	{ 0x2c62, 0x26b },
    189 	{ 0x2c63, 0x1d7d },
    190 	{ 0x2c64, 0x27d },
    191 	{ 0x2c6d, 0x251 },
    192 	{ 0x2c6e, 0x271 },
    193 	{ 0x2c6f, 0x250 },
    194 	{ 0x2c70, 0x252 },
    195 	{ 0x2c72, 0x2c73 },
    196 	{ 0x2c75, 0x2c76 },
    197 	{ 0x2c7e, 0x23f },
    198 	{ 0x2c7f, 0x240 },
    199 	{ 0x2cf2, 0x2cf3 },
    200 
    201 	{ 0xa77d, 0x1d79 },
    202 	{ 0xa78b, 0xa78c },
    203 	{ 0xa78d, 0x265 },
    204 	{ 0xa7aa, 0x266 },
    205 
    206 	{ 0x10c7, 0x2d27 },
    207 	{ 0x10cd, 0x2d2d },
    208 
    209 	/* bogus greek 'symbol' letters */
    210 	{ 0x376, 0x377 },
    211 	{ 0x39c, 0xb5 },
    212 	{ 0x392, 0x3d0 },
    213 	{ 0x398, 0x3d1 },
    214 	{ 0x3a6, 0x3d5 },
    215 	{ 0x3a0, 0x3d6 },
    216 	{ 0x39a, 0x3f0 },
    217 	{ 0x3a1, 0x3f1 },
    218 	{ 0x395, 0x3f5 },
    219 	{ 0x3cf, 0x3d7 },
    220 
    221 	{ 0,0 }
    222 };
    223 
    224 
    225 static wchar_t __towcase(wchar_t wc, int lower)
    226 {
    227 	int i;
    228 	int lmul = 2*lower-1;
    229 	int lmask = lower-1;
    230 	/* no letters with case in these large ranges */
    231 	if (!iswalpha(wc)
    232 	 || (unsigned)wc - 0x0600 <= 0x0fff-0x0600
    233 	 || (unsigned)wc - 0x2e00 <= 0xa63f-0x2e00
    234 	 || (unsigned)wc - 0xa800 <= 0xfeff-0xa800)
    235 		return wc;
    236 	/* special case because the diff between upper/lower is too big */
    237 	if (lower && (unsigned)wc - 0x10a0 < 0x2e)
    238 		if (wc>0x10c5 && wc != 0x10c7 && wc != 0x10cd) return wc;
    239 		else return wc + 0x2d00 - 0x10a0;
    240 	if (!lower && (unsigned)wc - 0x2d00 < 0x26)
    241 		if (wc>0x2d25 && wc != 0x2d27 && wc != 0x2d2d) return wc;
    242 		else return wc + 0x10a0 - 0x2d00;
    243 	for (i=0; casemaps[i].len; i++) {
    244 		int base = casemaps[i].upper + (lmask & casemaps[i].lower);
    245 		if ((unsigned)wc-base < casemaps[i].len) {
    246 			if (casemaps[i].lower == 1)
    247 				return wc + lower - ((wc-casemaps[i].upper)&1);
    248 			return wc + lmul*casemaps[i].lower;
    249 		}
    250 	}
    251 	for (i=0; pairs[i][1-lower]; i++) {
    252 		if (pairs[i][1-lower] == wc)
    253 			return pairs[i][lower];
    254 	}
    255 	if ((unsigned)wc - (0x10428 - 0x28*lower) < 0x28)
    256 		return wc - 0x28 + 0x50*lower;
    257 	return wc;
    258 }
    259 
    260 wint_t towupper(wint_t wc)
    261 {
    262 	return __towcase(wc, 0);
    263 }
    264 
    265 wint_t towlower(wint_t wc)
    266 {
    267 	return __towcase(wc, 1);
    268 }
    269