1 /* The table and comments below along with the function xkb_keysym_to_ucs4 2 * are under the public domain and are derived as described below. 3 */ 4 /* This module converts keysym values into the corresponding ISO 10646 5 * (UCS, Unicode) values. 6 * 7 * The array keysymtab[] contains pairs of X11 keysym values for graphical 8 * characters and the corresponding Unicode value. The function 9 * keysym2ucs() maps a keysym onto a Unicode value using a binary search, 10 * therefore keysymtab[] must remain SORTED by keysym value. 11 * 12 * The keysym -> UTF-8 conversion will hopefully one day be provided 13 * by Xlib via XmbLookupString() and should ideally not have to be 14 * done in X applications. But we are not there yet. 15 * 16 * We allow to represent any UCS character in the range U-00000000 to 17 * U-00FFFFFF by a keysym value in the range 0x01000000 to 0x01ffffff. 18 * This admittedly does not cover the entire 31-bit space of UCS, but 19 * it does cover all of the characters up to U-10FFFF, which can be 20 * represented by UTF-16, and more, and it is very unlikely that higher 21 * UCS codes will ever be assigned by ISO. So to get Unicode character 22 * U+ABCD you can directly use keysym 0x0100abcd. 23 * 24 * NOTE: The comments in the table below contain the actual character 25 * encoded in UTF-8, so for viewing and editing best use an editor in 26 * UTF-8 mode. 27 * 28 * Author: Markus G. Kuhn <http://www.cl.cam.ac.uk/~mgk25/>, 29 * University of Cambridge, April 2001 30 * 31 * Special thanks to Richard Verhoeven <river (at) win.tue.nl> for preparing 32 * an initial draft of the mapping table. 33 * 34 * This software is in the public domain. Share and enjoy! 35 * 36 */ 37 38 #include "xkbcommon/xkbcommon.h" 39 #include "utils.h" 40 #include "utf8.h" 41 42 /* We don't use the uint32_t types here, to save some space. */ 43 struct codepair { 44 uint16_t keysym; 45 uint16_t ucs; 46 }; 47 48 static const struct codepair keysymtab[] = { 49 { 0x01a1, 0x0104 }, /* Aogonek LATIN CAPITAL LETTER A WITH OGONEK */ 50 { 0x01a2, 0x02d8 }, /* breve BREVE */ 51 { 0x01a3, 0x0141 }, /* Lstroke LATIN CAPITAL LETTER L WITH STROKE */ 52 { 0x01a5, 0x013d }, /* Lcaron LATIN CAPITAL LETTER L WITH CARON */ 53 { 0x01a6, 0x015a }, /* Sacute LATIN CAPITAL LETTER S WITH ACUTE */ 54 { 0x01a9, 0x0160 }, /* Scaron LATIN CAPITAL LETTER S WITH CARON */ 55 { 0x01aa, 0x015e }, /* Scedilla LATIN CAPITAL LETTER S WITH CEDILLA */ 56 { 0x01ab, 0x0164 }, /* Tcaron LATIN CAPITAL LETTER T WITH CARON */ 57 { 0x01ac, 0x0179 }, /* Zacute LATIN CAPITAL LETTER Z WITH ACUTE */ 58 { 0x01ae, 0x017d }, /* Zcaron LATIN CAPITAL LETTER Z WITH CARON */ 59 { 0x01af, 0x017b }, /* Zabovedot LATIN CAPITAL LETTER Z WITH DOT ABOVE */ 60 { 0x01b1, 0x0105 }, /* aogonek LATIN SMALL LETTER A WITH OGONEK */ 61 { 0x01b2, 0x02db }, /* ogonek OGONEK */ 62 { 0x01b3, 0x0142 }, /* lstroke LATIN SMALL LETTER L WITH STROKE */ 63 { 0x01b5, 0x013e }, /* lcaron LATIN SMALL LETTER L WITH CARON */ 64 { 0x01b6, 0x015b }, /* sacute LATIN SMALL LETTER S WITH ACUTE */ 65 { 0x01b7, 0x02c7 }, /* caron CARON */ 66 { 0x01b9, 0x0161 }, /* scaron LATIN SMALL LETTER S WITH CARON */ 67 { 0x01ba, 0x015f }, /* scedilla LATIN SMALL LETTER S WITH CEDILLA */ 68 { 0x01bb, 0x0165 }, /* tcaron LATIN SMALL LETTER T WITH CARON */ 69 { 0x01bc, 0x017a }, /* zacute LATIN SMALL LETTER Z WITH ACUTE */ 70 { 0x01bd, 0x02dd }, /* doubleacute DOUBLE ACUTE ACCENT */ 71 { 0x01be, 0x017e }, /* zcaron LATIN SMALL LETTER Z WITH CARON */ 72 { 0x01bf, 0x017c }, /* zabovedot LATIN SMALL LETTER Z WITH DOT ABOVE */ 73 { 0x01c0, 0x0154 }, /* Racute LATIN CAPITAL LETTER R WITH ACUTE */ 74 { 0x01c3, 0x0102 }, /* Abreve LATIN CAPITAL LETTER A WITH BREVE */ 75 { 0x01c5, 0x0139 }, /* Lacute LATIN CAPITAL LETTER L WITH ACUTE */ 76 { 0x01c6, 0x0106 }, /* Cacute LATIN CAPITAL LETTER C WITH ACUTE */ 77 { 0x01c8, 0x010c }, /* Ccaron LATIN CAPITAL LETTER C WITH CARON */ 78 { 0x01ca, 0x0118 }, /* Eogonek LATIN CAPITAL LETTER E WITH OGONEK */ 79 { 0x01cc, 0x011a }, /* Ecaron LATIN CAPITAL LETTER E WITH CARON */ 80 { 0x01cf, 0x010e }, /* Dcaron LATIN CAPITAL LETTER D WITH CARON */ 81 { 0x01d0, 0x0110 }, /* Dstroke LATIN CAPITAL LETTER D WITH STROKE */ 82 { 0x01d1, 0x0143 }, /* Nacute LATIN CAPITAL LETTER N WITH ACUTE */ 83 { 0x01d2, 0x0147 }, /* Ncaron LATIN CAPITAL LETTER N WITH CARON */ 84 { 0x01d5, 0x0150 }, /* Odoubleacute LATIN CAPITAL LETTER O WITH DOUBLE ACUTE */ 85 { 0x01d8, 0x0158 }, /* Rcaron LATIN CAPITAL LETTER R WITH CARON */ 86 { 0x01d9, 0x016e }, /* Uring LATIN CAPITAL LETTER U WITH RING ABOVE */ 87 { 0x01db, 0x0170 }, /* Udoubleacute LATIN CAPITAL LETTER U WITH DOUBLE ACUTE */ 88 { 0x01de, 0x0162 }, /* Tcedilla LATIN CAPITAL LETTER T WITH CEDILLA */ 89 { 0x01e0, 0x0155 }, /* racute LATIN SMALL LETTER R WITH ACUTE */ 90 { 0x01e3, 0x0103 }, /* abreve LATIN SMALL LETTER A WITH BREVE */ 91 { 0x01e5, 0x013a }, /* lacute LATIN SMALL LETTER L WITH ACUTE */ 92 { 0x01e6, 0x0107 }, /* cacute LATIN SMALL LETTER C WITH ACUTE */ 93 { 0x01e8, 0x010d }, /* ccaron LATIN SMALL LETTER C WITH CARON */ 94 { 0x01ea, 0x0119 }, /* eogonek LATIN SMALL LETTER E WITH OGONEK */ 95 { 0x01ec, 0x011b }, /* ecaron LATIN SMALL LETTER E WITH CARON */ 96 { 0x01ef, 0x010f }, /* dcaron LATIN SMALL LETTER D WITH CARON */ 97 { 0x01f0, 0x0111 }, /* dstroke LATIN SMALL LETTER D WITH STROKE */ 98 { 0x01f1, 0x0144 }, /* nacute LATIN SMALL LETTER N WITH ACUTE */ 99 { 0x01f2, 0x0148 }, /* ncaron LATIN SMALL LETTER N WITH CARON */ 100 { 0x01f5, 0x0151 }, /* odoubleacute LATIN SMALL LETTER O WITH DOUBLE ACUTE */ 101 { 0x01f8, 0x0159 }, /* rcaron LATIN SMALL LETTER R WITH CARON */ 102 { 0x01f9, 0x016f }, /* uring LATIN SMALL LETTER U WITH RING ABOVE */ 103 { 0x01fb, 0x0171 }, /* udoubleacute LATIN SMALL LETTER U WITH DOUBLE ACUTE */ 104 { 0x01fe, 0x0163 }, /* tcedilla LATIN SMALL LETTER T WITH CEDILLA */ 105 { 0x01ff, 0x02d9 }, /* abovedot DOT ABOVE */ 106 { 0x02a1, 0x0126 }, /* Hstroke LATIN CAPITAL LETTER H WITH STROKE */ 107 { 0x02a6, 0x0124 }, /* Hcircumflex LATIN CAPITAL LETTER H WITH CIRCUMFLEX */ 108 { 0x02a9, 0x0130 }, /* Iabovedot LATIN CAPITAL LETTER I WITH DOT ABOVE */ 109 { 0x02ab, 0x011e }, /* Gbreve LATIN CAPITAL LETTER G WITH BREVE */ 110 { 0x02ac, 0x0134 }, /* Jcircumflex LATIN CAPITAL LETTER J WITH CIRCUMFLEX */ 111 { 0x02b1, 0x0127 }, /* hstroke LATIN SMALL LETTER H WITH STROKE */ 112 { 0x02b6, 0x0125 }, /* hcircumflex LATIN SMALL LETTER H WITH CIRCUMFLEX */ 113 { 0x02b9, 0x0131 }, /* idotless LATIN SMALL LETTER DOTLESS I */ 114 { 0x02bb, 0x011f }, /* gbreve LATIN SMALL LETTER G WITH BREVE */ 115 { 0x02bc, 0x0135 }, /* jcircumflex LATIN SMALL LETTER J WITH CIRCUMFLEX */ 116 { 0x02c5, 0x010a }, /* Cabovedot LATIN CAPITAL LETTER C WITH DOT ABOVE */ 117 { 0x02c6, 0x0108 }, /* Ccircumflex LATIN CAPITAL LETTER C WITH CIRCUMFLEX */ 118 { 0x02d5, 0x0120 }, /* Gabovedot LATIN CAPITAL LETTER G WITH DOT ABOVE */ 119 { 0x02d8, 0x011c }, /* Gcircumflex LATIN CAPITAL LETTER G WITH CIRCUMFLEX */ 120 { 0x02dd, 0x016c }, /* Ubreve LATIN CAPITAL LETTER U WITH BREVE */ 121 { 0x02de, 0x015c }, /* Scircumflex LATIN CAPITAL LETTER S WITH CIRCUMFLEX */ 122 { 0x02e5, 0x010b }, /* cabovedot LATIN SMALL LETTER C WITH DOT ABOVE */ 123 { 0x02e6, 0x0109 }, /* ccircumflex LATIN SMALL LETTER C WITH CIRCUMFLEX */ 124 { 0x02f5, 0x0121 }, /* gabovedot LATIN SMALL LETTER G WITH DOT ABOVE */ 125 { 0x02f8, 0x011d }, /* gcircumflex LATIN SMALL LETTER G WITH CIRCUMFLEX */ 126 { 0x02fd, 0x016d }, /* ubreve LATIN SMALL LETTER U WITH BREVE */ 127 { 0x02fe, 0x015d }, /* scircumflex LATIN SMALL LETTER S WITH CIRCUMFLEX */ 128 { 0x03a2, 0x0138 }, /* kra LATIN SMALL LETTER KRA */ 129 { 0x03a3, 0x0156 }, /* Rcedilla LATIN CAPITAL LETTER R WITH CEDILLA */ 130 { 0x03a5, 0x0128 }, /* Itilde LATIN CAPITAL LETTER I WITH TILDE */ 131 { 0x03a6, 0x013b }, /* Lcedilla LATIN CAPITAL LETTER L WITH CEDILLA */ 132 { 0x03aa, 0x0112 }, /* Emacron LATIN CAPITAL LETTER E WITH MACRON */ 133 { 0x03ab, 0x0122 }, /* Gcedilla LATIN CAPITAL LETTER G WITH CEDILLA */ 134 { 0x03ac, 0x0166 }, /* Tslash LATIN CAPITAL LETTER T WITH STROKE */ 135 { 0x03b3, 0x0157 }, /* rcedilla LATIN SMALL LETTER R WITH CEDILLA */ 136 { 0x03b5, 0x0129 }, /* itilde LATIN SMALL LETTER I WITH TILDE */ 137 { 0x03b6, 0x013c }, /* lcedilla LATIN SMALL LETTER L WITH CEDILLA */ 138 { 0x03ba, 0x0113 }, /* emacron LATIN SMALL LETTER E WITH MACRON */ 139 { 0x03bb, 0x0123 }, /* gcedilla LATIN SMALL LETTER G WITH CEDILLA */ 140 { 0x03bc, 0x0167 }, /* tslash LATIN SMALL LETTER T WITH STROKE */ 141 { 0x03bd, 0x014a }, /* ENG LATIN CAPITAL LETTER ENG */ 142 { 0x03bf, 0x014b }, /* eng LATIN SMALL LETTER ENG */ 143 { 0x03c0, 0x0100 }, /* Amacron LATIN CAPITAL LETTER A WITH MACRON */ 144 { 0x03c7, 0x012e }, /* Iogonek LATIN CAPITAL LETTER I WITH OGONEK */ 145 { 0x03cc, 0x0116 }, /* Eabovedot LATIN CAPITAL LETTER E WITH DOT ABOVE */ 146 { 0x03cf, 0x012a }, /* Imacron LATIN CAPITAL LETTER I WITH MACRON */ 147 { 0x03d1, 0x0145 }, /* Ncedilla LATIN CAPITAL LETTER N WITH CEDILLA */ 148 { 0x03d2, 0x014c }, /* Omacron LATIN CAPITAL LETTER O WITH MACRON */ 149 { 0x03d3, 0x0136 }, /* Kcedilla LATIN CAPITAL LETTER K WITH CEDILLA */ 150 { 0x03d9, 0x0172 }, /* Uogonek LATIN CAPITAL LETTER U WITH OGONEK */ 151 { 0x03dd, 0x0168 }, /* Utilde LATIN CAPITAL LETTER U WITH TILDE */ 152 { 0x03de, 0x016a }, /* Umacron LATIN CAPITAL LETTER U WITH MACRON */ 153 { 0x03e0, 0x0101 }, /* amacron LATIN SMALL LETTER A WITH MACRON */ 154 { 0x03e7, 0x012f }, /* iogonek LATIN SMALL LETTER I WITH OGONEK */ 155 { 0x03ec, 0x0117 }, /* eabovedot LATIN SMALL LETTER E WITH DOT ABOVE */ 156 { 0x03ef, 0x012b }, /* imacron LATIN SMALL LETTER I WITH MACRON */ 157 { 0x03f1, 0x0146 }, /* ncedilla LATIN SMALL LETTER N WITH CEDILLA */ 158 { 0x03f2, 0x014d }, /* omacron LATIN SMALL LETTER O WITH MACRON */ 159 { 0x03f3, 0x0137 }, /* kcedilla LATIN SMALL LETTER K WITH CEDILLA */ 160 { 0x03f9, 0x0173 }, /* uogonek LATIN SMALL LETTER U WITH OGONEK */ 161 { 0x03fd, 0x0169 }, /* utilde LATIN SMALL LETTER U WITH TILDE */ 162 { 0x03fe, 0x016b }, /* umacron LATIN SMALL LETTER U WITH MACRON */ 163 { 0x047e, 0x203e }, /* overline OVERLINE */ 164 { 0x04a1, 0x3002 }, /* kana_fullstop IDEOGRAPHIC FULL STOP */ 165 { 0x04a2, 0x300c }, /* kana_openingbracket LEFT CORNER BRACKET */ 166 { 0x04a3, 0x300d }, /* kana_closingbracket RIGHT CORNER BRACKET */ 167 { 0x04a4, 0x3001 }, /* kana_comma IDEOGRAPHIC COMMA */ 168 { 0x04a5, 0x30fb }, /* kana_conjunctive KATAKANA MIDDLE DOT */ 169 { 0x04a6, 0x30f2 }, /* kana_WO KATAKANA LETTER WO */ 170 { 0x04a7, 0x30a1 }, /* kana_a KATAKANA LETTER SMALL A */ 171 { 0x04a8, 0x30a3 }, /* kana_i KATAKANA LETTER SMALL I */ 172 { 0x04a9, 0x30a5 }, /* kana_u KATAKANA LETTER SMALL U */ 173 { 0x04aa, 0x30a7 }, /* kana_e KATAKANA LETTER SMALL E */ 174 { 0x04ab, 0x30a9 }, /* kana_o KATAKANA LETTER SMALL O */ 175 { 0x04ac, 0x30e3 }, /* kana_ya KATAKANA LETTER SMALL YA */ 176 { 0x04ad, 0x30e5 }, /* kana_yu KATAKANA LETTER SMALL YU */ 177 { 0x04ae, 0x30e7 }, /* kana_yo KATAKANA LETTER SMALL YO */ 178 { 0x04af, 0x30c3 }, /* kana_tsu KATAKANA LETTER SMALL TU */ 179 { 0x04b0, 0x30fc }, /* prolongedsound KATAKANA-HIRAGANA PROLONGED SOUND MARK */ 180 { 0x04b1, 0x30a2 }, /* kana_A KATAKANA LETTER A */ 181 { 0x04b2, 0x30a4 }, /* kana_I KATAKANA LETTER I */ 182 { 0x04b3, 0x30a6 }, /* kana_U KATAKANA LETTER U */ 183 { 0x04b4, 0x30a8 }, /* kana_E KATAKANA LETTER E */ 184 { 0x04b5, 0x30aa }, /* kana_O KATAKANA LETTER O */ 185 { 0x04b6, 0x30ab }, /* kana_KA KATAKANA LETTER KA */ 186 { 0x04b7, 0x30ad }, /* kana_KI KATAKANA LETTER KI */ 187 { 0x04b8, 0x30af }, /* kana_KU KATAKANA LETTER KU */ 188 { 0x04b9, 0x30b1 }, /* kana_KE KATAKANA LETTER KE */ 189 { 0x04ba, 0x30b3 }, /* kana_KO KATAKANA LETTER KO */ 190 { 0x04bb, 0x30b5 }, /* kana_SA KATAKANA LETTER SA */ 191 { 0x04bc, 0x30b7 }, /* kana_SHI KATAKANA LETTER SI */ 192 { 0x04bd, 0x30b9 }, /* kana_SU KATAKANA LETTER SU */ 193 { 0x04be, 0x30bb }, /* kana_SE KATAKANA LETTER SE */ 194 { 0x04bf, 0x30bd }, /* kana_SO KATAKANA LETTER SO */ 195 { 0x04c0, 0x30bf }, /* kana_TA KATAKANA LETTER TA */ 196 { 0x04c1, 0x30c1 }, /* kana_CHI KATAKANA LETTER TI */ 197 { 0x04c2, 0x30c4 }, /* kana_TSU KATAKANA LETTER TU */ 198 { 0x04c3, 0x30c6 }, /* kana_TE KATAKANA LETTER TE */ 199 { 0x04c4, 0x30c8 }, /* kana_TO KATAKANA LETTER TO */ 200 { 0x04c5, 0x30ca }, /* kana_NA KATAKANA LETTER NA */ 201 { 0x04c6, 0x30cb }, /* kana_NI KATAKANA LETTER NI */ 202 { 0x04c7, 0x30cc }, /* kana_NU KATAKANA LETTER NU */ 203 { 0x04c8, 0x30cd }, /* kana_NE KATAKANA LETTER NE */ 204 { 0x04c9, 0x30ce }, /* kana_NO KATAKANA LETTER NO */ 205 { 0x04ca, 0x30cf }, /* kana_HA KATAKANA LETTER HA */ 206 { 0x04cb, 0x30d2 }, /* kana_HI KATAKANA LETTER HI */ 207 { 0x04cc, 0x30d5 }, /* kana_FU KATAKANA LETTER HU */ 208 { 0x04cd, 0x30d8 }, /* kana_HE KATAKANA LETTER HE */ 209 { 0x04ce, 0x30db }, /* kana_HO KATAKANA LETTER HO */ 210 { 0x04cf, 0x30de }, /* kana_MA KATAKANA LETTER MA */ 211 { 0x04d0, 0x30df }, /* kana_MI KATAKANA LETTER MI */ 212 { 0x04d1, 0x30e0 }, /* kana_MU KATAKANA LETTER MU */ 213 { 0x04d2, 0x30e1 }, /* kana_ME KATAKANA LETTER ME */ 214 { 0x04d3, 0x30e2 }, /* kana_MO KATAKANA LETTER MO */ 215 { 0x04d4, 0x30e4 }, /* kana_YA KATAKANA LETTER YA */ 216 { 0x04d5, 0x30e6 }, /* kana_YU KATAKANA LETTER YU */ 217 { 0x04d6, 0x30e8 }, /* kana_YO KATAKANA LETTER YO */ 218 { 0x04d7, 0x30e9 }, /* kana_RA KATAKANA LETTER RA */ 219 { 0x04d8, 0x30ea }, /* kana_RI KATAKANA LETTER RI */ 220 { 0x04d9, 0x30eb }, /* kana_RU KATAKANA LETTER RU */ 221 { 0x04da, 0x30ec }, /* kana_RE KATAKANA LETTER RE */ 222 { 0x04db, 0x30ed }, /* kana_RO KATAKANA LETTER RO */ 223 { 0x04dc, 0x30ef }, /* kana_WA KATAKANA LETTER WA */ 224 { 0x04dd, 0x30f3 }, /* kana_N KATAKANA LETTER N */ 225 { 0x04de, 0x309b }, /* voicedsound KATAKANA-HIRAGANA VOICED SOUND MARK */ 226 { 0x04df, 0x309c }, /* semivoicedsound KATAKANA-HIRAGANA SEMI-VOICED SOUND MARK */ 227 { 0x05ac, 0x060c }, /* Arabic_comma ARABIC COMMA */ 228 { 0x05bb, 0x061b }, /* Arabic_semicolon ARABIC SEMICOLON */ 229 { 0x05bf, 0x061f }, /* Arabic_question_mark ARABIC QUESTION MARK */ 230 { 0x05c1, 0x0621 }, /* Arabic_hamza ARABIC LETTER HAMZA */ 231 { 0x05c2, 0x0622 }, /* Arabic_maddaonalef ARABIC LETTER ALEF WITH MADDA ABOVE */ 232 { 0x05c3, 0x0623 }, /* Arabic_hamzaonalef ARABIC LETTER ALEF WITH HAMZA ABOVE */ 233 { 0x05c4, 0x0624 }, /* Arabic_hamzaonwaw ARABIC LETTER WAW WITH HAMZA ABOVE */ 234 { 0x05c5, 0x0625 }, /* Arabic_hamzaunderalef ARABIC LETTER ALEF WITH HAMZA BELOW */ 235 { 0x05c6, 0x0626 }, /* Arabic_hamzaonyeh ARABIC LETTER YEH WITH HAMZA ABOVE */ 236 { 0x05c7, 0x0627 }, /* Arabic_alef ARABIC LETTER ALEF */ 237 { 0x05c8, 0x0628 }, /* Arabic_beh ARABIC LETTER BEH */ 238 { 0x05c9, 0x0629 }, /* Arabic_tehmarbuta ARABIC LETTER TEH MARBUTA */ 239 { 0x05ca, 0x062a }, /* Arabic_teh ARABIC LETTER TEH */ 240 { 0x05cb, 0x062b }, /* Arabic_theh ARABIC LETTER THEH */ 241 { 0x05cc, 0x062c }, /* Arabic_jeem ARABIC LETTER JEEM */ 242 { 0x05cd, 0x062d }, /* Arabic_hah ARABIC LETTER HAH */ 243 { 0x05ce, 0x062e }, /* Arabic_khah ARABIC LETTER KHAH */ 244 { 0x05cf, 0x062f }, /* Arabic_dal ARABIC LETTER DAL */ 245 { 0x05d0, 0x0630 }, /* Arabic_thal ARABIC LETTER THAL */ 246 { 0x05d1, 0x0631 }, /* Arabic_ra ARABIC LETTER REH */ 247 { 0x05d2, 0x0632 }, /* Arabic_zain ARABIC LETTER ZAIN */ 248 { 0x05d3, 0x0633 }, /* Arabic_seen ARABIC LETTER SEEN */ 249 { 0x05d4, 0x0634 }, /* Arabic_sheen ARABIC LETTER SHEEN */ 250 { 0x05d5, 0x0635 }, /* Arabic_sad ARABIC LETTER SAD */ 251 { 0x05d6, 0x0636 }, /* Arabic_dad ARABIC LETTER DAD */ 252 { 0x05d7, 0x0637 }, /* Arabic_tah ARABIC LETTER TAH */ 253 { 0x05d8, 0x0638 }, /* Arabic_zah ARABIC LETTER ZAH */ 254 { 0x05d9, 0x0639 }, /* Arabic_ain ARABIC LETTER AIN */ 255 { 0x05da, 0x063a }, /* Arabic_ghain ARABIC LETTER GHAIN */ 256 { 0x05e0, 0x0640 }, /* Arabic_tatweel ARABIC TATWEEL */ 257 { 0x05e1, 0x0641 }, /* Arabic_feh ARABIC LETTER FEH */ 258 { 0x05e2, 0x0642 }, /* Arabic_qaf ARABIC LETTER QAF */ 259 { 0x05e3, 0x0643 }, /* Arabic_kaf ARABIC LETTER KAF */ 260 { 0x05e4, 0x0644 }, /* Arabic_lam ARABIC LETTER LAM */ 261 { 0x05e5, 0x0645 }, /* Arabic_meem ARABIC LETTER MEEM */ 262 { 0x05e6, 0x0646 }, /* Arabic_noon ARABIC LETTER NOON */ 263 { 0x05e7, 0x0647 }, /* Arabic_ha ARABIC LETTER HEH */ 264 { 0x05e8, 0x0648 }, /* Arabic_waw ARABIC LETTER WAW */ 265 { 0x05e9, 0x0649 }, /* Arabic_alefmaksura ARABIC LETTER ALEF MAKSURA */ 266 { 0x05ea, 0x064a }, /* Arabic_yeh ARABIC LETTER YEH */ 267 { 0x05eb, 0x064b }, /* Arabic_fathatan ARABIC FATHATAN */ 268 { 0x05ec, 0x064c }, /* Arabic_dammatan ARABIC DAMMATAN */ 269 { 0x05ed, 0x064d }, /* Arabic_kasratan ARABIC KASRATAN */ 270 { 0x05ee, 0x064e }, /* Arabic_fatha ARABIC FATHA */ 271 { 0x05ef, 0x064f }, /* Arabic_damma ARABIC DAMMA */ 272 { 0x05f0, 0x0650 }, /* Arabic_kasra ARABIC KASRA */ 273 { 0x05f1, 0x0651 }, /* Arabic_shadda ARABIC SHADDA */ 274 { 0x05f2, 0x0652 }, /* Arabic_sukun ARABIC SUKUN */ 275 { 0x06a1, 0x0452 }, /* Serbian_dje CYRILLIC SMALL LETTER DJE */ 276 { 0x06a2, 0x0453 }, /* Macedonia_gje CYRILLIC SMALL LETTER GJE */ 277 { 0x06a3, 0x0451 }, /* Cyrillic_io CYRILLIC SMALL LETTER IO */ 278 { 0x06a4, 0x0454 }, /* Ukrainian_ie CYRILLIC SMALL LETTER UKRAINIAN IE */ 279 { 0x06a5, 0x0455 }, /* Macedonia_dse CYRILLIC SMALL LETTER DZE */ 280 { 0x06a6, 0x0456 }, /* Ukrainian_i CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I */ 281 { 0x06a7, 0x0457 }, /* Ukrainian_yi CYRILLIC SMALL LETTER YI */ 282 { 0x06a8, 0x0458 }, /* Cyrillic_je CYRILLIC SMALL LETTER JE */ 283 { 0x06a9, 0x0459 }, /* Cyrillic_lje CYRILLIC SMALL LETTER LJE */ 284 { 0x06aa, 0x045a }, /* Cyrillic_nje CYRILLIC SMALL LETTER NJE */ 285 { 0x06ab, 0x045b }, /* Serbian_tshe CYRILLIC SMALL LETTER TSHE */ 286 { 0x06ac, 0x045c }, /* Macedonia_kje CYRILLIC SMALL LETTER KJE */ 287 { 0x06ad, 0x0491 }, /* Ukrainian_ghe_with_upturn CYRILLIC SMALL LETTER GHE WITH UPTURN */ 288 { 0x06ae, 0x045e }, /* Byelorussian_shortu CYRILLIC SMALL LETTER SHORT U */ 289 { 0x06af, 0x045f }, /* Cyrillic_dzhe CYRILLIC SMALL LETTER DZHE */ 290 { 0x06b0, 0x2116 }, /* numerosign NUMERO SIGN */ 291 { 0x06b1, 0x0402 }, /* Serbian_DJE CYRILLIC CAPITAL LETTER DJE */ 292 { 0x06b2, 0x0403 }, /* Macedonia_GJE CYRILLIC CAPITAL LETTER GJE */ 293 { 0x06b3, 0x0401 }, /* Cyrillic_IO CYRILLIC CAPITAL LETTER IO */ 294 { 0x06b4, 0x0404 }, /* Ukrainian_IE CYRILLIC CAPITAL LETTER UKRAINIAN IE */ 295 { 0x06b5, 0x0405 }, /* Macedonia_DSE CYRILLIC CAPITAL LETTER DZE */ 296 { 0x06b6, 0x0406 }, /* Ukrainian_I CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I */ 297 { 0x06b7, 0x0407 }, /* Ukrainian_YI CYRILLIC CAPITAL LETTER YI */ 298 { 0x06b8, 0x0408 }, /* Cyrillic_JE CYRILLIC CAPITAL LETTER JE */ 299 { 0x06b9, 0x0409 }, /* Cyrillic_LJE CYRILLIC CAPITAL LETTER LJE */ 300 { 0x06ba, 0x040a }, /* Cyrillic_NJE CYRILLIC CAPITAL LETTER NJE */ 301 { 0x06bb, 0x040b }, /* Serbian_TSHE CYRILLIC CAPITAL LETTER TSHE */ 302 { 0x06bc, 0x040c }, /* Macedonia_KJE CYRILLIC CAPITAL LETTER KJE */ 303 { 0x06bd, 0x0490 }, /* Ukrainian_GHE_WITH_UPTURN CYRILLIC CAPITAL LETTER GHE WITH UPTURN */ 304 { 0x06be, 0x040e }, /* Byelorussian_SHORTU CYRILLIC CAPITAL LETTER SHORT U */ 305 { 0x06bf, 0x040f }, /* Cyrillic_DZHE CYRILLIC CAPITAL LETTER DZHE */ 306 { 0x06c0, 0x044e }, /* Cyrillic_yu CYRILLIC SMALL LETTER YU */ 307 { 0x06c1, 0x0430 }, /* Cyrillic_a CYRILLIC SMALL LETTER A */ 308 { 0x06c2, 0x0431 }, /* Cyrillic_be CYRILLIC SMALL LETTER BE */ 309 { 0x06c3, 0x0446 }, /* Cyrillic_tse CYRILLIC SMALL LETTER TSE */ 310 { 0x06c4, 0x0434 }, /* Cyrillic_de CYRILLIC SMALL LETTER DE */ 311 { 0x06c5, 0x0435 }, /* Cyrillic_ie CYRILLIC SMALL LETTER IE */ 312 { 0x06c6, 0x0444 }, /* Cyrillic_ef CYRILLIC SMALL LETTER EF */ 313 { 0x06c7, 0x0433 }, /* Cyrillic_ghe CYRILLIC SMALL LETTER GHE */ 314 { 0x06c8, 0x0445 }, /* Cyrillic_ha CYRILLIC SMALL LETTER HA */ 315 { 0x06c9, 0x0438 }, /* Cyrillic_i CYRILLIC SMALL LETTER I */ 316 { 0x06ca, 0x0439 }, /* Cyrillic_shorti CYRILLIC SMALL LETTER SHORT I */ 317 { 0x06cb, 0x043a }, /* Cyrillic_ka CYRILLIC SMALL LETTER KA */ 318 { 0x06cc, 0x043b }, /* Cyrillic_el CYRILLIC SMALL LETTER EL */ 319 { 0x06cd, 0x043c }, /* Cyrillic_em CYRILLIC SMALL LETTER EM */ 320 { 0x06ce, 0x043d }, /* Cyrillic_en CYRILLIC SMALL LETTER EN */ 321 { 0x06cf, 0x043e }, /* Cyrillic_o CYRILLIC SMALL LETTER O */ 322 { 0x06d0, 0x043f }, /* Cyrillic_pe CYRILLIC SMALL LETTER PE */ 323 { 0x06d1, 0x044f }, /* Cyrillic_ya CYRILLIC SMALL LETTER YA */ 324 { 0x06d2, 0x0440 }, /* Cyrillic_er CYRILLIC SMALL LETTER ER */ 325 { 0x06d3, 0x0441 }, /* Cyrillic_es CYRILLIC SMALL LETTER ES */ 326 { 0x06d4, 0x0442 }, /* Cyrillic_te CYRILLIC SMALL LETTER TE */ 327 { 0x06d5, 0x0443 }, /* Cyrillic_u CYRILLIC SMALL LETTER U */ 328 { 0x06d6, 0x0436 }, /* Cyrillic_zhe CYRILLIC SMALL LETTER ZHE */ 329 { 0x06d7, 0x0432 }, /* Cyrillic_ve CYRILLIC SMALL LETTER VE */ 330 { 0x06d8, 0x044c }, /* Cyrillic_softsign CYRILLIC SMALL LETTER SOFT SIGN */ 331 { 0x06d9, 0x044b }, /* Cyrillic_yeru CYRILLIC SMALL LETTER YERU */ 332 { 0x06da, 0x0437 }, /* Cyrillic_ze CYRILLIC SMALL LETTER ZE */ 333 { 0x06db, 0x0448 }, /* Cyrillic_sha CYRILLIC SMALL LETTER SHA */ 334 { 0x06dc, 0x044d }, /* Cyrillic_e CYRILLIC SMALL LETTER E */ 335 { 0x06dd, 0x0449 }, /* Cyrillic_shcha CYRILLIC SMALL LETTER SHCHA */ 336 { 0x06de, 0x0447 }, /* Cyrillic_che CYRILLIC SMALL LETTER CHE */ 337 { 0x06df, 0x044a }, /* Cyrillic_hardsign CYRILLIC SMALL LETTER HARD SIGN */ 338 { 0x06e0, 0x042e }, /* Cyrillic_YU CYRILLIC CAPITAL LETTER YU */ 339 { 0x06e1, 0x0410 }, /* Cyrillic_A CYRILLIC CAPITAL LETTER A */ 340 { 0x06e2, 0x0411 }, /* Cyrillic_BE CYRILLIC CAPITAL LETTER BE */ 341 { 0x06e3, 0x0426 }, /* Cyrillic_TSE CYRILLIC CAPITAL LETTER TSE */ 342 { 0x06e4, 0x0414 }, /* Cyrillic_DE CYRILLIC CAPITAL LETTER DE */ 343 { 0x06e5, 0x0415 }, /* Cyrillic_IE CYRILLIC CAPITAL LETTER IE */ 344 { 0x06e6, 0x0424 }, /* Cyrillic_EF CYRILLIC CAPITAL LETTER EF */ 345 { 0x06e7, 0x0413 }, /* Cyrillic_GHE CYRILLIC CAPITAL LETTER GHE */ 346 { 0x06e8, 0x0425 }, /* Cyrillic_HA CYRILLIC CAPITAL LETTER HA */ 347 { 0x06e9, 0x0418 }, /* Cyrillic_I CYRILLIC CAPITAL LETTER I */ 348 { 0x06ea, 0x0419 }, /* Cyrillic_SHORTI CYRILLIC CAPITAL LETTER SHORT I */ 349 { 0x06eb, 0x041a }, /* Cyrillic_KA CYRILLIC CAPITAL LETTER KA */ 350 { 0x06ec, 0x041b }, /* Cyrillic_EL CYRILLIC CAPITAL LETTER EL */ 351 { 0x06ed, 0x041c }, /* Cyrillic_EM CYRILLIC CAPITAL LETTER EM */ 352 { 0x06ee, 0x041d }, /* Cyrillic_EN CYRILLIC CAPITAL LETTER EN */ 353 { 0x06ef, 0x041e }, /* Cyrillic_O CYRILLIC CAPITAL LETTER O */ 354 { 0x06f0, 0x041f }, /* Cyrillic_PE CYRILLIC CAPITAL LETTER PE */ 355 { 0x06f1, 0x042f }, /* Cyrillic_YA CYRILLIC CAPITAL LETTER YA */ 356 { 0x06f2, 0x0420 }, /* Cyrillic_ER CYRILLIC CAPITAL LETTER ER */ 357 { 0x06f3, 0x0421 }, /* Cyrillic_ES CYRILLIC CAPITAL LETTER ES */ 358 { 0x06f4, 0x0422 }, /* Cyrillic_TE CYRILLIC CAPITAL LETTER TE */ 359 { 0x06f5, 0x0423 }, /* Cyrillic_U CYRILLIC CAPITAL LETTER U */ 360 { 0x06f6, 0x0416 }, /* Cyrillic_ZHE CYRILLIC CAPITAL LETTER ZHE */ 361 { 0x06f7, 0x0412 }, /* Cyrillic_VE CYRILLIC CAPITAL LETTER VE */ 362 { 0x06f8, 0x042c }, /* Cyrillic_SOFTSIGN CYRILLIC CAPITAL LETTER SOFT SIGN */ 363 { 0x06f9, 0x042b }, /* Cyrillic_YERU CYRILLIC CAPITAL LETTER YERU */ 364 { 0x06fa, 0x0417 }, /* Cyrillic_ZE CYRILLIC CAPITAL LETTER ZE */ 365 { 0x06fb, 0x0428 }, /* Cyrillic_SHA CYRILLIC CAPITAL LETTER SHA */ 366 { 0x06fc, 0x042d }, /* Cyrillic_E CYRILLIC CAPITAL LETTER E */ 367 { 0x06fd, 0x0429 }, /* Cyrillic_SHCHA CYRILLIC CAPITAL LETTER SHCHA */ 368 { 0x06fe, 0x0427 }, /* Cyrillic_CHE CYRILLIC CAPITAL LETTER CHE */ 369 { 0x06ff, 0x042a }, /* Cyrillic_HARDSIGN CYRILLIC CAPITAL LETTER HARD SIGN */ 370 { 0x07a1, 0x0386 }, /* Greek_ALPHAaccent GREEK CAPITAL LETTER ALPHA WITH TONOS */ 371 { 0x07a2, 0x0388 }, /* Greek_EPSILONaccent GREEK CAPITAL LETTER EPSILON WITH TONOS */ 372 { 0x07a3, 0x0389 }, /* Greek_ETAaccent GREEK CAPITAL LETTER ETA WITH TONOS */ 373 { 0x07a4, 0x038a }, /* Greek_IOTAaccent GREEK CAPITAL LETTER IOTA WITH TONOS */ 374 { 0x07a5, 0x03aa }, /* Greek_IOTAdiaeresis GREEK CAPITAL LETTER IOTA WITH DIALYTIKA */ 375 { 0x07a7, 0x038c }, /* Greek_OMICRONaccent GREEK CAPITAL LETTER OMICRON WITH TONOS */ 376 { 0x07a8, 0x038e }, /* Greek_UPSILONaccent GREEK CAPITAL LETTER UPSILON WITH TONOS */ 377 { 0x07a9, 0x03ab }, /* Greek_UPSILONdieresis GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA */ 378 { 0x07ab, 0x038f }, /* Greek_OMEGAaccent GREEK CAPITAL LETTER OMEGA WITH TONOS */ 379 { 0x07ae, 0x0385 }, /* Greek_accentdieresis GREEK DIALYTIKA TONOS */ 380 { 0x07af, 0x2015 }, /* Greek_horizbar HORIZONTAL BAR */ 381 { 0x07b1, 0x03ac }, /* Greek_alphaaccent GREEK SMALL LETTER ALPHA WITH TONOS */ 382 { 0x07b2, 0x03ad }, /* Greek_epsilonaccent GREEK SMALL LETTER EPSILON WITH TONOS */ 383 { 0x07b3, 0x03ae }, /* Greek_etaaccent GREEK SMALL LETTER ETA WITH TONOS */ 384 { 0x07b4, 0x03af }, /* Greek_iotaaccent GREEK SMALL LETTER IOTA WITH TONOS */ 385 { 0x07b5, 0x03ca }, /* Greek_iotadieresis GREEK SMALL LETTER IOTA WITH DIALYTIKA */ 386 { 0x07b6, 0x0390 }, /* Greek_iotaaccentdieresis GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS */ 387 { 0x07b7, 0x03cc }, /* Greek_omicronaccent GREEK SMALL LETTER OMICRON WITH TONOS */ 388 { 0x07b8, 0x03cd }, /* Greek_upsilonaccent GREEK SMALL LETTER UPSILON WITH TONOS */ 389 { 0x07b9, 0x03cb }, /* Greek_upsilondieresis GREEK SMALL LETTER UPSILON WITH DIALYTIKA */ 390 { 0x07ba, 0x03b0 }, /* Greek_upsilonaccentdieresis GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS */ 391 { 0x07bb, 0x03ce }, /* Greek_omegaaccent GREEK SMALL LETTER OMEGA WITH TONOS */ 392 { 0x07c1, 0x0391 }, /* Greek_ALPHA GREEK CAPITAL LETTER ALPHA */ 393 { 0x07c2, 0x0392 }, /* Greek_BETA GREEK CAPITAL LETTER BETA */ 394 { 0x07c3, 0x0393 }, /* Greek_GAMMA GREEK CAPITAL LETTER GAMMA */ 395 { 0x07c4, 0x0394 }, /* Greek_DELTA GREEK CAPITAL LETTER DELTA */ 396 { 0x07c5, 0x0395 }, /* Greek_EPSILON GREEK CAPITAL LETTER EPSILON */ 397 { 0x07c6, 0x0396 }, /* Greek_ZETA GREEK CAPITAL LETTER ZETA */ 398 { 0x07c7, 0x0397 }, /* Greek_ETA GREEK CAPITAL LETTER ETA */ 399 { 0x07c8, 0x0398 }, /* Greek_THETA GREEK CAPITAL LETTER THETA */ 400 { 0x07c9, 0x0399 }, /* Greek_IOTA GREEK CAPITAL LETTER IOTA */ 401 { 0x07ca, 0x039a }, /* Greek_KAPPA GREEK CAPITAL LETTER KAPPA */ 402 { 0x07cb, 0x039b }, /* Greek_LAMBDA GREEK CAPITAL LETTER LAMDA */ 403 { 0x07cc, 0x039c }, /* Greek_MU GREEK CAPITAL LETTER MU */ 404 { 0x07cd, 0x039d }, /* Greek_NU GREEK CAPITAL LETTER NU */ 405 { 0x07ce, 0x039e }, /* Greek_XI GREEK CAPITAL LETTER XI */ 406 { 0x07cf, 0x039f }, /* Greek_OMICRON GREEK CAPITAL LETTER OMICRON */ 407 { 0x07d0, 0x03a0 }, /* Greek_PI GREEK CAPITAL LETTER PI */ 408 { 0x07d1, 0x03a1 }, /* Greek_RHO GREEK CAPITAL LETTER RHO */ 409 { 0x07d2, 0x03a3 }, /* Greek_SIGMA GREEK CAPITAL LETTER SIGMA */ 410 { 0x07d4, 0x03a4 }, /* Greek_TAU GREEK CAPITAL LETTER TAU */ 411 { 0x07d5, 0x03a5 }, /* Greek_UPSILON GREEK CAPITAL LETTER UPSILON */ 412 { 0x07d6, 0x03a6 }, /* Greek_PHI GREEK CAPITAL LETTER PHI */ 413 { 0x07d7, 0x03a7 }, /* Greek_CHI GREEK CAPITAL LETTER CHI */ 414 { 0x07d8, 0x03a8 }, /* Greek_PSI GREEK CAPITAL LETTER PSI */ 415 { 0x07d9, 0x03a9 }, /* Greek_OMEGA GREEK CAPITAL LETTER OMEGA */ 416 { 0x07e1, 0x03b1 }, /* Greek_alpha GREEK SMALL LETTER ALPHA */ 417 { 0x07e2, 0x03b2 }, /* Greek_beta GREEK SMALL LETTER BETA */ 418 { 0x07e3, 0x03b3 }, /* Greek_gamma GREEK SMALL LETTER GAMMA */ 419 { 0x07e4, 0x03b4 }, /* Greek_delta GREEK SMALL LETTER DELTA */ 420 { 0x07e5, 0x03b5 }, /* Greek_epsilon GREEK SMALL LETTER EPSILON */ 421 { 0x07e6, 0x03b6 }, /* Greek_zeta GREEK SMALL LETTER ZETA */ 422 { 0x07e7, 0x03b7 }, /* Greek_eta GREEK SMALL LETTER ETA */ 423 { 0x07e8, 0x03b8 }, /* Greek_theta GREEK SMALL LETTER THETA */ 424 { 0x07e9, 0x03b9 }, /* Greek_iota GREEK SMALL LETTER IOTA */ 425 { 0x07ea, 0x03ba }, /* Greek_kappa GREEK SMALL LETTER KAPPA */ 426 { 0x07eb, 0x03bb }, /* Greek_lambda GREEK SMALL LETTER LAMDA */ 427 { 0x07ec, 0x03bc }, /* Greek_mu GREEK SMALL LETTER MU */ 428 { 0x07ed, 0x03bd }, /* Greek_nu GREEK SMALL LETTER NU */ 429 { 0x07ee, 0x03be }, /* Greek_xi GREEK SMALL LETTER XI */ 430 { 0x07ef, 0x03bf }, /* Greek_omicron GREEK SMALL LETTER OMICRON */ 431 { 0x07f0, 0x03c0 }, /* Greek_pi GREEK SMALL LETTER PI */ 432 { 0x07f1, 0x03c1 }, /* Greek_rho GREEK SMALL LETTER RHO */ 433 { 0x07f2, 0x03c3 }, /* Greek_sigma GREEK SMALL LETTER SIGMA */ 434 { 0x07f3, 0x03c2 }, /* Greek_finalsmallsigma GREEK SMALL LETTER FINAL SIGMA */ 435 { 0x07f4, 0x03c4 }, /* Greek_tau GREEK SMALL LETTER TAU */ 436 { 0x07f5, 0x03c5 }, /* Greek_upsilon GREEK SMALL LETTER UPSILON */ 437 { 0x07f6, 0x03c6 }, /* Greek_phi GREEK SMALL LETTER PHI */ 438 { 0x07f7, 0x03c7 }, /* Greek_chi GREEK SMALL LETTER CHI */ 439 { 0x07f8, 0x03c8 }, /* Greek_psi GREEK SMALL LETTER PSI */ 440 { 0x07f9, 0x03c9 }, /* Greek_omega GREEK SMALL LETTER OMEGA */ 441 { 0x08a1, 0x23b7 }, /* leftradical ??? */ 442 { 0x08a2, 0x250c }, /* topleftradical BOX DRAWINGS LIGHT DOWN AND RIGHT */ 443 { 0x08a3, 0x2500 }, /* horizconnector BOX DRAWINGS LIGHT HORIZONTAL */ 444 { 0x08a4, 0x2320 }, /* topintegral TOP HALF INTEGRAL */ 445 { 0x08a5, 0x2321 }, /* botintegral BOTTOM HALF INTEGRAL */ 446 { 0x08a6, 0x2502 }, /* vertconnector BOX DRAWINGS LIGHT VERTICAL */ 447 { 0x08a7, 0x23a1 }, /* topleftsqbracket ??? */ 448 { 0x08a8, 0x23a3 }, /* botleftsqbracket ??? */ 449 { 0x08a9, 0x23a4 }, /* toprightsqbracket ??? */ 450 { 0x08aa, 0x23a6 }, /* botrightsqbracket ??? */ 451 { 0x08ab, 0x239b }, /* topleftparens ??? */ 452 { 0x08ac, 0x239d }, /* botleftparens ??? */ 453 { 0x08ad, 0x239e }, /* toprightparens ??? */ 454 { 0x08ae, 0x23a0 }, /* botrightparens ??? */ 455 { 0x08af, 0x23a8 }, /* leftmiddlecurlybrace ??? */ 456 { 0x08b0, 0x23ac }, /* rightmiddlecurlybrace ??? */ 457 /* 0x08b1 topleftsummation ? ??? */ 458 /* 0x08b2 botleftsummation ? ??? */ 459 /* 0x08b3 topvertsummationconnector ? ??? */ 460 /* 0x08b4 botvertsummationconnector ? ??? */ 461 /* 0x08b5 toprightsummation ? ??? */ 462 /* 0x08b6 botrightsummation ? ??? */ 463 /* 0x08b7 rightmiddlesummation ? ??? */ 464 { 0x08bc, 0x2264 }, /* lessthanequal LESS-THAN OR EQUAL TO */ 465 { 0x08bd, 0x2260 }, /* notequal NOT EQUAL TO */ 466 { 0x08be, 0x2265 }, /* greaterthanequal GREATER-THAN OR EQUAL TO */ 467 { 0x08bf, 0x222b }, /* integral INTEGRAL */ 468 { 0x08c0, 0x2234 }, /* therefore THEREFORE */ 469 { 0x08c1, 0x221d }, /* variation PROPORTIONAL TO */ 470 { 0x08c2, 0x221e }, /* infinity INFINITY */ 471 { 0x08c5, 0x2207 }, /* nabla NABLA */ 472 { 0x08c8, 0x223c }, /* approximate TILDE OPERATOR */ 473 { 0x08c9, 0x2243 }, /* similarequal ASYMPTOTICALLY EQUAL TO */ 474 { 0x08cd, 0x21d4 }, /* ifonlyif LEFT RIGHT DOUBLE ARROW */ 475 { 0x08ce, 0x21d2 }, /* implies RIGHTWARDS DOUBLE ARROW */ 476 { 0x08cf, 0x2261 }, /* identical IDENTICAL TO */ 477 { 0x08d6, 0x221a }, /* radical SQUARE ROOT */ 478 { 0x08da, 0x2282 }, /* includedin SUBSET OF */ 479 { 0x08db, 0x2283 }, /* includes SUPERSET OF */ 480 { 0x08dc, 0x2229 }, /* intersection INTERSECTION */ 481 { 0x08dd, 0x222a }, /* union UNION */ 482 { 0x08de, 0x2227 }, /* logicaland LOGICAL AND */ 483 { 0x08df, 0x2228 }, /* logicalor LOGICAL OR */ 484 { 0x08ef, 0x2202 }, /* partialderivative PARTIAL DIFFERENTIAL */ 485 { 0x08f6, 0x0192 }, /* function LATIN SMALL LETTER F WITH HOOK */ 486 { 0x08fb, 0x2190 }, /* leftarrow LEFTWARDS ARROW */ 487 { 0x08fc, 0x2191 }, /* uparrow UPWARDS ARROW */ 488 { 0x08fd, 0x2192 }, /* rightarrow RIGHTWARDS ARROW */ 489 { 0x08fe, 0x2193 }, /* downarrow DOWNWARDS ARROW */ 490 /* 0x09df blank ? ??? */ 491 { 0x09e0, 0x25c6 }, /* soliddiamond BLACK DIAMOND */ 492 { 0x09e1, 0x2592 }, /* checkerboard MEDIUM SHADE */ 493 { 0x09e2, 0x2409 }, /* ht SYMBOL FOR HORIZONTAL TABULATION */ 494 { 0x09e3, 0x240c }, /* ff SYMBOL FOR FORM FEED */ 495 { 0x09e4, 0x240d }, /* cr SYMBOL FOR CARRIAGE RETURN */ 496 { 0x09e5, 0x240a }, /* lf SYMBOL FOR LINE FEED */ 497 { 0x09e8, 0x2424 }, /* nl SYMBOL FOR NEWLINE */ 498 { 0x09e9, 0x240b }, /* vt SYMBOL FOR VERTICAL TABULATION */ 499 { 0x09ea, 0x2518 }, /* lowrightcorner BOX DRAWINGS LIGHT UP AND LEFT */ 500 { 0x09eb, 0x2510 }, /* uprightcorner BOX DRAWINGS LIGHT DOWN AND LEFT */ 501 { 0x09ec, 0x250c }, /* upleftcorner BOX DRAWINGS LIGHT DOWN AND RIGHT */ 502 { 0x09ed, 0x2514 }, /* lowleftcorner BOX DRAWINGS LIGHT UP AND RIGHT */ 503 { 0x09ee, 0x253c }, /* crossinglines BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL */ 504 { 0x09ef, 0x23ba }, /* horizlinescan1 HORIZONTAL SCAN LINE-1 (Unicode 3.2 draft) */ 505 { 0x09f0, 0x23bb }, /* horizlinescan3 HORIZONTAL SCAN LINE-3 (Unicode 3.2 draft) */ 506 { 0x09f1, 0x2500 }, /* horizlinescan5 BOX DRAWINGS LIGHT HORIZONTAL */ 507 { 0x09f2, 0x23bc }, /* horizlinescan7 HORIZONTAL SCAN LINE-7 (Unicode 3.2 draft) */ 508 { 0x09f3, 0x23bd }, /* horizlinescan9 HORIZONTAL SCAN LINE-9 (Unicode 3.2 draft) */ 509 { 0x09f4, 0x251c }, /* leftt BOX DRAWINGS LIGHT VERTICAL AND RIGHT */ 510 { 0x09f5, 0x2524 }, /* rightt BOX DRAWINGS LIGHT VERTICAL AND LEFT */ 511 { 0x09f6, 0x2534 }, /* bott BOX DRAWINGS LIGHT UP AND HORIZONTAL */ 512 { 0x09f7, 0x252c }, /* topt BOX DRAWINGS LIGHT DOWN AND HORIZONTAL */ 513 { 0x09f8, 0x2502 }, /* vertbar BOX DRAWINGS LIGHT VERTICAL */ 514 { 0x0aa1, 0x2003 }, /* emspace EM SPACE */ 515 { 0x0aa2, 0x2002 }, /* enspace EN SPACE */ 516 { 0x0aa3, 0x2004 }, /* em3space THREE-PER-EM SPACE */ 517 { 0x0aa4, 0x2005 }, /* em4space FOUR-PER-EM SPACE */ 518 { 0x0aa5, 0x2007 }, /* digitspace FIGURE SPACE */ 519 { 0x0aa6, 0x2008 }, /* punctspace PUNCTUATION SPACE */ 520 { 0x0aa7, 0x2009 }, /* thinspace THIN SPACE */ 521 { 0x0aa8, 0x200a }, /* hairspace HAIR SPACE */ 522 { 0x0aa9, 0x2014 }, /* emdash EM DASH */ 523 { 0x0aaa, 0x2013 }, /* endash EN DASH */ 524 /* 0x0aac signifblank ? ??? */ 525 { 0x0aae, 0x2026 }, /* ellipsis HORIZONTAL ELLIPSIS */ 526 { 0x0aaf, 0x2025 }, /* doubbaselinedot TWO DOT LEADER */ 527 { 0x0ab0, 0x2153 }, /* onethird VULGAR FRACTION ONE THIRD */ 528 { 0x0ab1, 0x2154 }, /* twothirds VULGAR FRACTION TWO THIRDS */ 529 { 0x0ab2, 0x2155 }, /* onefifth VULGAR FRACTION ONE FIFTH */ 530 { 0x0ab3, 0x2156 }, /* twofifths VULGAR FRACTION TWO FIFTHS */ 531 { 0x0ab4, 0x2157 }, /* threefifths VULGAR FRACTION THREE FIFTHS */ 532 { 0x0ab5, 0x2158 }, /* fourfifths VULGAR FRACTION FOUR FIFTHS */ 533 { 0x0ab6, 0x2159 }, /* onesixth VULGAR FRACTION ONE SIXTH */ 534 { 0x0ab7, 0x215a }, /* fivesixths VULGAR FRACTION FIVE SIXTHS */ 535 { 0x0ab8, 0x2105 }, /* careof CARE OF */ 536 { 0x0abb, 0x2012 }, /* figdash FIGURE DASH */ 537 { 0x0abc, 0x2329 }, /* leftanglebracket LEFT-POINTING ANGLE BRACKET */ 538 { 0x0abd, 0x002e }, /* decimalpoint . FULL STOP */ 539 { 0x0abe, 0x232a }, /* rightanglebracket RIGHT-POINTING ANGLE BRACKET */ 540 /* 0x0abf marker ? ??? */ 541 { 0x0ac3, 0x215b }, /* oneeighth VULGAR FRACTION ONE EIGHTH */ 542 { 0x0ac4, 0x215c }, /* threeeighths VULGAR FRACTION THREE EIGHTHS */ 543 { 0x0ac5, 0x215d }, /* fiveeighths VULGAR FRACTION FIVE EIGHTHS */ 544 { 0x0ac6, 0x215e }, /* seveneighths VULGAR FRACTION SEVEN EIGHTHS */ 545 { 0x0ac9, 0x2122 }, /* trademark TRADE MARK SIGN */ 546 { 0x0aca, 0x2613 }, /* signaturemark SALTIRE */ 547 /* 0x0acb trademarkincircle ? ??? */ 548 { 0x0acc, 0x25c1 }, /* leftopentriangle WHITE LEFT-POINTING TRIANGLE */ 549 { 0x0acd, 0x25b7 }, /* rightopentriangle WHITE RIGHT-POINTING TRIANGLE */ 550 { 0x0ace, 0x25cb }, /* emopencircle WHITE CIRCLE */ 551 { 0x0acf, 0x25af }, /* emopenrectangle WHITE VERTICAL RECTANGLE */ 552 { 0x0ad0, 0x2018 }, /* leftsinglequotemark LEFT SINGLE QUOTATION MARK */ 553 { 0x0ad1, 0x2019 }, /* rightsinglequotemark RIGHT SINGLE QUOTATION MARK */ 554 { 0x0ad2, 0x201c }, /* leftdoublequotemark LEFT DOUBLE QUOTATION MARK */ 555 { 0x0ad3, 0x201d }, /* rightdoublequotemark RIGHT DOUBLE QUOTATION MARK */ 556 { 0x0ad4, 0x211e }, /* prescription PRESCRIPTION TAKE */ 557 { 0x0ad6, 0x2032 }, /* minutes PRIME */ 558 { 0x0ad7, 0x2033 }, /* seconds DOUBLE PRIME */ 559 { 0x0ad9, 0x271d }, /* latincross LATIN CROSS */ 560 /* 0x0ada hexagram ? ??? */ 561 { 0x0adb, 0x25ac }, /* filledrectbullet BLACK RECTANGLE */ 562 { 0x0adc, 0x25c0 }, /* filledlefttribullet BLACK LEFT-POINTING TRIANGLE */ 563 { 0x0add, 0x25b6 }, /* filledrighttribullet BLACK RIGHT-POINTING TRIANGLE */ 564 { 0x0ade, 0x25cf }, /* emfilledcircle BLACK CIRCLE */ 565 { 0x0adf, 0x25ae }, /* emfilledrect BLACK VERTICAL RECTANGLE */ 566 { 0x0ae0, 0x25e6 }, /* enopencircbullet WHITE BULLET */ 567 { 0x0ae1, 0x25ab }, /* enopensquarebullet WHITE SMALL SQUARE */ 568 { 0x0ae2, 0x25ad }, /* openrectbullet WHITE RECTANGLE */ 569 { 0x0ae3, 0x25b3 }, /* opentribulletup WHITE UP-POINTING TRIANGLE */ 570 { 0x0ae4, 0x25bd }, /* opentribulletdown WHITE DOWN-POINTING TRIANGLE */ 571 { 0x0ae5, 0x2606 }, /* openstar WHITE STAR */ 572 { 0x0ae6, 0x2022 }, /* enfilledcircbullet BULLET */ 573 { 0x0ae7, 0x25aa }, /* enfilledsqbullet BLACK SMALL SQUARE */ 574 { 0x0ae8, 0x25b2 }, /* filledtribulletup BLACK UP-POINTING TRIANGLE */ 575 { 0x0ae9, 0x25bc }, /* filledtribulletdown BLACK DOWN-POINTING TRIANGLE */ 576 { 0x0aea, 0x261c }, /* leftpointer WHITE LEFT POINTING INDEX */ 577 { 0x0aeb, 0x261e }, /* rightpointer WHITE RIGHT POINTING INDEX */ 578 { 0x0aec, 0x2663 }, /* club BLACK CLUB SUIT */ 579 { 0x0aed, 0x2666 }, /* diamond BLACK DIAMOND SUIT */ 580 { 0x0aee, 0x2665 }, /* heart BLACK HEART SUIT */ 581 { 0x0af0, 0x2720 }, /* maltesecross MALTESE CROSS */ 582 { 0x0af1, 0x2020 }, /* dagger DAGGER */ 583 { 0x0af2, 0x2021 }, /* doubledagger DOUBLE DAGGER */ 584 { 0x0af3, 0x2713 }, /* checkmark CHECK MARK */ 585 { 0x0af4, 0x2717 }, /* ballotcross BALLOT X */ 586 { 0x0af5, 0x266f }, /* musicalsharp MUSIC SHARP SIGN */ 587 { 0x0af6, 0x266d }, /* musicalflat MUSIC FLAT SIGN */ 588 { 0x0af7, 0x2642 }, /* malesymbol MALE SIGN */ 589 { 0x0af8, 0x2640 }, /* femalesymbol FEMALE SIGN */ 590 { 0x0af9, 0x260e }, /* telephone BLACK TELEPHONE */ 591 { 0x0afa, 0x2315 }, /* telephonerecorder TELEPHONE RECORDER */ 592 { 0x0afb, 0x2117 }, /* phonographcopyright SOUND RECORDING COPYRIGHT */ 593 { 0x0afc, 0x2038 }, /* caret CARET */ 594 { 0x0afd, 0x201a }, /* singlelowquotemark SINGLE LOW-9 QUOTATION MARK */ 595 { 0x0afe, 0x201e }, /* doublelowquotemark DOUBLE LOW-9 QUOTATION MARK */ 596 /* 0x0aff cursor ? ??? */ 597 { 0x0ba3, 0x003c }, /* leftcaret < LESS-THAN SIGN */ 598 { 0x0ba6, 0x003e }, /* rightcaret > GREATER-THAN SIGN */ 599 { 0x0ba8, 0x2228 }, /* downcaret LOGICAL OR */ 600 { 0x0ba9, 0x2227 }, /* upcaret LOGICAL AND */ 601 { 0x0bc0, 0x00af }, /* overbar MACRON */ 602 { 0x0bc2, 0x22a4 }, /* downtack DOWN TACK */ 603 { 0x0bc3, 0x2229 }, /* upshoe INTERSECTION */ 604 { 0x0bc4, 0x230a }, /* downstile LEFT FLOOR */ 605 { 0x0bc6, 0x005f }, /* underbar _ LOW LINE */ 606 { 0x0bca, 0x2218 }, /* jot RING OPERATOR */ 607 { 0x0bcc, 0x2395 }, /* quad APL FUNCTIONAL SYMBOL QUAD (Unicode 3.0) */ 608 { 0x0bce, 0x22a5 }, /* uptack UP TACK */ 609 { 0x0bcf, 0x25cb }, /* circle WHITE CIRCLE */ 610 { 0x0bd3, 0x2308 }, /* upstile LEFT CEILING */ 611 { 0x0bd6, 0x222a }, /* downshoe UNION */ 612 { 0x0bd8, 0x2283 }, /* rightshoe SUPERSET OF */ 613 { 0x0bda, 0x2282 }, /* leftshoe SUBSET OF */ 614 { 0x0bdc, 0x22a2 }, /* lefttack RIGHT TACK */ 615 { 0x0bfc, 0x22a3 }, /* righttack LEFT TACK */ 616 { 0x0cdf, 0x2017 }, /* hebrew_doublelowline DOUBLE LOW LINE */ 617 { 0x0ce0, 0x05d0 }, /* hebrew_aleph HEBREW LETTER ALEF */ 618 { 0x0ce1, 0x05d1 }, /* hebrew_bet HEBREW LETTER BET */ 619 { 0x0ce2, 0x05d2 }, /* hebrew_gimel HEBREW LETTER GIMEL */ 620 { 0x0ce3, 0x05d3 }, /* hebrew_dalet HEBREW LETTER DALET */ 621 { 0x0ce4, 0x05d4 }, /* hebrew_he HEBREW LETTER HE */ 622 { 0x0ce5, 0x05d5 }, /* hebrew_waw HEBREW LETTER VAV */ 623 { 0x0ce6, 0x05d6 }, /* hebrew_zain HEBREW LETTER ZAYIN */ 624 { 0x0ce7, 0x05d7 }, /* hebrew_chet HEBREW LETTER HET */ 625 { 0x0ce8, 0x05d8 }, /* hebrew_tet HEBREW LETTER TET */ 626 { 0x0ce9, 0x05d9 }, /* hebrew_yod HEBREW LETTER YOD */ 627 { 0x0cea, 0x05da }, /* hebrew_finalkaph HEBREW LETTER FINAL KAF */ 628 { 0x0ceb, 0x05db }, /* hebrew_kaph HEBREW LETTER KAF */ 629 { 0x0cec, 0x05dc }, /* hebrew_lamed HEBREW LETTER LAMED */ 630 { 0x0ced, 0x05dd }, /* hebrew_finalmem HEBREW LETTER FINAL MEM */ 631 { 0x0cee, 0x05de }, /* hebrew_mem HEBREW LETTER MEM */ 632 { 0x0cef, 0x05df }, /* hebrew_finalnun HEBREW LETTER FINAL NUN */ 633 { 0x0cf0, 0x05e0 }, /* hebrew_nun HEBREW LETTER NUN */ 634 { 0x0cf1, 0x05e1 }, /* hebrew_samech HEBREW LETTER SAMEKH */ 635 { 0x0cf2, 0x05e2 }, /* hebrew_ayin HEBREW LETTER AYIN */ 636 { 0x0cf3, 0x05e3 }, /* hebrew_finalpe HEBREW LETTER FINAL PE */ 637 { 0x0cf4, 0x05e4 }, /* hebrew_pe HEBREW LETTER PE */ 638 { 0x0cf5, 0x05e5 }, /* hebrew_finalzade HEBREW LETTER FINAL TSADI */ 639 { 0x0cf6, 0x05e6 }, /* hebrew_zade HEBREW LETTER TSADI */ 640 { 0x0cf7, 0x05e7 }, /* hebrew_qoph HEBREW LETTER QOF */ 641 { 0x0cf8, 0x05e8 }, /* hebrew_resh HEBREW LETTER RESH */ 642 { 0x0cf9, 0x05e9 }, /* hebrew_shin HEBREW LETTER SHIN */ 643 { 0x0cfa, 0x05ea }, /* hebrew_taw HEBREW LETTER TAV */ 644 { 0x0da1, 0x0e01 }, /* Thai_kokai THAI CHARACTER KO KAI */ 645 { 0x0da2, 0x0e02 }, /* Thai_khokhai THAI CHARACTER KHO KHAI */ 646 { 0x0da3, 0x0e03 }, /* Thai_khokhuat THAI CHARACTER KHO KHUAT */ 647 { 0x0da4, 0x0e04 }, /* Thai_khokhwai THAI CHARACTER KHO KHWAI */ 648 { 0x0da5, 0x0e05 }, /* Thai_khokhon THAI CHARACTER KHO KHON */ 649 { 0x0da6, 0x0e06 }, /* Thai_khorakhang THAI CHARACTER KHO RAKHANG */ 650 { 0x0da7, 0x0e07 }, /* Thai_ngongu THAI CHARACTER NGO NGU */ 651 { 0x0da8, 0x0e08 }, /* Thai_chochan THAI CHARACTER CHO CHAN */ 652 { 0x0da9, 0x0e09 }, /* Thai_choching THAI CHARACTER CHO CHING */ 653 { 0x0daa, 0x0e0a }, /* Thai_chochang THAI CHARACTER CHO CHANG */ 654 { 0x0dab, 0x0e0b }, /* Thai_soso THAI CHARACTER SO SO */ 655 { 0x0dac, 0x0e0c }, /* Thai_chochoe THAI CHARACTER CHO CHOE */ 656 { 0x0dad, 0x0e0d }, /* Thai_yoying THAI CHARACTER YO YING */ 657 { 0x0dae, 0x0e0e }, /* Thai_dochada THAI CHARACTER DO CHADA */ 658 { 0x0daf, 0x0e0f }, /* Thai_topatak THAI CHARACTER TO PATAK */ 659 { 0x0db0, 0x0e10 }, /* Thai_thothan THAI CHARACTER THO THAN */ 660 { 0x0db1, 0x0e11 }, /* Thai_thonangmontho THAI CHARACTER THO NANGMONTHO */ 661 { 0x0db2, 0x0e12 }, /* Thai_thophuthao THAI CHARACTER THO PHUTHAO */ 662 { 0x0db3, 0x0e13 }, /* Thai_nonen THAI CHARACTER NO NEN */ 663 { 0x0db4, 0x0e14 }, /* Thai_dodek THAI CHARACTER DO DEK */ 664 { 0x0db5, 0x0e15 }, /* Thai_totao THAI CHARACTER TO TAO */ 665 { 0x0db6, 0x0e16 }, /* Thai_thothung THAI CHARACTER THO THUNG */ 666 { 0x0db7, 0x0e17 }, /* Thai_thothahan THAI CHARACTER THO THAHAN */ 667 { 0x0db8, 0x0e18 }, /* Thai_thothong THAI CHARACTER THO THONG */ 668 { 0x0db9, 0x0e19 }, /* Thai_nonu THAI CHARACTER NO NU */ 669 { 0x0dba, 0x0e1a }, /* Thai_bobaimai THAI CHARACTER BO BAIMAI */ 670 { 0x0dbb, 0x0e1b }, /* Thai_popla THAI CHARACTER PO PLA */ 671 { 0x0dbc, 0x0e1c }, /* Thai_phophung THAI CHARACTER PHO PHUNG */ 672 { 0x0dbd, 0x0e1d }, /* Thai_fofa THAI CHARACTER FO FA */ 673 { 0x0dbe, 0x0e1e }, /* Thai_phophan THAI CHARACTER PHO PHAN */ 674 { 0x0dbf, 0x0e1f }, /* Thai_fofan THAI CHARACTER FO FAN */ 675 { 0x0dc0, 0x0e20 }, /* Thai_phosamphao THAI CHARACTER PHO SAMPHAO */ 676 { 0x0dc1, 0x0e21 }, /* Thai_moma THAI CHARACTER MO MA */ 677 { 0x0dc2, 0x0e22 }, /* Thai_yoyak THAI CHARACTER YO YAK */ 678 { 0x0dc3, 0x0e23 }, /* Thai_rorua THAI CHARACTER RO RUA */ 679 { 0x0dc4, 0x0e24 }, /* Thai_ru THAI CHARACTER RU */ 680 { 0x0dc5, 0x0e25 }, /* Thai_loling THAI CHARACTER LO LING */ 681 { 0x0dc6, 0x0e26 }, /* Thai_lu THAI CHARACTER LU */ 682 { 0x0dc7, 0x0e27 }, /* Thai_wowaen THAI CHARACTER WO WAEN */ 683 { 0x0dc8, 0x0e28 }, /* Thai_sosala THAI CHARACTER SO SALA */ 684 { 0x0dc9, 0x0e29 }, /* Thai_sorusi THAI CHARACTER SO RUSI */ 685 { 0x0dca, 0x0e2a }, /* Thai_sosua THAI CHARACTER SO SUA */ 686 { 0x0dcb, 0x0e2b }, /* Thai_hohip THAI CHARACTER HO HIP */ 687 { 0x0dcc, 0x0e2c }, /* Thai_lochula THAI CHARACTER LO CHULA */ 688 { 0x0dcd, 0x0e2d }, /* Thai_oang THAI CHARACTER O ANG */ 689 { 0x0dce, 0x0e2e }, /* Thai_honokhuk THAI CHARACTER HO NOKHUK */ 690 { 0x0dcf, 0x0e2f }, /* Thai_paiyannoi THAI CHARACTER PAIYANNOI */ 691 { 0x0dd0, 0x0e30 }, /* Thai_saraa THAI CHARACTER SARA A */ 692 { 0x0dd1, 0x0e31 }, /* Thai_maihanakat THAI CHARACTER MAI HAN-AKAT */ 693 { 0x0dd2, 0x0e32 }, /* Thai_saraaa THAI CHARACTER SARA AA */ 694 { 0x0dd3, 0x0e33 }, /* Thai_saraam THAI CHARACTER SARA AM */ 695 { 0x0dd4, 0x0e34 }, /* Thai_sarai THAI CHARACTER SARA I */ 696 { 0x0dd5, 0x0e35 }, /* Thai_saraii THAI CHARACTER SARA II */ 697 { 0x0dd6, 0x0e36 }, /* Thai_saraue THAI CHARACTER SARA UE */ 698 { 0x0dd7, 0x0e37 }, /* Thai_sarauee THAI CHARACTER SARA UEE */ 699 { 0x0dd8, 0x0e38 }, /* Thai_sarau THAI CHARACTER SARA U */ 700 { 0x0dd9, 0x0e39 }, /* Thai_sarauu THAI CHARACTER SARA UU */ 701 { 0x0dda, 0x0e3a }, /* Thai_phinthu THAI CHARACTER PHINTHU */ 702 { 0x0dde, 0x0e3e }, /* Thai_maihanakat_maitho ??? */ 703 { 0x0ddf, 0x0e3f }, /* Thai_baht THAI CURRENCY SYMBOL BAHT */ 704 { 0x0de0, 0x0e40 }, /* Thai_sarae THAI CHARACTER SARA E */ 705 { 0x0de1, 0x0e41 }, /* Thai_saraae THAI CHARACTER SARA AE */ 706 { 0x0de2, 0x0e42 }, /* Thai_sarao THAI CHARACTER SARA O */ 707 { 0x0de3, 0x0e43 }, /* Thai_saraaimaimuan THAI CHARACTER SARA AI MAIMUAN */ 708 { 0x0de4, 0x0e44 }, /* Thai_saraaimaimalai THAI CHARACTER SARA AI MAIMALAI */ 709 { 0x0de5, 0x0e45 }, /* Thai_lakkhangyao THAI CHARACTER LAKKHANGYAO */ 710 { 0x0de6, 0x0e46 }, /* Thai_maiyamok THAI CHARACTER MAIYAMOK */ 711 { 0x0de7, 0x0e47 }, /* Thai_maitaikhu THAI CHARACTER MAITAIKHU */ 712 { 0x0de8, 0x0e48 }, /* Thai_maiek THAI CHARACTER MAI EK */ 713 { 0x0de9, 0x0e49 }, /* Thai_maitho THAI CHARACTER MAI THO */ 714 { 0x0dea, 0x0e4a }, /* Thai_maitri THAI CHARACTER MAI TRI */ 715 { 0x0deb, 0x0e4b }, /* Thai_maichattawa THAI CHARACTER MAI CHATTAWA */ 716 { 0x0dec, 0x0e4c }, /* Thai_thanthakhat THAI CHARACTER THANTHAKHAT */ 717 { 0x0ded, 0x0e4d }, /* Thai_nikhahit THAI CHARACTER NIKHAHIT */ 718 { 0x0df0, 0x0e50 }, /* Thai_leksun THAI DIGIT ZERO */ 719 { 0x0df1, 0x0e51 }, /* Thai_leknung THAI DIGIT ONE */ 720 { 0x0df2, 0x0e52 }, /* Thai_leksong THAI DIGIT TWO */ 721 { 0x0df3, 0x0e53 }, /* Thai_leksam THAI DIGIT THREE */ 722 { 0x0df4, 0x0e54 }, /* Thai_leksi THAI DIGIT FOUR */ 723 { 0x0df5, 0x0e55 }, /* Thai_lekha THAI DIGIT FIVE */ 724 { 0x0df6, 0x0e56 }, /* Thai_lekhok THAI DIGIT SIX */ 725 { 0x0df7, 0x0e57 }, /* Thai_lekchet THAI DIGIT SEVEN */ 726 { 0x0df8, 0x0e58 }, /* Thai_lekpaet THAI DIGIT EIGHT */ 727 { 0x0df9, 0x0e59 }, /* Thai_lekkao THAI DIGIT NINE */ 728 { 0x0ea1, 0x3131 }, /* Hangul_Kiyeog HANGUL LETTER KIYEOK */ 729 { 0x0ea2, 0x3132 }, /* Hangul_SsangKiyeog HANGUL LETTER SSANGKIYEOK */ 730 { 0x0ea3, 0x3133 }, /* Hangul_KiyeogSios HANGUL LETTER KIYEOK-SIOS */ 731 { 0x0ea4, 0x3134 }, /* Hangul_Nieun HANGUL LETTER NIEUN */ 732 { 0x0ea5, 0x3135 }, /* Hangul_NieunJieuj HANGUL LETTER NIEUN-CIEUC */ 733 { 0x0ea6, 0x3136 }, /* Hangul_NieunHieuh HANGUL LETTER NIEUN-HIEUH */ 734 { 0x0ea7, 0x3137 }, /* Hangul_Dikeud HANGUL LETTER TIKEUT */ 735 { 0x0ea8, 0x3138 }, /* Hangul_SsangDikeud HANGUL LETTER SSANGTIKEUT */ 736 { 0x0ea9, 0x3139 }, /* Hangul_Rieul HANGUL LETTER RIEUL */ 737 { 0x0eaa, 0x313a }, /* Hangul_RieulKiyeog HANGUL LETTER RIEUL-KIYEOK */ 738 { 0x0eab, 0x313b }, /* Hangul_RieulMieum HANGUL LETTER RIEUL-MIEUM */ 739 { 0x0eac, 0x313c }, /* Hangul_RieulPieub HANGUL LETTER RIEUL-PIEUP */ 740 { 0x0ead, 0x313d }, /* Hangul_RieulSios HANGUL LETTER RIEUL-SIOS */ 741 { 0x0eae, 0x313e }, /* Hangul_RieulTieut HANGUL LETTER RIEUL-THIEUTH */ 742 { 0x0eaf, 0x313f }, /* Hangul_RieulPhieuf HANGUL LETTER RIEUL-PHIEUPH */ 743 { 0x0eb0, 0x3140 }, /* Hangul_RieulHieuh HANGUL LETTER RIEUL-HIEUH */ 744 { 0x0eb1, 0x3141 }, /* Hangul_Mieum HANGUL LETTER MIEUM */ 745 { 0x0eb2, 0x3142 }, /* Hangul_Pieub HANGUL LETTER PIEUP */ 746 { 0x0eb3, 0x3143 }, /* Hangul_SsangPieub HANGUL LETTER SSANGPIEUP */ 747 { 0x0eb4, 0x3144 }, /* Hangul_PieubSios HANGUL LETTER PIEUP-SIOS */ 748 { 0x0eb5, 0x3145 }, /* Hangul_Sios HANGUL LETTER SIOS */ 749 { 0x0eb6, 0x3146 }, /* Hangul_SsangSios HANGUL LETTER SSANGSIOS */ 750 { 0x0eb7, 0x3147 }, /* Hangul_Ieung HANGUL LETTER IEUNG */ 751 { 0x0eb8, 0x3148 }, /* Hangul_Jieuj HANGUL LETTER CIEUC */ 752 { 0x0eb9, 0x3149 }, /* Hangul_SsangJieuj HANGUL LETTER SSANGCIEUC */ 753 { 0x0eba, 0x314a }, /* Hangul_Cieuc HANGUL LETTER CHIEUCH */ 754 { 0x0ebb, 0x314b }, /* Hangul_Khieuq HANGUL LETTER KHIEUKH */ 755 { 0x0ebc, 0x314c }, /* Hangul_Tieut HANGUL LETTER THIEUTH */ 756 { 0x0ebd, 0x314d }, /* Hangul_Phieuf HANGUL LETTER PHIEUPH */ 757 { 0x0ebe, 0x314e }, /* Hangul_Hieuh HANGUL LETTER HIEUH */ 758 { 0x0ebf, 0x314f }, /* Hangul_A HANGUL LETTER A */ 759 { 0x0ec0, 0x3150 }, /* Hangul_AE HANGUL LETTER AE */ 760 { 0x0ec1, 0x3151 }, /* Hangul_YA HANGUL LETTER YA */ 761 { 0x0ec2, 0x3152 }, /* Hangul_YAE HANGUL LETTER YAE */ 762 { 0x0ec3, 0x3153 }, /* Hangul_EO HANGUL LETTER EO */ 763 { 0x0ec4, 0x3154 }, /* Hangul_E HANGUL LETTER E */ 764 { 0x0ec5, 0x3155 }, /* Hangul_YEO HANGUL LETTER YEO */ 765 { 0x0ec6, 0x3156 }, /* Hangul_YE HANGUL LETTER YE */ 766 { 0x0ec7, 0x3157 }, /* Hangul_O HANGUL LETTER O */ 767 { 0x0ec8, 0x3158 }, /* Hangul_WA HANGUL LETTER WA */ 768 { 0x0ec9, 0x3159 }, /* Hangul_WAE HANGUL LETTER WAE */ 769 { 0x0eca, 0x315a }, /* Hangul_OE HANGUL LETTER OE */ 770 { 0x0ecb, 0x315b }, /* Hangul_YO HANGUL LETTER YO */ 771 { 0x0ecc, 0x315c }, /* Hangul_U HANGUL LETTER U */ 772 { 0x0ecd, 0x315d }, /* Hangul_WEO HANGUL LETTER WEO */ 773 { 0x0ece, 0x315e }, /* Hangul_WE HANGUL LETTER WE */ 774 { 0x0ecf, 0x315f }, /* Hangul_WI HANGUL LETTER WI */ 775 { 0x0ed0, 0x3160 }, /* Hangul_YU HANGUL LETTER YU */ 776 { 0x0ed1, 0x3161 }, /* Hangul_EU HANGUL LETTER EU */ 777 { 0x0ed2, 0x3162 }, /* Hangul_YI HANGUL LETTER YI */ 778 { 0x0ed3, 0x3163 }, /* Hangul_I HANGUL LETTER I */ 779 { 0x0ed4, 0x11a8 }, /* Hangul_J_Kiyeog HANGUL JONGSEONG KIYEOK */ 780 { 0x0ed5, 0x11a9 }, /* Hangul_J_SsangKiyeog HANGUL JONGSEONG SSANGKIYEOK */ 781 { 0x0ed6, 0x11aa }, /* Hangul_J_KiyeogSios HANGUL JONGSEONG KIYEOK-SIOS */ 782 { 0x0ed7, 0x11ab }, /* Hangul_J_Nieun HANGUL JONGSEONG NIEUN */ 783 { 0x0ed8, 0x11ac }, /* Hangul_J_NieunJieuj HANGUL JONGSEONG NIEUN-CIEUC */ 784 { 0x0ed9, 0x11ad }, /* Hangul_J_NieunHieuh HANGUL JONGSEONG NIEUN-HIEUH */ 785 { 0x0eda, 0x11ae }, /* Hangul_J_Dikeud HANGUL JONGSEONG TIKEUT */ 786 { 0x0edb, 0x11af }, /* Hangul_J_Rieul HANGUL JONGSEONG RIEUL */ 787 { 0x0edc, 0x11b0 }, /* Hangul_J_RieulKiyeog HANGUL JONGSEONG RIEUL-KIYEOK */ 788 { 0x0edd, 0x11b1 }, /* Hangul_J_RieulMieum HANGUL JONGSEONG RIEUL-MIEUM */ 789 { 0x0ede, 0x11b2 }, /* Hangul_J_RieulPieub HANGUL JONGSEONG RIEUL-PIEUP */ 790 { 0x0edf, 0x11b3 }, /* Hangul_J_RieulSios HANGUL JONGSEONG RIEUL-SIOS */ 791 { 0x0ee0, 0x11b4 }, /* Hangul_J_RieulTieut HANGUL JONGSEONG RIEUL-THIEUTH */ 792 { 0x0ee1, 0x11b5 }, /* Hangul_J_RieulPhieuf HANGUL JONGSEONG RIEUL-PHIEUPH */ 793 { 0x0ee2, 0x11b6 }, /* Hangul_J_RieulHieuh HANGUL JONGSEONG RIEUL-HIEUH */ 794 { 0x0ee3, 0x11b7 }, /* Hangul_J_Mieum HANGUL JONGSEONG MIEUM */ 795 { 0x0ee4, 0x11b8 }, /* Hangul_J_Pieub HANGUL JONGSEONG PIEUP */ 796 { 0x0ee5, 0x11b9 }, /* Hangul_J_PieubSios HANGUL JONGSEONG PIEUP-SIOS */ 797 { 0x0ee6, 0x11ba }, /* Hangul_J_Sios HANGUL JONGSEONG SIOS */ 798 { 0x0ee7, 0x11bb }, /* Hangul_J_SsangSios HANGUL JONGSEONG SSANGSIOS */ 799 { 0x0ee8, 0x11bc }, /* Hangul_J_Ieung HANGUL JONGSEONG IEUNG */ 800 { 0x0ee9, 0x11bd }, /* Hangul_J_Jieuj HANGUL JONGSEONG CIEUC */ 801 { 0x0eea, 0x11be }, /* Hangul_J_Cieuc HANGUL JONGSEONG CHIEUCH */ 802 { 0x0eeb, 0x11bf }, /* Hangul_J_Khieuq HANGUL JONGSEONG KHIEUKH */ 803 { 0x0eec, 0x11c0 }, /* Hangul_J_Tieut HANGUL JONGSEONG THIEUTH */ 804 { 0x0eed, 0x11c1 }, /* Hangul_J_Phieuf HANGUL JONGSEONG PHIEUPH */ 805 { 0x0eee, 0x11c2 }, /* Hangul_J_Hieuh HANGUL JONGSEONG HIEUH */ 806 { 0x0eef, 0x316d }, /* Hangul_RieulYeorinHieuh HANGUL LETTER RIEUL-YEORINHIEUH */ 807 { 0x0ef0, 0x3171 }, /* Hangul_SunkyeongeumMieum HANGUL LETTER KAPYEOUNMIEUM */ 808 { 0x0ef1, 0x3178 }, /* Hangul_SunkyeongeumPieub HANGUL LETTER KAPYEOUNPIEUP */ 809 { 0x0ef2, 0x317f }, /* Hangul_PanSios HANGUL LETTER PANSIOS */ 810 /* 0x0ef3 Hangul_KkogjiDalrinIeung ? ??? */ 811 { 0x0ef4, 0x3184 }, /* Hangul_SunkyeongeumPhieuf HANGUL LETTER KAPYEOUNPHIEUPH */ 812 { 0x0ef5, 0x3186 }, /* Hangul_YeorinHieuh HANGUL LETTER YEORINHIEUH */ 813 { 0x0ef6, 0x318d }, /* Hangul_AraeA HANGUL LETTER ARAEA */ 814 { 0x0ef7, 0x318e }, /* Hangul_AraeAE HANGUL LETTER ARAEAE */ 815 { 0x0ef8, 0x11eb }, /* Hangul_J_PanSios HANGUL JONGSEONG PANSIOS */ 816 { 0x0ef9, 0x11f0 }, /* Hangul_J_KkogjiDalrinIeung HANGUL JONGSEONG YESIEUNG */ 817 { 0x0efa, 0x11f9 }, /* Hangul_J_YeorinHieuh HANGUL JONGSEONG YEORINHIEUH */ 818 { 0x0eff, 0x20a9 }, /* Korean_Won WON SIGN */ 819 { 0x13a4, 0x20ac }, /* Euro EURO SIGN */ 820 { 0x13bc, 0x0152 }, /* OE LATIN CAPITAL LIGATURE OE */ 821 { 0x13bd, 0x0153 }, /* oe LATIN SMALL LIGATURE OE */ 822 { 0x13be, 0x0178 }, /* Ydiaeresis LATIN CAPITAL LETTER Y WITH DIAERESIS */ 823 { 0x20a0, 0x20a0 }, /* EcuSign EURO-CURRENCY SIGN */ 824 { 0x20a1, 0x20a1 }, /* ColonSign COLON SIGN */ 825 { 0x20a2, 0x20a2 }, /* CruzeiroSign CRUZEIRO SIGN */ 826 { 0x20a3, 0x20a3 }, /* FFrancSign FRENCH FRANC SIGN */ 827 { 0x20a4, 0x20a4 }, /* LiraSign LIRA SIGN */ 828 { 0x20a5, 0x20a5 }, /* MillSign MILL SIGN */ 829 { 0x20a6, 0x20a6 }, /* NairaSign NAIRA SIGN */ 830 { 0x20a7, 0x20a7 }, /* PesetaSign PESETA SIGN */ 831 { 0x20a8, 0x20a8 }, /* RupeeSign RUPEE SIGN */ 832 { 0x20a9, 0x20a9 }, /* WonSign WON SIGN */ 833 { 0x20aa, 0x20aa }, /* NewSheqelSign NEW SHEQEL SIGN */ 834 { 0x20ab, 0x20ab }, /* DongSign DONG SIGN */ 835 { 0x20ac, 0x20ac }, /* EuroSign EURO SIGN */ 836 }; 837 838 /* binary search with range check */ 839 static uint32_t 840 bin_search(const struct codepair *table, size_t length, xkb_keysym_t keysym) 841 { 842 size_t first = 0; 843 size_t last = length; 844 845 if (keysym < table[0].keysym || keysym > table[length].keysym) 846 return 0; 847 848 /* binary search in table */ 849 while (last >= first) { 850 size_t mid = (first + last) / 2; 851 if (table[mid].keysym < keysym) 852 first = mid + 1; 853 else if (table[mid].keysym > keysym) 854 last = mid - 1; 855 else /* found it */ 856 return table[mid].ucs; 857 } 858 859 /* no matching Unicode value found in table */ 860 return 0; 861 } 862 863 XKB_EXPORT uint32_t 864 xkb_keysym_to_utf32(xkb_keysym_t keysym) 865 { 866 /* first check for Latin-1 characters (1:1 mapping) */ 867 if ((keysym >= 0x0020 && keysym <= 0x007e) || 868 (keysym >= 0x00a0 && keysym <= 0x00ff)) 869 return keysym; 870 871 /* patch encoding botch */ 872 if (keysym == XKB_KEY_KP_Space) 873 return XKB_KEY_space & 0x7f; 874 875 /* special keysyms */ 876 if ((keysym >= XKB_KEY_BackSpace && keysym <= XKB_KEY_Clear) || 877 (keysym >= XKB_KEY_KP_Multiply && keysym <= XKB_KEY_KP_9) || 878 keysym == XKB_KEY_Return || keysym == XKB_KEY_Escape || 879 keysym == XKB_KEY_Delete || keysym == XKB_KEY_KP_Tab || 880 keysym == XKB_KEY_KP_Enter || keysym == XKB_KEY_KP_Equal) 881 return keysym & 0x7f; 882 883 /* also check for directly encoded 24-bit UCS characters */ 884 if ((keysym & 0xff000000) == 0x01000000) 885 return keysym & 0x00ffffff; 886 887 /* search main table */ 888 return bin_search(keysymtab, ARRAY_SIZE(keysymtab) - 1, keysym); 889 } 890 891 /* 892 * Copyright 2012 Intel Corporation 893 * 894 * Permission is hereby granted, free of charge, to any person obtaining a 895 * copy of this software and associated documentation files (the "Software"), 896 * to deal in the Software without restriction, including without limitation 897 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 898 * and/or sell copies of the Software, and to permit persons to whom the 899 * Software is furnished to do so, subject to the following conditions: 900 * 901 * The above copyright notice and this permission notice (including the next 902 * paragraph) shall be included in all copies or substantial portions of the 903 * Software. 904 * 905 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 906 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 907 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 908 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 909 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 910 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER 911 * DEALINGS IN THE SOFTWARE. 912 * 913 * Author: Rob Bradford <rob (at) linux.intel.com> 914 */ 915 916 XKB_EXPORT int 917 xkb_keysym_to_utf8(xkb_keysym_t keysym, char *buffer, size_t size) 918 { 919 uint32_t codepoint; 920 921 if (size < 7) 922 return -1; 923 924 codepoint = xkb_keysym_to_utf32(keysym); 925 926 if (codepoint == 0) 927 return 0; 928 929 return utf32_to_utf8(codepoint, buffer); 930 } 931