1 /* 2 * Copyright 2009 Red Hat, Inc. 3 * Copyright 2011 Codethink Limited 4 * Copyright 2010,2011,2012 Google, Inc. 5 * 6 * This is part of HarfBuzz, a text shaping library. 7 * 8 * Permission is hereby granted, without written agreement and without 9 * license or royalty fees, to use, copy, modify, and distribute this 10 * software and its documentation for any purpose, provided that the 11 * above copyright notice and the following two paragraphs appear in 12 * all copies of this software. 13 * 14 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR 15 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES 16 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN 17 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH 18 * DAMAGE. 19 * 20 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, 21 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND 22 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS 23 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO 24 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. 25 * 26 * Red Hat Author(s): Behdad Esfahbod 27 * Codethink Author(s): Ryan Lortie 28 * Google Author(s): Behdad Esfahbod 29 */ 30 31 #include "hb-private.hh" 32 33 #include "hb-unicode-private.hh" 34 35 36 37 /* 38 * hb_unicode_funcs_t 39 */ 40 41 static hb_unicode_combining_class_t 42 hb_unicode_combining_class_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 43 hb_codepoint_t unicode HB_UNUSED, 44 void *user_data HB_UNUSED) 45 { 46 return HB_UNICODE_COMBINING_CLASS_NOT_REORDERED; 47 } 48 49 static unsigned int 50 hb_unicode_eastasian_width_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 51 hb_codepoint_t unicode HB_UNUSED, 52 void *user_data HB_UNUSED) 53 { 54 return 1; 55 } 56 57 static hb_unicode_general_category_t 58 hb_unicode_general_category_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 59 hb_codepoint_t unicode HB_UNUSED, 60 void *user_data HB_UNUSED) 61 { 62 return HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER; 63 } 64 65 static hb_codepoint_t 66 hb_unicode_mirroring_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 67 hb_codepoint_t unicode HB_UNUSED, 68 void *user_data HB_UNUSED) 69 { 70 return unicode; 71 } 72 73 static hb_script_t 74 hb_unicode_script_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 75 hb_codepoint_t unicode HB_UNUSED, 76 void *user_data HB_UNUSED) 77 { 78 return HB_SCRIPT_UNKNOWN; 79 } 80 81 static hb_bool_t 82 hb_unicode_compose_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 83 hb_codepoint_t a HB_UNUSED, 84 hb_codepoint_t b HB_UNUSED, 85 hb_codepoint_t *ab HB_UNUSED, 86 void *user_data HB_UNUSED) 87 { 88 return false; 89 } 90 91 static hb_bool_t 92 hb_unicode_decompose_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 93 hb_codepoint_t ab HB_UNUSED, 94 hb_codepoint_t *a HB_UNUSED, 95 hb_codepoint_t *b HB_UNUSED, 96 void *user_data HB_UNUSED) 97 { 98 return false; 99 } 100 101 102 static unsigned int 103 hb_unicode_decompose_compatibility_nil (hb_unicode_funcs_t *ufuncs HB_UNUSED, 104 hb_codepoint_t u HB_UNUSED, 105 hb_codepoint_t *decomposed HB_UNUSED, 106 void *user_data HB_UNUSED) 107 { 108 return 0; 109 } 110 111 112 #define HB_UNICODE_FUNCS_IMPLEMENT_SET \ 113 HB_UNICODE_FUNCS_IMPLEMENT (glib) \ 114 HB_UNICODE_FUNCS_IMPLEMENT (icu) \ 115 HB_UNICODE_FUNCS_IMPLEMENT (ucdn) \ 116 HB_UNICODE_FUNCS_IMPLEMENT (nil) \ 117 /* ^--- Add new callbacks before nil */ 118 119 #define hb_nil_get_unicode_funcs hb_unicode_funcs_get_empty 120 121 /* Prototype them all */ 122 #define HB_UNICODE_FUNCS_IMPLEMENT(set) \ 123 extern "C" hb_unicode_funcs_t *hb_##set##_get_unicode_funcs (void); 124 HB_UNICODE_FUNCS_IMPLEMENT_SET 125 #undef HB_UNICODE_FUNCS_IMPLEMENT 126 127 128 hb_unicode_funcs_t * 129 hb_unicode_funcs_get_default (void) 130 { 131 #define HB_UNICODE_FUNCS_IMPLEMENT(set) \ 132 return hb_##set##_get_unicode_funcs (); 133 134 #if defined(HAVE_UCDN) 135 HB_UNICODE_FUNCS_IMPLEMENT(ucdn) 136 #elif defined(HAVE_GLIB) 137 HB_UNICODE_FUNCS_IMPLEMENT(glib) 138 #elif defined(HAVE_ICU) && defined(HAVE_ICU_BUILTIN) 139 HB_UNICODE_FUNCS_IMPLEMENT(icu) 140 #else 141 #define HB_UNICODE_FUNCS_NIL 1 142 HB_UNICODE_FUNCS_IMPLEMENT(nil) 143 #endif 144 145 #undef HB_UNICODE_FUNCS_IMPLEMENT 146 } 147 148 #if !defined(HB_NO_UNICODE_FUNCS) && defined(HB_UNICODE_FUNCS_NIL) 149 #error "Could not find any Unicode functions implementation, you have to provide your own" 150 #error "Consider building hb-ucdn.c. If you absolutely want to build without any, check the code." 151 #endif 152 153 /** 154 * hb_unicode_funcs_create: (Xconstructor) 155 * @parent: (nullable): 156 * 157 * 158 * 159 * Return value: (transfer full): 160 * 161 * Since: 0.9.2 162 **/ 163 hb_unicode_funcs_t * 164 hb_unicode_funcs_create (hb_unicode_funcs_t *parent) 165 { 166 hb_unicode_funcs_t *ufuncs; 167 168 if (!(ufuncs = hb_object_create<hb_unicode_funcs_t> ())) 169 return hb_unicode_funcs_get_empty (); 170 171 if (!parent) 172 parent = hb_unicode_funcs_get_empty (); 173 174 hb_unicode_funcs_make_immutable (parent); 175 ufuncs->parent = hb_unicode_funcs_reference (parent); 176 177 ufuncs->func = parent->func; 178 179 /* We can safely copy user_data from parent since we hold a reference 180 * onto it and it's immutable. We should not copy the destroy notifiers 181 * though. */ 182 ufuncs->user_data = parent->user_data; 183 184 return ufuncs; 185 } 186 187 188 const hb_unicode_funcs_t _hb_unicode_funcs_nil = { 189 HB_OBJECT_HEADER_STATIC, 190 191 NULL, /* parent */ 192 true, /* immutable */ 193 { 194 #define HB_UNICODE_FUNC_IMPLEMENT(name) hb_unicode_##name##_nil, 195 HB_UNICODE_FUNCS_IMPLEMENT_CALLBACKS 196 #undef HB_UNICODE_FUNC_IMPLEMENT 197 } 198 }; 199 200 /** 201 * hb_unicode_funcs_get_empty: 202 * 203 * 204 * 205 * Return value: (transfer full): 206 * 207 * Since: 0.9.2 208 **/ 209 hb_unicode_funcs_t * 210 hb_unicode_funcs_get_empty (void) 211 { 212 return const_cast<hb_unicode_funcs_t *> (&_hb_unicode_funcs_nil); 213 } 214 215 /** 216 * hb_unicode_funcs_reference: (skip) 217 * @ufuncs: Unicode functions. 218 * 219 * 220 * 221 * Return value: (transfer full): 222 * 223 * Since: 0.9.2 224 **/ 225 hb_unicode_funcs_t * 226 hb_unicode_funcs_reference (hb_unicode_funcs_t *ufuncs) 227 { 228 return hb_object_reference (ufuncs); 229 } 230 231 /** 232 * hb_unicode_funcs_destroy: (skip) 233 * @ufuncs: Unicode functions. 234 * 235 * 236 * 237 * Since: 0.9.2 238 **/ 239 void 240 hb_unicode_funcs_destroy (hb_unicode_funcs_t *ufuncs) 241 { 242 if (!hb_object_destroy (ufuncs)) return; 243 244 #define HB_UNICODE_FUNC_IMPLEMENT(name) \ 245 if (ufuncs->destroy.name) ufuncs->destroy.name (ufuncs->user_data.name); 246 HB_UNICODE_FUNCS_IMPLEMENT_CALLBACKS 247 #undef HB_UNICODE_FUNC_IMPLEMENT 248 249 hb_unicode_funcs_destroy (ufuncs->parent); 250 251 free (ufuncs); 252 } 253 254 /** 255 * hb_unicode_funcs_set_user_data: (skip) 256 * @ufuncs: Unicode functions. 257 * @key: 258 * @data: 259 * @destroy: 260 * @replace: 261 * 262 * 263 * 264 * Return value: 265 * 266 * Since: 0.9.2 267 **/ 268 hb_bool_t 269 hb_unicode_funcs_set_user_data (hb_unicode_funcs_t *ufuncs, 270 hb_user_data_key_t *key, 271 void * data, 272 hb_destroy_func_t destroy, 273 hb_bool_t replace) 274 { 275 return hb_object_set_user_data (ufuncs, key, data, destroy, replace); 276 } 277 278 /** 279 * hb_unicode_funcs_get_user_data: (skip) 280 * @ufuncs: Unicode functions. 281 * @key: 282 * 283 * 284 * 285 * Return value: (transfer none): 286 * 287 * Since: 0.9.2 288 **/ 289 void * 290 hb_unicode_funcs_get_user_data (hb_unicode_funcs_t *ufuncs, 291 hb_user_data_key_t *key) 292 { 293 return hb_object_get_user_data (ufuncs, key); 294 } 295 296 297 /** 298 * hb_unicode_funcs_make_immutable: 299 * @ufuncs: Unicode functions. 300 * 301 * 302 * 303 * Since: 0.9.2 304 **/ 305 void 306 hb_unicode_funcs_make_immutable (hb_unicode_funcs_t *ufuncs) 307 { 308 if (unlikely (hb_object_is_inert (ufuncs))) 309 return; 310 311 ufuncs->immutable = true; 312 } 313 314 /** 315 * hb_unicode_funcs_is_immutable: 316 * @ufuncs: Unicode functions. 317 * 318 * 319 * 320 * Return value: 321 * 322 * Since: 0.9.2 323 **/ 324 hb_bool_t 325 hb_unicode_funcs_is_immutable (hb_unicode_funcs_t *ufuncs) 326 { 327 return ufuncs->immutable; 328 } 329 330 /** 331 * hb_unicode_funcs_get_parent: 332 * @ufuncs: Unicode functions. 333 * 334 * 335 * 336 * Return value: 337 * 338 * Since: 0.9.2 339 **/ 340 hb_unicode_funcs_t * 341 hb_unicode_funcs_get_parent (hb_unicode_funcs_t *ufuncs) 342 { 343 return ufuncs->parent ? ufuncs->parent : hb_unicode_funcs_get_empty (); 344 } 345 346 347 #define HB_UNICODE_FUNC_IMPLEMENT(name) \ 348 \ 349 void \ 350 hb_unicode_funcs_set_##name##_func (hb_unicode_funcs_t *ufuncs, \ 351 hb_unicode_##name##_func_t func, \ 352 void *user_data, \ 353 hb_destroy_func_t destroy) \ 354 { \ 355 if (ufuncs->immutable) \ 356 return; \ 357 \ 358 if (ufuncs->destroy.name) \ 359 ufuncs->destroy.name (ufuncs->user_data.name); \ 360 \ 361 if (func) { \ 362 ufuncs->func.name = func; \ 363 ufuncs->user_data.name = user_data; \ 364 ufuncs->destroy.name = destroy; \ 365 } else { \ 366 ufuncs->func.name = ufuncs->parent->func.name; \ 367 ufuncs->user_data.name = ufuncs->parent->user_data.name; \ 368 ufuncs->destroy.name = NULL; \ 369 } \ 370 } 371 372 HB_UNICODE_FUNCS_IMPLEMENT_CALLBACKS 373 #undef HB_UNICODE_FUNC_IMPLEMENT 374 375 376 #define HB_UNICODE_FUNC_IMPLEMENT(return_type, name) \ 377 \ 378 return_type \ 379 hb_unicode_##name (hb_unicode_funcs_t *ufuncs, \ 380 hb_codepoint_t unicode) \ 381 { \ 382 return ufuncs->name (unicode); \ 383 } 384 HB_UNICODE_FUNCS_IMPLEMENT_CALLBACKS_SIMPLE 385 #undef HB_UNICODE_FUNC_IMPLEMENT 386 387 /** 388 * hb_unicode_compose: 389 * @ufuncs: Unicode functions. 390 * @a: 391 * @b: 392 * @ab: (out): 393 * 394 * 395 * 396 * Return value: 397 * 398 * Since: 0.9.2 399 **/ 400 hb_bool_t 401 hb_unicode_compose (hb_unicode_funcs_t *ufuncs, 402 hb_codepoint_t a, 403 hb_codepoint_t b, 404 hb_codepoint_t *ab) 405 { 406 return ufuncs->compose (a, b, ab); 407 } 408 409 /** 410 * hb_unicode_decompose: 411 * @ufuncs: Unicode functions. 412 * @ab: 413 * @a: (out): 414 * @b: (out): 415 * 416 * 417 * 418 * Return value: 419 * 420 * Since: 0.9.2 421 **/ 422 hb_bool_t 423 hb_unicode_decompose (hb_unicode_funcs_t *ufuncs, 424 hb_codepoint_t ab, 425 hb_codepoint_t *a, 426 hb_codepoint_t *b) 427 { 428 return ufuncs->decompose (ab, a, b); 429 } 430 431 /** 432 * hb_unicode_decompose_compatibility: 433 * @ufuncs: Unicode functions. 434 * @u: 435 * @decomposed: (out): 436 * 437 * 438 * 439 * Return value: 440 * 441 * Since: 0.9.2 442 **/ 443 unsigned int 444 hb_unicode_decompose_compatibility (hb_unicode_funcs_t *ufuncs, 445 hb_codepoint_t u, 446 hb_codepoint_t *decomposed) 447 { 448 return ufuncs->decompose_compatibility (u, decomposed); 449 } 450 451 452 /* See hb-unicode-private.hh for details. */ 453 const uint8_t 454 _hb_modified_combining_class[256] = 455 { 456 0, /* HB_UNICODE_COMBINING_CLASS_NOT_REORDERED */ 457 1, /* HB_UNICODE_COMBINING_CLASS_OVERLAY */ 458 2, 3, 4, 5, 6, 459 7, /* HB_UNICODE_COMBINING_CLASS_NUKTA */ 460 8, /* HB_UNICODE_COMBINING_CLASS_KANA_VOICING */ 461 9, /* HB_UNICODE_COMBINING_CLASS_VIRAMA */ 462 463 /* Hebrew */ 464 HB_MODIFIED_COMBINING_CLASS_CCC10, 465 HB_MODIFIED_COMBINING_CLASS_CCC11, 466 HB_MODIFIED_COMBINING_CLASS_CCC12, 467 HB_MODIFIED_COMBINING_CLASS_CCC13, 468 HB_MODIFIED_COMBINING_CLASS_CCC14, 469 HB_MODIFIED_COMBINING_CLASS_CCC15, 470 HB_MODIFIED_COMBINING_CLASS_CCC16, 471 HB_MODIFIED_COMBINING_CLASS_CCC17, 472 HB_MODIFIED_COMBINING_CLASS_CCC18, 473 HB_MODIFIED_COMBINING_CLASS_CCC19, 474 HB_MODIFIED_COMBINING_CLASS_CCC20, 475 HB_MODIFIED_COMBINING_CLASS_CCC21, 476 HB_MODIFIED_COMBINING_CLASS_CCC22, 477 HB_MODIFIED_COMBINING_CLASS_CCC23, 478 HB_MODIFIED_COMBINING_CLASS_CCC24, 479 HB_MODIFIED_COMBINING_CLASS_CCC25, 480 HB_MODIFIED_COMBINING_CLASS_CCC26, 481 482 /* Arabic */ 483 HB_MODIFIED_COMBINING_CLASS_CCC27, 484 HB_MODIFIED_COMBINING_CLASS_CCC28, 485 HB_MODIFIED_COMBINING_CLASS_CCC29, 486 HB_MODIFIED_COMBINING_CLASS_CCC30, 487 HB_MODIFIED_COMBINING_CLASS_CCC31, 488 HB_MODIFIED_COMBINING_CLASS_CCC32, 489 HB_MODIFIED_COMBINING_CLASS_CCC33, 490 HB_MODIFIED_COMBINING_CLASS_CCC34, 491 HB_MODIFIED_COMBINING_CLASS_CCC35, 492 493 /* Syriac */ 494 HB_MODIFIED_COMBINING_CLASS_CCC36, 495 496 37, 38, 39, 497 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 498 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 499 80, 81, 82, 83, 500 501 /* Telugu */ 502 HB_MODIFIED_COMBINING_CLASS_CCC84, 503 85, 86, 87, 88, 89, 90, 504 HB_MODIFIED_COMBINING_CLASS_CCC91, 505 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 506 507 /* Thai */ 508 HB_MODIFIED_COMBINING_CLASS_CCC103, 509 104, 105, 106, 510 HB_MODIFIED_COMBINING_CLASS_CCC107, 511 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 512 513 /* Lao */ 514 HB_MODIFIED_COMBINING_CLASS_CCC118, 515 119, 120, 121, 516 HB_MODIFIED_COMBINING_CLASS_CCC122, 517 123, 124, 125, 126, 127, 128, 518 519 /* Tibetan */ 520 HB_MODIFIED_COMBINING_CLASS_CCC129, 521 HB_MODIFIED_COMBINING_CLASS_CCC130, 522 131, 523 HB_MODIFIED_COMBINING_CLASS_CCC132, 524 133, 134, 135, 136, 137, 138, 139, 525 526 527 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 528 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 529 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 530 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 531 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 532 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 533 534 200, /* HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW_LEFT */ 535 201, 536 202, /* HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW */ 537 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 538 214, /* HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE */ 539 215, 540 216, /* HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE_RIGHT */ 541 217, 542 218, /* HB_UNICODE_COMBINING_CLASS_BELOW_LEFT */ 543 219, 544 220, /* HB_UNICODE_COMBINING_CLASS_BELOW */ 545 221, 546 222, /* HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT */ 547 223, 548 224, /* HB_UNICODE_COMBINING_CLASS_LEFT */ 549 225, 550 226, /* HB_UNICODE_COMBINING_CLASS_RIGHT */ 551 227, 552 228, /* HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT */ 553 229, 554 230, /* HB_UNICODE_COMBINING_CLASS_ABOVE */ 555 231, 556 232, /* HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT */ 557 233, /* HB_UNICODE_COMBINING_CLASS_DOUBLE_BELOW */ 558 234, /* HB_UNICODE_COMBINING_CLASS_DOUBLE_ABOVE */ 559 235, 236, 237, 238, 239, 560 240, /* HB_UNICODE_COMBINING_CLASS_IOTA_SUBSCRIPT */ 561 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 562 255, /* HB_UNICODE_COMBINING_CLASS_INVALID */ 563 }; 564