1 /* 2 * Copyright 2010,2011,2012 Google, Inc. 3 * 4 * This is part of HarfBuzz, a text shaping library. 5 * 6 * Permission is hereby granted, without written agreement and without 7 * license or royalty fees, to use, copy, modify, and distribute this 8 * software and its documentation for any purpose, provided that the 9 * above copyright notice and the following two paragraphs appear in 10 * all copies of this software. 11 * 12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR 13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES 14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN 15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH 16 * DAMAGE. 17 * 18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, 19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND 20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS 21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO 22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. 23 * 24 * Google Author(s): Behdad Esfahbod 25 */ 26 27 #ifndef HB_OT_SHAPE_COMPLEX_PRIVATE_HH 28 #define HB_OT_SHAPE_COMPLEX_PRIVATE_HH 29 30 #include "hb-private.hh" 31 32 #include "hb-ot-shape-private.hh" 33 #include "hb-ot-shape-normalize-private.hh" 34 35 36 37 /* buffer var allocations, used by complex shapers */ 38 #define complex_var_u8_0() var2.u8[2] 39 #define complex_var_u8_1() var2.u8[3] 40 41 42 enum hb_ot_shape_zero_width_marks_type_t { 43 HB_OT_SHAPE_ZERO_WIDTH_MARKS_NONE, 44 // HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_UNICODE_EARLY, 45 HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_UNICODE_LATE, 46 HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_GDEF_EARLY, 47 HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_GDEF_LATE, 48 49 HB_OT_SHAPE_ZERO_WIDTH_MARKS_DEFAULT = HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_UNICODE_LATE 50 }; 51 52 53 /* Master OT shaper list */ 54 #define HB_COMPLEX_SHAPERS_IMPLEMENT_SHAPERS \ 55 HB_COMPLEX_SHAPER_IMPLEMENT (default) /* should be first */ \ 56 HB_COMPLEX_SHAPER_IMPLEMENT (arabic) \ 57 HB_COMPLEX_SHAPER_IMPLEMENT (hangul) \ 58 HB_COMPLEX_SHAPER_IMPLEMENT (hebrew) \ 59 HB_COMPLEX_SHAPER_IMPLEMENT (myanmar_old) \ 60 HB_COMPLEX_SHAPER_IMPLEMENT (indic) \ 61 HB_COMPLEX_SHAPER_IMPLEMENT (myanmar) \ 62 HB_COMPLEX_SHAPER_IMPLEMENT (sea) \ 63 HB_COMPLEX_SHAPER_IMPLEMENT (thai) \ 64 HB_COMPLEX_SHAPER_IMPLEMENT (tibetan) \ 65 /* ^--- Add new shapers here */ 66 67 68 struct hb_ot_complex_shaper_t 69 { 70 char name[8]; 71 72 /* collect_features() 73 * Called during shape_plan(). 74 * Shapers should use plan->map to add their features and callbacks. 75 * May be NULL. 76 */ 77 void (*collect_features) (hb_ot_shape_planner_t *plan); 78 79 /* override_features() 80 * Called during shape_plan(). 81 * Shapers should use plan->map to override features and add callbacks after 82 * common features are added. 83 * May be NULL. 84 */ 85 void (*override_features) (hb_ot_shape_planner_t *plan); 86 87 88 /* data_create() 89 * Called at the end of shape_plan(). 90 * Whatever shapers return will be accessible through plan->data later. 91 * If NULL is returned, means a plan failure. 92 */ 93 void *(*data_create) (const hb_ot_shape_plan_t *plan); 94 95 /* data_destroy() 96 * Called when the shape_plan is being destroyed. 97 * plan->data is passed here for destruction. 98 * If NULL is returned, means a plan failure. 99 * May be NULL. 100 */ 101 void (*data_destroy) (void *data); 102 103 104 /* preprocess_text() 105 * Called during shape(). 106 * Shapers can use to modify text before shaping starts. 107 * May be NULL. 108 */ 109 void (*preprocess_text) (const hb_ot_shape_plan_t *plan, 110 hb_buffer_t *buffer, 111 hb_font_t *font); 112 113 114 hb_ot_shape_normalization_mode_t normalization_preference; 115 116 /* decompose() 117 * Called during shape()'s normalization. 118 * May be NULL. 119 */ 120 bool (*decompose) (const hb_ot_shape_normalize_context_t *c, 121 hb_codepoint_t ab, 122 hb_codepoint_t *a, 123 hb_codepoint_t *b); 124 125 /* compose() 126 * Called during shape()'s normalization. 127 * May be NULL. 128 */ 129 bool (*compose) (const hb_ot_shape_normalize_context_t *c, 130 hb_codepoint_t a, 131 hb_codepoint_t b, 132 hb_codepoint_t *ab); 133 134 /* setup_masks() 135 * Called during shape(). 136 * Shapers should use map to get feature masks and set on buffer. 137 * Shapers may NOT modify characters. 138 * May be NULL. 139 */ 140 void (*setup_masks) (const hb_ot_shape_plan_t *plan, 141 hb_buffer_t *buffer, 142 hb_font_t *font); 143 144 hb_ot_shape_zero_width_marks_type_t zero_width_marks; 145 146 bool fallback_position; 147 }; 148 149 #define HB_COMPLEX_SHAPER_IMPLEMENT(name) extern HB_INTERNAL const hb_ot_complex_shaper_t _hb_ot_complex_shaper_##name; 150 HB_COMPLEX_SHAPERS_IMPLEMENT_SHAPERS 151 #undef HB_COMPLEX_SHAPER_IMPLEMENT 152 153 154 static inline const hb_ot_complex_shaper_t * 155 hb_ot_shape_complex_categorize (const hb_ot_shape_planner_t *planner) 156 { 157 switch ((hb_tag_t) planner->props.script) 158 { 159 default: 160 return &_hb_ot_complex_shaper_default; 161 162 163 /* Unicode-1.1 additions */ 164 case HB_SCRIPT_ARABIC: 165 166 /* Unicode-3.0 additions */ 167 case HB_SCRIPT_MONGOLIAN: 168 case HB_SCRIPT_SYRIAC: 169 170 /* Unicode-5.0 additions */ 171 case HB_SCRIPT_NKO: 172 case HB_SCRIPT_PHAGS_PA: 173 174 /* Unicode-6.0 additions */ 175 case HB_SCRIPT_MANDAIC: 176 177 /* Unicode-7.0 additions */ 178 case HB_SCRIPT_MANICHAEAN: 179 case HB_SCRIPT_PSALTER_PAHLAVI: 180 181 /* For Arabic script, use the Arabic shaper even if no OT script tag was found. 182 * This is because we do fallback shaping for Arabic script (and not others). */ 183 if (planner->map.chosen_script[0] != HB_OT_TAG_DEFAULT_SCRIPT || 184 planner->props.script == HB_SCRIPT_ARABIC) 185 return &_hb_ot_complex_shaper_arabic; 186 else 187 return &_hb_ot_complex_shaper_default; 188 189 190 /* Unicode-1.1 additions */ 191 case HB_SCRIPT_THAI: 192 case HB_SCRIPT_LAO: 193 194 return &_hb_ot_complex_shaper_thai; 195 196 197 /* Unicode-1.1 additions */ 198 case HB_SCRIPT_HANGUL: 199 200 return &_hb_ot_complex_shaper_hangul; 201 202 203 /* Unicode-2.0 additions */ 204 case HB_SCRIPT_TIBETAN: 205 206 return &_hb_ot_complex_shaper_tibetan; 207 208 209 /* Unicode-1.1 additions */ 210 case HB_SCRIPT_HEBREW: 211 212 return &_hb_ot_complex_shaper_hebrew; 213 214 215 /* ^--- Add new shapers here */ 216 217 218 #if 0 219 /* Note: 220 * 221 * These disabled scripts are listed in ucd/IndicSyllabicCategory.txt, but according 222 * to Martin Hosken and Jonathan Kew do not require complex shaping. 223 * 224 * TODO We should automate figuring out which scripts do not need complex shaping 225 * 226 * TODO We currently keep data for these scripts in our indic table. Need to fix the 227 * generator to not do that. 228 */ 229 230 231 /* Simple? */ 232 233 /* Unicode-3.2 additions */ 234 case HB_SCRIPT_BUHID: 235 case HB_SCRIPT_HANUNOO: 236 237 /* Unicode-5.1 additions */ 238 case HB_SCRIPT_SAURASHTRA: 239 240 /* Unicode-6.0 additions */ 241 case HB_SCRIPT_BATAK: 242 case HB_SCRIPT_BRAHMI: 243 244 245 /* Simple */ 246 247 /* Unicode-1.1 additions */ 248 /* These have their own shaper now. */ 249 case HB_SCRIPT_LAO: 250 case HB_SCRIPT_THAI: 251 252 /* Unicode-3.2 additions */ 253 case HB_SCRIPT_TAGALOG: 254 case HB_SCRIPT_TAGBANWA: 255 256 /* Unicode-4.0 additions */ 257 case HB_SCRIPT_LIMBU: 258 case HB_SCRIPT_TAI_LE: 259 260 /* Unicode-4.1 additions */ 261 case HB_SCRIPT_KHAROSHTHI: 262 case HB_SCRIPT_NEW_TAI_LUE: 263 case HB_SCRIPT_SYLOTI_NAGRI: 264 265 /* Unicode-5.1 additions */ 266 case HB_SCRIPT_KAYAH_LI: 267 268 /* Unicode-5.2 additions */ 269 case HB_SCRIPT_TAI_VIET: 270 271 272 #endif 273 274 /* Unicode-1.1 additions */ 275 case HB_SCRIPT_BENGALI: 276 case HB_SCRIPT_DEVANAGARI: 277 case HB_SCRIPT_GUJARATI: 278 case HB_SCRIPT_GURMUKHI: 279 case HB_SCRIPT_KANNADA: 280 case HB_SCRIPT_MALAYALAM: 281 case HB_SCRIPT_ORIYA: 282 case HB_SCRIPT_TAMIL: 283 case HB_SCRIPT_TELUGU: 284 285 /* Unicode-3.0 additions */ 286 case HB_SCRIPT_SINHALA: 287 288 /* Unicode-5.0 additions */ 289 case HB_SCRIPT_BALINESE: 290 291 /* Unicode-5.1 additions */ 292 case HB_SCRIPT_LEPCHA: 293 case HB_SCRIPT_REJANG: 294 case HB_SCRIPT_SUNDANESE: 295 296 /* Unicode-5.2 additions */ 297 case HB_SCRIPT_JAVANESE: 298 case HB_SCRIPT_KAITHI: 299 case HB_SCRIPT_MEETEI_MAYEK: 300 301 /* Unicode-6.0 additions */ 302 303 /* Unicode-6.1 additions */ 304 case HB_SCRIPT_CHAKMA: 305 case HB_SCRIPT_SHARADA: 306 case HB_SCRIPT_TAKRI: 307 308 /* If the designer designed the font for the 'DFLT' script, 309 * use the default shaper. Otherwise, use the Indic shaper. 310 * Note that for some simple scripts, there may not be *any* 311 * GSUB/GPOS needed, so there may be no scripts found! */ 312 if (planner->map.chosen_script[0] == HB_TAG ('D','F','L','T')) 313 return &_hb_ot_complex_shaper_default; 314 else 315 return &_hb_ot_complex_shaper_indic; 316 317 case HB_SCRIPT_KHMER: 318 /* A number of Khmer fonts in the wild don't have a 'pref' feature, 319 * and as such won't shape properly via the Indic shaper; 320 * however, they typically have 'liga' / 'clig' features that implement 321 * the necessary "reordering" by means of ligature substitutions. 322 * So we send such pref-less fonts through the generic shaper instead. */ 323 if (planner->map.found_script[0] && 324 hb_ot_layout_language_find_feature (planner->face, HB_OT_TAG_GSUB, 325 planner->map.script_index[0], 326 planner->map.language_index[0], 327 HB_TAG ('p','r','e','f'), 328 NULL)) 329 return &_hb_ot_complex_shaper_indic; 330 else 331 return &_hb_ot_complex_shaper_default; 332 333 case HB_SCRIPT_MYANMAR: 334 if (planner->map.chosen_script[0] == HB_TAG ('m','y','m','2')) 335 return &_hb_ot_complex_shaper_myanmar; 336 else if (planner->map.chosen_script[0] == HB_TAG ('m','y','m','r')) 337 return &_hb_ot_complex_shaper_myanmar_old; 338 else 339 return &_hb_ot_complex_shaper_default; 340 341 /* Unicode-4.1 additions */ 342 case HB_SCRIPT_BUGINESE: 343 344 /* Unicode-5.1 additions */ 345 case HB_SCRIPT_CHAM: 346 347 /* Unicode-5.2 additions */ 348 case HB_SCRIPT_TAI_THAM: 349 350 /* If the designer designed the font for the 'DFLT' script, 351 * use the default shaper. Otherwise, use the Indic shaper. 352 * Note that for some simple scripts, there may not be *any* 353 * GSUB/GPOS needed, so there may be no scripts found! */ 354 if (planner->map.chosen_script[0] == HB_TAG ('D','F','L','T')) 355 return &_hb_ot_complex_shaper_default; 356 else 357 return &_hb_ot_complex_shaper_sea; 358 } 359 } 360 361 362 #endif /* HB_OT_SHAPE_COMPLEX_PRIVATE_HH */ 363