Home | History | Annotate | Download | only in src
      1 /*
      2  * Copyright  2010,2011,2012  Google, Inc.
      3  *
      4  *  This is part of HarfBuzz, a text shaping library.
      5  *
      6  * Permission is hereby granted, without written agreement and without
      7  * license or royalty fees, to use, copy, modify, and distribute this
      8  * software and its documentation for any purpose, provided that the
      9  * above copyright notice and the following two paragraphs appear in
     10  * all copies of this software.
     11  *
     12  * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
     13  * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
     14  * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
     15  * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
     16  * DAMAGE.
     17  *
     18  * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
     19  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
     20  * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
     21  * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
     22  * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
     23  *
     24  * Google Author(s): Behdad Esfahbod
     25  */
     26 
     27 #ifndef HB_OT_SHAPE_COMPLEX_HH
     28 #define HB_OT_SHAPE_COMPLEX_HH
     29 
     30 #include "hb.hh"
     31 
     32 #include "hb-ot-layout.hh"
     33 #include "hb-ot-shape.hh"
     34 #include "hb-ot-shape-normalize.hh"
     35 
     36 
     37 /* buffer var allocations, used by complex shapers */
     38 #define complex_var_u8_0()	var2.u8[2]
     39 #define complex_var_u8_1()	var2.u8[3]
     40 
     41 
     42 #define HB_OT_SHAPE_COMPLEX_MAX_COMBINING_MARKS 32
     43 
     44 enum hb_ot_shape_zero_width_marks_type_t {
     45   HB_OT_SHAPE_ZERO_WIDTH_MARKS_NONE,
     46   HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_GDEF_EARLY,
     47   HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_GDEF_LATE
     48 };
     49 
     50 
     51 /* Master OT shaper list */
     52 #define HB_COMPLEX_SHAPERS_IMPLEMENT_SHAPERS \
     53   HB_COMPLEX_SHAPER_IMPLEMENT (default) /* should be first */ \
     54   HB_COMPLEX_SHAPER_IMPLEMENT (arabic) \
     55   HB_COMPLEX_SHAPER_IMPLEMENT (hangul) \
     56   HB_COMPLEX_SHAPER_IMPLEMENT (hebrew) \
     57   HB_COMPLEX_SHAPER_IMPLEMENT (indic) \
     58   HB_COMPLEX_SHAPER_IMPLEMENT (khmer) \
     59   HB_COMPLEX_SHAPER_IMPLEMENT (myanmar) \
     60   HB_COMPLEX_SHAPER_IMPLEMENT (myanmar_zawgyi) \
     61   HB_COMPLEX_SHAPER_IMPLEMENT (thai) \
     62   HB_COMPLEX_SHAPER_IMPLEMENT (use) \
     63   /* ^--- Add new shapers here */
     64 
     65 
     66 struct hb_ot_complex_shaper_t
     67 {
     68   /* collect_features()
     69    * Called during shape_plan().
     70    * Shapers should use plan->map to add their features and callbacks.
     71    * May be NULL.
     72    */
     73   void (*collect_features) (hb_ot_shape_planner_t *plan);
     74 
     75   /* override_features()
     76    * Called during shape_plan().
     77    * Shapers should use plan->map to override features and add callbacks after
     78    * common features are added.
     79    * May be NULL.
     80    */
     81   void (*override_features) (hb_ot_shape_planner_t *plan);
     82 
     83 
     84   /* data_create()
     85    * Called at the end of shape_plan().
     86    * Whatever shapers return will be accessible through plan->data later.
     87    * If nullptr is returned, means a plan failure.
     88    */
     89   void *(*data_create) (const hb_ot_shape_plan_t *plan);
     90 
     91   /* data_destroy()
     92    * Called when the shape_plan is being destroyed.
     93    * plan->data is passed here for destruction.
     94    * If nullptr is returned, means a plan failure.
     95    * May be NULL.
     96    */
     97   void (*data_destroy) (void *data);
     98 
     99 
    100   /* preprocess_text()
    101    * Called during shape().
    102    * Shapers can use to modify text before shaping starts.
    103    * May be NULL.
    104    */
    105   void (*preprocess_text) (const hb_ot_shape_plan_t *plan,
    106 			   hb_buffer_t              *buffer,
    107 			   hb_font_t                *font);
    108 
    109   /* postprocess_glyphs()
    110    * Called during shape().
    111    * Shapers can use to modify glyphs after shaping ends.
    112    * May be NULL.
    113    */
    114   void (*postprocess_glyphs) (const hb_ot_shape_plan_t *plan,
    115 			      hb_buffer_t              *buffer,
    116 			      hb_font_t                *font);
    117 
    118 
    119   hb_ot_shape_normalization_mode_t normalization_preference;
    120 
    121   /* decompose()
    122    * Called during shape()'s normalization.
    123    * May be NULL.
    124    */
    125   bool (*decompose) (const hb_ot_shape_normalize_context_t *c,
    126 		     hb_codepoint_t  ab,
    127 		     hb_codepoint_t *a,
    128 		     hb_codepoint_t *b);
    129 
    130   /* compose()
    131    * Called during shape()'s normalization.
    132    * May be NULL.
    133    */
    134   bool (*compose) (const hb_ot_shape_normalize_context_t *c,
    135 		   hb_codepoint_t  a,
    136 		   hb_codepoint_t  b,
    137 		   hb_codepoint_t *ab);
    138 
    139   /* setup_masks()
    140    * Called during shape().
    141    * Shapers should use map to get feature masks and set on buffer.
    142    * Shapers may NOT modify characters.
    143    * May be NULL.
    144    */
    145   void (*setup_masks) (const hb_ot_shape_plan_t *plan,
    146 		       hb_buffer_t              *buffer,
    147 		       hb_font_t                *font);
    148 
    149   /* gpos_tag()
    150    * If not HB_TAG_NONE, then must match found GPOS script tag for
    151    * GPOS to be applied.  Otherwise, fallback positioning will be used.
    152    */
    153   hb_tag_t gpos_tag;
    154 
    155   /* reorder_marks()
    156    * Called during shape().
    157    * Shapers can use to modify ordering of combining marks.
    158    * May be NULL.
    159    */
    160   void (*reorder_marks) (const hb_ot_shape_plan_t *plan,
    161 			 hb_buffer_t              *buffer,
    162 			 unsigned int              start,
    163 			 unsigned int              end);
    164 
    165   hb_ot_shape_zero_width_marks_type_t zero_width_marks;
    166 
    167   bool fallback_position;
    168 };
    169 
    170 #define HB_COMPLEX_SHAPER_IMPLEMENT(name) extern HB_INTERNAL const hb_ot_complex_shaper_t _hb_ot_complex_shaper_##name;
    171 HB_COMPLEX_SHAPERS_IMPLEMENT_SHAPERS
    172 #undef HB_COMPLEX_SHAPER_IMPLEMENT
    173 
    174 
    175 static inline const hb_ot_complex_shaper_t *
    176 hb_ot_shape_complex_categorize (const hb_ot_shape_planner_t *planner)
    177 {
    178   switch ((hb_tag_t) planner->props.script)
    179   {
    180     default:
    181       return &_hb_ot_complex_shaper_default;
    182 
    183 
    184     /* Unicode-1.1 additions */
    185     case HB_SCRIPT_ARABIC:
    186 
    187     /* Unicode-3.0 additions */
    188     case HB_SCRIPT_MONGOLIAN:
    189     case HB_SCRIPT_SYRIAC:
    190 
    191     /* Unicode-5.0 additions */
    192     case HB_SCRIPT_NKO:
    193     case HB_SCRIPT_PHAGS_PA:
    194 
    195     /* Unicode-6.0 additions */
    196     case HB_SCRIPT_MANDAIC:
    197 
    198     /* Unicode-7.0 additions */
    199     case HB_SCRIPT_MANICHAEAN:
    200     case HB_SCRIPT_PSALTER_PAHLAVI:
    201 
    202     /* Unicode-9.0 additions */
    203     case HB_SCRIPT_ADLAM:
    204 
    205     /* Unicode-11.0 additions */
    206     case HB_SCRIPT_HANIFI_ROHINGYA:
    207     case HB_SCRIPT_SOGDIAN:
    208 
    209       /* For Arabic script, use the Arabic shaper even if no OT script tag was found.
    210        * This is because we do fallback shaping for Arabic script (and not others).
    211        * But note that Arabic shaping is applicable only to horizontal layout; for
    212        * vertical text, just use the generic shaper instead. */
    213       if ((planner->map.chosen_script[0] != HB_OT_TAG_DEFAULT_SCRIPT ||
    214 	   planner->props.script == HB_SCRIPT_ARABIC) &&
    215 	  HB_DIRECTION_IS_HORIZONTAL(planner->props.direction))
    216 	return &_hb_ot_complex_shaper_arabic;
    217       else
    218 	return &_hb_ot_complex_shaper_default;
    219 
    220 
    221     /* Unicode-1.1 additions */
    222     case HB_SCRIPT_THAI:
    223     case HB_SCRIPT_LAO:
    224 
    225       return &_hb_ot_complex_shaper_thai;
    226 
    227 
    228     /* Unicode-1.1 additions */
    229     case HB_SCRIPT_HANGUL:
    230 
    231       return &_hb_ot_complex_shaper_hangul;
    232 
    233 
    234     /* Unicode-1.1 additions */
    235     case HB_SCRIPT_HEBREW:
    236 
    237       return &_hb_ot_complex_shaper_hebrew;
    238 
    239 
    240     /* Unicode-1.1 additions */
    241     case HB_SCRIPT_BENGALI:
    242     case HB_SCRIPT_DEVANAGARI:
    243     case HB_SCRIPT_GUJARATI:
    244     case HB_SCRIPT_GURMUKHI:
    245     case HB_SCRIPT_KANNADA:
    246     case HB_SCRIPT_MALAYALAM:
    247     case HB_SCRIPT_ORIYA:
    248     case HB_SCRIPT_TAMIL:
    249     case HB_SCRIPT_TELUGU:
    250 
    251     /* Unicode-3.0 additions */
    252     case HB_SCRIPT_SINHALA:
    253 
    254       /* If the designer designed the font for the 'DFLT' script,
    255        * (or we ended up arbitrarily pick 'latn'), use the default shaper.
    256        * Otherwise, use the specific shaper.
    257        *
    258        * If it's indy3 tag, send to USE. */
    259       if (planner->map.chosen_script[0] == HB_TAG ('D','F','L','T') ||
    260 	  planner->map.chosen_script[0] == HB_TAG ('l','a','t','n'))
    261 	return &_hb_ot_complex_shaper_default;
    262       else if ((planner->map.chosen_script[0] & 0x000000FF) == '3')
    263 	return &_hb_ot_complex_shaper_use;
    264       else
    265 	return &_hb_ot_complex_shaper_indic;
    266 
    267     case HB_SCRIPT_KHMER:
    268 	return &_hb_ot_complex_shaper_khmer;
    269 
    270     case HB_SCRIPT_MYANMAR:
    271       /* If the designer designed the font for the 'DFLT' script,
    272        * (or we ended up arbitrarily pick 'latn'), use the default shaper.
    273        * Otherwise, use the specific shaper.
    274        *
    275        * If designer designed for 'mymr' tag, also send to default
    276        * shaper.  That's tag used from before Myanmar shaping spec
    277        * was developed.  The shaping spec uses 'mym2' tag. */
    278       if (planner->map.chosen_script[0] == HB_TAG ('D','F','L','T') ||
    279 	  planner->map.chosen_script[0] == HB_TAG ('l','a','t','n') ||
    280 	  planner->map.chosen_script[0] == HB_TAG ('m','y','m','r'))
    281 	return &_hb_ot_complex_shaper_default;
    282       else
    283 	return &_hb_ot_complex_shaper_myanmar;
    284 
    285 
    286     /* https://github.com/harfbuzz/harfbuzz/issues/1162 */
    287     case HB_SCRIPT_MYANMAR_ZAWGYI:
    288 
    289       return &_hb_ot_complex_shaper_myanmar_zawgyi;
    290 
    291 
    292     /* Unicode-2.0 additions */
    293     case HB_SCRIPT_TIBETAN:
    294 
    295     /* Unicode-3.0 additions */
    296     //case HB_SCRIPT_MONGOLIAN:
    297     //case HB_SCRIPT_SINHALA:
    298 
    299     /* Unicode-3.2 additions */
    300     case HB_SCRIPT_BUHID:
    301     case HB_SCRIPT_HANUNOO:
    302     case HB_SCRIPT_TAGALOG:
    303     case HB_SCRIPT_TAGBANWA:
    304 
    305     /* Unicode-4.0 additions */
    306     case HB_SCRIPT_LIMBU:
    307     case HB_SCRIPT_TAI_LE:
    308 
    309     /* Unicode-4.1 additions */
    310     case HB_SCRIPT_BUGINESE:
    311     case HB_SCRIPT_KHAROSHTHI:
    312     case HB_SCRIPT_SYLOTI_NAGRI:
    313     case HB_SCRIPT_TIFINAGH:
    314 
    315     /* Unicode-5.0 additions */
    316     case HB_SCRIPT_BALINESE:
    317     //case HB_SCRIPT_NKO:
    318     //case HB_SCRIPT_PHAGS_PA:
    319 
    320     /* Unicode-5.1 additions */
    321     case HB_SCRIPT_CHAM:
    322     case HB_SCRIPT_KAYAH_LI:
    323     case HB_SCRIPT_LEPCHA:
    324     case HB_SCRIPT_REJANG:
    325     case HB_SCRIPT_SAURASHTRA:
    326     case HB_SCRIPT_SUNDANESE:
    327 
    328     /* Unicode-5.2 additions */
    329     case HB_SCRIPT_EGYPTIAN_HIEROGLYPHS:
    330     case HB_SCRIPT_JAVANESE:
    331     case HB_SCRIPT_KAITHI:
    332     case HB_SCRIPT_MEETEI_MAYEK:
    333     case HB_SCRIPT_TAI_THAM:
    334     case HB_SCRIPT_TAI_VIET:
    335 
    336     /* Unicode-6.0 additions */
    337     case HB_SCRIPT_BATAK:
    338     case HB_SCRIPT_BRAHMI:
    339     //case HB_SCRIPT_MANDAIC:
    340 
    341     /* Unicode-6.1 additions */
    342     case HB_SCRIPT_CHAKMA:
    343     case HB_SCRIPT_SHARADA:
    344     case HB_SCRIPT_TAKRI:
    345 
    346     /* Unicode-7.0 additions */
    347     case HB_SCRIPT_DUPLOYAN:
    348     case HB_SCRIPT_GRANTHA:
    349     case HB_SCRIPT_KHOJKI:
    350     case HB_SCRIPT_KHUDAWADI:
    351     case HB_SCRIPT_MAHAJANI:
    352     //case HB_SCRIPT_MANICHAEAN:
    353     case HB_SCRIPT_MODI:
    354     case HB_SCRIPT_PAHAWH_HMONG:
    355     //case HB_SCRIPT_PSALTER_PAHLAVI:
    356     case HB_SCRIPT_SIDDHAM:
    357     case HB_SCRIPT_TIRHUTA:
    358 
    359     /* Unicode-8.0 additions */
    360     case HB_SCRIPT_AHOM:
    361 
    362     /* Unicode-9.0 additions */
    363     //case HB_SCRIPT_ADLAM:
    364     case HB_SCRIPT_BHAIKSUKI:
    365     case HB_SCRIPT_MARCHEN:
    366     case HB_SCRIPT_NEWA:
    367 
    368     /* Unicode-10.0 additions */
    369     case HB_SCRIPT_MASARAM_GONDI:
    370     case HB_SCRIPT_SOYOMBO:
    371     case HB_SCRIPT_ZANABAZAR_SQUARE:
    372 
    373     /* Unicode-11.0 additions */
    374     case HB_SCRIPT_DOGRA:
    375     case HB_SCRIPT_GUNJALA_GONDI:
    376     //case HB_SCRIPT_HANIFI_ROHINGYA:
    377     case HB_SCRIPT_MAKASAR:
    378     //case HB_SCRIPT_SOGDIAN:
    379 
    380       /* If the designer designed the font for the 'DFLT' script,
    381        * (or we ended up arbitrarily pick 'latn'), use the default shaper.
    382        * Otherwise, use the specific shaper.
    383        * Note that for some simple scripts, there may not be *any*
    384        * GSUB/GPOS needed, so there may be no scripts found! */
    385       if (planner->map.chosen_script[0] == HB_TAG ('D','F','L','T') ||
    386 	  planner->map.chosen_script[0] == HB_TAG ('l','a','t','n'))
    387 	return &_hb_ot_complex_shaper_default;
    388       else
    389 	return &_hb_ot_complex_shaper_use;
    390   }
    391 }
    392 
    393 
    394 #endif /* HB_OT_SHAPE_COMPLEX_HH */
    395