Home | History | Annotate | Download | only in src
      1 /*
      2  * Copyright  2009  Red Hat, Inc.
      3  * Copyright  2011  Codethink Limited
      4  * Copyright  2011,2012  Google, Inc.
      5  *
      6  *  This is part of HarfBuzz, a text shaping library.
      7  *
      8  * Permission is hereby granted, without written agreement and without
      9  * license or royalty fees, to use, copy, modify, and distribute this
     10  * software and its documentation for any purpose, provided that the
     11  * above copyright notice and the following two paragraphs appear in
     12  * all copies of this software.
     13  *
     14  * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
     15  * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
     16  * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
     17  * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
     18  * DAMAGE.
     19  *
     20  * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
     21  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
     22  * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
     23  * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
     24  * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
     25  *
     26  * Red Hat Author(s): Behdad Esfahbod
     27  * Codethink Author(s): Ryan Lortie
     28  * Google Author(s): Behdad Esfahbod
     29  */
     30 
     31 #ifndef HB_H_IN
     32 #error "Include <hb.h> instead."
     33 #endif
     34 
     35 #ifndef HB_UNICODE_H
     36 #define HB_UNICODE_H
     37 
     38 #include "hb-common.h"
     39 
     40 HB_BEGIN_DECLS
     41 
     42 
     43 /**
     44  * HB_UNICODE_MAX
     45  *
     46  * Since: 1.9.0
     47  **/
     48 #define HB_UNICODE_MAX 0x10FFFFu
     49 
     50 
     51 /* hb_unicode_general_category_t */
     52 
     53 /* Unicode Character Database property: General_Category (gc) */
     54 typedef enum
     55 {
     56   HB_UNICODE_GENERAL_CATEGORY_CONTROL,			/* Cc */
     57   HB_UNICODE_GENERAL_CATEGORY_FORMAT,			/* Cf */
     58   HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED,		/* Cn */
     59   HB_UNICODE_GENERAL_CATEGORY_PRIVATE_USE,		/* Co */
     60   HB_UNICODE_GENERAL_CATEGORY_SURROGATE,		/* Cs */
     61   HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER,		/* Ll */
     62   HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER,		/* Lm */
     63   HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER,		/* Lo */
     64   HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER,		/* Lt */
     65   HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER,		/* Lu */
     66   HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK,		/* Mc */
     67   HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK,		/* Me */
     68   HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK,		/* Mn */
     69   HB_UNICODE_GENERAL_CATEGORY_DECIMAL_NUMBER,		/* Nd */
     70   HB_UNICODE_GENERAL_CATEGORY_LETTER_NUMBER,		/* Nl */
     71   HB_UNICODE_GENERAL_CATEGORY_OTHER_NUMBER,		/* No */
     72   HB_UNICODE_GENERAL_CATEGORY_CONNECT_PUNCTUATION,	/* Pc */
     73   HB_UNICODE_GENERAL_CATEGORY_DASH_PUNCTUATION,		/* Pd */
     74   HB_UNICODE_GENERAL_CATEGORY_CLOSE_PUNCTUATION,	/* Pe */
     75   HB_UNICODE_GENERAL_CATEGORY_FINAL_PUNCTUATION,	/* Pf */
     76   HB_UNICODE_GENERAL_CATEGORY_INITIAL_PUNCTUATION,	/* Pi */
     77   HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION,	/* Po */
     78   HB_UNICODE_GENERAL_CATEGORY_OPEN_PUNCTUATION,		/* Ps */
     79   HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL,		/* Sc */
     80   HB_UNICODE_GENERAL_CATEGORY_MODIFIER_SYMBOL,		/* Sk */
     81   HB_UNICODE_GENERAL_CATEGORY_MATH_SYMBOL,		/* Sm */
     82   HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL,		/* So */
     83   HB_UNICODE_GENERAL_CATEGORY_LINE_SEPARATOR,		/* Zl */
     84   HB_UNICODE_GENERAL_CATEGORY_PARAGRAPH_SEPARATOR,	/* Zp */
     85   HB_UNICODE_GENERAL_CATEGORY_SPACE_SEPARATOR		/* Zs */
     86 } hb_unicode_general_category_t;
     87 
     88 /* hb_unicode_combining_class_t */
     89 
     90 /* Note: newer versions of Unicode may add new values.  Clients should be ready to handle
     91  * any value in the 0..254 range being returned from hb_unicode_combining_class().
     92  */
     93 
     94 /* Unicode Character Database property: Canonical_Combining_Class (ccc) */
     95 typedef enum
     96 {
     97   HB_UNICODE_COMBINING_CLASS_NOT_REORDERED	= 0,
     98   HB_UNICODE_COMBINING_CLASS_OVERLAY		= 1,
     99   HB_UNICODE_COMBINING_CLASS_NUKTA		= 7,
    100   HB_UNICODE_COMBINING_CLASS_KANA_VOICING	= 8,
    101   HB_UNICODE_COMBINING_CLASS_VIRAMA		= 9,
    102 
    103   /* Hebrew */
    104   HB_UNICODE_COMBINING_CLASS_CCC10	=  10,
    105   HB_UNICODE_COMBINING_CLASS_CCC11	=  11,
    106   HB_UNICODE_COMBINING_CLASS_CCC12	=  12,
    107   HB_UNICODE_COMBINING_CLASS_CCC13	=  13,
    108   HB_UNICODE_COMBINING_CLASS_CCC14	=  14,
    109   HB_UNICODE_COMBINING_CLASS_CCC15	=  15,
    110   HB_UNICODE_COMBINING_CLASS_CCC16	=  16,
    111   HB_UNICODE_COMBINING_CLASS_CCC17	=  17,
    112   HB_UNICODE_COMBINING_CLASS_CCC18	=  18,
    113   HB_UNICODE_COMBINING_CLASS_CCC19	=  19,
    114   HB_UNICODE_COMBINING_CLASS_CCC20	=  20,
    115   HB_UNICODE_COMBINING_CLASS_CCC21	=  21,
    116   HB_UNICODE_COMBINING_CLASS_CCC22	=  22,
    117   HB_UNICODE_COMBINING_CLASS_CCC23	=  23,
    118   HB_UNICODE_COMBINING_CLASS_CCC24	=  24,
    119   HB_UNICODE_COMBINING_CLASS_CCC25	=  25,
    120   HB_UNICODE_COMBINING_CLASS_CCC26	=  26,
    121 
    122   /* Arabic */
    123   HB_UNICODE_COMBINING_CLASS_CCC27	=  27,
    124   HB_UNICODE_COMBINING_CLASS_CCC28	=  28,
    125   HB_UNICODE_COMBINING_CLASS_CCC29	=  29,
    126   HB_UNICODE_COMBINING_CLASS_CCC30	=  30,
    127   HB_UNICODE_COMBINING_CLASS_CCC31	=  31,
    128   HB_UNICODE_COMBINING_CLASS_CCC32	=  32,
    129   HB_UNICODE_COMBINING_CLASS_CCC33	=  33,
    130   HB_UNICODE_COMBINING_CLASS_CCC34	=  34,
    131   HB_UNICODE_COMBINING_CLASS_CCC35	=  35,
    132 
    133   /* Syriac */
    134   HB_UNICODE_COMBINING_CLASS_CCC36	=  36,
    135 
    136   /* Telugu */
    137   HB_UNICODE_COMBINING_CLASS_CCC84	=  84,
    138   HB_UNICODE_COMBINING_CLASS_CCC91	=  91,
    139 
    140   /* Thai */
    141   HB_UNICODE_COMBINING_CLASS_CCC103	= 103,
    142   HB_UNICODE_COMBINING_CLASS_CCC107	= 107,
    143 
    144   /* Lao */
    145   HB_UNICODE_COMBINING_CLASS_CCC118	= 118,
    146   HB_UNICODE_COMBINING_CLASS_CCC122	= 122,
    147 
    148   /* Tibetan */
    149   HB_UNICODE_COMBINING_CLASS_CCC129	= 129,
    150   HB_UNICODE_COMBINING_CLASS_CCC130	= 130,
    151   HB_UNICODE_COMBINING_CLASS_CCC133	= 132,
    152 
    153 
    154   HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW_LEFT	= 200,
    155   HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW		= 202,
    156   HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE		= 214,
    157   HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE_RIGHT	= 216,
    158   HB_UNICODE_COMBINING_CLASS_BELOW_LEFT			= 218,
    159   HB_UNICODE_COMBINING_CLASS_BELOW			= 220,
    160   HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT		= 222,
    161   HB_UNICODE_COMBINING_CLASS_LEFT			= 224,
    162   HB_UNICODE_COMBINING_CLASS_RIGHT			= 226,
    163   HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT			= 228,
    164   HB_UNICODE_COMBINING_CLASS_ABOVE			= 230,
    165   HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT		= 232,
    166   HB_UNICODE_COMBINING_CLASS_DOUBLE_BELOW		= 233,
    167   HB_UNICODE_COMBINING_CLASS_DOUBLE_ABOVE		= 234,
    168 
    169   HB_UNICODE_COMBINING_CLASS_IOTA_SUBSCRIPT		= 240,
    170 
    171   HB_UNICODE_COMBINING_CLASS_INVALID	= 255
    172 } hb_unicode_combining_class_t;
    173 
    174 
    175 /*
    176  * hb_unicode_funcs_t
    177  */
    178 
    179 typedef struct hb_unicode_funcs_t hb_unicode_funcs_t;
    180 
    181 
    182 /*
    183  * just give me the best implementation you've got there.
    184  */
    185 HB_EXTERN hb_unicode_funcs_t *
    186 hb_unicode_funcs_get_default (void);
    187 
    188 
    189 HB_EXTERN hb_unicode_funcs_t *
    190 hb_unicode_funcs_create (hb_unicode_funcs_t *parent);
    191 
    192 HB_EXTERN hb_unicode_funcs_t *
    193 hb_unicode_funcs_get_empty (void);
    194 
    195 HB_EXTERN hb_unicode_funcs_t *
    196 hb_unicode_funcs_reference (hb_unicode_funcs_t *ufuncs);
    197 
    198 HB_EXTERN void
    199 hb_unicode_funcs_destroy (hb_unicode_funcs_t *ufuncs);
    200 
    201 HB_EXTERN hb_bool_t
    202 hb_unicode_funcs_set_user_data (hb_unicode_funcs_t *ufuncs,
    203 			        hb_user_data_key_t *key,
    204 			        void *              data,
    205 			        hb_destroy_func_t   destroy,
    206 				hb_bool_t           replace);
    207 
    208 
    209 HB_EXTERN void *
    210 hb_unicode_funcs_get_user_data (hb_unicode_funcs_t *ufuncs,
    211 			        hb_user_data_key_t *key);
    212 
    213 
    214 HB_EXTERN void
    215 hb_unicode_funcs_make_immutable (hb_unicode_funcs_t *ufuncs);
    216 
    217 HB_EXTERN hb_bool_t
    218 hb_unicode_funcs_is_immutable (hb_unicode_funcs_t *ufuncs);
    219 
    220 HB_EXTERN hb_unicode_funcs_t *
    221 hb_unicode_funcs_get_parent (hb_unicode_funcs_t *ufuncs);
    222 
    223 
    224 /*
    225  * funcs
    226  */
    227 
    228 /* typedefs */
    229 
    230 typedef hb_unicode_combining_class_t	(*hb_unicode_combining_class_func_t)	(hb_unicode_funcs_t *ufuncs,
    231 										 hb_codepoint_t      unicode,
    232 										 void               *user_data);
    233 typedef hb_unicode_general_category_t	(*hb_unicode_general_category_func_t)	(hb_unicode_funcs_t *ufuncs,
    234 										 hb_codepoint_t      unicode,
    235 										 void               *user_data);
    236 typedef hb_codepoint_t			(*hb_unicode_mirroring_func_t)		(hb_unicode_funcs_t *ufuncs,
    237 										 hb_codepoint_t      unicode,
    238 										 void               *user_data);
    239 typedef hb_script_t			(*hb_unicode_script_func_t)		(hb_unicode_funcs_t *ufuncs,
    240 										 hb_codepoint_t      unicode,
    241 										 void               *user_data);
    242 
    243 typedef hb_bool_t			(*hb_unicode_compose_func_t)		(hb_unicode_funcs_t *ufuncs,
    244 										 hb_codepoint_t      a,
    245 										 hb_codepoint_t      b,
    246 										 hb_codepoint_t     *ab,
    247 										 void               *user_data);
    248 typedef hb_bool_t			(*hb_unicode_decompose_func_t)		(hb_unicode_funcs_t *ufuncs,
    249 										 hb_codepoint_t      ab,
    250 										 hb_codepoint_t     *a,
    251 										 hb_codepoint_t     *b,
    252 										 void               *user_data);
    253 
    254 /* setters */
    255 
    256 /**
    257  * hb_unicode_funcs_set_combining_class_func:
    258  * @ufuncs: a Unicode function structure
    259  * @func: (closure user_data) (destroy destroy) (scope notified):
    260  * @user_data:
    261  * @destroy:
    262  *
    263  *
    264  *
    265  * Since: 0.9.2
    266  **/
    267 HB_EXTERN void
    268 hb_unicode_funcs_set_combining_class_func (hb_unicode_funcs_t *ufuncs,
    269 					   hb_unicode_combining_class_func_t func,
    270 					   void *user_data, hb_destroy_func_t destroy);
    271 
    272 /**
    273  * hb_unicode_funcs_set_general_category_func:
    274  * @ufuncs: a Unicode function structure
    275  * @func: (closure user_data) (destroy destroy) (scope notified):
    276  * @user_data:
    277  * @destroy:
    278  *
    279  *
    280  *
    281  * Since: 0.9.2
    282  **/
    283 HB_EXTERN void
    284 hb_unicode_funcs_set_general_category_func (hb_unicode_funcs_t *ufuncs,
    285 					    hb_unicode_general_category_func_t func,
    286 					    void *user_data, hb_destroy_func_t destroy);
    287 
    288 /**
    289  * hb_unicode_funcs_set_mirroring_func:
    290  * @ufuncs: a Unicode function structure
    291  * @func: (closure user_data) (destroy destroy) (scope notified):
    292  * @user_data:
    293  * @destroy:
    294  *
    295  *
    296  *
    297  * Since: 0.9.2
    298  **/
    299 HB_EXTERN void
    300 hb_unicode_funcs_set_mirroring_func (hb_unicode_funcs_t *ufuncs,
    301 				     hb_unicode_mirroring_func_t func,
    302 				     void *user_data, hb_destroy_func_t destroy);
    303 
    304 /**
    305  * hb_unicode_funcs_set_script_func:
    306  * @ufuncs: a Unicode function structure
    307  * @func: (closure user_data) (destroy destroy) (scope notified):
    308  * @user_data:
    309  * @destroy:
    310  *
    311  *
    312  *
    313  * Since: 0.9.2
    314  **/
    315 HB_EXTERN void
    316 hb_unicode_funcs_set_script_func (hb_unicode_funcs_t *ufuncs,
    317 				  hb_unicode_script_func_t func,
    318 				  void *user_data, hb_destroy_func_t destroy);
    319 
    320 /**
    321  * hb_unicode_funcs_set_compose_func:
    322  * @ufuncs: a Unicode function structure
    323  * @func: (closure user_data) (destroy destroy) (scope notified):
    324  * @user_data:
    325  * @destroy:
    326  *
    327  *
    328  *
    329  * Since: 0.9.2
    330  **/
    331 HB_EXTERN void
    332 hb_unicode_funcs_set_compose_func (hb_unicode_funcs_t *ufuncs,
    333 				   hb_unicode_compose_func_t func,
    334 				   void *user_data, hb_destroy_func_t destroy);
    335 
    336 /**
    337  * hb_unicode_funcs_set_decompose_func:
    338  * @ufuncs: a Unicode function structure
    339  * @func: (closure user_data) (destroy destroy) (scope notified):
    340  * @user_data:
    341  * @destroy:
    342  *
    343  *
    344  *
    345  * Since: 0.9.2
    346  **/
    347 HB_EXTERN void
    348 hb_unicode_funcs_set_decompose_func (hb_unicode_funcs_t *ufuncs,
    349 				     hb_unicode_decompose_func_t func,
    350 				     void *user_data, hb_destroy_func_t destroy);
    351 
    352 /* accessors */
    353 
    354 /**
    355  * hb_unicode_combining_class:
    356  *
    357  * Since: 0.9.2
    358  **/
    359 HB_EXTERN hb_unicode_combining_class_t
    360 hb_unicode_combining_class (hb_unicode_funcs_t *ufuncs,
    361 			    hb_codepoint_t unicode);
    362 
    363 /**
    364  * hb_unicode_general_category:
    365  *
    366  * Since: 0.9.2
    367  **/
    368 HB_EXTERN hb_unicode_general_category_t
    369 hb_unicode_general_category (hb_unicode_funcs_t *ufuncs,
    370 			     hb_codepoint_t unicode);
    371 
    372 /**
    373  * hb_unicode_mirroring:
    374  *
    375  * Since: 0.9.2
    376  **/
    377 HB_EXTERN hb_codepoint_t
    378 hb_unicode_mirroring (hb_unicode_funcs_t *ufuncs,
    379 		      hb_codepoint_t unicode);
    380 
    381 /**
    382  * hb_unicode_script:
    383  *
    384  * Since: 0.9.2
    385  **/
    386 HB_EXTERN hb_script_t
    387 hb_unicode_script (hb_unicode_funcs_t *ufuncs,
    388 		   hb_codepoint_t unicode);
    389 
    390 HB_EXTERN hb_bool_t
    391 hb_unicode_compose (hb_unicode_funcs_t *ufuncs,
    392 		    hb_codepoint_t      a,
    393 		    hb_codepoint_t      b,
    394 		    hb_codepoint_t     *ab);
    395 
    396 HB_EXTERN hb_bool_t
    397 hb_unicode_decompose (hb_unicode_funcs_t *ufuncs,
    398 		      hb_codepoint_t      ab,
    399 		      hb_codepoint_t     *a,
    400 		      hb_codepoint_t     *b);
    401 
    402 HB_END_DECLS
    403 
    404 #endif /* HB_UNICODE_H */
    405