1 /* 2 * Copyright 1998-2004 David Turner and Werner Lemberg 3 * Copyright 2004,2007,2009,2010 Red Hat, Inc. 4 * Copyright 2011,2012 Google, Inc. 5 * 6 * This is part of HarfBuzz, a text shaping library. 7 * 8 * Permission is hereby granted, without written agreement and without 9 * license or royalty fees, to use, copy, modify, and distribute this 10 * software and its documentation for any purpose, provided that the 11 * above copyright notice and the following two paragraphs appear in 12 * all copies of this software. 13 * 14 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR 15 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES 16 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN 17 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH 18 * DAMAGE. 19 * 20 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, 21 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND 22 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS 23 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO 24 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. 25 * 26 * Red Hat Author(s): Owen Taylor, Behdad Esfahbod 27 * Google Author(s): Behdad Esfahbod 28 */ 29 30 #ifndef HB_BUFFER_HH 31 #define HB_BUFFER_HH 32 33 #include "hb.hh" 34 #include "hb-unicode.hh" 35 36 37 #ifndef HB_BUFFER_MAX_LEN_FACTOR 38 #define HB_BUFFER_MAX_LEN_FACTOR 32 39 #endif 40 #ifndef HB_BUFFER_MAX_LEN_MIN 41 #define HB_BUFFER_MAX_LEN_MIN 8192 42 #endif 43 #ifndef HB_BUFFER_MAX_LEN_DEFAULT 44 #define HB_BUFFER_MAX_LEN_DEFAULT 0x3FFFFFFF /* Shaping more than a billion chars? Let us know! */ 45 #endif 46 47 #ifndef HB_BUFFER_MAX_OPS_FACTOR 48 #define HB_BUFFER_MAX_OPS_FACTOR 64 49 #endif 50 #ifndef HB_BUFFER_MAX_OPS_MIN 51 #define HB_BUFFER_MAX_OPS_MIN 1024 52 #endif 53 #ifndef HB_BUFFER_MAX_OPS_DEFAULT 54 #define HB_BUFFER_MAX_OPS_DEFAULT 0x1FFFFFFF /* Shaping more than a billion operations? Let us know! */ 55 #endif 56 57 static_assert ((sizeof (hb_glyph_info_t) == 20), ""); 58 static_assert ((sizeof (hb_glyph_info_t) == sizeof (hb_glyph_position_t)), ""); 59 60 HB_MARK_AS_FLAG_T (hb_buffer_flags_t); 61 HB_MARK_AS_FLAG_T (hb_buffer_serialize_flags_t); 62 HB_MARK_AS_FLAG_T (hb_buffer_diff_flags_t); 63 64 enum hb_buffer_scratch_flags_t { 65 HB_BUFFER_SCRATCH_FLAG_DEFAULT = 0x00000000u, 66 HB_BUFFER_SCRATCH_FLAG_HAS_NON_ASCII = 0x00000001u, 67 HB_BUFFER_SCRATCH_FLAG_HAS_DEFAULT_IGNORABLES = 0x00000002u, 68 HB_BUFFER_SCRATCH_FLAG_HAS_SPACE_FALLBACK = 0x00000004u, 69 HB_BUFFER_SCRATCH_FLAG_HAS_GPOS_ATTACHMENT = 0x00000008u, 70 HB_BUFFER_SCRATCH_FLAG_HAS_UNSAFE_TO_BREAK = 0x00000010u, 71 HB_BUFFER_SCRATCH_FLAG_HAS_CGJ = 0x00000020u, 72 73 /* Reserved for complex shapers' internal use. */ 74 HB_BUFFER_SCRATCH_FLAG_COMPLEX0 = 0x01000000u, 75 HB_BUFFER_SCRATCH_FLAG_COMPLEX1 = 0x02000000u, 76 HB_BUFFER_SCRATCH_FLAG_COMPLEX2 = 0x04000000u, 77 HB_BUFFER_SCRATCH_FLAG_COMPLEX3 = 0x08000000u, 78 }; 79 HB_MARK_AS_FLAG_T (hb_buffer_scratch_flags_t); 80 81 82 /* 83 * hb_buffer_t 84 */ 85 86 struct hb_buffer_t 87 { 88 hb_object_header_t header; 89 90 /* Information about how the text in the buffer should be treated */ 91 hb_unicode_funcs_t *unicode; /* Unicode functions */ 92 hb_buffer_flags_t flags; /* BOT / EOT / etc. */ 93 hb_buffer_cluster_level_t cluster_level; 94 hb_codepoint_t replacement; /* U+FFFD or something else. */ 95 hb_codepoint_t invisible; /* 0 or something else. */ 96 hb_buffer_scratch_flags_t scratch_flags; /* Have space-fallback, etc. */ 97 unsigned int max_len; /* Maximum allowed len. */ 98 int max_ops; /* Maximum allowed operations. */ 99 100 /* Buffer contents */ 101 hb_buffer_content_type_t content_type; 102 hb_segment_properties_t props; /* Script, language, direction */ 103 104 bool successful; /* Allocations successful */ 105 bool have_output; /* Whether we have an output buffer going on */ 106 bool have_positions; /* Whether we have positions */ 107 108 unsigned int idx; /* Cursor into ->info and ->pos arrays */ 109 unsigned int len; /* Length of ->info and ->pos arrays */ 110 unsigned int out_len; /* Length of ->out array if have_output */ 111 112 unsigned int allocated; /* Length of allocated arrays */ 113 hb_glyph_info_t *info; 114 hb_glyph_info_t *out_info; 115 hb_glyph_position_t *pos; 116 117 unsigned int serial; 118 119 /* Text before / after the main buffer contents. 120 * Always in Unicode, and ordered outward. 121 * Index 0 is for "pre-context", 1 for "post-context". */ 122 enum { CONTEXT_LENGTH = 5 }; 123 hb_codepoint_t context[2][CONTEXT_LENGTH]; 124 unsigned int context_len[2]; 125 126 /* Debugging API */ 127 hb_buffer_message_func_t message_func; 128 void *message_data; 129 hb_destroy_func_t message_destroy; 130 131 /* Internal debugging. */ 132 /* The bits here reflect current allocations of the bytes in glyph_info_t's var1 and var2. */ 133 #ifndef HB_NDEBUG 134 uint8_t allocated_var_bits; 135 #endif 136 137 138 /* Methods */ 139 140 bool in_error () const { return !successful; } 141 142 void allocate_var (unsigned int start, unsigned int count) 143 { 144 #ifndef HB_NDEBUG 145 unsigned int end = start + count; 146 assert (end <= 8); 147 unsigned int bits = (1u<<end) - (1u<<start); 148 assert (0 == (allocated_var_bits & bits)); 149 allocated_var_bits |= bits; 150 #endif 151 } 152 void deallocate_var (unsigned int start, unsigned int count) 153 { 154 #ifndef HB_NDEBUG 155 unsigned int end = start + count; 156 assert (end <= 8); 157 unsigned int bits = (1u<<end) - (1u<<start); 158 assert (bits == (allocated_var_bits & bits)); 159 allocated_var_bits &= ~bits; 160 #endif 161 } 162 void assert_var (unsigned int start, unsigned int count) 163 { 164 #ifndef HB_NDEBUG 165 unsigned int end = start + count; 166 assert (end <= 8); 167 unsigned int bits = (1u<<end) - (1u<<start); 168 assert (bits == (allocated_var_bits & bits)); 169 #endif 170 } 171 void deallocate_var_all () 172 { 173 #ifndef HB_NDEBUG 174 allocated_var_bits = 0; 175 #endif 176 } 177 178 hb_glyph_info_t &cur (unsigned int i = 0) { return info[idx + i]; } 179 hb_glyph_info_t cur (unsigned int i = 0) const { return info[idx + i]; } 180 181 hb_glyph_position_t &cur_pos (unsigned int i = 0) { return pos[idx + i]; } 182 hb_glyph_position_t cur_pos (unsigned int i = 0) const { return pos[idx + i]; } 183 184 hb_glyph_info_t &prev () { return out_info[out_len ? out_len - 1 : 0]; } 185 hb_glyph_info_t prev () const { return out_info[out_len ? out_len - 1 : 0]; } 186 187 bool has_separate_output () const { return info != out_info; } 188 189 190 HB_INTERNAL void reset (); 191 HB_INTERNAL void clear (); 192 193 unsigned int backtrack_len () const { return have_output? out_len : idx; } 194 unsigned int lookahead_len () const { return len - idx; } 195 unsigned int next_serial () { return serial++; } 196 197 HB_INTERNAL void add (hb_codepoint_t codepoint, 198 unsigned int cluster); 199 HB_INTERNAL void add_info (const hb_glyph_info_t &glyph_info); 200 201 HB_INTERNAL void reverse_range (unsigned int start, unsigned int end); 202 HB_INTERNAL void reverse (); 203 HB_INTERNAL void reverse_clusters (); 204 HB_INTERNAL void guess_segment_properties (); 205 206 HB_INTERNAL void swap_buffers (); 207 HB_INTERNAL void remove_output (); 208 HB_INTERNAL void clear_output (); 209 HB_INTERNAL void clear_positions (); 210 211 HB_INTERNAL void replace_glyphs (unsigned int num_in, 212 unsigned int num_out, 213 const hb_codepoint_t *glyph_data); 214 215 void replace_glyph (hb_codepoint_t glyph_index) 216 { 217 if (unlikely (out_info != info || out_len != idx)) { 218 if (unlikely (!make_room_for (1, 1))) return; 219 out_info[out_len] = info[idx]; 220 } 221 out_info[out_len].codepoint = glyph_index; 222 223 idx++; 224 out_len++; 225 } 226 /* Makes a copy of the glyph at idx to output and replace glyph_index */ 227 hb_glyph_info_t & output_glyph (hb_codepoint_t glyph_index) 228 { 229 if (unlikely (!make_room_for (0, 1))) return Crap(hb_glyph_info_t); 230 231 if (unlikely (idx == len && !out_len)) 232 return Crap(hb_glyph_info_t); 233 234 out_info[out_len] = idx < len ? info[idx] : out_info[out_len - 1]; 235 out_info[out_len].codepoint = glyph_index; 236 237 out_len++; 238 239 return out_info[out_len - 1]; 240 } 241 void output_info (const hb_glyph_info_t &glyph_info) 242 { 243 if (unlikely (!make_room_for (0, 1))) return; 244 245 out_info[out_len] = glyph_info; 246 247 out_len++; 248 } 249 /* Copies glyph at idx to output but doesn't advance idx */ 250 void copy_glyph () 251 { 252 if (unlikely (!make_room_for (0, 1))) return; 253 254 out_info[out_len] = info[idx]; 255 256 out_len++; 257 } 258 /* Copies glyph at idx to output and advance idx. 259 * If there's no output, just advance idx. */ 260 void 261 next_glyph () 262 { 263 if (have_output) 264 { 265 if (out_info != info || out_len != idx) 266 { 267 if (unlikely (!make_room_for (1, 1))) return; 268 out_info[out_len] = info[idx]; 269 } 270 out_len++; 271 } 272 273 idx++; 274 } 275 /* Copies n glyphs at idx to output and advance idx. 276 * If there's no output, just advance idx. */ 277 void 278 next_glyphs (unsigned int n) 279 { 280 if (have_output) 281 { 282 if (out_info != info || out_len != idx) 283 { 284 if (unlikely (!make_room_for (n, n))) return; 285 memmove (out_info + out_len, info + idx, n * sizeof (out_info[0])); 286 } 287 out_len += n; 288 } 289 290 idx += n; 291 } 292 /* Advance idx without copying to output. */ 293 void skip_glyph () { idx++; } 294 void reset_masks (hb_mask_t mask) 295 { 296 for (unsigned int j = 0; j < len; j++) 297 info[j].mask = mask; 298 } 299 void add_masks (hb_mask_t mask) 300 { 301 for (unsigned int j = 0; j < len; j++) 302 info[j].mask |= mask; 303 } 304 HB_INTERNAL void set_masks (hb_mask_t value, hb_mask_t mask, 305 unsigned int cluster_start, unsigned int cluster_end); 306 307 void merge_clusters (unsigned int start, unsigned int end) 308 { 309 if (end - start < 2) 310 return; 311 merge_clusters_impl (start, end); 312 } 313 HB_INTERNAL void merge_clusters_impl (unsigned int start, unsigned int end); 314 HB_INTERNAL void merge_out_clusters (unsigned int start, unsigned int end); 315 /* Merge clusters for deleting current glyph, and skip it. */ 316 HB_INTERNAL void delete_glyph (); 317 318 void unsafe_to_break (unsigned int start, 319 unsigned int end) 320 { 321 if (end - start < 2) 322 return; 323 unsafe_to_break_impl (start, end); 324 } 325 HB_INTERNAL void unsafe_to_break_impl (unsigned int start, unsigned int end); 326 HB_INTERNAL void unsafe_to_break_from_outbuffer (unsigned int start, unsigned int end); 327 328 329 /* Internal methods */ 330 HB_INTERNAL bool move_to (unsigned int i); /* i is output-buffer index. */ 331 332 HB_INTERNAL bool enlarge (unsigned int size); 333 334 bool ensure (unsigned int size) 335 { return likely (!size || size < allocated) ? true : enlarge (size); } 336 337 bool ensure_inplace (unsigned int size) 338 { return likely (!size || size < allocated); } 339 340 HB_INTERNAL bool make_room_for (unsigned int num_in, unsigned int num_out); 341 HB_INTERNAL bool shift_forward (unsigned int count); 342 343 typedef long scratch_buffer_t; 344 HB_INTERNAL scratch_buffer_t *get_scratch_buffer (unsigned int *size); 345 346 void clear_context (unsigned int side) { context_len[side] = 0; } 347 348 HB_INTERNAL void sort (unsigned int start, unsigned int end, int(*compar)(const hb_glyph_info_t *, const hb_glyph_info_t *)); 349 350 bool messaging () { return unlikely (message_func); } 351 bool message (hb_font_t *font, const char *fmt, ...) HB_PRINTF_FUNC(3, 4) 352 { 353 if (!messaging ()) 354 return true; 355 va_list ap; 356 va_start (ap, fmt); 357 bool ret = message_impl (font, fmt, ap); 358 va_end (ap); 359 return ret; 360 } 361 HB_INTERNAL bool message_impl (hb_font_t *font, const char *fmt, va_list ap) HB_PRINTF_FUNC(3, 0); 362 363 static void 364 set_cluster (hb_glyph_info_t &inf, unsigned int cluster, unsigned int mask = 0) 365 { 366 if (inf.cluster != cluster) 367 { 368 if (mask & HB_GLYPH_FLAG_UNSAFE_TO_BREAK) 369 inf.mask |= HB_GLYPH_FLAG_UNSAFE_TO_BREAK; 370 else 371 inf.mask &= ~HB_GLYPH_FLAG_UNSAFE_TO_BREAK; 372 } 373 inf.cluster = cluster; 374 } 375 376 int 377 _unsafe_to_break_find_min_cluster (const hb_glyph_info_t *infos, 378 unsigned int start, unsigned int end, 379 unsigned int cluster) const 380 { 381 for (unsigned int i = start; i < end; i++) 382 cluster = MIN<unsigned int> (cluster, infos[i].cluster); 383 return cluster; 384 } 385 void 386 _unsafe_to_break_set_mask (hb_glyph_info_t *infos, 387 unsigned int start, unsigned int end, 388 unsigned int cluster) 389 { 390 for (unsigned int i = start; i < end; i++) 391 if (cluster != infos[i].cluster) 392 { 393 scratch_flags |= HB_BUFFER_SCRATCH_FLAG_HAS_UNSAFE_TO_BREAK; 394 infos[i].mask |= HB_GLYPH_FLAG_UNSAFE_TO_BREAK; 395 } 396 } 397 398 void unsafe_to_break_all () 399 { unsafe_to_break_impl (0, len); } 400 void safe_to_break_all () 401 { 402 for (unsigned int i = 0; i < len; i++) 403 info[i].mask &= ~HB_GLYPH_FLAG_UNSAFE_TO_BREAK; 404 } 405 }; 406 DECLARE_NULL_INSTANCE (hb_buffer_t); 407 408 409 /* Loop over clusters. Duplicated in foreach_syllable(). */ 410 #define foreach_cluster(buffer, start, end) \ 411 for (unsigned int \ 412 _count = buffer->len, \ 413 start = 0, end = _count ? _next_cluster (buffer, 0) : 0; \ 414 start < _count; \ 415 start = end, end = _next_cluster (buffer, start)) 416 417 static inline unsigned int 418 _next_cluster (hb_buffer_t *buffer, unsigned int start) 419 { 420 hb_glyph_info_t *info = buffer->info; 421 unsigned int count = buffer->len; 422 423 unsigned int cluster = info[start].cluster; 424 while (++start < count && cluster == info[start].cluster) 425 ; 426 427 return start; 428 } 429 430 431 #define HB_BUFFER_XALLOCATE_VAR(b, func, var) \ 432 b->func (offsetof (hb_glyph_info_t, var) - offsetof(hb_glyph_info_t, var1), \ 433 sizeof (b->info[0].var)) 434 #define HB_BUFFER_ALLOCATE_VAR(b, var) HB_BUFFER_XALLOCATE_VAR (b, allocate_var, var ()) 435 #define HB_BUFFER_DEALLOCATE_VAR(b, var) HB_BUFFER_XALLOCATE_VAR (b, deallocate_var, var ()) 436 #define HB_BUFFER_ASSERT_VAR(b, var) HB_BUFFER_XALLOCATE_VAR (b, assert_var, var ()) 437 438 439 #endif /* HB_BUFFER_HH */ 440