| 1 | /* |
| 2 | * Copyright © 1998-2004 David Turner and Werner Lemberg |
| 3 | * Copyright © 2004,2007,2009,2010 Red Hat, Inc. |
| 4 | * Copyright © 2011,2012 Google, Inc. |
| 5 | * |
| 6 | * This is part of HarfBuzz, a text shaping library. |
| 7 | * |
| 8 | * Permission is hereby granted, without written agreement and without |
| 9 | * license or royalty fees, to use, copy, modify, and distribute this |
| 10 | * software and its documentation for any purpose, provided that the |
| 11 | * above copyright notice and the following two paragraphs appear in |
| 12 | * all copies of this software. |
| 13 | * |
| 14 | * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR |
| 15 | * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES |
| 16 | * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN |
| 17 | * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH |
| 18 | * DAMAGE. |
| 19 | * |
| 20 | * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, |
| 21 | * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND |
| 22 | * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS |
| 23 | * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO |
| 24 | * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. |
| 25 | * |
| 26 | * Red Hat Author(s): Owen Taylor, Behdad Esfahbod |
| 27 | * Google Author(s): Behdad Esfahbod |
| 28 | */ |
| 29 | |
| 30 | #ifndef HB_BUFFER_HH |
| 31 | #define HB_BUFFER_HH |
| 32 | |
| 33 | #include "hb.hh" |
| 34 | #include "hb-unicode.hh" |
| 35 | |
| 36 | |
| 37 | #ifndef HB_BUFFER_MAX_LEN_FACTOR |
| 38 | #define HB_BUFFER_MAX_LEN_FACTOR 32 |
| 39 | #endif |
| 40 | #ifndef HB_BUFFER_MAX_LEN_MIN |
| 41 | #define HB_BUFFER_MAX_LEN_MIN 8192 |
| 42 | #endif |
| 43 | #ifndef HB_BUFFER_MAX_LEN_DEFAULT |
| 44 | #define HB_BUFFER_MAX_LEN_DEFAULT 0x3FFFFFFF /* Shaping more than a billion chars? Let us know! */ |
| 45 | #endif |
| 46 | |
| 47 | #ifndef HB_BUFFER_MAX_OPS_FACTOR |
| 48 | #define HB_BUFFER_MAX_OPS_FACTOR 64 |
| 49 | #endif |
| 50 | #ifndef HB_BUFFER_MAX_OPS_MIN |
| 51 | #define HB_BUFFER_MAX_OPS_MIN 1024 |
| 52 | #endif |
| 53 | #ifndef HB_BUFFER_MAX_OPS_DEFAULT |
| 54 | #define HB_BUFFER_MAX_OPS_DEFAULT 0x1FFFFFFF /* Shaping more than a billion operations? Let us know! */ |
| 55 | #endif |
| 56 | |
| 57 | static_assert ((sizeof (hb_glyph_info_t) == 20), "" ); |
| 58 | static_assert ((sizeof (hb_glyph_info_t) == sizeof (hb_glyph_position_t)), "" ); |
| 59 | |
| 60 | HB_MARK_AS_FLAG_T (hb_buffer_flags_t); |
| 61 | HB_MARK_AS_FLAG_T (hb_buffer_serialize_flags_t); |
| 62 | HB_MARK_AS_FLAG_T (hb_buffer_diff_flags_t); |
| 63 | |
| 64 | enum hb_buffer_scratch_flags_t { |
| 65 | HB_BUFFER_SCRATCH_FLAG_DEFAULT = 0x00000000u, |
| 66 | HB_BUFFER_SCRATCH_FLAG_HAS_NON_ASCII = 0x00000001u, |
| 67 | HB_BUFFER_SCRATCH_FLAG_HAS_DEFAULT_IGNORABLES = 0x00000002u, |
| 68 | HB_BUFFER_SCRATCH_FLAG_HAS_SPACE_FALLBACK = 0x00000004u, |
| 69 | HB_BUFFER_SCRATCH_FLAG_HAS_GPOS_ATTACHMENT = 0x00000008u, |
| 70 | HB_BUFFER_SCRATCH_FLAG_HAS_UNSAFE_TO_BREAK = 0x00000010u, |
| 71 | HB_BUFFER_SCRATCH_FLAG_HAS_CGJ = 0x00000020u, |
| 72 | |
| 73 | /* Reserved for complex shapers' internal use. */ |
| 74 | HB_BUFFER_SCRATCH_FLAG_COMPLEX0 = 0x01000000u, |
| 75 | HB_BUFFER_SCRATCH_FLAG_COMPLEX1 = 0x02000000u, |
| 76 | HB_BUFFER_SCRATCH_FLAG_COMPLEX2 = 0x04000000u, |
| 77 | HB_BUFFER_SCRATCH_FLAG_COMPLEX3 = 0x08000000u, |
| 78 | }; |
| 79 | HB_MARK_AS_FLAG_T (hb_buffer_scratch_flags_t); |
| 80 | |
| 81 | |
| 82 | /* |
| 83 | * hb_buffer_t |
| 84 | */ |
| 85 | |
| 86 | struct hb_buffer_t |
| 87 | { |
| 88 | hb_object_header_t ; |
| 89 | |
| 90 | /* Information about how the text in the buffer should be treated */ |
| 91 | hb_unicode_funcs_t *unicode; /* Unicode functions */ |
| 92 | hb_buffer_flags_t flags; /* BOT / EOT / etc. */ |
| 93 | hb_buffer_cluster_level_t cluster_level; |
| 94 | hb_codepoint_t replacement; /* U+FFFD or something else. */ |
| 95 | hb_codepoint_t invisible; /* 0 or something else. */ |
| 96 | hb_buffer_scratch_flags_t scratch_flags; /* Have space-fallback, etc. */ |
| 97 | unsigned int max_len; /* Maximum allowed len. */ |
| 98 | int max_ops; /* Maximum allowed operations. */ |
| 99 | |
| 100 | /* Buffer contents */ |
| 101 | hb_buffer_content_type_t content_type; |
| 102 | hb_segment_properties_t props; /* Script, language, direction */ |
| 103 | |
| 104 | bool successful; /* Allocations successful */ |
| 105 | bool have_output; /* Whether we have an output buffer going on */ |
| 106 | bool have_positions; /* Whether we have positions */ |
| 107 | |
| 108 | unsigned int idx; /* Cursor into ->info and ->pos arrays */ |
| 109 | unsigned int len; /* Length of ->info and ->pos arrays */ |
| 110 | unsigned int out_len; /* Length of ->out array if have_output */ |
| 111 | |
| 112 | unsigned int allocated; /* Length of allocated arrays */ |
| 113 | hb_glyph_info_t *info; |
| 114 | hb_glyph_info_t *out_info; |
| 115 | hb_glyph_position_t *pos; |
| 116 | |
| 117 | unsigned int serial; |
| 118 | |
| 119 | /* Text before / after the main buffer contents. |
| 120 | * Always in Unicode, and ordered outward. |
| 121 | * Index 0 is for "pre-context", 1 for "post-context". */ |
| 122 | static constexpr unsigned CONTEXT_LENGTH = 5u; |
| 123 | hb_codepoint_t context[2][CONTEXT_LENGTH]; |
| 124 | unsigned int context_len[2]; |
| 125 | |
| 126 | /* Debugging API */ |
| 127 | #ifndef HB_NO_BUFFER_MESSAGE |
| 128 | hb_buffer_message_func_t message_func; |
| 129 | void *message_data; |
| 130 | hb_destroy_func_t message_destroy; |
| 131 | #endif |
| 132 | |
| 133 | /* Internal debugging. */ |
| 134 | /* The bits here reflect current allocations of the bytes in glyph_info_t's var1 and var2. */ |
| 135 | #ifndef HB_NDEBUG |
| 136 | uint8_t allocated_var_bits; |
| 137 | #endif |
| 138 | |
| 139 | |
| 140 | /* Methods */ |
| 141 | |
| 142 | bool in_error () const { return !successful; } |
| 143 | |
| 144 | void allocate_var (unsigned int start, unsigned int count) |
| 145 | { |
| 146 | #ifndef HB_NDEBUG |
| 147 | unsigned int end = start + count; |
| 148 | assert (end <= 8); |
| 149 | unsigned int bits = (1u<<end) - (1u<<start); |
| 150 | assert (0 == (allocated_var_bits & bits)); |
| 151 | allocated_var_bits |= bits; |
| 152 | #endif |
| 153 | } |
| 154 | void deallocate_var (unsigned int start, unsigned int count) |
| 155 | { |
| 156 | #ifndef HB_NDEBUG |
| 157 | unsigned int end = start + count; |
| 158 | assert (end <= 8); |
| 159 | unsigned int bits = (1u<<end) - (1u<<start); |
| 160 | assert (bits == (allocated_var_bits & bits)); |
| 161 | allocated_var_bits &= ~bits; |
| 162 | #endif |
| 163 | } |
| 164 | void assert_var (unsigned int start, unsigned int count) |
| 165 | { |
| 166 | #ifndef HB_NDEBUG |
| 167 | unsigned int end = start + count; |
| 168 | assert (end <= 8); |
| 169 | unsigned int bits = (1u<<end) - (1u<<start); |
| 170 | assert (bits == (allocated_var_bits & bits)); |
| 171 | #endif |
| 172 | } |
| 173 | void deallocate_var_all () |
| 174 | { |
| 175 | #ifndef HB_NDEBUG |
| 176 | allocated_var_bits = 0; |
| 177 | #endif |
| 178 | } |
| 179 | |
| 180 | hb_glyph_info_t &cur (unsigned int i = 0) { return info[idx + i]; } |
| 181 | hb_glyph_info_t cur (unsigned int i = 0) const { return info[idx + i]; } |
| 182 | |
| 183 | hb_glyph_position_t &cur_pos (unsigned int i = 0) { return pos[idx + i]; } |
| 184 | hb_glyph_position_t cur_pos (unsigned int i = 0) const { return pos[idx + i]; } |
| 185 | |
| 186 | hb_glyph_info_t &prev () { return out_info[out_len ? out_len - 1 : 0]; } |
| 187 | hb_glyph_info_t prev () const { return out_info[out_len ? out_len - 1 : 0]; } |
| 188 | |
| 189 | bool has_separate_output () const { return info != out_info; } |
| 190 | |
| 191 | |
| 192 | HB_INTERNAL void reset (); |
| 193 | HB_INTERNAL void clear (); |
| 194 | |
| 195 | unsigned int backtrack_len () const { return have_output? out_len : idx; } |
| 196 | unsigned int lookahead_len () const { return len - idx; } |
| 197 | unsigned int next_serial () { return serial++; } |
| 198 | |
| 199 | HB_INTERNAL void add (hb_codepoint_t codepoint, |
| 200 | unsigned int cluster); |
| 201 | HB_INTERNAL void add_info (const hb_glyph_info_t &glyph_info); |
| 202 | |
| 203 | HB_INTERNAL void reverse_range (unsigned int start, unsigned int end); |
| 204 | HB_INTERNAL void reverse (); |
| 205 | HB_INTERNAL void reverse_clusters (); |
| 206 | HB_INTERNAL void guess_segment_properties (); |
| 207 | |
| 208 | HB_INTERNAL void swap_buffers (); |
| 209 | HB_INTERNAL void remove_output (); |
| 210 | HB_INTERNAL void clear_output (); |
| 211 | HB_INTERNAL void clear_positions (); |
| 212 | |
| 213 | HB_INTERNAL void replace_glyphs (unsigned int num_in, |
| 214 | unsigned int num_out, |
| 215 | const hb_codepoint_t *glyph_data); |
| 216 | |
| 217 | void replace_glyph (hb_codepoint_t glyph_index) |
| 218 | { |
| 219 | if (unlikely (out_info != info || out_len != idx)) { |
| 220 | if (unlikely (!make_room_for (1, 1))) return; |
| 221 | out_info[out_len] = info[idx]; |
| 222 | } |
| 223 | out_info[out_len].codepoint = glyph_index; |
| 224 | |
| 225 | idx++; |
| 226 | out_len++; |
| 227 | } |
| 228 | /* Makes a copy of the glyph at idx to output and replace glyph_index */ |
| 229 | hb_glyph_info_t & output_glyph (hb_codepoint_t glyph_index) |
| 230 | { |
| 231 | if (unlikely (!make_room_for (0, 1))) return Crap(hb_glyph_info_t); |
| 232 | |
| 233 | if (unlikely (idx == len && !out_len)) |
| 234 | return Crap(hb_glyph_info_t); |
| 235 | |
| 236 | out_info[out_len] = idx < len ? info[idx] : out_info[out_len - 1]; |
| 237 | out_info[out_len].codepoint = glyph_index; |
| 238 | |
| 239 | out_len++; |
| 240 | |
| 241 | return out_info[out_len - 1]; |
| 242 | } |
| 243 | void output_info (const hb_glyph_info_t &glyph_info) |
| 244 | { |
| 245 | if (unlikely (!make_room_for (0, 1))) return; |
| 246 | |
| 247 | out_info[out_len] = glyph_info; |
| 248 | |
| 249 | out_len++; |
| 250 | } |
| 251 | /* Copies glyph at idx to output but doesn't advance idx */ |
| 252 | void copy_glyph () |
| 253 | { |
| 254 | if (unlikely (!make_room_for (0, 1))) return; |
| 255 | |
| 256 | out_info[out_len] = info[idx]; |
| 257 | |
| 258 | out_len++; |
| 259 | } |
| 260 | /* Copies glyph at idx to output and advance idx. |
| 261 | * If there's no output, just advance idx. */ |
| 262 | void |
| 263 | next_glyph () |
| 264 | { |
| 265 | if (have_output) |
| 266 | { |
| 267 | if (out_info != info || out_len != idx) |
| 268 | { |
| 269 | if (unlikely (!make_room_for (1, 1))) return; |
| 270 | out_info[out_len] = info[idx]; |
| 271 | } |
| 272 | out_len++; |
| 273 | } |
| 274 | |
| 275 | idx++; |
| 276 | } |
| 277 | /* Copies n glyphs at idx to output and advance idx. |
| 278 | * If there's no output, just advance idx. */ |
| 279 | void |
| 280 | next_glyphs (unsigned int n) |
| 281 | { |
| 282 | if (have_output) |
| 283 | { |
| 284 | if (out_info != info || out_len != idx) |
| 285 | { |
| 286 | if (unlikely (!make_room_for (n, n))) return; |
| 287 | memmove (out_info + out_len, info + idx, n * sizeof (out_info[0])); |
| 288 | } |
| 289 | out_len += n; |
| 290 | } |
| 291 | |
| 292 | idx += n; |
| 293 | } |
| 294 | /* Advance idx without copying to output. */ |
| 295 | void skip_glyph () { idx++; } |
| 296 | void reset_masks (hb_mask_t mask) |
| 297 | { |
| 298 | for (unsigned int j = 0; j < len; j++) |
| 299 | info[j].mask = mask; |
| 300 | } |
| 301 | void add_masks (hb_mask_t mask) |
| 302 | { |
| 303 | for (unsigned int j = 0; j < len; j++) |
| 304 | info[j].mask |= mask; |
| 305 | } |
| 306 | HB_INTERNAL void set_masks (hb_mask_t value, hb_mask_t mask, |
| 307 | unsigned int cluster_start, unsigned int cluster_end); |
| 308 | |
| 309 | void merge_clusters (unsigned int start, unsigned int end) |
| 310 | { |
| 311 | if (end - start < 2) |
| 312 | return; |
| 313 | merge_clusters_impl (start, end); |
| 314 | } |
| 315 | HB_INTERNAL void merge_clusters_impl (unsigned int start, unsigned int end); |
| 316 | HB_INTERNAL void merge_out_clusters (unsigned int start, unsigned int end); |
| 317 | /* Merge clusters for deleting current glyph, and skip it. */ |
| 318 | HB_INTERNAL void delete_glyph (); |
| 319 | |
| 320 | void unsafe_to_break (unsigned int start, |
| 321 | unsigned int end) |
| 322 | { |
| 323 | if (end - start < 2) |
| 324 | return; |
| 325 | unsafe_to_break_impl (start, end); |
| 326 | } |
| 327 | HB_INTERNAL void unsafe_to_break_impl (unsigned int start, unsigned int end); |
| 328 | HB_INTERNAL void unsafe_to_break_from_outbuffer (unsigned int start, unsigned int end); |
| 329 | |
| 330 | |
| 331 | /* Internal methods */ |
| 332 | HB_INTERNAL bool move_to (unsigned int i); /* i is output-buffer index. */ |
| 333 | |
| 334 | HB_INTERNAL bool enlarge (unsigned int size); |
| 335 | |
| 336 | bool ensure (unsigned int size) |
| 337 | { return likely (!size || size < allocated) ? true : enlarge (size); } |
| 338 | |
| 339 | bool ensure_inplace (unsigned int size) |
| 340 | { return likely (!size || size < allocated); } |
| 341 | |
| 342 | HB_INTERNAL bool make_room_for (unsigned int num_in, unsigned int num_out); |
| 343 | HB_INTERNAL bool shift_forward (unsigned int count); |
| 344 | |
| 345 | typedef long scratch_buffer_t; |
| 346 | HB_INTERNAL scratch_buffer_t *get_scratch_buffer (unsigned int *size); |
| 347 | |
| 348 | void clear_context (unsigned int side) { context_len[side] = 0; } |
| 349 | |
| 350 | HB_INTERNAL void sort (unsigned int start, unsigned int end, int(*compar)(const hb_glyph_info_t *, const hb_glyph_info_t *)); |
| 351 | |
| 352 | bool messaging () |
| 353 | { |
| 354 | #ifdef HB_NO_BUFFER_MESSAGE |
| 355 | return false; |
| 356 | #else |
| 357 | return unlikely (message_func); |
| 358 | #endif |
| 359 | } |
| 360 | bool message (hb_font_t *font, const char *fmt, ...) HB_PRINTF_FUNC(3, 4) |
| 361 | { |
| 362 | #ifdef HB_NO_BUFFER_MESSAGE |
| 363 | return true; |
| 364 | #else |
| 365 | if (!messaging ()) |
| 366 | return true; |
| 367 | va_list ap; |
| 368 | va_start (ap, fmt); |
| 369 | bool ret = message_impl (font, fmt, ap); |
| 370 | va_end (ap); |
| 371 | return ret; |
| 372 | #endif |
| 373 | } |
| 374 | HB_INTERNAL bool message_impl (hb_font_t *font, const char *fmt, va_list ap) HB_PRINTF_FUNC(3, 0); |
| 375 | |
| 376 | static void |
| 377 | set_cluster (hb_glyph_info_t &inf, unsigned int cluster, unsigned int mask = 0) |
| 378 | { |
| 379 | if (inf.cluster != cluster) |
| 380 | { |
| 381 | if (mask & HB_GLYPH_FLAG_UNSAFE_TO_BREAK) |
| 382 | inf.mask |= HB_GLYPH_FLAG_UNSAFE_TO_BREAK; |
| 383 | else |
| 384 | inf.mask &= ~HB_GLYPH_FLAG_UNSAFE_TO_BREAK; |
| 385 | } |
| 386 | inf.cluster = cluster; |
| 387 | } |
| 388 | |
| 389 | int |
| 390 | _unsafe_to_break_find_min_cluster (const hb_glyph_info_t *infos, |
| 391 | unsigned int start, unsigned int end, |
| 392 | unsigned int cluster) const |
| 393 | { |
| 394 | for (unsigned int i = start; i < end; i++) |
| 395 | cluster = hb_min (cluster, infos[i].cluster); |
| 396 | return cluster; |
| 397 | } |
| 398 | void |
| 399 | _unsafe_to_break_set_mask (hb_glyph_info_t *infos, |
| 400 | unsigned int start, unsigned int end, |
| 401 | unsigned int cluster) |
| 402 | { |
| 403 | for (unsigned int i = start; i < end; i++) |
| 404 | if (cluster != infos[i].cluster) |
| 405 | { |
| 406 | scratch_flags |= HB_BUFFER_SCRATCH_FLAG_HAS_UNSAFE_TO_BREAK; |
| 407 | infos[i].mask |= HB_GLYPH_FLAG_UNSAFE_TO_BREAK; |
| 408 | } |
| 409 | } |
| 410 | |
| 411 | void unsafe_to_break_all () { unsafe_to_break_impl (0, len); } |
| 412 | void safe_to_break_all () |
| 413 | { |
| 414 | for (unsigned int i = 0; i < len; i++) |
| 415 | info[i].mask &= ~HB_GLYPH_FLAG_UNSAFE_TO_BREAK; |
| 416 | } |
| 417 | }; |
| 418 | DECLARE_NULL_INSTANCE (hb_buffer_t); |
| 419 | |
| 420 | |
| 421 | /* Loop over clusters. Duplicated in foreach_syllable(). */ |
| 422 | #define foreach_cluster(buffer, start, end) \ |
| 423 | for (unsigned int \ |
| 424 | _count = buffer->len, \ |
| 425 | start = 0, end = _count ? _next_cluster (buffer, 0) : 0; \ |
| 426 | start < _count; \ |
| 427 | start = end, end = _next_cluster (buffer, start)) |
| 428 | |
| 429 | static inline unsigned int |
| 430 | _next_cluster (hb_buffer_t *buffer, unsigned int start) |
| 431 | { |
| 432 | hb_glyph_info_t *info = buffer->info; |
| 433 | unsigned int count = buffer->len; |
| 434 | |
| 435 | unsigned int cluster = info[start].cluster; |
| 436 | while (++start < count && cluster == info[start].cluster) |
| 437 | ; |
| 438 | |
| 439 | return start; |
| 440 | } |
| 441 | |
| 442 | |
| 443 | #define HB_BUFFER_XALLOCATE_VAR(b, func, var) \ |
| 444 | b->func (offsetof (hb_glyph_info_t, var) - offsetof(hb_glyph_info_t, var1), \ |
| 445 | sizeof (b->info[0].var)) |
| 446 | #define HB_BUFFER_ALLOCATE_VAR(b, var) HB_BUFFER_XALLOCATE_VAR (b, allocate_var, var ()) |
| 447 | #define HB_BUFFER_DEALLOCATE_VAR(b, var) HB_BUFFER_XALLOCATE_VAR (b, deallocate_var, var ()) |
| 448 | #define HB_BUFFER_ASSERT_VAR(b, var) HB_BUFFER_XALLOCATE_VAR (b, assert_var, var ()) |
| 449 | |
| 450 | |
| 451 | #endif /* HB_BUFFER_HH */ |
| 452 | |