hb-buffer.hh 13.5 KB
Newer Older
1
/*
B
Behdad Esfahbod 已提交
2 3
 * Copyright © 1998-2004  David Turner and Werner Lemberg
 * Copyright © 2004,2007,2009,2010  Red Hat, Inc.
4
 * Copyright © 2011,2012  Google, Inc.
5
 *
6
 *  This is part of HarfBuzz, a text shaping library.
7
 *
8 9 10 11 12
 * Permission is hereby granted, without written agreement and without
 * license or royalty fees, to use, copy, modify, and distribute this
 * software and its documentation for any purpose, provided that the
 * above copyright notice and the following two paragraphs appear in
 * all copies of this software.
13
 *
14 15 16 17 18 19 20 21 22 23 24 25 26
 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
 * DAMAGE.
 *
 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
 * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
 *
 * Red Hat Author(s): Owen Taylor, Behdad Esfahbod
27
 * Google Author(s): Behdad Esfahbod
28
 */
29

30 31
#ifndef HB_BUFFER_HH
#define HB_BUFFER_HH
32

33 34
#include "hb.hh"
#include "hb-unicode.hh"
35 36


37 38
#ifndef HB_BUFFER_MAX_LEN_FACTOR
#define HB_BUFFER_MAX_LEN_FACTOR 32
B
Behdad Esfahbod 已提交
39 40 41 42
#endif
#ifndef HB_BUFFER_MAX_LEN_MIN
#define HB_BUFFER_MAX_LEN_MIN 8192
#endif
B
Behdad Esfahbod 已提交
43
#ifndef HB_BUFFER_MAX_LEN_DEFAULT
B
Behdad Esfahbod 已提交
44 45 46
#define HB_BUFFER_MAX_LEN_DEFAULT 0x3FFFFFFF /* Shaping more than a billion chars? Let us know! */
#endif

47 48 49 50 51 52 53 54 55 56
#ifndef HB_BUFFER_MAX_OPS_FACTOR
#define HB_BUFFER_MAX_OPS_FACTOR 64
#endif
#ifndef HB_BUFFER_MAX_OPS_MIN
#define HB_BUFFER_MAX_OPS_MIN 1024
#endif
#ifndef HB_BUFFER_MAX_OPS_DEFAULT
#define HB_BUFFER_MAX_OPS_DEFAULT 0x1FFFFFFF /* Shaping more than a billion operations? Let us know! */
#endif

57 58
static_assert ((sizeof (hb_glyph_info_t) == 20), "");
static_assert ((sizeof (hb_glyph_info_t) == sizeof (hb_glyph_position_t)), "");
59

C
Chun-wei Fan 已提交
60 61
HB_MARK_AS_FLAG_T (hb_buffer_flags_t);
HB_MARK_AS_FLAG_T (hb_buffer_serialize_flags_t);
62
HB_MARK_AS_FLAG_T (hb_buffer_diff_flags_t);
B
Behdad Esfahbod 已提交
63

64 65
enum hb_buffer_scratch_flags_t {
  HB_BUFFER_SCRATCH_FLAG_DEFAULT			= 0x00000000u,
66 67 68
  HB_BUFFER_SCRATCH_FLAG_HAS_NON_ASCII			= 0x00000001u,
  HB_BUFFER_SCRATCH_FLAG_HAS_DEFAULT_IGNORABLES		= 0x00000002u,
  HB_BUFFER_SCRATCH_FLAG_HAS_SPACE_FALLBACK		= 0x00000004u,
69
  HB_BUFFER_SCRATCH_FLAG_HAS_GPOS_ATTACHMENT		= 0x00000008u,
70
  HB_BUFFER_SCRATCH_FLAG_HAS_UNSAFE_TO_BREAK		= 0x00000010u,
71
  HB_BUFFER_SCRATCH_FLAG_HAS_CGJ			= 0x00000020u,
72

73 74 75 76 77
  /* Reserved for complex shapers' internal use. */
  HB_BUFFER_SCRATCH_FLAG_COMPLEX0			= 0x01000000u,
  HB_BUFFER_SCRATCH_FLAG_COMPLEX1			= 0x02000000u,
  HB_BUFFER_SCRATCH_FLAG_COMPLEX2			= 0x04000000u,
  HB_BUFFER_SCRATCH_FLAG_COMPLEX3			= 0x08000000u,
78
};
C
Chun-wei Fan 已提交
79
HB_MARK_AS_FLAG_T (hb_buffer_scratch_flags_t);
80

B
Behdad Esfahbod 已提交
81 82 83 84

/*
 * hb_buffer_t
 */
85

86 87
struct hb_buffer_t
{
88
  hb_object_header_t header;
89
  ASSERT_POD ();
B
Behdad Esfahbod 已提交
90 91

  /* Information about how the text in the buffer should be treated */
92
  hb_unicode_funcs_t *unicode; /* Unicode functions */
B
Behdad Esfahbod 已提交
93
  hb_buffer_flags_t flags; /* BOT / EOT / etc. */
94
  hb_buffer_cluster_level_t cluster_level;
95
  hb_codepoint_t replacement; /* U+FFFD or something else. */
96
  hb_codepoint_t invisible; /* 0 or something else. */
B
Bruce Mitchener 已提交
97
  hb_buffer_scratch_flags_t scratch_flags; /* Have space-fallback, etc. */
B
Behdad Esfahbod 已提交
98
  unsigned int max_len; /* Maximum allowed len. */
99
  int max_ops; /* Maximum allowed operations. */
B
Behdad Esfahbod 已提交
100 101

  /* Buffer contents */
102
  hb_buffer_content_type_t content_type;
103
  hb_segment_properties_t props; /* Script, language, direction */
104

B
Behdad Esfahbod 已提交
105
  bool successful; /* Allocations successful */
106 107
  bool have_output; /* Whether we have an output buffer going on */
  bool have_positions; /* Whether we have positions */
B
Behdad Esfahbod 已提交
108

109
  unsigned int idx; /* Cursor into ->info and ->pos arrays */
B
Behdad Esfahbod 已提交
110
  unsigned int len; /* Length of ->info and ->pos arrays */
111
  unsigned int out_len; /* Length of ->out array if have_output */
B
Behdad Esfahbod 已提交
112

113
  unsigned int allocated; /* Length of allocated arrays */
114 115 116
  hb_glyph_info_t     *info;
  hb_glyph_info_t     *out_info;
  hb_glyph_position_t *pos;
B
Behdad Esfahbod 已提交
117

118
  unsigned int serial;
119 120 121 122

  /* Text before / after the main buffer contents.
   * Always in Unicode, and ordered outward.
   * Index 0 is for "pre-context", 1 for "post-context". */
123
  enum { CONTEXT_LENGTH = 5 };
124 125 126
  hb_codepoint_t context[2][CONTEXT_LENGTH];
  unsigned int context_len[2];

127
  /* Debugging API */
128 129 130 131
  hb_buffer_message_func_t message_func;
  void *message_data;
  hb_destroy_func_t message_destroy;

132
  /* Internal debugging. */
133 134 135 136
  /* The bits here reflect current allocations of the bytes in glyph_info_t's var1 and var2. */
#ifndef HB_NDEBUG
  uint8_t allocated_var_bits;
#endif
B
Behdad Esfahbod 已提交
137 138 139 140


  /* Methods */

141 142 143 144 145
  inline void allocate_var (unsigned int start, unsigned int count)
  {
#ifndef HB_NDEBUG
    unsigned int end = start + count;
    assert (end <= 8);
B
Behdad Esfahbod 已提交
146
    unsigned int bits = (1u<<end) - (1u<<start);
147 148 149 150 151 152 153 154 155
    assert (0 == (allocated_var_bits & bits));
    allocated_var_bits |= bits;
#endif
  }
  inline void deallocate_var (unsigned int start, unsigned int count)
  {
#ifndef HB_NDEBUG
    unsigned int end = start + count;
    assert (end <= 8);
B
Behdad Esfahbod 已提交
156
    unsigned int bits = (1u<<end) - (1u<<start);
157 158 159 160 161 162 163 164 165
    assert (bits == (allocated_var_bits & bits));
    allocated_var_bits &= ~bits;
#endif
  }
  inline void assert_var (unsigned int start, unsigned int count)
  {
#ifndef HB_NDEBUG
    unsigned int end = start + count;
    assert (end <= 8);
B
Behdad Esfahbod 已提交
166
    unsigned int bits = (1u<<end) - (1u<<start);
167 168 169 170 171 172 173
    assert (bits == (allocated_var_bits & bits));
#endif
  }
  inline void deallocate_var_all (void)
  {
#ifndef HB_NDEBUG
    allocated_var_bits = 0;
174
#endif
175
  }
176

B
Behdad Esfahbod 已提交
177 178 179 180 181 182 183 184 185 186
  inline hb_glyph_info_t &cur (unsigned int i = 0) { return info[idx + i]; }
  inline hb_glyph_info_t cur (unsigned int i = 0) const { return info[idx + i]; }

  inline hb_glyph_position_t &cur_pos (unsigned int i = 0) { return pos[idx + i]; }
  inline hb_glyph_position_t cur_pos (unsigned int i = 0) const { return pos[idx + i]; }

  inline hb_glyph_info_t &prev (void) { return out_info[out_len ? out_len - 1 : 0]; }
  inline hb_glyph_info_t prev (void) const { return out_info[out_len ? out_len - 1 : 0]; }

  inline bool has_separate_output (void) const { return info != out_info; }
B
Behdad Esfahbod 已提交
187

188 189

  HB_INTERNAL void reset (void);
B
Behdad Esfahbod 已提交
190
  HB_INTERNAL void clear (void);
191

192
  inline unsigned int backtrack_len (void) const
193
  { return have_output? out_len : idx; }
194 195
  inline unsigned int lookahead_len (void) const
  { return len - idx; }
B
Behdad Esfahbod 已提交
196
  inline unsigned int next_serial (void) { return serial++; }
197 198 199

  HB_INTERNAL void add (hb_codepoint_t  codepoint,
			unsigned int    cluster);
200
  HB_INTERNAL void add_info (const hb_glyph_info_t &glyph_info);
201 202 203 204

  HB_INTERNAL void reverse_range (unsigned int start, unsigned int end);
  HB_INTERNAL void reverse (void);
  HB_INTERNAL void reverse_clusters (void);
205
  HB_INTERNAL void guess_segment_properties (void);
206 207

  HB_INTERNAL void swap_buffers (void);
B
Behdad Esfahbod 已提交
208
  HB_INTERNAL void remove_output (void);
209 210
  HB_INTERNAL void clear_output (void);
  HB_INTERNAL void clear_positions (void);
B
Behdad Esfahbod 已提交
211

B
Behdad Esfahbod 已提交
212 213
  HB_INTERNAL void replace_glyphs (unsigned int num_in,
				   unsigned int num_out,
B
Minor  
Behdad Esfahbod 已提交
214
				   const hb_codepoint_t *glyph_data);
B
Behdad Esfahbod 已提交
215

B
Behdad Esfahbod 已提交
216 217 218 219 220 221 222 223 224 225 226
  inline void replace_glyph (hb_codepoint_t glyph_index)
  {
    if (unlikely (out_info != info || out_len != idx)) {
      if (unlikely (!make_room_for (1, 1))) return;
      out_info[out_len] = info[idx];
    }
    out_info[out_len].codepoint = glyph_index;

    idx++;
    out_len++;
  }
227
  /* Makes a copy of the glyph at idx to output and replace glyph_index */
B
Behdad Esfahbod 已提交
228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246
  inline hb_glyph_info_t & output_glyph (hb_codepoint_t glyph_index)
  {
    if (unlikely (!make_room_for (0, 1))) return Crap(hb_glyph_info_t);

    out_info[out_len] = info[idx];
    out_info[out_len].codepoint = glyph_index;

    out_len++;

    return out_info[out_len - 1];
  }
  inline void output_info (const hb_glyph_info_t &glyph_info)
  {
    if (unlikely (!make_room_for (0, 1))) return;

    out_info[out_len] = glyph_info;

    out_len++;
  }
247
  /* Copies glyph at idx to output but doesn't advance idx */
B
Behdad Esfahbod 已提交
248 249 250 251 252 253 254 255
  inline void copy_glyph (void)
  {
    if (unlikely (!make_room_for (0, 1))) return;

    out_info[out_len] = info[idx];

    out_len++;
  }
256 257
  /* Copies glyph at idx to output and advance idx.
   * If there's no output, just advance idx. */
B
Minor  
Behdad Esfahbod 已提交
258 259 260 261 262
  inline void
  next_glyph (void)
  {
    if (have_output)
    {
263 264
      if (out_info != info || out_len != idx)
      {
265
	if (unlikely (!make_room_for (1, 1))) return;
B
Minor  
Behdad Esfahbod 已提交
266 267 268 269
	out_info[out_len] = info[idx];
      }
      out_len++;
    }
270

B
Minor  
Behdad Esfahbod 已提交
271 272
    idx++;
  }
273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289
  /* Copies n glyphs at idx to output and advance idx.
   * If there's no output, just advance idx. */
  inline void
  next_glyphs (unsigned int n)
  {
    if (have_output)
    {
      if (out_info != info || out_len != idx)
      {
	if (unlikely (!make_room_for (n, n))) return;
	memmove (out_info + out_len, info + idx, n * sizeof (out_info[0]));
      }
      out_len += n;
    }

    idx += n;
  }
290
  /* Advance idx without copying to output. */
B
Behdad Esfahbod 已提交
291 292 293 294
  inline void skip_glyph (void)
  {
    idx++;
  }
B
Behdad Esfahbod 已提交
295 296
  inline void reset_masks (hb_mask_t mask)
  {
B
Behdad Esfahbod 已提交
297 298
    for (unsigned int j = 0; j < len; j++)
      info[j].mask = mask;
B
Behdad Esfahbod 已提交
299 300 301
  }
  inline void add_masks (hb_mask_t mask)
  {
B
Behdad Esfahbod 已提交
302 303
    for (unsigned int j = 0; j < len; j++)
      info[j].mask |= mask;
B
Behdad Esfahbod 已提交
304
  }
305 306
  HB_INTERNAL void set_masks (hb_mask_t value, hb_mask_t mask,
			      unsigned int cluster_start, unsigned int cluster_end);
307

308
  inline void merge_clusters (unsigned int start, unsigned int end)
B
Behdad Esfahbod 已提交
309 310 311 312 313
  {
    if (end - start < 2)
      return;
    merge_clusters_impl (start, end);
  }
314 315
  HB_INTERNAL void merge_clusters_impl (unsigned int start, unsigned int end);
  HB_INTERNAL void merge_out_clusters (unsigned int start, unsigned int end);
316 317
  /* Merge clusters for deleting current glyph, and skip it. */
  HB_INTERNAL void delete_glyph (void);
318

319 320 321 322 323 324 325 326 327 328 329
  inline void unsafe_to_break (unsigned int start,
			       unsigned int end)
  {
    if (end - start < 2)
      return;
    unsafe_to_break_impl (start, end);
  }
  HB_INTERNAL void unsafe_to_break_impl (unsigned int start, unsigned int end);
  HB_INTERNAL void unsafe_to_break_from_outbuffer (unsigned int start, unsigned int end);


330
  /* Internal methods */
B
Behdad Esfahbod 已提交
331 332
  HB_INTERNAL bool move_to (unsigned int i); /* i is output-buffer index. */

333 334 335
  HB_INTERNAL bool enlarge (unsigned int size);

  inline bool ensure (unsigned int size)
336
  { return likely (!size || size < allocated) ? true : enlarge (size); }
337

338 339 340
  inline bool ensure_inplace (unsigned int size)
  { return likely (!size || size < allocated); }

341
  HB_INTERNAL bool make_room_for (unsigned int num_in, unsigned int num_out);
342
  HB_INTERNAL bool shift_forward (unsigned int count);
343

344
  typedef long scratch_buffer_t;
B
Behdad Esfahbod 已提交
345
  HB_INTERNAL scratch_buffer_t *get_scratch_buffer (unsigned int *size);
346 347

  inline void clear_context (unsigned int side) { context_len[side] = 0; }
348 349

  HB_INTERNAL void sort (unsigned int start, unsigned int end, int(*compar)(const hb_glyph_info_t *, const hb_glyph_info_t *));
350 351 352 353 354 355 356 357 358 359 360 361 362

  inline bool messaging (void) { return unlikely (message_func); }
  inline bool message (hb_font_t *font, const char *fmt, ...) HB_PRINTF_FUNC(3, 4)
  {
    if (!messaging ())
      return true;
    va_list ap;
    va_start (ap, fmt);
    bool ret = message_impl (font, fmt, ap);
    va_end (ap);
    return ret;
  }
  HB_INTERNAL bool message_impl (hb_font_t *font, const char *fmt, va_list ap) HB_PRINTF_FUNC(3, 0);
363 364

  static inline void
B
Behdad Esfahbod 已提交
365
  set_cluster (hb_glyph_info_t &inf, unsigned int cluster, unsigned int mask = 0)
366
  {
B
Behdad Esfahbod 已提交
367
    if (inf.cluster != cluster)
368 369
    {
      if (mask & HB_GLYPH_FLAG_UNSAFE_TO_BREAK)
B
Behdad Esfahbod 已提交
370
	inf.mask |= HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
371
      else
B
Behdad Esfahbod 已提交
372
	inf.mask &= ~HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
373
    }
B
Behdad Esfahbod 已提交
374
    inf.cluster = cluster;
375
  }
376

377
  inline int
B
Behdad Esfahbod 已提交
378
  _unsafe_to_break_find_min_cluster (const hb_glyph_info_t *infos,
379 380 381 382
				     unsigned int start, unsigned int end,
				     unsigned int cluster) const
  {
    for (unsigned int i = start; i < end; i++)
B
Behdad Esfahbod 已提交
383
      cluster = MIN<unsigned int> (cluster, infos[i].cluster);
384 385
    return cluster;
  }
386
  inline void
B
Behdad Esfahbod 已提交
387
  _unsafe_to_break_set_mask (hb_glyph_info_t *infos,
388 389 390 391
			     unsigned int start, unsigned int end,
			     unsigned int cluster)
  {
    for (unsigned int i = start; i < end; i++)
B
Behdad Esfahbod 已提交
392
      if (cluster != infos[i].cluster)
393 394
      {
	scratch_flags |= HB_BUFFER_SCRATCH_FLAG_HAS_UNSAFE_TO_BREAK;
B
Behdad Esfahbod 已提交
395
	infos[i].mask |= HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
396 397
      }
  }
398 399 400 401

  inline void
  unsafe_to_break_all (void)
  {
402
    unsafe_to_break_impl (0, len);
403 404 405 406 407 408 409
  }
  inline void
  safe_to_break_all (void)
  {
    for (unsigned int i = 0; i < len; i++)
      info[i].mask &= ~HB_GLYPH_FLAG_UNSAFE_TO_BREAK;
  }
B
Behdad Esfahbod 已提交
410
};
411
DECLARE_NULL_INSTANCE (hb_buffer_t);
B
Behdad Esfahbod 已提交
412 413


414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435
/* Loop over clusters. Duplicated in foreach_syllable(). */
#define foreach_cluster(buffer, start, end) \
  for (unsigned int \
       _count = buffer->len, \
       start = 0, end = _count ? _next_cluster (buffer, 0) : 0; \
       start < _count; \
       start = end, end = _next_cluster (buffer, start))

static inline unsigned int
_next_cluster (hb_buffer_t *buffer, unsigned int start)
{
  hb_glyph_info_t *info = buffer->info;
  unsigned int count = buffer->len;

  unsigned int cluster = info[start].cluster;
  while (++start < count && cluster == info[start].cluster)
    ;

  return start;
}


436
#define HB_BUFFER_XALLOCATE_VAR(b, func, var) \
437
  b->func (offsetof (hb_glyph_info_t, var) - offsetof(hb_glyph_info_t, var1), \
438 439 440 441
	   sizeof (b->info[0].var))
#define HB_BUFFER_ALLOCATE_VAR(b, var)		HB_BUFFER_XALLOCATE_VAR (b, allocate_var,   var ())
#define HB_BUFFER_DEALLOCATE_VAR(b, var)	HB_BUFFER_XALLOCATE_VAR (b, deallocate_var, var ())
#define HB_BUFFER_ASSERT_VAR(b, var)		HB_BUFFER_XALLOCATE_VAR (b, assert_var,     var ())
442 443


444
#endif /* HB_BUFFER_HH */