hb-buffer.cc 42.3 KB
Newer Older
1
/*
B
Behdad Esfahbod 已提交
2 3
 * Copyright © 1998-2004  David Turner and Werner Lemberg
 * Copyright © 2004,2007,2009,2010  Red Hat, Inc.
4
 * Copyright © 2011,2012  Google, Inc.
5
 *
6
 *  This is part of HarfBuzz, a text shaping library.
7
 *
8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
 * Permission is hereby granted, without written agreement and without
 * license or royalty fees, to use, copy, modify, and distribute this
 * software and its documentation for any purpose, provided that the
 * above copyright notice and the following two paragraphs appear in
 * all copies of this software.
 *
 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
 * DAMAGE.
 *
 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
 * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
 *
 * Red Hat Author(s): Owen Taylor, Behdad Esfahbod
27
 * Google Author(s): Behdad Esfahbod
28 29
 */

30
#include "hb-buffer-private.hh"
31
#include "hb-utf-private.hh"
32

33

B
Behdad Esfahbod 已提交
34 35 36 37
#ifndef HB_DEBUG_BUFFER
#define HB_DEBUG_BUFFER (HB_DEBUG+0)
#endif

38 39 40 41 42 43 44 45 46
/**
 * SECTION: hb-buffer
 * @title: Buffers
 * @short_description: Input and output buffers
 * @include: hb.h
 *
 * Buffers serve dual role in HarfBuzz; they hold the input characters that are
 * passed hb_shape(), and after shaping they hold the output glyphs.
 **/
47

S
Sascha Brawer 已提交
48
/**
B
Behdad Esfahbod 已提交
49
 * hb_segment_properties_equal:
K
Khaled Hosny 已提交
50 51 52 53 54
 * @a: first #hb_segment_properties_t to compare.
 * @b: second #hb_segment_properties_t to compare.
 *
 * Checks the equality of two #hb_segment_properties_t's.
 *
B
Behdad Esfahbod 已提交
55
 * Return value:
K
Khaled Hosny 已提交
56
 * %true if all properties of @a equal those of @b, false otherwise.
B
Behdad Esfahbod 已提交
57
 *
S
Sascha Brawer 已提交
58 59
 * Since: 0.9.7
 **/
60 61 62 63 64 65 66 67 68 69 70 71
hb_bool_t
hb_segment_properties_equal (const hb_segment_properties_t *a,
			     const hb_segment_properties_t *b)
{
  return a->direction == b->direction &&
	 a->script    == b->script    &&
	 a->language  == b->language  &&
	 a->reserved1 == b->reserved1 &&
	 a->reserved2 == b->reserved2;

}

S
Sascha Brawer 已提交
72
/**
B
Behdad Esfahbod 已提交
73
 * hb_segment_properties_hash:
K
Khaled Hosny 已提交
74 75 76 77 78 79
 * @p: #hb_segment_properties_t to hash.
 *
 * Creates a hash representing @p.
 *
 * Return value:
 * A hash of @p.
B
Behdad Esfahbod 已提交
80
 *
S
Sascha Brawer 已提交
81 82
 * Since: 0.9.7
 **/
83 84 85 86 87 88 89 90 91 92
unsigned int
hb_segment_properties_hash (const hb_segment_properties_t *p)
{
  return (unsigned int) p->direction ^
	 (unsigned int) p->script ^
	 (intptr_t) (p->language);
}



93 94
/* Here is how the buffer works internally:
 *
B
Behdad Esfahbod 已提交
95 96
 * There are two info pointers: info and out_info.  They always have
 * the same allocated size, but different lengths.
97
 *
98
 * As an optimization, both info and out_info may point to the
99
 * same piece of memory, which is owned by info.  This remains the
100
 * case as long as out_len doesn't exceed i at any time.
101
 * In that case, swap_buffers() is no-op and the glyph operations operate
B
Behdad Esfahbod 已提交
102
 * mostly in-place.
103
 *
104
 * As soon as out_info gets longer than info, out_info is moved over
B
Behdad Esfahbod 已提交
105 106
 * to an alternate buffer (which we reuse the pos buffer for!), and its
 * current contents (out_len entries) are copied to the new place.
107
 * This should all remain transparent to the user.  swap_buffers() then
B
Behdad Esfahbod 已提交
108
 * switches info and out_info.
109 110
 */

B
Behdad Esfahbod 已提交
111

112 113 114 115 116

/* Internal API */

bool
hb_buffer_t::enlarge (unsigned int size)
117
{
118
  if (unlikely (in_error))
119
    return false;
B
Behdad Esfahbod 已提交
120 121 122 123 124
  if (unlikely (size > max_len))
  {
    in_error = true;
    return false;
  }
125

126
  unsigned int new_allocated = allocated;
B
Behdad Esfahbod 已提交
127 128
  hb_glyph_position_t *new_pos = NULL;
  hb_glyph_info_t *new_info = NULL;
129
  bool separate_out = out_info != info;
130

131
  if (unlikely (_hb_unsigned_int_mul_overflows (size, sizeof (info[0]))))
B
Behdad Esfahbod 已提交
132
    goto done;
133

134
  while (size >= new_allocated)
135
    new_allocated += (new_allocated >> 1) + 32;
136

137 138
  ASSERT_STATIC (sizeof (info[0]) == sizeof (pos[0]));
  if (unlikely (_hb_unsigned_int_mul_overflows (new_allocated, sizeof (info[0]))))
B
Behdad Esfahbod 已提交
139 140
    goto done;

141 142
  new_pos = (hb_glyph_position_t *) realloc (pos, new_allocated * sizeof (pos[0]));
  new_info = (hb_glyph_info_t *) realloc (info, new_allocated * sizeof (info[0]));
143

B
Behdad Esfahbod 已提交
144
done:
145
  if (unlikely (!new_pos || !new_info))
146
    in_error = true;
147 148

  if (likely (new_pos))
149
    pos = new_pos;
150 151

  if (likely (new_info))
152 153 154 155 156 157 158 159 160 161 162 163 164
    info = new_info;

  out_info = separate_out ? (hb_glyph_info_t *) pos : info;
  if (likely (!in_error))
    allocated = new_allocated;

  return likely (!in_error);
}

bool
hb_buffer_t::make_room_for (unsigned int num_in,
			    unsigned int num_out)
{
165
  if (unlikely (!ensure (out_len + num_out))) return false;
166 167 168 169 170 171 172 173 174 175

  if (out_info == info &&
      out_len + num_out > idx + num_in)
  {
    assert (have_output);

    out_info = (hb_glyph_info_t *) pos;
    memcpy (out_info, info, out_len * sizeof (out_info[0]));
  }

176
  return true;
177 178
}

179 180 181 182 183 184 185 186 187 188 189 190 191
bool
hb_buffer_t::shift_forward (unsigned int count)
{
  assert (have_output);
  if (unlikely (!ensure (len + count))) return false;

  memmove (info + idx + count, info + idx, (len - idx) * sizeof (info[0]));
  len += count;
  idx += count;

  return true;
}

B
Behdad Esfahbod 已提交
192 193
hb_buffer_t::scratch_buffer_t *
hb_buffer_t::get_scratch_buffer (unsigned int *size)
194
{
195 196
  have_output = false;
  have_positions = false;
197

198
  out_len = 0;
199 200
  out_info = info;

201
  assert ((uintptr_t) pos % sizeof (scratch_buffer_t) == 0);
B
Behdad Esfahbod 已提交
202
  *size = allocated * sizeof (pos[0]) / sizeof (scratch_buffer_t);
203
  return (scratch_buffer_t *) (void *) pos;
204 205
}

206

B
Behdad Esfahbod 已提交
207

208 209 210 211 212 213 214 215 216
/* HarfBuzz-Internal API */

void
hb_buffer_t::reset (void)
{
  if (unlikely (hb_object_is_inert (this)))
    return;

  hb_unicode_funcs_destroy (unicode);
217
  unicode = hb_unicode_funcs_get_default ();
218
  flags = HB_BUFFER_FLAG_DEFAULT;
219
  replacement = HB_BUFFER_REPLACEMENT_CODEPOINT_DEFAULT;
220

B
Behdad Esfahbod 已提交
221 222 223 224 225 226 227 228 229
  clear ();
}

void
hb_buffer_t::clear (void)
{
  if (unlikely (hb_object_is_inert (this)))
    return;

230
  hb_segment_properties_t default_props = HB_SEGMENT_PROPERTIES_DEFAULT;
231
  props = default_props;
232
  scratch_flags = HB_BUFFER_SCRATCH_FLAG_DEFAULT;
233

234
  content_type = HB_BUFFER_CONTENT_TYPE_INVALID;
235 236 237
  in_error = false;
  have_output = false;
  have_positions = false;
238

239 240 241
  idx = 0;
  len = 0;
  out_len = 0;
242
  out_info = info;
243

244
  serial = 0;
245 246 247

  memset (context, 0, sizeof context);
  memset (context_len, 0, sizeof context_len);
248 249

  deallocate_var_all ();
250 251
}

252 253 254
void
hb_buffer_t::add (hb_codepoint_t  codepoint,
		  unsigned int    cluster)
255
{
256 257 258 259 260 261 262 263
  hb_glyph_info_t *glyph;

  if (unlikely (!ensure (len + 1))) return;

  glyph = &info[len];

  memset (glyph, 0, sizeof (*glyph));
  glyph->codepoint = codepoint;
264
  glyph->mask = 1;
265 266 267
  glyph->cluster = cluster;

  len++;
268
}
269

270 271 272 273 274 275 276 277 278 279 280
void
hb_buffer_t::add_info (const hb_glyph_info_t &glyph_info)
{
  if (unlikely (!ensure (len + 1))) return;

  info[len] = glyph_info;

  len++;
}


B
Behdad Esfahbod 已提交
281 282 283 284 285 286 287 288 289 290 291 292 293
void
hb_buffer_t::remove_output (void)
{
  if (unlikely (hb_object_is_inert (this)))
    return;

  have_output = false;
  have_positions = false;

  out_len = 0;
  out_info = info;
}

294 295
void
hb_buffer_t::clear_output (void)
B
Behdad Esfahbod 已提交
296
{
297 298 299
  if (unlikely (hb_object_is_inert (this)))
    return;

300 301
  have_output = true;
  have_positions = false;
302

303 304 305 306 307 308 309 310 311 312
  out_len = 0;
  out_info = info;
}

void
hb_buffer_t::clear_positions (void)
{
  if (unlikely (hb_object_is_inert (this)))
    return;

313 314
  have_output = false;
  have_positions = true;
315

316 317 318
  out_len = 0;
  out_info = info;

319 320 321 322 323 324 325 326 327
  memset (pos, 0, sizeof (pos[0]) * len);
}

void
hb_buffer_t::swap_buffers (void)
{
  if (unlikely (in_error)) return;

  assert (have_output);
328
  have_output = false;
329 330

  if (out_info != info)
331
  {
332 333 334 335 336 337 338 339 340 341 342 343 344 345
    hb_glyph_info_t *tmp_string;
    tmp_string = info;
    info = out_info;
    out_info = tmp_string;
    pos = (hb_glyph_position_t *) out_info;
  }

  unsigned int tmp;
  tmp = len;
  len = out_len;
  out_len = tmp;

  idx = 0;
}
346

B
Behdad Esfahbod 已提交
347

B
Behdad Esfahbod 已提交
348 349 350
void
hb_buffer_t::replace_glyphs (unsigned int num_in,
			     unsigned int num_out,
B
Minor  
Behdad Esfahbod 已提交
351
			     const uint32_t *glyph_data)
B
Behdad Esfahbod 已提交
352
{
353
  if (unlikely (!make_room_for (num_in, num_out))) return;
B
Behdad Esfahbod 已提交
354

355
  merge_clusters (idx, idx + num_in);
B
Behdad Esfahbod 已提交
356

357
  hb_glyph_info_t orig_info = info[idx];
B
Behdad Esfahbod 已提交
358 359 360 361 362 363 364 365
  hb_glyph_info_t *pinfo = &out_info[out_len];
  for (unsigned int i = 0; i < num_out; i++)
  {
    *pinfo = orig_info;
    pinfo->codepoint = glyph_data[i];
    pinfo++;
  }

366
  idx  += num_in;
367
  out_len += num_out;
B
Behdad Esfahbod 已提交
368 369
}

370 371 372
void
hb_buffer_t::output_glyph (hb_codepoint_t glyph_index)
{
373
  if (unlikely (!make_room_for (0, 1))) return;
374 375 376 377 378 379 380

  out_info[out_len] = info[idx];
  out_info[out_len].codepoint = glyph_index;

  out_len++;
}

381
void
382
hb_buffer_t::output_info (const hb_glyph_info_t &glyph_info)
383
{
384
  if (unlikely (!make_room_for (0, 1))) return;
385 386 387 388 389 390

  out_info[out_len] = glyph_info;

  out_len++;
}

391 392 393
void
hb_buffer_t::copy_glyph (void)
{
394
  if (unlikely (!make_room_for (0, 1))) return;
395 396 397 398 399 400

  out_info[out_len] = info[idx];

  out_len++;
}

401 402 403 404 405 406 407
bool
hb_buffer_t::move_to (unsigned int i)
{
  if (!have_output)
  {
    assert (i <= len);
    idx = i;
408
    return true;
409
  }
410 411
  if (unlikely (in_error))
    return false;
412 413 414 415

  assert (i <= out_len + (len - idx));

  if (out_len < i)
416 417
  {
    unsigned int count = i - out_len;
418
    if (unlikely (!make_room_for (count, count))) return false;
419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436

    memmove (out_info + out_len, info + idx, count * sizeof (out_info[0]));
    idx += count;
    out_len += count;
  }
  else if (out_len > i)
  {
    /* Tricky part: rewinding... */
    unsigned int count = out_len - i;

    if (unlikely (idx < count && !shift_forward (count + 32))) return false;

    assert (idx >= count);

    idx -= count;
    out_len -= count;
    memmove (info + idx, out_info + out_len, count * sizeof (out_info[0]));
  }
437

438 439 440
  return true;
}

441 442 443
void
hb_buffer_t::replace_glyph (hb_codepoint_t glyph_index)
{
B
Behdad Esfahbod 已提交
444
  if (unlikely (out_info != info || out_len != idx)) {
445
    if (unlikely (!make_room_for (1, 1))) return;
B
Behdad Esfahbod 已提交
446 447
    out_info[out_len] = info[idx];
  }
448 449
  out_info[out_len].codepoint = glyph_index;

450
  idx++;
451
  out_len++;
452 453
}

B
Behdad Esfahbod 已提交
454

455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485
void
hb_buffer_t::set_masks (hb_mask_t    value,
			hb_mask_t    mask,
			unsigned int cluster_start,
			unsigned int cluster_end)
{
  hb_mask_t not_mask = ~mask;
  value &= mask;

  if (!mask)
    return;

  if (cluster_start == 0 && cluster_end == (unsigned int)-1) {
    unsigned int count = len;
    for (unsigned int i = 0; i < count; i++)
      info[i].mask = (info[i].mask & not_mask) | value;
    return;
  }

  unsigned int count = len;
  for (unsigned int i = 0; i < count; i++)
    if (cluster_start <= info[i].cluster && info[i].cluster < cluster_end)
      info[i].mask = (info[i].mask & not_mask) | value;
}

void
hb_buffer_t::reverse_range (unsigned int start,
			    unsigned int end)
{
  unsigned int i, j;

486
  if (end - start < 2)
487 488 489 490 491 492 493 494 495 496
    return;

  for (i = start, j = end - 1; i < j; i++, j--) {
    hb_glyph_info_t t;

    t = info[i];
    info[i] = info[j];
    info[j] = t;
  }

497
  if (have_positions) {
498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537
    for (i = start, j = end - 1; i < j; i++, j--) {
      hb_glyph_position_t t;

      t = pos[i];
      pos[i] = pos[j];
      pos[j] = t;
    }
  }
}

void
hb_buffer_t::reverse (void)
{
  if (unlikely (!len))
    return;

  reverse_range (0, len);
}

void
hb_buffer_t::reverse_clusters (void)
{
  unsigned int i, start, count, last_cluster;

  if (unlikely (!len))
    return;

  reverse ();

  count = len;
  start = 0;
  last_cluster = info[0].cluster;
  for (i = 1; i < count; i++) {
    if (last_cluster != info[i].cluster) {
      reverse_range (start, i);
      start = i;
      last_cluster = info[i].cluster;
    }
  }
  reverse_range (start, i);
538 539
}

540
void
B
Behdad Esfahbod 已提交
541 542
hb_buffer_t::merge_clusters_impl (unsigned int start,
				  unsigned int end)
543
{
544 545
  if (cluster_level == HB_BUFFER_CLUSTER_LEVEL_CHARACTERS)
    return;
B
Behdad Esfahbod 已提交
546

547
  unsigned int cluster = info[start].cluster;
548 549

  for (unsigned int i = start + 1; i < end; i++)
550 551 552 553 554 555
    cluster = MIN (cluster, info[i].cluster);

  /* Extend end */
  while (end < len && info[end - 1].cluster == info[end].cluster)
    end++;

556 557 558 559 560 561
  /* Extend start */
  while (idx < start && info[start - 1].cluster == info[start].cluster)
    start--;

  /* If we hit the start of buffer, continue in out-buffer. */
  if (idx == start)
562
    for (unsigned int i = out_len; i && out_info[i - 1].cluster == info[start].cluster; i--)
563 564
      out_info[i - 1].cluster = cluster;

565
  for (unsigned int i = start; i < end; i++)
566
    info[i].cluster = cluster;
567 568 569 570 571
}
void
hb_buffer_t::merge_out_clusters (unsigned int start,
				 unsigned int end)
{
572 573
  if (cluster_level == HB_BUFFER_CLUSTER_LEVEL_CHARACTERS)
    return;
B
Behdad Esfahbod 已提交
574

B
Minor  
Behdad Esfahbod 已提交
575
  if (unlikely (end - start < 2))
576 577
    return;

578
  unsigned int cluster = out_info[start].cluster;
579 580

  for (unsigned int i = start + 1; i < end; i++)
581
    cluster = MIN (cluster, out_info[i].cluster);
582 583 584 585 586

  /* Extend start */
  while (start && out_info[start - 1].cluster == out_info[start].cluster)
    start--;

587 588 589 590
  /* Extend end */
  while (end < out_len && out_info[end - 1].cluster == out_info[end].cluster)
    end++;

591 592
  /* If we hit the end of out-buffer, continue in buffer. */
  if (end == out_len)
593
    for (unsigned int i = idx; i < len && info[i].cluster == out_info[end - 1].cluster; i++)
594 595
      info[i].cluster = cluster;

596
  for (unsigned int i = start; i < end; i++)
597
    out_info[i].cluster = cluster;
598
}
599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630
void
hb_buffer_t::delete_glyph ()
{
  unsigned int cluster = info[idx].cluster;
  if (idx + 1 < len && cluster == info[idx + 1].cluster)
  {
    /* Cluster survives; do nothing. */
    goto done;
  }

  if (out_len)
  {
    /* Merge cluster backward. */
    if (cluster < out_info[out_len - 1].cluster)
    {
      unsigned int old_cluster = out_info[out_len - 1].cluster;
      for (unsigned i = out_len; i && out_info[i - 1].cluster == old_cluster; i--)
	out_info[i - 1].cluster = cluster;
    }
    goto done;
  }

  if (idx + 1 < len)
  {
    /* Merge cluster forward. */
    merge_clusters (idx, idx + 2);
    goto done;
  }

done:
  skip_glyph ();
}
631

632
void
633
hb_buffer_t::guess_segment_properties (void)
634
{
635 636
  assert (content_type == HB_BUFFER_CONTENT_TYPE_UNICODE ||
	  (!len && content_type == HB_BUFFER_CONTENT_TYPE_INVALID));
637

638 639 640
  /* If script is set to INVALID, guess from buffer contents */
  if (props.script == HB_SCRIPT_INVALID) {
    for (unsigned int i = 0; i < len; i++) {
641
      hb_script_t script = unicode->script (info[i].codepoint);
642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663
      if (likely (script != HB_SCRIPT_COMMON &&
		  script != HB_SCRIPT_INHERITED &&
		  script != HB_SCRIPT_UNKNOWN)) {
        props.script = script;
        break;
      }
    }
  }

  /* If direction is set to INVALID, guess from script */
  if (props.direction == HB_DIRECTION_INVALID) {
    props.direction = hb_script_get_horizontal_direction (props.script);
  }

  /* If language is not set, use default language from locale */
  if (props.language == HB_LANGUAGE_INVALID) {
    /* TODO get_default_for_script? using $LANGUAGE */
    props.language = hb_language_get_default ();
  }
}


664 665
/* Public API */

666
/**
667
 * hb_buffer_create: (Xconstructor)
668
 *
669
 * Creates a new #hb_buffer_t with all properties to defaults.
670
 *
671 672
 * Return value: (transfer full):
 * A newly allocated #hb_buffer_t with a reference count of 1. The initial
K
Khaled Hosny 已提交
673
 * reference count should be released with hb_buffer_destroy() when you are done
674 675 676
 * using the #hb_buffer_t. This function never returns %NULL. If memory cannot
 * be allocated, a special #hb_buffer_t object will be returned on which
 * hb_buffer_allocation_successful() returns %false.
677
 *
B
Behdad Esfahbod 已提交
678
 * Since: 0.9.2
679
 **/
680
hb_buffer_t *
B
Minor  
Behdad Esfahbod 已提交
681
hb_buffer_create (void)
682
{
683 684
  hb_buffer_t *buffer;

685
  if (!(buffer = hb_object_create<hb_buffer_t> ()))
686
    return hb_buffer_get_empty ();
687

B
Behdad Esfahbod 已提交
688 689
  buffer->max_len = HB_BUFFER_MAX_LEN_DEFAULT;

690
  buffer->reset ();
B
Behdad Esfahbod 已提交
691

692 693
  return buffer;
}
B
Behdad Esfahbod 已提交
694

695 696 697 698 699 700 701
/**
 * hb_buffer_get_empty:
 *
 * 
 *
 * Return value: (transfer full):
 *
B
Behdad Esfahbod 已提交
702
 * Since: 0.9.2
703
 **/
704 705 706
hb_buffer_t *
hb_buffer_get_empty (void)
{
707 708 709
  static const hb_buffer_t _hb_buffer_nil = {
    HB_OBJECT_HEADER_STATIC,

710
    const_cast<hb_unicode_funcs_t *> (&_hb_unicode_funcs_nil),
711
    HB_BUFFER_FLAG_DEFAULT,
712
    HB_BUFFER_CLUSTER_LEVEL_DEFAULT,
713
    HB_BUFFER_REPLACEMENT_CODEPOINT_DEFAULT,
714
    HB_BUFFER_SCRATCH_FLAG_DEFAULT,
B
Behdad Esfahbod 已提交
715
    HB_BUFFER_MAX_LEN_DEFAULT,
716

717
    HB_BUFFER_CONTENT_TYPE_INVALID,
718
    HB_SEGMENT_PROPERTIES_DEFAULT,
719 720 721
    true, /* in_error */
    true, /* have_output */
    true  /* have_positions */
722 723

    /* Zero is good enough for everything else. */
724 725 726
  };

  return const_cast<hb_buffer_t *> (&_hb_buffer_nil);
727 728
}

729 730
/**
 * hb_buffer_reference: (skip)
731
 * @buffer: an #hb_buffer_t.
732
 *
733 734
 * Increases the reference count on @buffer by one. This prevents @buffer from
 * being destroyed until a matching call to hb_buffer_destroy() is made.
735 736
 *
 * Return value: (transfer full):
737
 * The referenced #hb_buffer_t.
738
 *
B
Behdad Esfahbod 已提交
739
 * Since: 0.9.2
740
 **/
741 742 743
hb_buffer_t *
hb_buffer_reference (hb_buffer_t *buffer)
{
744
  return hb_object_reference (buffer);
745
}
B
Behdad Esfahbod 已提交
746

747 748
/**
 * hb_buffer_destroy: (skip)
749
 * @buffer: an #hb_buffer_t.
750
 *
751 752 753
 * Deallocate the @buffer.
 * Decreases the reference count on @buffer by one. If the result is zero, then
 * @buffer and all associated resources are freed. See hb_buffer_reference().
754
 *
B
Behdad Esfahbod 已提交
755
 * Since: 0.9.2
756
 **/
B
Behdad Esfahbod 已提交
757
void
758
hb_buffer_destroy (hb_buffer_t *buffer)
B
Behdad Esfahbod 已提交
759
{
760
  if (!hb_object_destroy (buffer)) return;
761

B
Behdad Esfahbod 已提交
762 763
  hb_unicode_funcs_destroy (buffer->unicode);

764
  free (buffer->info);
765
  free (buffer->pos);
766 767
  if (buffer->message_destroy)
    buffer->message_destroy (buffer->message_data);
768

769
  free (buffer);
B
Behdad Esfahbod 已提交
770 771
}

772 773
/**
 * hb_buffer_set_user_data: (skip)
774
 * @buffer: an #hb_buffer_t.
775 776 777 778 779 780 781 782 783
 * @key: 
 * @data: 
 * @destroy: 
 * @replace: 
 *
 * 
 *
 * Return value: 
 *
B
Behdad Esfahbod 已提交
784
 * Since: 0.9.2
785
 **/
786 787 788 789
hb_bool_t
hb_buffer_set_user_data (hb_buffer_t        *buffer,
			 hb_user_data_key_t *key,
			 void *              data,
790 791
			 hb_destroy_func_t   destroy,
			 hb_bool_t           replace)
792
{
793
  return hb_object_set_user_data (buffer, key, data, destroy, replace);
794 795
}

796 797
/**
 * hb_buffer_get_user_data: (skip)
798
 * @buffer: an #hb_buffer_t.
799 800 801 802 803 804
 * @key: 
 *
 * 
 *
 * Return value: 
 *
B
Behdad Esfahbod 已提交
805
 * Since: 0.9.2
806
 **/
807 808 809 810 811 812 813
void *
hb_buffer_get_user_data (hb_buffer_t        *buffer,
			 hb_user_data_key_t *key)
{
  return hb_object_get_user_data (buffer, key);
}

B
Behdad Esfahbod 已提交
814

815 816
/**
 * hb_buffer_set_content_type:
817
 * @buffer: an #hb_buffer_t.
818
 * @content_type: the type of buffer contents to set
819
 *
820 821
 * Sets the type of @buffer contents, buffers are either empty, contain
 * characters (before shaping) or glyphs (the result of shaping).
822
 *
S
Sascha Brawer 已提交
823
 * Since: 0.9.5
824
 **/
825 826 827 828 829 830 831
void
hb_buffer_set_content_type (hb_buffer_t              *buffer,
			    hb_buffer_content_type_t  content_type)
{
  buffer->content_type = content_type;
}

832 833
/**
 * hb_buffer_get_content_type:
834
 * @buffer: an #hb_buffer_t.
835
 *
836
 * see hb_buffer_set_content_type().
837
 *
838 839
 * Return value:
 * The type of @buffer contents.
840
 *
S
Sascha Brawer 已提交
841
 * Since: 0.9.5
842
 **/
843 844 845 846 847 848 849
hb_buffer_content_type_t
hb_buffer_get_content_type (hb_buffer_t *buffer)
{
  return buffer->content_type;
}


850 851
/**
 * hb_buffer_set_unicode_funcs:
852
 * @buffer: an #hb_buffer_t.
853 854 855 856
 * @unicode_funcs: 
 *
 * 
 *
B
Behdad Esfahbod 已提交
857
 * Since: 0.9.2
858
 **/
B
Behdad Esfahbod 已提交
859 860
void
hb_buffer_set_unicode_funcs (hb_buffer_t        *buffer,
861
			     hb_unicode_funcs_t *unicode_funcs)
B
Behdad Esfahbod 已提交
862
{
B
Behdad Esfahbod 已提交
863 864 865
  if (unlikely (hb_object_is_inert (buffer)))
    return;

866 867
  if (!unicode_funcs)
    unicode_funcs = hb_unicode_funcs_get_default ();
868

B
Behdad Esfahbod 已提交
869

870
  hb_unicode_funcs_reference (unicode_funcs);
B
Behdad Esfahbod 已提交
871
  hb_unicode_funcs_destroy (buffer->unicode);
872
  buffer->unicode = unicode_funcs;
B
Behdad Esfahbod 已提交
873 874
}

875 876
/**
 * hb_buffer_get_unicode_funcs:
877
 * @buffer: an #hb_buffer_t.
878 879 880 881 882
 *
 * 
 *
 * Return value: 
 *
B
Behdad Esfahbod 已提交
883
 * Since: 0.9.2
884
 **/
B
Behdad Esfahbod 已提交
885 886 887 888 889 890
hb_unicode_funcs_t *
hb_buffer_get_unicode_funcs (hb_buffer_t        *buffer)
{
  return buffer->unicode;
}

891 892
/**
 * hb_buffer_set_direction:
893
 * @buffer: an #hb_buffer_t.
894
 * @direction: the #hb_direction_t of the @buffer
895
 *
896 897 898 899 900 901 902
 * Set the text flow direction of the buffer. No shaping can happen without
 * setting @buffer direction, and it controls the visual direction for the
 * output glyphs; for RTL direction the glyphs will be reversed. Many layout
 * features depend on the proper setting of the direction, for example,
 * reversing RTL text before shaping, then shaping with LTR direction is not
 * the same as keeping the text in logical order and shaping with RTL
 * direction.
903
 *
B
Behdad Esfahbod 已提交
904
 * Since: 0.9.2
905
 **/
B
Behdad Esfahbod 已提交
906 907 908 909 910
void
hb_buffer_set_direction (hb_buffer_t    *buffer,
			 hb_direction_t  direction)

{
B
Behdad Esfahbod 已提交
911 912 913
  if (unlikely (hb_object_is_inert (buffer)))
    return;

914
  buffer->props.direction = direction;
B
Behdad Esfahbod 已提交
915 916
}

917 918
/**
 * hb_buffer_get_direction:
919
 * @buffer: an #hb_buffer_t.
920
 *
921
 * See hb_buffer_set_direction()
922
 *
923 924
 * Return value:
 * The direction of the @buffer.
925
 *
B
Behdad Esfahbod 已提交
926
 * Since: 0.9.2
927
 **/
B
Behdad Esfahbod 已提交
928 929 930
hb_direction_t
hb_buffer_get_direction (hb_buffer_t    *buffer)
{
931
  return buffer->props.direction;
B
Behdad Esfahbod 已提交
932 933
}

934 935
/**
 * hb_buffer_set_script:
936
 * @buffer: an #hb_buffer_t.
937
 * @script: an #hb_script_t to set.
938
 *
939 940 941 942 943 944 945 946 947
 * Sets the script of @buffer to @script.
 *
 * Script is crucial for choosing the proper shaping behaviour for scripts that
 * require it (e.g. Arabic) and the which OpenType features defined in the font
 * to be applied.
 *
 * You can pass one of the predefined #hb_script_t values, or use
 * hb_script_from_string() or hb_script_from_iso15924_tag() to get the
 * corresponding script from an ISO 15924 script tag.
948
 *
B
Behdad Esfahbod 已提交
949
 * Since: 0.9.2
950
 **/
951 952 953 954
void
hb_buffer_set_script (hb_buffer_t *buffer,
		      hb_script_t  script)
{
B
Behdad Esfahbod 已提交
955 956 957
  if (unlikely (hb_object_is_inert (buffer)))
    return;

958
  buffer->props.script = script;
959 960
}

961 962
/**
 * hb_buffer_get_script:
963
 * @buffer: an #hb_buffer_t.
964
 *
965
 * See hb_buffer_set_script().
966
 *
967 968
 * Return value:
 * The #hb_script_t of the @buffer.
969
 *
B
Behdad Esfahbod 已提交
970
 * Since: 0.9.2
971
 **/
972 973 974
hb_script_t
hb_buffer_get_script (hb_buffer_t *buffer)
{
975
  return buffer->props.script;
976 977
}

978 979
/**
 * hb_buffer_set_language:
980
 * @buffer: an #hb_buffer_t.
981
 * @language: an hb_language_t to set.
982
 *
983 984 985 986 987 988 989 990 991
 * Sets the language of @buffer to @language.
 *
 * Languages are crucial for selecting which OpenType feature to apply to the
 * buffer which can result in applying language-specific behaviour. Languages
 * are orthogonal to the scripts, and though they are related, they are
 * different concepts and should not be confused with each other.
 *
 * Use hb_language_from_string() to convert from ISO 639 language codes to
 * #hb_language_t.
992
 *
B
Behdad Esfahbod 已提交
993
 * Since: 0.9.2
994
 **/
995 996 997 998
void
hb_buffer_set_language (hb_buffer_t   *buffer,
			hb_language_t  language)
{
B
Behdad Esfahbod 已提交
999 1000 1001
  if (unlikely (hb_object_is_inert (buffer)))
    return;

1002
  buffer->props.language = language;
1003 1004
}

1005 1006
/**
 * hb_buffer_get_language:
1007
 * @buffer: an #hb_buffer_t.
1008
 *
1009
 * See hb_buffer_set_language().
1010
 *
1011
 * Return value: (transfer none):
1012
 * The #hb_language_t of the buffer. Must not be freed by the caller.
1013
 *
B
Behdad Esfahbod 已提交
1014
 * Since: 0.9.2
1015
 **/
1016 1017 1018
hb_language_t
hb_buffer_get_language (hb_buffer_t *buffer)
{
1019
  return buffer->props.language;
1020 1021
}

1022 1023
/**
 * hb_buffer_set_segment_properties:
1024
 * @buffer: an #hb_buffer_t.
K
Khaled Hosny 已提交
1025
 * @props: an #hb_segment_properties_t to use.
1026
 *
K
Khaled Hosny 已提交
1027 1028 1029
 * Sets the segment properties of the buffer, a shortcut for calling
 * hb_buffer_set_direction(), hb_buffer_set_script() and
 * hb_buffer_set_language() individually.
1030
 *
S
Sascha Brawer 已提交
1031
 * Since: 0.9.7
1032
 **/
1033 1034 1035 1036 1037 1038 1039 1040 1041 1042
void
hb_buffer_set_segment_properties (hb_buffer_t *buffer,
				  const hb_segment_properties_t *props)
{
  if (unlikely (hb_object_is_inert (buffer)))
    return;

  buffer->props = *props;
}

1043 1044
/**
 * hb_buffer_get_segment_properties:
1045
 * @buffer: an #hb_buffer_t.
K
Khaled Hosny 已提交
1046
 * @props: (out): the output #hb_segment_properties_t.
1047
 *
K
Khaled Hosny 已提交
1048
 * Sets @props to the #hb_segment_properties_t of @buffer.
1049
 *
S
Sascha Brawer 已提交
1050
 * Since: 0.9.7
1051
 **/
1052 1053 1054 1055 1056 1057 1058 1059
void
hb_buffer_get_segment_properties (hb_buffer_t *buffer,
				  hb_segment_properties_t *props)
{
  *props = buffer->props;
}


1060 1061
/**
 * hb_buffer_set_flags:
1062
 * @buffer: an #hb_buffer_t.
1063
 * @flags: the buffer flags to set.
1064
 *
1065
 * Sets @buffer flags to @flags. See #hb_buffer_flags_t.
1066
 *
S
Sascha Brawer 已提交
1067
 * Since: 0.9.7
1068
 **/
B
Behdad Esfahbod 已提交
1069 1070 1071 1072 1073 1074 1075 1076 1077 1078
void
hb_buffer_set_flags (hb_buffer_t       *buffer,
		     hb_buffer_flags_t  flags)
{
  if (unlikely (hb_object_is_inert (buffer)))
    return;

  buffer->flags = flags;
}

1079 1080
/**
 * hb_buffer_get_flags:
1081
 * @buffer: an #hb_buffer_t.
1082
 *
1083
 * See hb_buffer_set_flags().
1084 1085
 *
 * Return value: 
1086
 * The @buffer flags.
1087
 *
S
Sascha Brawer 已提交
1088
 * Since: 0.9.7
1089
 **/
B
Behdad Esfahbod 已提交
1090 1091 1092 1093 1094 1095
hb_buffer_flags_t
hb_buffer_get_flags (hb_buffer_t *buffer)
{
  return buffer->flags;
}

1096 1097
/**
 * hb_buffer_set_cluster_level:
1098
 * @buffer: an #hb_buffer_t.
1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116
 * @cluster_level: 
 *
 * 
 *
 * Since: 0.9.42
 **/
void
hb_buffer_set_cluster_level (hb_buffer_t       *buffer,
		     hb_buffer_cluster_level_t  cluster_level)
{
  if (unlikely (hb_object_is_inert (buffer)))
    return;

  buffer->cluster_level = cluster_level;
}

/**
 * hb_buffer_get_cluster_level:
1117
 * @buffer: an #hb_buffer_t.
1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130
 *
 * 
 *
 * Return value: 
 *
 * Since: 0.9.42
 **/
hb_buffer_cluster_level_t
hb_buffer_get_cluster_level (hb_buffer_t *buffer)
{
  return buffer->cluster_level;
}

B
Behdad Esfahbod 已提交
1131

1132 1133
/**
 * hb_buffer_set_replacement_codepoint:
1134
 * @buffer: an #hb_buffer_t.
K
Khaled Hosny 已提交
1135
 * @replacement: the replacement #hb_codepoint_t
1136
 *
K
Khaled Hosny 已提交
1137 1138 1139 1140
 * Sets the #hb_codepoint_t that replaces invalid entries for a given encoding
 * when adding text to @buffer.
 *
 * Default is %HB_BUFFER_REPLACEMENT_CODEPOINT_DEFAULT.
1141
 *
S
Sascha Brawer 已提交
1142
 * Since: 0.9.31
1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155
 **/
void
hb_buffer_set_replacement_codepoint (hb_buffer_t    *buffer,
				     hb_codepoint_t  replacement)
{
  if (unlikely (hb_object_is_inert (buffer)))
    return;

  buffer->replacement = replacement;
}

/**
 * hb_buffer_get_replacement_codepoint:
1156
 * @buffer: an #hb_buffer_t.
1157
 *
K
Khaled Hosny 已提交
1158
 * See hb_buffer_set_replacement_codepoint().
1159 1160
 *
 * Return value: 
K
Khaled Hosny 已提交
1161
 * The @buffer replacement #hb_codepoint_t.
1162
 *
S
Sascha Brawer 已提交
1163
 * Since: 0.9.31
1164 1165 1166 1167 1168 1169 1170 1171
 **/
hb_codepoint_t
hb_buffer_get_replacement_codepoint (hb_buffer_t    *buffer)
{
  return buffer->replacement;
}


1172 1173
/**
 * hb_buffer_reset:
1174
 * @buffer: an #hb_buffer_t.
1175
 *
K
Khaled Hosny 已提交
1176 1177
 * Resets the buffer to its initial status, as if it was just newly created
 * with hb_buffer_create().
1178
 *
B
Behdad Esfahbod 已提交
1179
 * Since: 0.9.2
1180
 **/
1181 1182
void
hb_buffer_reset (hb_buffer_t *buffer)
B
Behdad Esfahbod 已提交
1183
{
1184
  buffer->reset ();
B
Behdad Esfahbod 已提交
1185 1186
}

1187 1188
/**
 * hb_buffer_clear_contents:
1189
 * @buffer: an #hb_buffer_t.
1190
 *
K
Khaled Hosny 已提交
1191 1192
 * Similar to hb_buffer_reset(), but does not clear the Unicode functions and
 * the replacement code point.
1193
 *
S
Sascha Brawer 已提交
1194
 * Since: 0.9.11
1195
 **/
B
Behdad Esfahbod 已提交
1196
void
1197
hb_buffer_clear_contents (hb_buffer_t *buffer)
B
Behdad Esfahbod 已提交
1198 1199 1200 1201
{
  buffer->clear ();
}

1202 1203
/**
 * hb_buffer_pre_allocate:
1204
 * @buffer: an #hb_buffer_t.
1205
 * @size: number of items to pre allocate.
1206
 *
1207
 * Pre allocates memory for @buffer to fit at least @size number of items.
1208
 *
1209
 * Return value:
K
Khaled Hosny 已提交
1210
 * %true if @buffer memory allocation succeeded, %false otherwise.
1211
 *
B
Behdad Esfahbod 已提交
1212
 * Since: 0.9.2
1213
 **/
1214
hb_bool_t
1215
hb_buffer_pre_allocate (hb_buffer_t *buffer, unsigned int size)
B
Behdad Esfahbod 已提交
1216
{
1217
  return buffer->ensure (size);
B
Behdad Esfahbod 已提交
1218 1219
}

1220 1221
/**
 * hb_buffer_allocation_successful:
1222
 * @buffer: an #hb_buffer_t.
1223
 *
1224
 * Check if allocating memory for the buffer succeeded.
1225
 *
1226
 * Return value:
K
Khaled Hosny 已提交
1227
 * %true if @buffer memory allocation succeeded, %false otherwise.
1228
 *
B
Behdad Esfahbod 已提交
1229
 * Since: 0.9.2
1230
 **/
1231 1232 1233 1234 1235 1236
hb_bool_t
hb_buffer_allocation_successful (hb_buffer_t  *buffer)
{
  return !buffer->in_error;
}

1237 1238
/**
 * hb_buffer_add:
1239 1240 1241
 * @buffer: an #hb_buffer_t.
 * @codepoint: a Unicode code point.
 * @cluster: the cluster value of @codepoint.
1242
 *
1243 1244 1245 1246 1247
 * Appends a character with the Unicode value of @codepoint to @buffer, and
 * gives it the initial cluster value of @cluster. Clusters can be any thing
 * the client wants, they are usually used to refer to the index of the
 * character in the input text stream and are output in
 * #hb_glyph_info_t.cluster field.
1248
 *
K
Khaled Hosny 已提交
1249 1250 1251
 * This function does not check the validity of @codepoint, it is up to the
 * caller to ensure it is a valid Unicode code point.
 *
B
Behdad Esfahbod 已提交
1252
 * Since: 0.9.7
1253
 **/
1254
void
1255 1256 1257
hb_buffer_add (hb_buffer_t    *buffer,
	       hb_codepoint_t  codepoint,
	       unsigned int    cluster)
1258
{
1259
  buffer->add (codepoint, cluster);
1260
  buffer->clear_context (1);
1261 1262
}

1263 1264
/**
 * hb_buffer_set_length:
1265
 * @buffer: an #hb_buffer_t.
K
Khaled Hosny 已提交
1266
 * @length: the new length of @buffer.
1267
 *
K
Khaled Hosny 已提交
1268 1269
 * Similar to hb_buffer_pre_allocate(), but clears any new items added at the
 * end.
1270 1271
 *
 * Return value: 
K
Khaled Hosny 已提交
1272
 * %true if @buffer memory allocation succeeded, %false otherwise.
1273
 *
B
Behdad Esfahbod 已提交
1274
 * Since: 0.9.2
1275
 **/
1276 1277 1278 1279
hb_bool_t
hb_buffer_set_length (hb_buffer_t  *buffer,
		      unsigned int  length)
{
1280 1281 1282
  if (unlikely (hb_object_is_inert (buffer)))
    return length == 0;

1283
  if (!buffer->ensure (length))
1284
    return false;
1285 1286 1287 1288 1289 1290 1291 1292 1293

  /* Wipe the new space */
  if (length > buffer->len) {
    memset (buffer->info + buffer->len, 0, sizeof (buffer->info[0]) * (length - buffer->len));
    if (buffer->have_positions)
      memset (buffer->pos + buffer->len, 0, sizeof (buffer->pos[0]) * (length - buffer->len));
  }

  buffer->len = length;
1294 1295

  if (!length)
1296 1297
  {
    buffer->content_type = HB_BUFFER_CONTENT_TYPE_INVALID;
1298
    buffer->clear_context (0);
1299
  }
1300 1301
  buffer->clear_context (1);

1302
  return true;
1303 1304
}

B
Behdad Esfahbod 已提交
1305 1306
/**
 * hb_buffer_get_length:
1307
 * @buffer: an #hb_buffer_t.
B
Behdad Esfahbod 已提交
1308 1309 1310
 *
 * Returns the number of items in the buffer.
 *
1311 1312
 * Return value:
 * The @buffer length.
K
Khaled Hosny 已提交
1313
 * The value valid as long as buffer has not been modified.
B
Behdad Esfahbod 已提交
1314
 *
B
Behdad Esfahbod 已提交
1315
 * Since: 0.9.2
B
Behdad Esfahbod 已提交
1316
 **/
1317
unsigned int
1318
hb_buffer_get_length (hb_buffer_t *buffer)
1319
{
1320
  return buffer->len;
1321 1322
}

B
Behdad Esfahbod 已提交
1323 1324
/**
 * hb_buffer_get_glyph_infos:
1325
 * @buffer: an #hb_buffer_t.
B
Behdad Esfahbod 已提交
1326 1327
 * @length: (out): output array length.
 *
1328 1329
 * Returns @buffer glyph information array.  Returned pointer
 * is valid as long as @buffer contents are not modified.
B
Behdad Esfahbod 已提交
1330
 *
1331 1332
 * Return value: (transfer none) (array length=length):
 * The @buffer glyph information array.
K
Khaled Hosny 已提交
1333
 * The value valid as long as buffer has not been modified.
B
Behdad Esfahbod 已提交
1334
 *
B
Behdad Esfahbod 已提交
1335
 * Since: 0.9.2
B
Behdad Esfahbod 已提交
1336
 **/
1337
hb_glyph_info_t *
1338 1339
hb_buffer_get_glyph_infos (hb_buffer_t  *buffer,
                           unsigned int *length)
1340
{
1341 1342 1343
  if (length)
    *length = buffer->len;

1344
  return (hb_glyph_info_t *) buffer->info;
1345 1346
}

B
Behdad Esfahbod 已提交
1347 1348
/**
 * hb_buffer_get_glyph_positions:
1349
 * @buffer: an #hb_buffer_t.
B
Behdad Esfahbod 已提交
1350 1351
 * @length: (out): output length.
 *
1352 1353
 * Returns @buffer glyph position array.  Returned pointer
 * is valid as long as @buffer contents are not modified.
B
Behdad Esfahbod 已提交
1354
 *
1355 1356
 * Return value: (transfer none) (array length=length):
 * The @buffer glyph position array.
K
Khaled Hosny 已提交
1357
 * The value valid as long as buffer has not been modified.
B
Behdad Esfahbod 已提交
1358
 *
B
Behdad Esfahbod 已提交
1359
 * Since: 0.9.2
B
Behdad Esfahbod 已提交
1360
 **/
1361
hb_glyph_position_t *
1362 1363
hb_buffer_get_glyph_positions (hb_buffer_t  *buffer,
                               unsigned int *length)
1364
{
1365
  if (!buffer->have_positions)
1366
    buffer->clear_positions ();
1367

1368 1369 1370
  if (length)
    *length = buffer->len;

1371
  return (hb_glyph_position_t *) buffer->pos;
1372
}
B
Behdad Esfahbod 已提交
1373

B
Behdad Esfahbod 已提交
1374 1375
/**
 * hb_buffer_reverse:
1376
 * @buffer: an #hb_buffer_t.
B
Behdad Esfahbod 已提交
1377 1378 1379
 *
 * Reverses buffer contents.
 *
B
Behdad Esfahbod 已提交
1380
 * Since: 0.9.2
B
Behdad Esfahbod 已提交
1381
 **/
1382 1383 1384
void
hb_buffer_reverse (hb_buffer_t *buffer)
{
1385
  buffer->reverse ();
1386 1387
}

1388 1389
/**
 * hb_buffer_reverse_range:
1390
 * @buffer: an #hb_buffer_t.
1391 1392 1393
 * @start: start index.
 * @end: end index.
 *
B
Behdad Esfahbod 已提交
1394
 * Reverses buffer contents between start to end.
1395
 *
B
Behdad Esfahbod 已提交
1396
 * Since: 0.9.41
1397 1398 1399 1400 1401 1402 1403 1404
 **/
void
hb_buffer_reverse_range (hb_buffer_t *buffer,
			 unsigned int start, unsigned int end)
{
  buffer->reverse_range (start, end);
}

B
Behdad Esfahbod 已提交
1405 1406
/**
 * hb_buffer_reverse_clusters:
1407
 * @buffer: an #hb_buffer_t.
B
Behdad Esfahbod 已提交
1408 1409 1410 1411 1412
 *
 * Reverses buffer clusters.  That is, the buffer contents are
 * reversed, then each cluster (consecutive items having the
 * same cluster number) are reversed again.
 *
B
Behdad Esfahbod 已提交
1413
 * Since: 0.9.2
B
Behdad Esfahbod 已提交
1414
 **/
1415 1416 1417
void
hb_buffer_reverse_clusters (hb_buffer_t *buffer)
{
1418
  buffer->reverse_clusters ();
1419 1420
}

B
Behdad Esfahbod 已提交
1421 1422
/**
 * hb_buffer_guess_segment_properties:
1423
 * @buffer: an #hb_buffer_t.
B
Behdad Esfahbod 已提交
1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442
 *
 * Sets unset buffer segment properties based on buffer Unicode
 * contents.  If buffer is not empty, it must have content type
 * %HB_BUFFER_CONTENT_TYPE_UNICODE.
 *
 * If buffer script is not set (ie. is %HB_SCRIPT_INVALID), it
 * will be set to the Unicode script of the first character in
 * the buffer that has a script other than %HB_SCRIPT_COMMON,
 * %HB_SCRIPT_INHERITED, and %HB_SCRIPT_UNKNOWN.
 *
 * Next, if buffer direction is not set (ie. is %HB_DIRECTION_INVALID),
 * it will be set to the natural horizontal direction of the
 * buffer script as returned by hb_script_get_horizontal_direction().
 *
 * Finally, if buffer language is not set (ie. is %HB_LANGUAGE_INVALID),
 * it will be set to the process's default language as returned by
 * hb_language_get_default().  This may change in the future by
 * taking buffer script into consideration when choosing a language.
 *
S
Sascha Brawer 已提交
1443
 * Since: 0.9.7
B
Behdad Esfahbod 已提交
1444
 **/
1445
void
1446
hb_buffer_guess_segment_properties (hb_buffer_t *buffer)
1447
{
1448
  buffer->guess_segment_properties ();
1449 1450
}

1451
template <typename utf_t>
1452 1453
static inline void
hb_buffer_add_utf (hb_buffer_t  *buffer,
1454
		   const typename utf_t::codepoint_t *text,
1455 1456 1457 1458
		   int           text_length,
		   unsigned int  item_offset,
		   int           item_length)
{
1459
  typedef typename utf_t::codepoint_t T;
1460
  const hb_codepoint_t replacement = buffer->replacement;
1461

1462 1463 1464 1465 1466 1467
  assert (buffer->content_type == HB_BUFFER_CONTENT_TYPE_UNICODE ||
	  (!buffer->len && buffer->content_type == HB_BUFFER_CONTENT_TYPE_INVALID));

  if (unlikely (hb_object_is_inert (buffer)))
    return;

B
Behdad Esfahbod 已提交
1468
  if (text_length == -1)
1469
    text_length = utf_t::strlen (text);
1470 1471 1472 1473 1474 1475

  if (item_length == -1)
    item_length = text_length - item_offset;

  buffer->ensure (buffer->len + item_length * sizeof (T) / 4);

1476 1477 1478 1479 1480 1481 1482 1483
  /* If buffer is empty and pre-context provided, install it.
   * This check is written this way, to make sure people can
   * provide pre-context in one add_utf() call, then provide
   * text in a follow-up call.  See:
   *
   * https://bugzilla.mozilla.org/show_bug.cgi?id=801410#c13
   */
  if (!buffer->len && item_offset > 0)
1484 1485 1486 1487 1488 1489 1490 1491
  {
    /* Add pre-context */
    buffer->clear_context (0);
    const T *prev = text + item_offset;
    const T *start = text;
    while (start < prev && buffer->context_len[0] < buffer->CONTEXT_LENGTH)
    {
      hb_codepoint_t u;
1492
      prev = utf_t::prev (prev, start, &u, replacement);
1493 1494 1495 1496 1497
      buffer->context[0][buffer->context_len[0]++] = u;
    }
  }

  const T *next = text + item_offset;
1498
  const T *end = next + item_length;
1499 1500
  while (next < end)
  {
1501 1502
    hb_codepoint_t u;
    const T *old_next = next;
1503
    next = utf_t::next (next, end, &u, replacement);
1504
    buffer->add (u, old_next - (const T *) text);
1505 1506 1507 1508 1509 1510 1511 1512
  }

  /* Add post-context */
  buffer->clear_context (1);
  end = text + text_length;
  while (next < end && buffer->context_len[1] < buffer->CONTEXT_LENGTH)
  {
    hb_codepoint_t u;
1513
    next = utf_t::next (next, end, &u, replacement);
1514
    buffer->context[1][buffer->context_len[1]++] = u;
1515 1516 1517
  }

  buffer->content_type = HB_BUFFER_CONTENT_TYPE_UNICODE;
1518 1519
}

1520 1521
/**
 * hb_buffer_add_utf8:
1522
 * @buffer: an #hb_buffer_t.
K
Khaled Hosny 已提交
1523 1524
 * @text: (array length=text_length) (element-type uint8_t): an array of UTF-8
 *               characters to append.
1525 1526 1527 1528
 * @text_length: the length of the @text, or -1 if it is %NULL terminated.
 * @item_offset: the offset of the first character to add to the @buffer.
 * @item_length: the number of characters to add to the @buffer, or -1 for the
 *               end of @text (assuming it is %NULL terminated).
1529
 *
1530
 * See hb_buffer_add_codepoints().
1531
 *
K
Khaled Hosny 已提交
1532 1533 1534
 * Replaces invalid UTF-8 characters with the @buffer replacement code point,
 * see hb_buffer_set_replacement_codepoint().
 *
B
Behdad Esfahbod 已提交
1535
 * Since: 0.9.2
1536
 **/
1537 1538 1539
void
hb_buffer_add_utf8 (hb_buffer_t  *buffer,
		    const char   *text,
1540
		    int           text_length,
1541
		    unsigned int  item_offset,
1542
		    int           item_length)
1543
{
1544
  hb_buffer_add_utf<hb_utf8_t> (buffer, (const uint8_t *) text, text_length, item_offset, item_length);
1545 1546
}

1547 1548
/**
 * hb_buffer_add_utf16:
1549 1550 1551 1552 1553 1554
 * @buffer: an #hb_buffer_t.
 * @text: (array length=text_length): an array of UTF-16 characters to append.
 * @text_length: the length of the @text, or -1 if it is %NULL terminated.
 * @item_offset: the offset of the first character to add to the @buffer.
 * @item_length: the number of characters to add to the @buffer, or -1 for the
 *               end of @text (assuming it is %NULL terminated).
1555
 *
1556
 * See hb_buffer_add_codepoints().
1557
 *
K
Khaled Hosny 已提交
1558 1559 1560
 * Replaces invalid UTF-16 characters with the @buffer replacement code point,
 * see hb_buffer_set_replacement_codepoint().
 *
B
Behdad Esfahbod 已提交
1561
 * Since: 0.9.2
1562
 **/
1563 1564 1565
void
hb_buffer_add_utf16 (hb_buffer_t    *buffer,
		     const uint16_t *text,
1566
		     int             text_length,
1567
		     unsigned int    item_offset,
1568
		     int             item_length)
1569
{
1570
  hb_buffer_add_utf<hb_utf16_t> (buffer, text, text_length, item_offset, item_length);
1571 1572
}

1573 1574
/**
 * hb_buffer_add_utf32:
1575 1576 1577 1578 1579 1580
 * @buffer: an #hb_buffer_t.
 * @text: (array length=text_length): an array of UTF-32 characters to append.
 * @text_length: the length of the @text, or -1 if it is %NULL terminated.
 * @item_offset: the offset of the first character to add to the @buffer.
 * @item_length: the number of characters to add to the @buffer, or -1 for the
 *               end of @text (assuming it is %NULL terminated).
1581
 *
1582
 * See hb_buffer_add_codepoints().
1583
 *
K
Khaled Hosny 已提交
1584 1585 1586
 * Replaces invalid UTF-32 characters with the @buffer replacement code point,
 * see hb_buffer_set_replacement_codepoint().
 *
B
Behdad Esfahbod 已提交
1587
 * Since: 0.9.2
1588
 **/
1589 1590 1591
void
hb_buffer_add_utf32 (hb_buffer_t    *buffer,
		     const uint32_t *text,
1592
		     int             text_length,
1593
		     unsigned int    item_offset,
1594
		     int             item_length)
1595
{
1596 1597 1598 1599 1600
  hb_buffer_add_utf<hb_utf32_t<> > (buffer, text, text_length, item_offset, item_length);
}

/**
 * hb_buffer_add_latin1:
1601
 * @buffer: an #hb_buffer_t.
K
Khaled Hosny 已提交
1602 1603 1604 1605 1606 1607
 * @text: (array length=text_length) (element-type uint8_t): an array of UTF-8
 *               characters to append.
 * @text_length: the length of the @text, or -1 if it is %NULL terminated.
 * @item_offset: the offset of the first character to add to the @buffer.
 * @item_length: the number of characters to add to the @buffer, or -1 for the
 *               end of @text (assuming it is %NULL terminated).
1608
 *
K
Khaled Hosny 已提交
1609 1610 1611 1612
 * Similar to hb_buffer_add_codepoints(), but allows only access to first 256
 * Unicode code points that can fit in 8-bit strings.
 *
 * <note>Has nothing to do with non-Unicode Latin-1 encoding.</note>
1613
 *
S
Sascha Brawer 已提交
1614
 * Since: 0.9.39
1615 1616 1617 1618 1619 1620 1621 1622 1623
 **/
void
hb_buffer_add_latin1 (hb_buffer_t   *buffer,
		      const uint8_t *text,
		      int            text_length,
		      unsigned int   item_offset,
		      int            item_length)
{
  hb_buffer_add_utf<hb_latin1_t> (buffer, text, text_length, item_offset, item_length);
1624 1625 1626 1627
}

/**
 * hb_buffer_add_codepoints:
1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643
 * @buffer: a #hb_buffer_t to append characters to.
 * @text: (array length=text_length): an array of Unicode code points to append.
 * @text_length: the length of the @text, or -1 if it is %NULL terminated.
 * @item_offset: the offset of the first code point to add to the @buffer.
 * @item_length: the number of code points to add to the @buffer, or -1 for the
 *               end of @text (assuming it is %NULL terminated).
 *
 * Appends characters from @text array to @buffer. The @item_offset is the
 * position of the first character from @text that will be appended, and
 * @item_length is the number of character. When shaping part of a larger text
 * (e.g. a run of text from a paragraph), instead of passing just the substring
 * corresponding to the run, it is preferable to pass the whole
 * paragraph and specify the run start and length as @item_offset and
 * @item_length, respectively, to give HarfBuzz the full context to be able,
 * for example, to do cross-run Arabic shaping or properly handle combining
 * marks at stat of run.
1644
 *
K
Khaled Hosny 已提交
1645 1646 1647
 * This function does not check the validity of @text, it is up to the caller
 * to ensure it contains a valid Unicode code points.
 *
S
Sascha Brawer 已提交
1648
 * Since: 0.9.31
1649 1650 1651 1652 1653 1654 1655 1656
 **/
void
hb_buffer_add_codepoints (hb_buffer_t          *buffer,
			  const hb_codepoint_t *text,
			  int                   text_length,
			  unsigned int          item_offset,
			  int                   item_length)
{
1657
  hb_buffer_add_utf<hb_utf32_t<false> > (buffer, text, text_length, item_offset, item_length);
1658
}
B
Behdad Esfahbod 已提交
1659 1660


1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702
static int
compare_info_codepoint (const hb_glyph_info_t *pa,
			const hb_glyph_info_t *pb)
{
  return (int) pb->codepoint - (int) pa->codepoint;
}

static inline void
normalize_glyphs_cluster (hb_buffer_t *buffer,
			  unsigned int start,
			  unsigned int end,
			  bool backward)
{
  hb_glyph_position_t *pos = buffer->pos;

  /* Total cluster advance */
  hb_position_t total_x_advance = 0, total_y_advance = 0;
  for (unsigned int i = start; i < end; i++)
  {
    total_x_advance += pos[i].x_advance;
    total_y_advance += pos[i].y_advance;
  }

  hb_position_t x_advance = 0, y_advance = 0;
  for (unsigned int i = start; i < end; i++)
  {
    pos[i].x_offset += x_advance;
    pos[i].y_offset += y_advance;

    x_advance += pos[i].x_advance;
    y_advance += pos[i].y_advance;

    pos[i].x_advance = 0;
    pos[i].y_advance = 0;
  }

  if (backward)
  {
    /* Transfer all cluster advance to the last glyph. */
    pos[end - 1].x_advance = total_x_advance;
    pos[end - 1].y_advance = total_y_advance;

1703
    hb_stable_sort (buffer->info + start, end - start - 1, compare_info_codepoint, buffer->pos + start);
1704 1705 1706 1707 1708 1709 1710 1711
  } else {
    /* Transfer all cluster advance to the first glyph. */
    pos[start].x_advance += total_x_advance;
    pos[start].y_advance += total_y_advance;
    for (unsigned int i = start + 1; i < end; i++) {
      pos[i].x_offset -= total_x_advance;
      pos[i].y_offset -= total_y_advance;
    }
1712
    hb_stable_sort (buffer->info + start + 1, end - start - 1, compare_info_codepoint, buffer->pos + start + 1);
1713 1714 1715
  }
}

1716 1717
/**
 * hb_buffer_normalize_glyphs:
1718
 * @buffer: an #hb_buffer_t.
1719
 *
K
Khaled Hosny 已提交
1720 1721 1722 1723
 * Reorders a glyph buffer to have canonical in-cluster glyph order / position.
 * The resulting clusters should behave identical to pre-reordering clusters.
 *
 * <note>This has nothing to do with Unicode normalization.</note>
1724
 *
S
Sascha Brawer 已提交
1725
 * Since: 0.9.2
1726
 **/
1727 1728 1729 1730
void
hb_buffer_normalize_glyphs (hb_buffer_t *buffer)
{
  assert (buffer->have_positions);
B
Minor  
Behdad Esfahbod 已提交
1731
  assert (buffer->content_type == HB_BUFFER_CONTENT_TYPE_GLYPHS);
1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747

  bool backward = HB_DIRECTION_IS_BACKWARD (buffer->props.direction);

  unsigned int count = buffer->len;
  if (unlikely (!count)) return;
  hb_glyph_info_t *info = buffer->info;

  unsigned int start = 0;
  unsigned int end;
  for (end = start + 1; end < count; end++)
    if (info[start].cluster != info[end].cluster) {
      normalize_glyphs_cluster (buffer, start, end, backward);
      start = end;
    }
  normalize_glyphs_cluster (buffer, start, end, backward);
}
1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768

void
hb_buffer_t::sort (unsigned int start, unsigned int end, int(*compar)(const hb_glyph_info_t *, const hb_glyph_info_t *))
{
  assert (!have_positions);
  for (unsigned int i = start + 1; i < end; i++)
  {
    unsigned int j = i;
    while (j > start && compar (&info[j - 1], &info[i]) > 0)
      j--;
    if (i == j)
      continue;
    /* Move item i to occupy place for item j, shift what's in between. */
    merge_clusters (j, i + 1);
    {
      hb_glyph_info_t t = info[i];
      memmove (&info[j + 1], &info[j], (i - j) * sizeof (hb_glyph_info_t));
      info[j] = t;
    }
  }
}
1769 1770 1771 1772 1773 1774 1775

/*
 * Debugging.
 */

/**
 * hb_buffer_set_message_func:
1776
 * @buffer: an #hb_buffer_t.
1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810
 * @func: (closure user_data) (destroy destroy) (scope notified):
 * @user_data:
 * @destroy:
 *
 * 
 *
 * Since: 1.1.3
 **/
void
hb_buffer_set_message_func (hb_buffer_t *buffer,
			    hb_buffer_message_func_t func,
			    void *user_data, hb_destroy_func_t destroy)
{
  if (buffer->message_destroy)
    buffer->message_destroy (buffer->message_data);

  if (func) {
    buffer->message_func = func;
    buffer->message_data = user_data;
    buffer->message_destroy = destroy;
  } else {
    buffer->message_func = NULL;
    buffer->message_data = NULL;
    buffer->message_destroy = NULL;
  }
}

bool
hb_buffer_t::message_impl (hb_font_t *font, const char *fmt, va_list ap)
{
  char buf[100];
  vsnprintf (buf, sizeof (buf),  fmt, ap);
  return (bool) this->message_func (this, font, buf, this->message_data);
}