Blame src/hb-set-private.hh

Packit 874993
/*
Packit 874993
 * Copyright © 2012  Google, Inc.
Packit 874993
 *
Packit 874993
 *  This is part of HarfBuzz, a text shaping library.
Packit 874993
 *
Packit 874993
 * Permission is hereby granted, without written agreement and without
Packit 874993
 * license or royalty fees, to use, copy, modify, and distribute this
Packit 874993
 * software and its documentation for any purpose, provided that the
Packit 874993
 * above copyright notice and the following two paragraphs appear in
Packit 874993
 * all copies of this software.
Packit 874993
 *
Packit 874993
 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
Packit 874993
 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
Packit 874993
 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
Packit 874993
 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
Packit 874993
 * DAMAGE.
Packit 874993
 *
Packit 874993
 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
Packit 874993
 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
Packit 874993
 * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
Packit 874993
 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
Packit 874993
 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
Packit 874993
 *
Packit 874993
 * Google Author(s): Behdad Esfahbod
Packit 874993
 */
Packit 874993
Packit 874993
#ifndef HB_SET_PRIVATE_HH
Packit 874993
#define HB_SET_PRIVATE_HH
Packit 874993
Packit 874993
#include "hb-private.hh"
Packit 874993
#include "hb-object-private.hh"
Packit 874993
Packit 874993
Packit 874993
/*
Packit 874993
 * The set digests here implement various "filters" that support
Packit 874993
 * "approximate member query".  Conceptually these are like Bloom
Packit 874993
 * Filter and Quotient Filter, however, much smaller, faster, and
Packit 874993
 * designed to fit the requirements of our uses for glyph coverage
Packit 874993
 * queries.
Packit 874993
 *
Packit 874993
 * Our filters are highly accurate if the lookup covers fairly local
Packit 874993
 * set of glyphs, but fully flooded and ineffective if coverage is
Packit 874993
 * all over the place.
Packit 874993
 *
Packit 874993
 * The frozen-set can be used instead of a digest, to trade more
Packit 874993
 * memory for 100% accuracy, but in practice, that doesn't look like
Packit 874993
 * an attractive trade-off.
Packit 874993
 */
Packit 874993
Packit 874993
template <typename mask_t, unsigned int shift>
Packit 874993
struct hb_set_digest_lowest_bits_t
Packit 874993
{
Packit 874993
  ASSERT_POD ();
Packit 874993
Packit 874993
  static const unsigned int mask_bytes = sizeof (mask_t);
Packit 874993
  static const unsigned int mask_bits = sizeof (mask_t) * 8;
Packit 874993
  static const unsigned int num_bits = 0
Packit 874993
				     + (mask_bytes >= 1 ? 3 : 0)
Packit 874993
				     + (mask_bytes >= 2 ? 1 : 0)
Packit 874993
				     + (mask_bytes >= 4 ? 1 : 0)
Packit 874993
				     + (mask_bytes >= 8 ? 1 : 0)
Packit 874993
				     + (mask_bytes >= 16? 1 : 0)
Packit 874993
				     + 0;
Packit 874993
Packit 874993
  ASSERT_STATIC (shift < sizeof (hb_codepoint_t) * 8);
Packit 874993
  ASSERT_STATIC (shift + num_bits <= sizeof (hb_codepoint_t) * 8);
Packit 874993
Packit 874993
  inline void init (void) {
Packit 874993
    mask = 0;
Packit 874993
  }
Packit 874993
Packit 874993
  inline void add (hb_codepoint_t g) {
Packit 874993
    mask |= mask_for (g);
Packit 874993
  }
Packit 874993
Packit 874993
  inline void add_range (hb_codepoint_t a, hb_codepoint_t b) {
Packit 874993
    if ((b >> shift) - (a >> shift) >= mask_bits - 1)
Packit 874993
      mask = (mask_t) -1;
Packit 874993
    else {
Packit 874993
      mask_t ma = mask_for (a);
Packit 874993
      mask_t mb = mask_for (b);
Packit 874993
      mask |= mb + (mb - ma) - (mb < ma);
Packit 874993
    }
Packit 874993
  }
Packit 874993
Packit 874993
  inline bool may_have (hb_codepoint_t g) const {
Packit 874993
    return !!(mask & mask_for (g));
Packit 874993
  }
Packit 874993
Packit 874993
  private:
Packit 874993
Packit 874993
  static inline mask_t mask_for (hb_codepoint_t g) {
Packit 874993
    return ((mask_t) 1) << ((g >> shift) & (mask_bits - 1));
Packit 874993
  }
Packit 874993
  mask_t mask;
Packit 874993
};
Packit 874993
Packit 874993
template <typename head_t, typename tail_t>
Packit 874993
struct hb_set_digest_combiner_t
Packit 874993
{
Packit 874993
  ASSERT_POD ();
Packit 874993
Packit 874993
  inline void init (void) {
Packit 874993
    head.init ();
Packit 874993
    tail.init ();
Packit 874993
  }
Packit 874993
Packit 874993
  inline void add (hb_codepoint_t g) {
Packit 874993
    head.add (g);
Packit 874993
    tail.add (g);
Packit 874993
  }
Packit 874993
Packit 874993
  inline void add_range (hb_codepoint_t a, hb_codepoint_t b) {
Packit 874993
    head.add_range (a, b);
Packit 874993
    tail.add_range (a, b);
Packit 874993
  }
Packit 874993
Packit 874993
  inline bool may_have (hb_codepoint_t g) const {
Packit 874993
    return head.may_have (g) && tail.may_have (g);
Packit 874993
  }
Packit 874993
Packit 874993
  private:
Packit 874993
  head_t head;
Packit 874993
  tail_t tail;
Packit 874993
};
Packit 874993
Packit 874993
Packit 874993
/*
Packit 874993
 * hb_set_digest_t
Packit 874993
 *
Packit 874993
 * This is a combination of digests that performs "best".
Packit 874993
 * There is not much science to this: it's a result of intuition
Packit 874993
 * and testing.
Packit 874993
 */
Packit 874993
typedef hb_set_digest_combiner_t
Packit 874993
<
Packit 874993
  hb_set_digest_lowest_bits_t<unsigned long, 4>,
Packit 874993
  hb_set_digest_combiner_t
Packit 874993
  <
Packit 874993
    hb_set_digest_lowest_bits_t<unsigned long, 0>,
Packit 874993
    hb_set_digest_lowest_bits_t<unsigned long, 9>
Packit 874993
  >
Packit 874993
> hb_set_digest_t;
Packit 874993
Packit 874993
Packit 874993
Packit 874993
/*
Packit 874993
 * hb_set_t
Packit 874993
 */
Packit 874993
Packit 874993
Packit 874993
/* TODO Make this faster and memmory efficient. */
Packit 874993
Packit 874993
struct hb_set_t
Packit 874993
{
Packit 874993
  friend struct hb_frozen_set_t;
Packit 874993
Packit 874993
  hb_object_header_t header;
Packit 874993
  ASSERT_POD ();
Packit 874993
  bool in_error;
Packit 874993
Packit 874993
  inline void init (void) {
Packit 874993
    hb_object_init (this);
Packit 874993
    clear ();
Packit 874993
  }
Packit 874993
  inline void fini (void) {
Packit 874993
  }
Packit 874993
  inline void clear (void) {
Packit 874993
    if (unlikely (hb_object_is_inert (this)))
Packit 874993
      return;
Packit 874993
    in_error = false;
Packit 874993
    memset (elts, 0, sizeof elts);
Packit 874993
  }
Packit 874993
  inline bool is_empty (void) const {
Packit 874993
    for (unsigned int i = 0; i < ARRAY_LENGTH (elts); i++)
Packit 874993
      if (elts[i])
Packit 874993
        return false;
Packit 874993
    return true;
Packit 874993
  }
Packit 874993
  inline void add (hb_codepoint_t g)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    if (unlikely (g == INVALID)) return;
Packit 874993
    if (unlikely (g > MAX_G)) return;
Packit 874993
    elt (g) |= mask (g);
Packit 874993
  }
Packit 874993
  inline void add_range (hb_codepoint_t a, hb_codepoint_t b)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    /* TODO Speedup */
Packit 874993
    for (unsigned int i = a; i < b + 1; i++)
Packit 874993
      add (i);
Packit 874993
  }
Packit 874993
  inline void del (hb_codepoint_t g)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    if (unlikely (g > MAX_G)) return;
Packit 874993
    elt (g) &= ~mask (g);
Packit 874993
  }
Packit 874993
  inline void del_range (hb_codepoint_t a, hb_codepoint_t b)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    /* TODO Speedup */
Packit 874993
    for (unsigned int i = a; i < b + 1; i++)
Packit 874993
      del (i);
Packit 874993
  }
Packit 874993
  inline bool has (hb_codepoint_t g) const
Packit 874993
  {
Packit 874993
    if (unlikely (g > MAX_G)) return false;
Packit 874993
    return !!(elt (g) & mask (g));
Packit 874993
  }
Packit 874993
  inline bool intersects (hb_codepoint_t first,
Packit 874993
			  hb_codepoint_t last) const
Packit 874993
  {
Packit 874993
    if (unlikely (first > MAX_G)) return false;
Packit 874993
    if (unlikely (last  > MAX_G)) last = MAX_G;
Packit 874993
    unsigned int end = last + 1;
Packit 874993
    for (hb_codepoint_t i = first; i < end; i++)
Packit 874993
      if (has (i))
Packit 874993
        return true;
Packit 874993
    return false;
Packit 874993
  }
Packit 874993
  inline bool is_equal (const hb_set_t *other) const
Packit 874993
  {
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      if (elts[i] != other->elts[i])
Packit 874993
        return false;
Packit 874993
    return true;
Packit 874993
  }
Packit 874993
  inline void set (const hb_set_t *other)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      elts[i] = other->elts[i];
Packit 874993
  }
Packit 874993
  inline void union_ (const hb_set_t *other)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      elts[i] |= other->elts[i];
Packit 874993
  }
Packit 874993
  inline void intersect (const hb_set_t *other)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      elts[i] &= other->elts[i];
Packit 874993
  }
Packit 874993
  inline void subtract (const hb_set_t *other)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      elts[i] &= ~other->elts[i];
Packit 874993
  }
Packit 874993
  inline void symmetric_difference (const hb_set_t *other)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      elts[i] ^= other->elts[i];
Packit 874993
  }
Packit 874993
  inline void invert (void)
Packit 874993
  {
Packit 874993
    if (unlikely (in_error)) return;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      elts[i] = ~elts[i];
Packit 874993
  }
Packit 874993
  inline bool next (hb_codepoint_t *codepoint) const
Packit 874993
  {
Packit 874993
    if (unlikely (*codepoint == INVALID)) {
Packit 874993
      hb_codepoint_t i = get_min ();
Packit 874993
      if (i != INVALID) {
Packit 874993
        *codepoint = i;
Packit 874993
	return true;
Packit 874993
      } else {
Packit 874993
	*codepoint = INVALID;
Packit 874993
        return false;
Packit 874993
      }
Packit 874993
    }
Packit 874993
    for (hb_codepoint_t i = *codepoint + 1; i < MAX_G + 1; i++)
Packit 874993
      if (has (i)) {
Packit 874993
        *codepoint = i;
Packit 874993
	return true;
Packit 874993
      }
Packit 874993
    *codepoint = INVALID;
Packit 874993
    return false;
Packit 874993
  }
Packit 874993
  inline bool next_range (hb_codepoint_t *first, hb_codepoint_t *last) const
Packit 874993
  {
Packit 874993
    hb_codepoint_t i;
Packit 874993
Packit 874993
    i = *last;
Packit 874993
    if (!next (&i))
Packit 874993
    {
Packit 874993
      *last = *first = INVALID;
Packit 874993
      return false;
Packit 874993
    }
Packit 874993
Packit 874993
    *last = *first = i;
Packit 874993
    while (next (&i) && i == *last + 1)
Packit 874993
      (*last)++;
Packit 874993
Packit 874993
    return true;
Packit 874993
  }
Packit 874993
Packit 874993
  inline unsigned int get_population (void) const
Packit 874993
  {
Packit 874993
    unsigned int count = 0;
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      count += _hb_popcount32 (elts[i]);
Packit 874993
    return count;
Packit 874993
  }
Packit 874993
  inline hb_codepoint_t get_min (void) const
Packit 874993
  {
Packit 874993
    for (unsigned int i = 0; i < ELTS; i++)
Packit 874993
      if (elts[i])
Packit 874993
	for (unsigned int j = 0; j < BITS; j++)
Packit 874993
	  if (elts[i] & (1u << j))
Packit 874993
	    return i * BITS + j;
Packit 874993
    return INVALID;
Packit 874993
  }
Packit 874993
  inline hb_codepoint_t get_max (void) const
Packit 874993
  {
Packit 874993
    for (unsigned int i = ELTS; i; i--)
Packit 874993
      if (elts[i - 1])
Packit 874993
	for (unsigned int j = BITS; j; j--)
Packit 874993
	  if (elts[i - 1] & (1u << (j - 1)))
Packit 874993
	    return (i - 1) * BITS + (j - 1);
Packit 874993
    return INVALID;
Packit 874993
  }
Packit 874993
Packit 874993
  typedef uint32_t elt_t;
Packit 874993
  static const unsigned int MAX_G = 65536 - 1; /* XXX Fix this... */
Packit 874993
  static const unsigned int SHIFT = 5;
Packit 874993
  static const unsigned int BITS = (1 << SHIFT);
Packit 874993
  static const unsigned int MASK = BITS - 1;
Packit 874993
  static const unsigned int ELTS = (MAX_G + 1 + (BITS - 1)) / BITS;
Packit 874993
  static  const hb_codepoint_t INVALID = HB_SET_VALUE_INVALID;
Packit 874993
Packit 874993
  elt_t &elt (hb_codepoint_t g) { return elts[g >> SHIFT]; }
Packit 874993
  elt_t const &elt (hb_codepoint_t g) const { return elts[g >> SHIFT]; }
Packit 874993
  elt_t mask (hb_codepoint_t g) const { return elt_t (1) << (g & MASK); }
Packit 874993
Packit 874993
  elt_t elts[ELTS]; /* XXX 8kb */
Packit 874993
Packit 874993
  ASSERT_STATIC (sizeof (elt_t) * 8 == BITS);
Packit 874993
  ASSERT_STATIC (sizeof (elt_t) * 8 * ELTS > MAX_G);
Packit 874993
};
Packit 874993
Packit 874993
struct hb_frozen_set_t
Packit 874993
{
Packit 874993
  static const unsigned int SHIFT = hb_set_t::SHIFT;
Packit 874993
  static const unsigned int BITS = hb_set_t::BITS;
Packit 874993
  static const unsigned int MASK = hb_set_t::MASK;
Packit 874993
  typedef hb_set_t::elt_t elt_t;
Packit 874993
Packit 874993
  inline void init (const hb_set_t &set)
Packit 874993
  {
Packit 874993
    start = count = 0;
Packit 874993
    elts = NULL;
Packit 874993
Packit 874993
    unsigned int max = set.get_max ();
Packit 874993
    if (max == set.INVALID)
Packit 874993
      return;
Packit 874993
    unsigned int min = set.get_min ();
Packit 874993
    const elt_t &min_elt = set.elt (min);
Packit 874993
Packit 874993
    start = min & ~MASK;
Packit 874993
    count = max - start + 1;
Packit 874993
    unsigned int num_elts = (count + BITS - 1) / BITS;
Packit 874993
    unsigned int elts_size = num_elts * sizeof (elt_t);
Packit 874993
    elts = (elt_t *) malloc (elts_size);
Packit 874993
    if (unlikely (!elts))
Packit 874993
    {
Packit 874993
      start = count = 0;
Packit 874993
      return;
Packit 874993
    }
Packit 874993
    memcpy (elts, &min_elt, elts_size);
Packit 874993
  }
Packit 874993
Packit 874993
  inline void fini (void)
Packit 874993
  {
Packit 874993
    if (elts)
Packit 874993
      free (elts);
Packit 874993
  }
Packit 874993
Packit 874993
  inline bool has (hb_codepoint_t g) const
Packit 874993
  {
Packit 874993
    /* hb_codepoint_t is unsigned. */
Packit 874993
    g -= start;
Packit 874993
    if (unlikely (g > count)) return false;
Packit 874993
    return !!(elt (g) & mask (g));
Packit 874993
  }
Packit 874993
Packit 874993
  elt_t const &elt (hb_codepoint_t g) const { return elts[g >> SHIFT]; }
Packit 874993
  elt_t mask (hb_codepoint_t g) const { return elt_t (1) << (g & MASK); }
Packit 874993
Packit 874993
  private:
Packit 874993
  hb_codepoint_t start, count;
Packit 874993
  elt_t *elts;
Packit 874993
};
Packit 874993
Packit 874993
Packit 874993
#endif /* HB_SET_PRIVATE_HH */