2017-10-15 14:09:05 +02:00
|
|
|
/*
|
|
|
|
* Copyright © 2012 Google, Inc.
|
|
|
|
*
|
|
|
|
* This is part of HarfBuzz, a text shaping library.
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, without written agreement and without
|
|
|
|
* license or royalty fees, to use, copy, modify, and distribute this
|
|
|
|
* software and its documentation for any purpose, provided that the
|
|
|
|
* above copyright notice and the following two paragraphs appear in
|
|
|
|
* all copies of this software.
|
|
|
|
*
|
|
|
|
* IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
|
|
|
|
* DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
|
|
|
|
* ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
|
|
|
|
* IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
|
|
|
|
* DAMAGE.
|
|
|
|
*
|
|
|
|
* THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
|
|
|
|
* BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
|
|
|
|
* ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
|
|
|
|
* PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
|
|
|
|
*
|
|
|
|
* Google Author(s): Behdad Esfahbod
|
|
|
|
*/
|
|
|
|
|
2018-08-26 07:36:36 +02:00
|
|
|
#ifndef HB_SET_DIGEST_HH
|
|
|
|
#define HB_SET_DIGEST_HH
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-08-26 07:36:36 +02:00
|
|
|
#include "hb.hh"
|
2017-10-15 14:09:05 +02:00
|
|
|
|
|
|
|
/*
|
2022-06-08 19:35:50 +02:00
|
|
|
* The set-digests here implement various "filters" that support
|
2017-10-15 14:09:05 +02:00
|
|
|
* "approximate member query". Conceptually these are like Bloom
|
|
|
|
* Filter and Quotient Filter, however, much smaller, faster, and
|
|
|
|
* designed to fit the requirements of our uses for glyph coverage
|
|
|
|
* queries.
|
|
|
|
*
|
|
|
|
* Our filters are highly accurate if the lookup covers fairly local
|
|
|
|
* set of glyphs, but fully flooded and ineffective if coverage is
|
|
|
|
* all over the place.
|
|
|
|
*
|
2022-06-08 19:35:50 +02:00
|
|
|
* The way these are used is that the filter is first populated by
|
|
|
|
* a lookup's or subtable's Coverage table(s), and then when we
|
|
|
|
* want to apply the lookup or subtable to a glyph, before trying
|
|
|
|
* to apply, we ask the filter if the glyph may be covered. If it's
|
|
|
|
* not, we return early.
|
|
|
|
*
|
|
|
|
* We use these filters both at the lookup-level, and then again,
|
|
|
|
* at the subtable-level. Both have performance win.
|
|
|
|
*
|
2022-06-08 19:37:12 +02:00
|
|
|
* The main filter we use is a combination of three bits-pattern
|
2022-06-08 19:38:17 +02:00
|
|
|
* filters. A bits-pattern filter checks a number of bits (5 or 6)
|
2022-06-08 19:35:50 +02:00
|
|
|
* of the input number (glyph-id in this case) and checks whether
|
2022-06-08 19:45:14 +02:00
|
|
|
* its pattern is amongst the patterns of any of the accepted values.
|
|
|
|
* The accepted patterns are represented as a "long" integer. The
|
2022-06-08 19:35:50 +02:00
|
|
|
* check is done using four bitwise operations only.
|
2017-10-15 14:09:05 +02:00
|
|
|
*/
|
|
|
|
|
|
|
|
template <typename mask_t, unsigned int shift>
|
2022-06-08 19:37:12 +02:00
|
|
|
struct hb_set_digest_bits_pattern_t
|
2017-10-15 14:09:05 +02:00
|
|
|
{
|
2019-01-22 12:15:23 +01:00
|
|
|
static constexpr unsigned mask_bytes = sizeof (mask_t);
|
|
|
|
static constexpr unsigned mask_bits = sizeof (mask_t) * 8;
|
2019-01-25 16:08:25 +01:00
|
|
|
static constexpr unsigned num_bits = 0
|
|
|
|
+ (mask_bytes >= 1 ? 3 : 0)
|
|
|
|
+ (mask_bytes >= 2 ? 1 : 0)
|
|
|
|
+ (mask_bytes >= 4 ? 1 : 0)
|
|
|
|
+ (mask_bytes >= 8 ? 1 : 0)
|
|
|
|
+ (mask_bytes >= 16? 1 : 0)
|
|
|
|
+ 0;
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-09-16 19:33:48 +02:00
|
|
|
static_assert ((shift < sizeof (hb_codepoint_t) * 8), "");
|
|
|
|
static_assert ((shift + num_bits <= sizeof (hb_codepoint_t) * 8), "");
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-12-17 19:01:01 +01:00
|
|
|
void init () { mask = 0; }
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
void add (hb_codepoint_t g) { mask |= mask_for (g); }
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
bool add_range (hb_codepoint_t a, hb_codepoint_t b)
|
|
|
|
{
|
2017-10-15 14:09:05 +02:00
|
|
|
if ((b >> shift) - (a >> shift) >= mask_bits - 1)
|
|
|
|
mask = (mask_t) -1;
|
|
|
|
else {
|
|
|
|
mask_t ma = mask_for (a);
|
|
|
|
mask_t mb = mask_for (b);
|
|
|
|
mask |= mb + (mb - ma) - (mb < ma);
|
|
|
|
}
|
2017-12-16 15:12:06 +01:00
|
|
|
return true;
|
2017-10-15 14:09:05 +02:00
|
|
|
}
|
2017-12-15 04:33:55 +01:00
|
|
|
|
|
|
|
template <typename T>
|
2018-12-16 20:08:10 +01:00
|
|
|
void add_array (const T *array, unsigned int count, unsigned int stride=sizeof(T))
|
2017-12-15 04:33:55 +01:00
|
|
|
{
|
|
|
|
for (unsigned int i = 0; i < count; i++)
|
|
|
|
{
|
|
|
|
add (*array);
|
|
|
|
array = (const T *) (stride + (const char *) array);
|
|
|
|
}
|
|
|
|
}
|
2017-12-13 22:12:20 +01:00
|
|
|
template <typename T>
|
2021-04-02 16:32:41 +02:00
|
|
|
void add_array (const hb_array_t<const T>& arr) { add_array (&arr, arr.len ()); }
|
|
|
|
template <typename T>
|
2018-12-16 20:08:10 +01:00
|
|
|
bool add_sorted_array (const T *array, unsigned int count, unsigned int stride=sizeof(T))
|
2017-12-13 22:12:20 +01:00
|
|
|
{
|
|
|
|
for (unsigned int i = 0; i < count; i++)
|
2017-12-15 04:33:55 +01:00
|
|
|
{
|
|
|
|
add (*array);
|
|
|
|
array = (const T *) (stride + (const char *) array);
|
|
|
|
}
|
|
|
|
return true;
|
2017-12-13 22:12:20 +01:00
|
|
|
}
|
2021-04-02 16:32:41 +02:00
|
|
|
template <typename T>
|
|
|
|
bool add_sorted_array (const hb_sorted_array_t<const T>& arr) { return add_sorted_array (&arr, arr.len ()); }
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
bool may_have (hb_codepoint_t g) const
|
2022-05-29 14:33:34 +02:00
|
|
|
{ return mask & mask_for (g); }
|
2017-10-15 14:09:05 +02:00
|
|
|
|
|
|
|
private:
|
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
static mask_t mask_for (hb_codepoint_t g)
|
|
|
|
{ return ((mask_t) 1) << ((g >> shift) & (mask_bits - 1)); }
|
2017-10-15 14:09:05 +02:00
|
|
|
mask_t mask;
|
|
|
|
};
|
|
|
|
|
|
|
|
template <typename head_t, typename tail_t>
|
|
|
|
struct hb_set_digest_combiner_t
|
|
|
|
{
|
2018-12-17 19:01:01 +01:00
|
|
|
void init ()
|
2018-12-16 20:08:10 +01:00
|
|
|
{
|
2017-10-15 14:09:05 +02:00
|
|
|
head.init ();
|
|
|
|
tail.init ();
|
|
|
|
}
|
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
void add (hb_codepoint_t g)
|
|
|
|
{
|
2017-10-15 14:09:05 +02:00
|
|
|
head.add (g);
|
|
|
|
tail.add (g);
|
|
|
|
}
|
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
bool add_range (hb_codepoint_t a, hb_codepoint_t b)
|
|
|
|
{
|
2017-10-15 14:09:05 +02:00
|
|
|
head.add_range (a, b);
|
|
|
|
tail.add_range (a, b);
|
2017-12-16 15:12:06 +01:00
|
|
|
return true;
|
2017-10-15 14:09:05 +02:00
|
|
|
}
|
2017-12-13 22:12:20 +01:00
|
|
|
template <typename T>
|
2018-12-16 20:08:10 +01:00
|
|
|
void add_array (const T *array, unsigned int count, unsigned int stride=sizeof(T))
|
2017-12-15 04:33:55 +01:00
|
|
|
{
|
|
|
|
head.add_array (array, count, stride);
|
|
|
|
tail.add_array (array, count, stride);
|
|
|
|
}
|
|
|
|
template <typename T>
|
2021-04-02 16:32:41 +02:00
|
|
|
void add_array (const hb_array_t<const T>& arr) { add_array (&arr, arr.len ()); }
|
|
|
|
template <typename T>
|
2018-12-16 20:08:10 +01:00
|
|
|
bool add_sorted_array (const T *array, unsigned int count, unsigned int stride=sizeof(T))
|
2017-12-13 22:12:20 +01:00
|
|
|
{
|
2017-12-15 04:33:55 +01:00
|
|
|
head.add_sorted_array (array, count, stride);
|
|
|
|
tail.add_sorted_array (array, count, stride);
|
|
|
|
return true;
|
2017-12-13 22:12:20 +01:00
|
|
|
}
|
2021-04-02 16:32:41 +02:00
|
|
|
template <typename T>
|
|
|
|
bool add_sorted_array (const hb_sorted_array_t<const T>& arr) { return add_sorted_array (&arr, arr.len ()); }
|
2017-10-15 14:09:05 +02:00
|
|
|
|
2018-12-16 20:08:10 +01:00
|
|
|
bool may_have (hb_codepoint_t g) const
|
|
|
|
{
|
2017-10-15 14:09:05 +02:00
|
|
|
return head.may_have (g) && tail.may_have (g);
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
head_t head;
|
|
|
|
tail_t tail;
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* hb_set_digest_t
|
|
|
|
*
|
|
|
|
* This is a combination of digests that performs "best".
|
|
|
|
* There is not much science to this: it's a result of intuition
|
|
|
|
* and testing.
|
|
|
|
*/
|
2021-09-21 20:21:02 +02:00
|
|
|
using hb_set_digest_t =
|
2017-10-15 14:09:05 +02:00
|
|
|
hb_set_digest_combiner_t
|
|
|
|
<
|
2022-06-08 19:37:12 +02:00
|
|
|
hb_set_digest_bits_pattern_t<unsigned long, 4>,
|
2021-09-21 20:21:02 +02:00
|
|
|
hb_set_digest_combiner_t
|
|
|
|
<
|
2022-06-08 19:37:12 +02:00
|
|
|
hb_set_digest_bits_pattern_t<unsigned long, 0>,
|
|
|
|
hb_set_digest_bits_pattern_t<unsigned long, 9>
|
2021-09-21 20:21:02 +02:00
|
|
|
>
|
2017-10-15 14:09:05 +02:00
|
|
|
>
|
2021-09-21 20:21:02 +02:00
|
|
|
;
|
2017-10-15 14:09:05 +02:00
|
|
|
|
|
|
|
|
2018-08-26 07:36:36 +02:00
|
|
|
#endif /* HB_SET_DIGEST_HH */
|