1246 lines
31 KiB
C++
1246 lines
31 KiB
C++
/*
|
||
* Copyright © 2009,2010 Red Hat, Inc.
|
||
* Copyright © 2011,2012 Google, Inc.
|
||
*
|
||
* This is part of HarfBuzz, a text shaping library.
|
||
*
|
||
* Permission is hereby granted, without written agreement and without
|
||
* license or royalty fees, to use, copy, modify, and distribute this
|
||
* software and its documentation for any purpose, provided that the
|
||
* above copyright notice and the following two paragraphs appear in
|
||
* all copies of this software.
|
||
*
|
||
* IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
|
||
* DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
|
||
* ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
|
||
* IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
|
||
* DAMAGE.
|
||
*
|
||
* THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
|
||
* BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
|
||
* FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
|
||
* ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
|
||
* PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
|
||
*
|
||
* Red Hat Author(s): Behdad Esfahbod
|
||
* Google Author(s): Behdad Esfahbod
|
||
*/
|
||
|
||
#include "hb.hh"
|
||
#include "hb-machinery.hh"
|
||
|
||
#if !defined(HB_NO_SETLOCALE) && (!defined(HAVE_NEWLOCALE) || !defined(HAVE_USELOCALE))
|
||
#define HB_NO_SETLOCALE 1
|
||
#endif
|
||
|
||
#ifndef HB_NO_SETLOCALE
|
||
|
||
#include <locale.h>
|
||
#ifdef HAVE_XLOCALE_H
|
||
#include <xlocale.h> // Needed on BSD/OS X for uselocale
|
||
#endif
|
||
|
||
#ifdef WIN32
|
||
#define hb_locale_t _locale_t
|
||
#else
|
||
#define hb_locale_t locale_t
|
||
#endif
|
||
#define hb_setlocale setlocale
|
||
#define hb_uselocale uselocale
|
||
|
||
#else
|
||
|
||
#define hb_locale_t void *
|
||
#define hb_setlocale(Category, Locale) "C"
|
||
#define hb_uselocale(Locale) ((hb_locale_t) 0)
|
||
|
||
#endif
|
||
|
||
/**
|
||
* SECTION:hb-common
|
||
* @title: hb-common
|
||
* @short_description: Common data types
|
||
* @include: hb.h
|
||
*
|
||
* Common data types used across HarfBuzz are defined here.
|
||
**/
|
||
|
||
|
||
/* hb_options_t */
|
||
|
||
hb_atomic_int_t _hb_options;
|
||
|
||
void
|
||
_hb_options_init ()
|
||
{
|
||
hb_options_union_t u;
|
||
u.i = 0;
|
||
u.opts.initialized = true;
|
||
|
||
const char *c = getenv ("HB_OPTIONS");
|
||
if (c)
|
||
{
|
||
while (*c)
|
||
{
|
||
const char *p = strchr (c, ':');
|
||
if (!p)
|
||
p = c + strlen (c);
|
||
|
||
#define OPTION(name, symbol) \
|
||
if (0 == strncmp (c, name, p - c) && strlen (name) == static_cast<size_t>(p - c)) do { u.opts.symbol = true; } while (0)
|
||
|
||
OPTION ("uniscribe-bug-compatible", uniscribe_bug_compatible);
|
||
|
||
#undef OPTION
|
||
|
||
c = *p ? p + 1 : p;
|
||
}
|
||
|
||
}
|
||
|
||
/* This is idempotent and threadsafe. */
|
||
_hb_options = u.i;
|
||
}
|
||
|
||
|
||
/* hb_tag_t */
|
||
|
||
/**
|
||
* hb_tag_from_string:
|
||
* @str: (array length=len) (element-type uint8_t): String to convert
|
||
* @len: Length of @str, or -1 if it is `NULL`-terminated
|
||
*
|
||
* Converts a string into an #hb_tag_t. Valid tags
|
||
* are four characters. Shorter input strings will be
|
||
* padded with spaces. Longer input strings will be
|
||
* truncated.
|
||
*
|
||
* Return value: The #hb_tag_t corresponding to @str
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_tag_t
|
||
hb_tag_from_string (const char *str, int len)
|
||
{
|
||
char tag[4];
|
||
unsigned int i;
|
||
|
||
if (!str || !len || !*str)
|
||
return HB_TAG_NONE;
|
||
|
||
if (len < 0 || len > 4)
|
||
len = 4;
|
||
for (i = 0; i < (unsigned) len && str[i]; i++)
|
||
tag[i] = str[i];
|
||
for (; i < 4; i++)
|
||
tag[i] = ' ';
|
||
|
||
return HB_TAG (tag[0], tag[1], tag[2], tag[3]);
|
||
}
|
||
|
||
/**
|
||
* hb_tag_to_string:
|
||
* @tag: #hb_tag_t to convert
|
||
* @buf: (out caller-allocates) (array fixed-size=4) (element-type uint8_t): Converted string
|
||
*
|
||
* Converts an #hb_tag_t to a string and returns it in @buf.
|
||
* Strings will be four characters long.
|
||
*
|
||
* Since: 0.9.5
|
||
**/
|
||
void
|
||
hb_tag_to_string (hb_tag_t tag, char *buf)
|
||
{
|
||
buf[0] = (char) (uint8_t) (tag >> 24);
|
||
buf[1] = (char) (uint8_t) (tag >> 16);
|
||
buf[2] = (char) (uint8_t) (tag >> 8);
|
||
buf[3] = (char) (uint8_t) (tag >> 0);
|
||
}
|
||
|
||
|
||
/* hb_direction_t */
|
||
|
||
static const char direction_strings[][4] = {
|
||
"ltr",
|
||
"rtl",
|
||
"ttb",
|
||
"btt"
|
||
};
|
||
|
||
/**
|
||
* hb_direction_from_string:
|
||
* @str: (array length=len) (element-type uint8_t): String to convert
|
||
* @len: Length of @str, or -1 if it is `NULL`-terminated
|
||
*
|
||
* Converts a string to an #hb_direction_t.
|
||
*
|
||
* Matching is loose and applies only to the first letter. For
|
||
* examples, "LTR" and "left-to-right" will both return #HB_DIRECTION_LTR.
|
||
*
|
||
* Unmatched strings will return #HB_DIRECTION_INVALID.
|
||
*
|
||
* Return value: The #hb_direction_t matching @str
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_direction_t
|
||
hb_direction_from_string (const char *str, int len)
|
||
{
|
||
if (unlikely (!str || !len || !*str))
|
||
return HB_DIRECTION_INVALID;
|
||
|
||
/* Lets match loosely: just match the first letter, such that
|
||
* all of "ltr", "left-to-right", etc work!
|
||
*/
|
||
char c = TOLOWER (str[0]);
|
||
for (unsigned int i = 0; i < ARRAY_LENGTH (direction_strings); i++)
|
||
if (c == direction_strings[i][0])
|
||
return (hb_direction_t) (HB_DIRECTION_LTR + i);
|
||
|
||
return HB_DIRECTION_INVALID;
|
||
}
|
||
|
||
/**
|
||
* hb_direction_to_string:
|
||
* @direction: The #hb_direction_t to convert
|
||
*
|
||
* Converts an #hb_direction_t to a string.
|
||
*
|
||
* Return value: (transfer none): The string corresponding to @direction
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
const char *
|
||
hb_direction_to_string (hb_direction_t direction)
|
||
{
|
||
if (likely ((unsigned int) (direction - HB_DIRECTION_LTR)
|
||
< ARRAY_LENGTH (direction_strings)))
|
||
return direction_strings[direction - HB_DIRECTION_LTR];
|
||
|
||
return "invalid";
|
||
}
|
||
|
||
|
||
/* hb_language_t */
|
||
|
||
struct hb_language_impl_t {
|
||
const char s[1];
|
||
};
|
||
|
||
static const char canon_map[256] = {
|
||
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
||
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
||
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, '-', 0, 0,
|
||
'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 0, 0, 0, 0, 0, 0,
|
||
0, 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
|
||
'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', 0, 0, 0, 0, '-',
|
||
0, 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
|
||
'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', 0, 0, 0, 0, 0
|
||
};
|
||
|
||
static bool
|
||
lang_equal (hb_language_t v1,
|
||
const void *v2)
|
||
{
|
||
const unsigned char *p1 = (const unsigned char *) v1;
|
||
const unsigned char *p2 = (const unsigned char *) v2;
|
||
|
||
while (*p1 && *p1 == canon_map[*p2]) {
|
||
p1++;
|
||
p2++;
|
||
}
|
||
|
||
return *p1 == canon_map[*p2];
|
||
}
|
||
|
||
#if 0
|
||
static unsigned int
|
||
lang_hash (const void *key)
|
||
{
|
||
const unsigned char *p = key;
|
||
unsigned int h = 0;
|
||
while (canon_map[*p])
|
||
{
|
||
h = (h << 5) - h + canon_map[*p];
|
||
p++;
|
||
}
|
||
|
||
return h;
|
||
}
|
||
#endif
|
||
|
||
|
||
struct hb_language_item_t {
|
||
|
||
struct hb_language_item_t *next;
|
||
hb_language_t lang;
|
||
|
||
bool operator == (const char *s) const
|
||
{ return lang_equal (lang, s); }
|
||
|
||
hb_language_item_t & operator = (const char *s)
|
||
{
|
||
/* We can't call strdup(), because we allow custom allocators. */
|
||
size_t len = strlen(s) + 1;
|
||
lang = (hb_language_t) hb_malloc(len);
|
||
if (likely (lang))
|
||
{
|
||
memcpy((unsigned char *) lang, s, len);
|
||
for (unsigned char *p = (unsigned char *) lang; *p; p++)
|
||
*p = canon_map[*p];
|
||
}
|
||
|
||
return *this;
|
||
}
|
||
|
||
void fini () { hb_free ((void *) lang); }
|
||
};
|
||
|
||
|
||
/* Thread-safe lockfree language list */
|
||
|
||
static hb_atomic_ptr_t <hb_language_item_t> langs;
|
||
|
||
static inline void
|
||
free_langs ()
|
||
{
|
||
retry:
|
||
hb_language_item_t *first_lang = langs;
|
||
if (unlikely (!langs.cmpexch (first_lang, nullptr)))
|
||
goto retry;
|
||
|
||
while (first_lang) {
|
||
hb_language_item_t *next = first_lang->next;
|
||
first_lang->fini ();
|
||
hb_free (first_lang);
|
||
first_lang = next;
|
||
}
|
||
}
|
||
|
||
static hb_language_item_t *
|
||
lang_find_or_insert (const char *key)
|
||
{
|
||
retry:
|
||
hb_language_item_t *first_lang = langs;
|
||
|
||
for (hb_language_item_t *lang = first_lang; lang; lang = lang->next)
|
||
if (*lang == key)
|
||
return lang;
|
||
|
||
/* Not found; allocate one. */
|
||
hb_language_item_t *lang = (hb_language_item_t *) hb_calloc (1, sizeof (hb_language_item_t));
|
||
if (unlikely (!lang))
|
||
return nullptr;
|
||
lang->next = first_lang;
|
||
*lang = key;
|
||
if (unlikely (!lang->lang))
|
||
{
|
||
hb_free (lang);
|
||
return nullptr;
|
||
}
|
||
|
||
if (unlikely (!langs.cmpexch (first_lang, lang)))
|
||
{
|
||
lang->fini ();
|
||
hb_free (lang);
|
||
goto retry;
|
||
}
|
||
|
||
if (!first_lang)
|
||
hb_atexit (free_langs); /* First person registers atexit() callback. */
|
||
|
||
return lang;
|
||
}
|
||
|
||
|
||
/**
|
||
* hb_language_from_string:
|
||
* @str: (array length=len) (element-type uint8_t): a string representing
|
||
* a BCP 47 language tag
|
||
* @len: length of the @str, or -1 if it is `NULL`-terminated.
|
||
*
|
||
* Converts @str representing a BCP 47 language tag to the corresponding
|
||
* #hb_language_t.
|
||
*
|
||
* Return value: (transfer none):
|
||
* The #hb_language_t corresponding to the BCP 47 language tag.
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_language_t
|
||
hb_language_from_string (const char *str, int len)
|
||
{
|
||
if (!str || !len || !*str)
|
||
return HB_LANGUAGE_INVALID;
|
||
|
||
hb_language_item_t *item = nullptr;
|
||
if (len >= 0)
|
||
{
|
||
/* NUL-terminate it. */
|
||
char strbuf[64];
|
||
len = hb_min (len, (int) sizeof (strbuf) - 1);
|
||
memcpy (strbuf, str, len);
|
||
strbuf[len] = '\0';
|
||
item = lang_find_or_insert (strbuf);
|
||
}
|
||
else
|
||
item = lang_find_or_insert (str);
|
||
|
||
return likely (item) ? item->lang : HB_LANGUAGE_INVALID;
|
||
}
|
||
|
||
/**
|
||
* hb_language_to_string:
|
||
* @language: The #hb_language_t to convert
|
||
*
|
||
* Converts an #hb_language_t to a string.
|
||
*
|
||
* Return value: (transfer none):
|
||
* A `NULL`-terminated string representing the @language. Must not be freed by
|
||
* the caller.
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
const char *
|
||
hb_language_to_string (hb_language_t language)
|
||
{
|
||
if (unlikely (!language)) return nullptr;
|
||
|
||
return language->s;
|
||
}
|
||
|
||
/**
|
||
* hb_language_get_default:
|
||
*
|
||
* Fetch the default language from current locale.
|
||
*
|
||
* <note>Note that the first time this function is called, it calls
|
||
* "setlocale (LC_CTYPE, nullptr)" to fetch current locale. The underlying
|
||
* setlocale function is, in many implementations, NOT threadsafe. To avoid
|
||
* problems, call this function once before multiple threads can call it.
|
||
* This function is only used from hb_buffer_guess_segment_properties() by
|
||
* HarfBuzz itself.</note>
|
||
*
|
||
* Return value: (transfer none): The default language of the locale as
|
||
* an #hb_language_t
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_language_t
|
||
hb_language_get_default ()
|
||
{
|
||
static hb_atomic_ptr_t <hb_language_t> default_language;
|
||
|
||
hb_language_t language = default_language;
|
||
if (unlikely (language == HB_LANGUAGE_INVALID))
|
||
{
|
||
language = hb_language_from_string (hb_setlocale (LC_CTYPE, nullptr), -1);
|
||
(void) default_language.cmpexch (HB_LANGUAGE_INVALID, language);
|
||
}
|
||
|
||
return language;
|
||
}
|
||
|
||
/**
|
||
* hb_language_matches:
|
||
* @language: The #hb_language_t to work on
|
||
* @specific: Another #hb_language_t
|
||
*
|
||
* Check whether a second language tag is the same or a more
|
||
* specific version of the provided language tag. For example,
|
||
* "fa_IR.utf8" is a more specific tag for "fa" or for "fa_IR".
|
||
*
|
||
* Return value: `true` if languages match, `false` otherwise.
|
||
*
|
||
* Since: 5.0.0
|
||
**/
|
||
hb_bool_t
|
||
hb_language_matches (hb_language_t language,
|
||
hb_language_t specific)
|
||
{
|
||
if (language == specific) return true;
|
||
if (!language || !specific) return false;
|
||
|
||
const char *l = language->s;
|
||
const char *s = specific->s;
|
||
unsigned ll = strlen (l);
|
||
unsigned sl = strlen (s);
|
||
|
||
if (ll > sl)
|
||
return false;
|
||
|
||
return strncmp (l, s, ll) == 0 &&
|
||
(s[ll] == '\0' || s[ll] == '-');
|
||
}
|
||
|
||
|
||
/* hb_script_t */
|
||
|
||
/**
|
||
* hb_script_from_iso15924_tag:
|
||
* @tag: an #hb_tag_t representing an ISO 15924 tag.
|
||
*
|
||
* Converts an ISO 15924 script tag to a corresponding #hb_script_t.
|
||
*
|
||
* Return value:
|
||
* An #hb_script_t corresponding to the ISO 15924 tag.
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_script_t
|
||
hb_script_from_iso15924_tag (hb_tag_t tag)
|
||
{
|
||
if (unlikely (tag == HB_TAG_NONE))
|
||
return HB_SCRIPT_INVALID;
|
||
|
||
/* Be lenient, adjust case (one capital letter followed by three small letters) */
|
||
tag = (tag & 0xDFDFDFDFu) | 0x00202020u;
|
||
|
||
switch (tag) {
|
||
|
||
/* These graduated from the 'Q' private-area codes, but
|
||
* the old code is still aliased by Unicode, and the Qaai
|
||
* one in use by ICU. */
|
||
case HB_TAG('Q','a','a','i'): return HB_SCRIPT_INHERITED;
|
||
case HB_TAG('Q','a','a','c'): return HB_SCRIPT_COPTIC;
|
||
|
||
/* Script variants from https://unicode.org/iso15924/ */
|
||
case HB_TAG('A','r','a','n'): return HB_SCRIPT_ARABIC;
|
||
case HB_TAG('C','y','r','s'): return HB_SCRIPT_CYRILLIC;
|
||
case HB_TAG('G','e','o','k'): return HB_SCRIPT_GEORGIAN;
|
||
case HB_TAG('H','a','n','s'): return HB_SCRIPT_HAN;
|
||
case HB_TAG('H','a','n','t'): return HB_SCRIPT_HAN;
|
||
case HB_TAG('J','a','m','o'): return HB_SCRIPT_HANGUL;
|
||
case HB_TAG('L','a','t','f'): return HB_SCRIPT_LATIN;
|
||
case HB_TAG('L','a','t','g'): return HB_SCRIPT_LATIN;
|
||
case HB_TAG('S','y','r','e'): return HB_SCRIPT_SYRIAC;
|
||
case HB_TAG('S','y','r','j'): return HB_SCRIPT_SYRIAC;
|
||
case HB_TAG('S','y','r','n'): return HB_SCRIPT_SYRIAC;
|
||
}
|
||
|
||
/* If it looks right, just use the tag as a script */
|
||
if (((uint32_t) tag & 0xE0E0E0E0u) == 0x40606060u)
|
||
return (hb_script_t) tag;
|
||
|
||
/* Otherwise, return unknown */
|
||
return HB_SCRIPT_UNKNOWN;
|
||
}
|
||
|
||
/**
|
||
* hb_script_from_string:
|
||
* @str: (array length=len) (element-type uint8_t): a string representing an
|
||
* ISO 15924 tag.
|
||
* @len: length of the @str, or -1 if it is `NULL`-terminated.
|
||
*
|
||
* Converts a string @str representing an ISO 15924 script tag to a
|
||
* corresponding #hb_script_t. Shorthand for hb_tag_from_string() then
|
||
* hb_script_from_iso15924_tag().
|
||
*
|
||
* Return value:
|
||
* An #hb_script_t corresponding to the ISO 15924 tag.
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_script_t
|
||
hb_script_from_string (const char *str, int len)
|
||
{
|
||
return hb_script_from_iso15924_tag (hb_tag_from_string (str, len));
|
||
}
|
||
|
||
/**
|
||
* hb_script_to_iso15924_tag:
|
||
* @script: an #hb_script_t to convert.
|
||
*
|
||
* Converts an #hb_script_t to a corresponding ISO 15924 script tag.
|
||
*
|
||
* Return value:
|
||
* An #hb_tag_t representing an ISO 15924 script tag.
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_tag_t
|
||
hb_script_to_iso15924_tag (hb_script_t script)
|
||
{
|
||
return (hb_tag_t) script;
|
||
}
|
||
|
||
/**
|
||
* hb_script_get_horizontal_direction:
|
||
* @script: The #hb_script_t to query
|
||
*
|
||
* Fetches the #hb_direction_t of a script when it is
|
||
* set horizontally. All right-to-left scripts will return
|
||
* #HB_DIRECTION_RTL. All left-to-right scripts will return
|
||
* #HB_DIRECTION_LTR. Scripts that can be written either
|
||
* horizontally or vertically will return #HB_DIRECTION_INVALID.
|
||
* Unknown scripts will return #HB_DIRECTION_LTR.
|
||
*
|
||
* Return value: The horizontal #hb_direction_t of @script
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
hb_direction_t
|
||
hb_script_get_horizontal_direction (hb_script_t script)
|
||
{
|
||
/* https://docs.google.com/spreadsheets/d/1Y90M0Ie3MUJ6UVCRDOypOtijlMDLNNyyLk36T6iMu0o */
|
||
switch ((hb_tag_t) script)
|
||
{
|
||
/* Unicode-1.1 additions */
|
||
case HB_SCRIPT_ARABIC:
|
||
case HB_SCRIPT_HEBREW:
|
||
|
||
/* Unicode-3.0 additions */
|
||
case HB_SCRIPT_SYRIAC:
|
||
case HB_SCRIPT_THAANA:
|
||
|
||
/* Unicode-4.0 additions */
|
||
case HB_SCRIPT_CYPRIOT:
|
||
|
||
/* Unicode-4.1 additions */
|
||
case HB_SCRIPT_KHAROSHTHI:
|
||
|
||
/* Unicode-5.0 additions */
|
||
case HB_SCRIPT_PHOENICIAN:
|
||
case HB_SCRIPT_NKO:
|
||
|
||
/* Unicode-5.1 additions */
|
||
case HB_SCRIPT_LYDIAN:
|
||
|
||
/* Unicode-5.2 additions */
|
||
case HB_SCRIPT_AVESTAN:
|
||
case HB_SCRIPT_IMPERIAL_ARAMAIC:
|
||
case HB_SCRIPT_INSCRIPTIONAL_PAHLAVI:
|
||
case HB_SCRIPT_INSCRIPTIONAL_PARTHIAN:
|
||
case HB_SCRIPT_OLD_SOUTH_ARABIAN:
|
||
case HB_SCRIPT_OLD_TURKIC:
|
||
case HB_SCRIPT_SAMARITAN:
|
||
|
||
/* Unicode-6.0 additions */
|
||
case HB_SCRIPT_MANDAIC:
|
||
|
||
/* Unicode-6.1 additions */
|
||
case HB_SCRIPT_MEROITIC_CURSIVE:
|
||
case HB_SCRIPT_MEROITIC_HIEROGLYPHS:
|
||
|
||
/* Unicode-7.0 additions */
|
||
case HB_SCRIPT_MANICHAEAN:
|
||
case HB_SCRIPT_MENDE_KIKAKUI:
|
||
case HB_SCRIPT_NABATAEAN:
|
||
case HB_SCRIPT_OLD_NORTH_ARABIAN:
|
||
case HB_SCRIPT_PALMYRENE:
|
||
case HB_SCRIPT_PSALTER_PAHLAVI:
|
||
|
||
/* Unicode-8.0 additions */
|
||
case HB_SCRIPT_HATRAN:
|
||
|
||
/* Unicode-9.0 additions */
|
||
case HB_SCRIPT_ADLAM:
|
||
|
||
/* Unicode-11.0 additions */
|
||
case HB_SCRIPT_HANIFI_ROHINGYA:
|
||
case HB_SCRIPT_OLD_SOGDIAN:
|
||
case HB_SCRIPT_SOGDIAN:
|
||
|
||
/* Unicode-12.0 additions */
|
||
case HB_SCRIPT_ELYMAIC:
|
||
|
||
/* Unicode-13.0 additions */
|
||
case HB_SCRIPT_CHORASMIAN:
|
||
case HB_SCRIPT_YEZIDI:
|
||
|
||
/* Unicode-14.0 additions */
|
||
case HB_SCRIPT_OLD_UYGHUR:
|
||
|
||
return HB_DIRECTION_RTL;
|
||
|
||
|
||
/* https://github.com/harfbuzz/harfbuzz/issues/1000 */
|
||
case HB_SCRIPT_OLD_HUNGARIAN:
|
||
case HB_SCRIPT_OLD_ITALIC:
|
||
case HB_SCRIPT_RUNIC:
|
||
|
||
return HB_DIRECTION_INVALID;
|
||
}
|
||
|
||
return HB_DIRECTION_LTR;
|
||
}
|
||
|
||
|
||
/* hb_version */
|
||
|
||
|
||
/**
|
||
* SECTION:hb-version
|
||
* @title: hb-version
|
||
* @short_description: Information about the version of HarfBuzz in use
|
||
* @include: hb.h
|
||
*
|
||
* These functions and macros allow accessing version of the HarfBuzz
|
||
* library used at compile- as well as run-time, and to direct code
|
||
* conditionally based on those versions, again, at compile- or run-time.
|
||
**/
|
||
|
||
|
||
/**
|
||
* hb_version:
|
||
* @major: (out): Library major version component
|
||
* @minor: (out): Library minor version component
|
||
* @micro: (out): Library micro version component
|
||
*
|
||
* Returns library version as three integer components.
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
void
|
||
hb_version (unsigned int *major,
|
||
unsigned int *minor,
|
||
unsigned int *micro)
|
||
{
|
||
*major = HB_VERSION_MAJOR;
|
||
*minor = HB_VERSION_MINOR;
|
||
*micro = HB_VERSION_MICRO;
|
||
}
|
||
|
||
/**
|
||
* hb_version_string:
|
||
*
|
||
* Returns library version as a string with three components.
|
||
*
|
||
* Return value: Library version string
|
||
*
|
||
* Since: 0.9.2
|
||
**/
|
||
const char *
|
||
hb_version_string ()
|
||
{
|
||
return HB_VERSION_STRING;
|
||
}
|
||
|
||
/**
|
||
* hb_version_atleast:
|
||
* @major: Library major version component
|
||
* @minor: Library minor version component
|
||
* @micro: Library micro version component
|
||
*
|
||
* Tests the library version against a minimum value,
|
||
* as three integer components.
|
||
*
|
||
* Return value: `true` if the library is equal to or greater than
|
||
* the test value, `false` otherwise
|
||
*
|
||
* Since: 0.9.30
|
||
**/
|
||
hb_bool_t
|
||
hb_version_atleast (unsigned int major,
|
||
unsigned int minor,
|
||
unsigned int micro)
|
||
{
|
||
return HB_VERSION_ATLEAST (major, minor, micro);
|
||
}
|
||
|
||
|
||
|
||
/* hb_feature_t and hb_variation_t */
|
||
|
||
static bool
|
||
parse_space (const char **pp, const char *end)
|
||
{
|
||
while (*pp < end && ISSPACE (**pp))
|
||
(*pp)++;
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_char (const char **pp, const char *end, char c)
|
||
{
|
||
parse_space (pp, end);
|
||
|
||
if (*pp == end || **pp != c)
|
||
return false;
|
||
|
||
(*pp)++;
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_uint (const char **pp, const char *end, unsigned int *pv)
|
||
{
|
||
/* Intentionally use hb_parse_int inside instead of hb_parse_uint,
|
||
* such that -1 turns into "big number"... */
|
||
int v;
|
||
if (unlikely (!hb_parse_int (pp, end, &v))) return false;
|
||
|
||
*pv = v;
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_uint32 (const char **pp, const char *end, uint32_t *pv)
|
||
{
|
||
/* Intentionally use hb_parse_int inside instead of hb_parse_uint,
|
||
* such that -1 turns into "big number"... */
|
||
int v;
|
||
if (unlikely (!hb_parse_int (pp, end, &v))) return false;
|
||
|
||
*pv = v;
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_bool (const char **pp, const char *end, uint32_t *pv)
|
||
{
|
||
parse_space (pp, end);
|
||
|
||
const char *p = *pp;
|
||
while (*pp < end && ISALPHA(**pp))
|
||
(*pp)++;
|
||
|
||
/* CSS allows on/off as aliases 1/0. */
|
||
if (*pp - p == 2
|
||
&& TOLOWER (p[0]) == 'o'
|
||
&& TOLOWER (p[1]) == 'n')
|
||
*pv = 1;
|
||
else if (*pp - p == 3
|
||
&& TOLOWER (p[0]) == 'o'
|
||
&& TOLOWER (p[1]) == 'f'
|
||
&& TOLOWER (p[2]) == 'f')
|
||
*pv = 0;
|
||
else
|
||
return false;
|
||
|
||
return true;
|
||
}
|
||
|
||
/* hb_feature_t */
|
||
|
||
static bool
|
||
parse_feature_value_prefix (const char **pp, const char *end, hb_feature_t *feature)
|
||
{
|
||
if (parse_char (pp, end, '-'))
|
||
feature->value = 0;
|
||
else {
|
||
parse_char (pp, end, '+');
|
||
feature->value = 1;
|
||
}
|
||
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_tag (const char **pp, const char *end, hb_tag_t *tag)
|
||
{
|
||
parse_space (pp, end);
|
||
|
||
char quote = 0;
|
||
|
||
if (*pp < end && (**pp == '\'' || **pp == '"'))
|
||
{
|
||
quote = **pp;
|
||
(*pp)++;
|
||
}
|
||
|
||
const char *p = *pp;
|
||
while (*pp < end && (ISALNUM(**pp) || **pp == '_'))
|
||
(*pp)++;
|
||
|
||
if (p == *pp || *pp - p > 4)
|
||
return false;
|
||
|
||
*tag = hb_tag_from_string (p, *pp - p);
|
||
|
||
if (quote)
|
||
{
|
||
/* CSS expects exactly four bytes. And we only allow quotations for
|
||
* CSS compatibility. So, enforce the length. */
|
||
if (*pp - p != 4)
|
||
return false;
|
||
if (*pp == end || **pp != quote)
|
||
return false;
|
||
(*pp)++;
|
||
}
|
||
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_feature_indices (const char **pp, const char *end, hb_feature_t *feature)
|
||
{
|
||
parse_space (pp, end);
|
||
|
||
bool has_start;
|
||
|
||
feature->start = HB_FEATURE_GLOBAL_START;
|
||
feature->end = HB_FEATURE_GLOBAL_END;
|
||
|
||
if (!parse_char (pp, end, '['))
|
||
return true;
|
||
|
||
has_start = parse_uint (pp, end, &feature->start);
|
||
|
||
if (parse_char (pp, end, ':') || parse_char (pp, end, ';')) {
|
||
parse_uint (pp, end, &feature->end);
|
||
} else {
|
||
if (has_start)
|
||
feature->end = feature->start + 1;
|
||
}
|
||
|
||
return parse_char (pp, end, ']');
|
||
}
|
||
|
||
static bool
|
||
parse_feature_value_postfix (const char **pp, const char *end, hb_feature_t *feature)
|
||
{
|
||
bool had_equal = parse_char (pp, end, '=');
|
||
bool had_value = parse_uint32 (pp, end, &feature->value) ||
|
||
parse_bool (pp, end, &feature->value);
|
||
/* CSS doesn't use equal-sign between tag and value.
|
||
* If there was an equal-sign, then there *must* be a value.
|
||
* A value without an equal-sign is ok, but not required. */
|
||
return !had_equal || had_value;
|
||
}
|
||
|
||
static bool
|
||
parse_one_feature (const char **pp, const char *end, hb_feature_t *feature)
|
||
{
|
||
return parse_feature_value_prefix (pp, end, feature) &&
|
||
parse_tag (pp, end, &feature->tag) &&
|
||
parse_feature_indices (pp, end, feature) &&
|
||
parse_feature_value_postfix (pp, end, feature) &&
|
||
parse_space (pp, end) &&
|
||
*pp == end;
|
||
}
|
||
|
||
/**
|
||
* hb_feature_from_string:
|
||
* @str: (array length=len) (element-type uint8_t): a string to parse
|
||
* @len: length of @str, or -1 if string is `NULL` terminated
|
||
* @feature: (out): the #hb_feature_t to initialize with the parsed values
|
||
*
|
||
* Parses a string into a #hb_feature_t.
|
||
*
|
||
* The format for specifying feature strings follows. All valid CSS
|
||
* font-feature-settings values other than 'normal' and the global values are
|
||
* also accepted, though not documented below. CSS string escapes are not
|
||
* supported.
|
||
*
|
||
* The range indices refer to the positions between Unicode characters. The
|
||
* position before the first character is always 0.
|
||
*
|
||
* The format is Python-esque. Here is how it all works:
|
||
*
|
||
* <informaltable pgwide='1' align='left' frame='none'>
|
||
* <tgroup cols='5'>
|
||
* <thead>
|
||
* <row><entry>Syntax</entry> <entry>Value</entry> <entry>Start</entry> <entry>End</entry></row>
|
||
* </thead>
|
||
* <tbody>
|
||
* <row><entry>Setting value:</entry></row>
|
||
* <row><entry>kern</entry> <entry>1</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature on</entry></row>
|
||
* <row><entry>+kern</entry> <entry>1</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature on</entry></row>
|
||
* <row><entry>-kern</entry> <entry>0</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature off</entry></row>
|
||
* <row><entry>kern=0</entry> <entry>0</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature off</entry></row>
|
||
* <row><entry>kern=1</entry> <entry>1</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature on</entry></row>
|
||
* <row><entry>aalt=2</entry> <entry>2</entry> <entry>0</entry> <entry>∞</entry> <entry>Choose 2nd alternate</entry></row>
|
||
* <row><entry>Setting index:</entry></row>
|
||
* <row><entry>kern[]</entry> <entry>1</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature on</entry></row>
|
||
* <row><entry>kern[:]</entry> <entry>1</entry> <entry>0</entry> <entry>∞</entry> <entry>Turn feature on</entry></row>
|
||
* <row><entry>kern[5:]</entry> <entry>1</entry> <entry>5</entry> <entry>∞</entry> <entry>Turn feature on, partial</entry></row>
|
||
* <row><entry>kern[:5]</entry> <entry>1</entry> <entry>0</entry> <entry>5</entry> <entry>Turn feature on, partial</entry></row>
|
||
* <row><entry>kern[3:5]</entry> <entry>1</entry> <entry>3</entry> <entry>5</entry> <entry>Turn feature on, range</entry></row>
|
||
* <row><entry>kern[3]</entry> <entry>1</entry> <entry>3</entry> <entry>3+1</entry> <entry>Turn feature on, single char</entry></row>
|
||
* <row><entry>Mixing it all:</entry></row>
|
||
* <row><entry>aalt[3:5]=2</entry> <entry>2</entry> <entry>3</entry> <entry>5</entry> <entry>Turn 2nd alternate on for range</entry></row>
|
||
* </tbody>
|
||
* </tgroup>
|
||
* </informaltable>
|
||
*
|
||
* Return value:
|
||
* `true` if @str is successfully parsed, `false` otherwise
|
||
*
|
||
* Since: 0.9.5
|
||
**/
|
||
hb_bool_t
|
||
hb_feature_from_string (const char *str, int len,
|
||
hb_feature_t *feature)
|
||
{
|
||
hb_feature_t feat;
|
||
|
||
if (len < 0)
|
||
len = strlen (str);
|
||
|
||
if (likely (parse_one_feature (&str, str + len, &feat)))
|
||
{
|
||
if (feature)
|
||
*feature = feat;
|
||
return true;
|
||
}
|
||
|
||
if (feature)
|
||
memset (feature, 0, sizeof (*feature));
|
||
return false;
|
||
}
|
||
|
||
/**
|
||
* hb_feature_to_string:
|
||
* @feature: an #hb_feature_t to convert
|
||
* @buf: (array length=size) (out): output string
|
||
* @size: the allocated size of @buf
|
||
*
|
||
* Converts a #hb_feature_t into a `NULL`-terminated string in the format
|
||
* understood by hb_feature_from_string(). The client in responsible for
|
||
* allocating big enough size for @buf, 128 bytes is more than enough.
|
||
*
|
||
* Since: 0.9.5
|
||
**/
|
||
void
|
||
hb_feature_to_string (hb_feature_t *feature,
|
||
char *buf, unsigned int size)
|
||
{
|
||
if (unlikely (!size)) return;
|
||
|
||
char s[128];
|
||
unsigned int len = 0;
|
||
if (feature->value == 0)
|
||
s[len++] = '-';
|
||
hb_tag_to_string (feature->tag, s + len);
|
||
len += 4;
|
||
while (len && s[len - 1] == ' ')
|
||
len--;
|
||
if (feature->start != HB_FEATURE_GLOBAL_START || feature->end != HB_FEATURE_GLOBAL_END)
|
||
{
|
||
s[len++] = '[';
|
||
if (feature->start)
|
||
len += hb_max (0, snprintf (s + len, ARRAY_LENGTH (s) - len, "%u", feature->start));
|
||
if (feature->end != feature->start + 1) {
|
||
s[len++] = ':';
|
||
if (feature->end != HB_FEATURE_GLOBAL_END)
|
||
len += hb_max (0, snprintf (s + len, ARRAY_LENGTH (s) - len, "%u", feature->end));
|
||
}
|
||
s[len++] = ']';
|
||
}
|
||
if (feature->value > 1)
|
||
{
|
||
s[len++] = '=';
|
||
len += hb_max (0, snprintf (s + len, ARRAY_LENGTH (s) - len, "%u", feature->value));
|
||
}
|
||
assert (len < ARRAY_LENGTH (s));
|
||
len = hb_min (len, size - 1);
|
||
memcpy (buf, s, len);
|
||
buf[len] = '\0';
|
||
}
|
||
|
||
/* hb_variation_t */
|
||
|
||
static bool
|
||
parse_variation_value (const char **pp, const char *end, hb_variation_t *variation)
|
||
{
|
||
parse_char (pp, end, '='); /* Optional. */
|
||
double v;
|
||
if (unlikely (!hb_parse_double (pp, end, &v))) return false;
|
||
|
||
variation->value = v;
|
||
return true;
|
||
}
|
||
|
||
static bool
|
||
parse_one_variation (const char **pp, const char *end, hb_variation_t *variation)
|
||
{
|
||
return parse_tag (pp, end, &variation->tag) &&
|
||
parse_variation_value (pp, end, variation) &&
|
||
parse_space (pp, end) &&
|
||
*pp == end;
|
||
}
|
||
|
||
/**
|
||
* hb_variation_from_string:
|
||
* @str: (array length=len) (element-type uint8_t): a string to parse
|
||
* @len: length of @str, or -1 if string is `NULL` terminated
|
||
* @variation: (out): the #hb_variation_t to initialize with the parsed values
|
||
*
|
||
* Parses a string into a #hb_variation_t.
|
||
*
|
||
* The format for specifying variation settings follows. All valid CSS
|
||
* font-variation-settings values other than 'normal' and 'inherited' are also
|
||
* accepted, though, not documented below.
|
||
*
|
||
* The format is a tag, optionally followed by an equals sign, followed by a
|
||
* number. For example `wght=500`, or `slnt=-7.5`.
|
||
*
|
||
* Return value:
|
||
* `true` if @str is successfully parsed, `false` otherwise
|
||
*
|
||
* Since: 1.4.2
|
||
*/
|
||
hb_bool_t
|
||
hb_variation_from_string (const char *str, int len,
|
||
hb_variation_t *variation)
|
||
{
|
||
hb_variation_t var;
|
||
|
||
if (len < 0)
|
||
len = strlen (str);
|
||
|
||
if (likely (parse_one_variation (&str, str + len, &var)))
|
||
{
|
||
if (variation)
|
||
*variation = var;
|
||
return true;
|
||
}
|
||
|
||
if (variation)
|
||
memset (variation, 0, sizeof (*variation));
|
||
return false;
|
||
}
|
||
|
||
#ifndef HB_NO_SETLOCALE
|
||
|
||
static inline void free_static_C_locale ();
|
||
|
||
static struct hb_C_locale_lazy_loader_t : hb_lazy_loader_t<hb_remove_pointer<hb_locale_t>,
|
||
hb_C_locale_lazy_loader_t>
|
||
{
|
||
static hb_locale_t create ()
|
||
{
|
||
hb_locale_t l = newlocale (LC_ALL_MASK, "C", NULL);
|
||
if (!l)
|
||
return l;
|
||
|
||
hb_atexit (free_static_C_locale);
|
||
|
||
return l;
|
||
}
|
||
static void destroy (hb_locale_t l)
|
||
{
|
||
freelocale (l);
|
||
}
|
||
static hb_locale_t get_null ()
|
||
{
|
||
return (hb_locale_t) 0;
|
||
}
|
||
} static_C_locale;
|
||
|
||
static inline
|
||
void free_static_C_locale ()
|
||
{
|
||
static_C_locale.free_instance ();
|
||
}
|
||
|
||
static hb_locale_t
|
||
get_C_locale ()
|
||
{
|
||
return static_C_locale.get_unconst ();
|
||
}
|
||
|
||
#endif
|
||
|
||
/**
|
||
* hb_variation_to_string:
|
||
* @variation: an #hb_variation_t to convert
|
||
* @buf: (array length=size) (out caller-allocates): output string
|
||
* @size: the allocated size of @buf
|
||
*
|
||
* Converts an #hb_variation_t into a `NULL`-terminated string in the format
|
||
* understood by hb_variation_from_string(). The client in responsible for
|
||
* allocating big enough size for @buf, 128 bytes is more than enough.
|
||
*
|
||
* Since: 1.4.2
|
||
*/
|
||
void
|
||
hb_variation_to_string (hb_variation_t *variation,
|
||
char *buf, unsigned int size)
|
||
{
|
||
if (unlikely (!size)) return;
|
||
|
||
char s[128];
|
||
unsigned int len = 0;
|
||
hb_tag_to_string (variation->tag, s + len);
|
||
len += 4;
|
||
while (len && s[len - 1] == ' ')
|
||
len--;
|
||
s[len++] = '=';
|
||
|
||
hb_locale_t oldlocale HB_UNUSED;
|
||
oldlocale = hb_uselocale (get_C_locale ());
|
||
len += hb_max (0, snprintf (s + len, ARRAY_LENGTH (s) - len, "%g", (double) variation->value));
|
||
(void) hb_uselocale (oldlocale);
|
||
|
||
assert (len < ARRAY_LENGTH (s));
|
||
len = hb_min (len, size - 1);
|
||
memcpy (buf, s, len);
|
||
buf[len] = '\0';
|
||
}
|
||
|
||
/**
|
||
* hb_color_get_alpha:
|
||
* @color: an #hb_color_t we are interested in its channels.
|
||
*
|
||
* Fetches the alpha channel of the given @color.
|
||
*
|
||
* Return value: Alpha channel value
|
||
*
|
||
* Since: 2.1.0
|
||
*/
|
||
uint8_t
|
||
(hb_color_get_alpha) (hb_color_t color)
|
||
{
|
||
return hb_color_get_alpha (color);
|
||
}
|
||
|
||
/**
|
||
* hb_color_get_red:
|
||
* @color: an #hb_color_t we are interested in its channels.
|
||
*
|
||
* Fetches the red channel of the given @color.
|
||
*
|
||
* Return value: Red channel value
|
||
*
|
||
* Since: 2.1.0
|
||
*/
|
||
uint8_t
|
||
(hb_color_get_red) (hb_color_t color)
|
||
{
|
||
return hb_color_get_red (color);
|
||
}
|
||
|
||
/**
|
||
* hb_color_get_green:
|
||
* @color: an #hb_color_t we are interested in its channels.
|
||
*
|
||
* Fetches the green channel of the given @color.
|
||
*
|
||
* Return value: Green channel value
|
||
*
|
||
* Since: 2.1.0
|
||
*/
|
||
uint8_t
|
||
(hb_color_get_green) (hb_color_t color)
|
||
{
|
||
return hb_color_get_green (color);
|
||
}
|
||
|
||
/**
|
||
* hb_color_get_blue:
|
||
* @color: an #hb_color_t we are interested in its channels.
|
||
*
|
||
* Fetches the blue channel of the given @color.
|
||
*
|
||
* Return value: Blue channel value
|
||
*
|
||
* Since: 2.1.0
|
||
*/
|
||
uint8_t
|
||
(hb_color_get_blue) (hb_color_t color)
|
||
{
|
||
return hb_color_get_blue (color);
|
||
}
|
||
|
||
|
||
/* If there is no visibility control, then hb-static.cc will NOT
|
||
* define anything. Instead, we get it to define one set in here
|
||
* only, so only libharfbuzz.so defines them, not other libs. */
|
||
#ifdef HB_NO_VISIBILITY
|
||
#undef HB_NO_VISIBILITY
|
||
#include "hb-static.cc"
|
||
#define HB_NO_VISIBILITY 1
|
||
#endif
|