2010-05-21 14:43:49 +02:00
|
|
|
/*
|
2011-04-21 23:14:28 +02:00
|
|
|
* Copyright © 2009,2010 Red Hat, Inc.
|
|
|
|
* Copyright © 2011 Google, Inc.
|
2010-05-21 14:43:49 +02:00
|
|
|
*
|
|
|
|
* This is part of HarfBuzz, a text shaping library.
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, without written agreement and without
|
|
|
|
* license or royalty fees, to use, copy, modify, and distribute this
|
|
|
|
* software and its documentation for any purpose, provided that the
|
|
|
|
* above copyright notice and the following two paragraphs appear in
|
|
|
|
* all copies of this software.
|
|
|
|
*
|
|
|
|
* IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
|
|
|
|
* DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
|
|
|
|
* ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
|
|
|
|
* IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
|
|
|
|
* DAMAGE.
|
|
|
|
*
|
|
|
|
* THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
|
|
|
|
* BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
|
|
|
|
* ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
|
|
|
|
* PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
|
|
|
|
*
|
|
|
|
* Red Hat Author(s): Behdad Esfahbod
|
2011-04-21 23:14:28 +02:00
|
|
|
* Google Author(s): Behdad Esfahbod
|
2010-05-21 14:43:49 +02:00
|
|
|
*/
|
|
|
|
|
2011-04-21 00:50:27 +02:00
|
|
|
#include "hb-private.hh"
|
2010-05-21 14:43:49 +02:00
|
|
|
|
2011-05-06 03:31:04 +02:00
|
|
|
#include "hb-version.h"
|
|
|
|
|
2011-05-05 21:14:04 +02:00
|
|
|
#include "hb-mutex-private.hh"
|
2011-05-05 21:28:37 +02:00
|
|
|
#include "hb-object-private.hh"
|
2011-05-05 21:14:04 +02:00
|
|
|
|
2011-05-06 06:04:28 +02:00
|
|
|
#include <locale.h>
|
|
|
|
|
2010-07-23 21:11:18 +02:00
|
|
|
|
|
|
|
|
2011-04-11 23:55:58 +02:00
|
|
|
/* hb_tag_t */
|
|
|
|
|
2010-05-21 14:43:49 +02:00
|
|
|
hb_tag_t
|
2011-08-26 09:18:53 +02:00
|
|
|
hb_tag_from_string (const char *s, int len)
|
2010-05-21 14:43:49 +02:00
|
|
|
{
|
|
|
|
char tag[4];
|
|
|
|
unsigned int i;
|
|
|
|
|
2011-08-26 09:18:53 +02:00
|
|
|
if (!s || !len || !*s)
|
2011-04-11 19:27:30 +02:00
|
|
|
return HB_TAG_NONE;
|
|
|
|
|
2011-08-26 09:18:53 +02:00
|
|
|
if (len < 0 || len > 4)
|
|
|
|
len = 4;
|
|
|
|
for (i = 0; i < (unsigned) len && s[i]; i++)
|
2010-05-21 14:43:49 +02:00
|
|
|
tag[i] = s[i];
|
|
|
|
for (; i < 4; i++)
|
|
|
|
tag[i] = ' ';
|
|
|
|
|
2011-04-11 19:12:37 +02:00
|
|
|
return HB_TAG_CHAR4 (tag);
|
2010-05-21 14:43:49 +02:00
|
|
|
}
|
2010-07-23 21:11:18 +02:00
|
|
|
|
|
|
|
|
2011-04-27 20:48:19 +02:00
|
|
|
/* hb_direction_t */
|
|
|
|
|
|
|
|
const char direction_strings[][4] = {
|
|
|
|
"ltr",
|
|
|
|
"rtl",
|
|
|
|
"ttb",
|
|
|
|
"btt"
|
|
|
|
};
|
|
|
|
|
|
|
|
hb_direction_t
|
2011-08-26 09:18:53 +02:00
|
|
|
hb_direction_from_string (const char *str, int len)
|
2011-04-27 20:48:19 +02:00
|
|
|
{
|
2011-08-26 09:18:53 +02:00
|
|
|
if (unlikely (!str || !len || !*str))
|
2011-04-27 20:48:19 +02:00
|
|
|
return HB_DIRECTION_INVALID;
|
|
|
|
|
|
|
|
/* Lets match loosely: just match the first letter, such that
|
|
|
|
* all of "ltr", "left-to-right", etc work!
|
|
|
|
*/
|
|
|
|
char c = TOLOWER (str[0]);
|
|
|
|
for (unsigned int i = 0; i < ARRAY_LENGTH (direction_strings); i++)
|
|
|
|
if (c == direction_strings[i][0])
|
|
|
|
return (hb_direction_t) i;
|
|
|
|
|
|
|
|
return HB_DIRECTION_INVALID;
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *
|
|
|
|
hb_direction_to_string (hb_direction_t direction)
|
|
|
|
{
|
|
|
|
if (likely ((unsigned int) direction < ARRAY_LENGTH (direction_strings)))
|
|
|
|
return direction_strings[direction];
|
|
|
|
|
|
|
|
return "invalid";
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2011-04-11 23:55:58 +02:00
|
|
|
/* hb_language_t */
|
|
|
|
|
2011-04-15 18:32:06 +02:00
|
|
|
struct _hb_language_t {
|
|
|
|
const char s[1];
|
|
|
|
};
|
|
|
|
|
2011-04-11 23:55:58 +02:00
|
|
|
static const char canon_map[256] = {
|
|
|
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
|
|
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
|
|
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, '-', 0, 0,
|
|
|
|
'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 0, 0, 0, 0, 0, 0,
|
|
|
|
'-', 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
|
|
|
|
'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', 0, 0, 0, 0, '-',
|
|
|
|
0, 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
|
|
|
|
'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', 0, 0, 0, 0, 0
|
|
|
|
};
|
|
|
|
|
|
|
|
static hb_bool_t
|
|
|
|
lang_equal (const void *v1,
|
|
|
|
const void *v2)
|
|
|
|
{
|
2011-04-21 00:50:27 +02:00
|
|
|
const unsigned char *p1 = (const unsigned char *) v1;
|
|
|
|
const unsigned char *p2 = (const unsigned char *) v2;
|
2011-04-11 23:55:58 +02:00
|
|
|
|
|
|
|
while (canon_map[*p1] && canon_map[*p1] == canon_map[*p2])
|
|
|
|
{
|
|
|
|
p1++, p2++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return (canon_map[*p1] == canon_map[*p2]);
|
|
|
|
}
|
|
|
|
|
|
|
|
#if 0
|
|
|
|
static unsigned int
|
|
|
|
lang_hash (const void *key)
|
|
|
|
{
|
|
|
|
const unsigned char *p = key;
|
|
|
|
unsigned int h = 0;
|
|
|
|
while (canon_map[*p])
|
|
|
|
{
|
|
|
|
h = (h << 5) - h + canon_map[*p];
|
|
|
|
p++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return h;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2011-05-05 21:00:43 +02:00
|
|
|
struct hb_language_item_t {
|
|
|
|
|
|
|
|
hb_language_t lang;
|
|
|
|
|
|
|
|
inline bool operator == (const char *s) const {
|
|
|
|
return lang_equal (lang, s);
|
|
|
|
}
|
|
|
|
|
|
|
|
inline hb_language_item_t & operator = (const char *s) {
|
|
|
|
lang = (hb_language_t) strdup (s);
|
|
|
|
for (unsigned char *p = (unsigned char *) lang; *p; p++)
|
|
|
|
*p = canon_map[*p];
|
|
|
|
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
void finish (void) { free (lang); }
|
|
|
|
};
|
|
|
|
|
2011-08-06 00:02:30 +02:00
|
|
|
static struct hb_static_lang_set_t : hb_lockable_set_t<hb_language_item_t, hb_static_mutex_t> {
|
|
|
|
~hb_static_lang_set_t (void) { this->finish (lock); }
|
|
|
|
hb_static_mutex_t lock;
|
|
|
|
} langs;
|
2011-05-05 21:14:04 +02:00
|
|
|
|
2011-04-11 23:55:58 +02:00
|
|
|
hb_language_t
|
2011-08-26 09:18:53 +02:00
|
|
|
hb_language_from_string (const char *str, int len)
|
2011-04-11 23:55:58 +02:00
|
|
|
{
|
2011-08-26 09:18:53 +02:00
|
|
|
if (!str || !len || !*str)
|
2011-05-14 04:55:32 +02:00
|
|
|
return HB_LANGUAGE_INVALID;
|
2011-04-11 23:55:58 +02:00
|
|
|
|
2011-08-26 09:18:53 +02:00
|
|
|
char strbuf[32];
|
|
|
|
if (len >= 0) {
|
|
|
|
len = MIN (len, (int) sizeof (strbuf) - 1);
|
|
|
|
str = (char *) memcpy (strbuf, str, len);
|
|
|
|
strbuf[len] = '\0';
|
|
|
|
}
|
|
|
|
|
2011-08-06 00:02:30 +02:00
|
|
|
hb_language_item_t *item = langs.find_or_insert (str, langs.lock);
|
2011-04-11 23:55:58 +02:00
|
|
|
|
2011-05-14 04:55:32 +02:00
|
|
|
return likely (item) ? item->lang : HB_LANGUAGE_INVALID;
|
2011-04-11 23:55:58 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
const char *
|
|
|
|
hb_language_to_string (hb_language_t language)
|
|
|
|
{
|
2011-05-14 04:55:32 +02:00
|
|
|
/* This is actually NULL-safe! */
|
2011-04-15 18:32:06 +02:00
|
|
|
return language->s;
|
2011-04-11 23:55:58 +02:00
|
|
|
}
|
|
|
|
|
2011-05-06 06:04:28 +02:00
|
|
|
hb_language_t
|
|
|
|
hb_language_get_default (void)
|
|
|
|
{
|
|
|
|
static hb_language_t default_language;
|
|
|
|
|
|
|
|
if (!default_language) {
|
|
|
|
/* This block is not quite threadsafe, but is not as bad as
|
|
|
|
* it looks since it's idempotent. As long as pointer ops
|
|
|
|
* are atomic, we are safe. */
|
|
|
|
|
|
|
|
/* I hear that setlocale() doesn't honor env vars on Windows,
|
|
|
|
* but for now we ignore that. */
|
|
|
|
|
2011-08-26 09:18:53 +02:00
|
|
|
default_language = hb_language_from_string (setlocale (LC_CTYPE, NULL), -1);
|
2011-05-06 06:04:28 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return default_language;
|
|
|
|
}
|
|
|
|
|
2011-04-11 23:55:58 +02:00
|
|
|
|
2011-04-16 01:16:54 +02:00
|
|
|
/* hb_script_t */
|
|
|
|
|
|
|
|
hb_script_t
|
|
|
|
hb_script_from_iso15924_tag (hb_tag_t tag)
|
|
|
|
{
|
2011-04-20 08:54:42 +02:00
|
|
|
if (unlikely (tag == HB_TAG_NONE))
|
|
|
|
return HB_SCRIPT_INVALID;
|
|
|
|
|
2011-04-16 01:16:54 +02:00
|
|
|
/* Be lenient, adjust case (one capital letter followed by three small letters) */
|
|
|
|
tag = (tag & 0xDFDFDFDF) | 0x00202020;
|
|
|
|
|
2011-04-19 05:40:21 +02:00
|
|
|
switch (tag) {
|
2011-05-02 18:35:14 +02:00
|
|
|
|
|
|
|
/* These graduated from the 'Q' private-area codes, but
|
|
|
|
* the old code is still aliased by Unicode, and the Qaai
|
|
|
|
* one in use by ICU. */
|
|
|
|
case HB_TAG('Q','a','a','i'): return HB_SCRIPT_INHERITED;
|
|
|
|
case HB_TAG('Q','a','a','c'): return HB_SCRIPT_COPTIC;
|
|
|
|
|
|
|
|
/* Script variants from http://unicode.org/iso15924/ */
|
2011-04-19 05:40:21 +02:00
|
|
|
case HB_TAG('C','y','r','s'): return HB_SCRIPT_CYRILLIC;
|
|
|
|
case HB_TAG('L','a','t','f'): return HB_SCRIPT_LATIN;
|
|
|
|
case HB_TAG('L','a','t','g'): return HB_SCRIPT_LATIN;
|
|
|
|
case HB_TAG('S','y','r','e'): return HB_SCRIPT_SYRIAC;
|
|
|
|
case HB_TAG('S','y','r','j'): return HB_SCRIPT_SYRIAC;
|
|
|
|
case HB_TAG('S','y','r','n'): return HB_SCRIPT_SYRIAC;
|
|
|
|
}
|
2011-04-16 01:16:54 +02:00
|
|
|
|
|
|
|
/* If it looks right, just use the tag as a script */
|
|
|
|
if (((uint32_t) tag & 0xE0E0E0E0) == 0x40606060)
|
|
|
|
return (hb_script_t) tag;
|
|
|
|
|
|
|
|
/* Otherwise, return unknown */
|
|
|
|
return HB_SCRIPT_UNKNOWN;
|
|
|
|
}
|
|
|
|
|
|
|
|
hb_script_t
|
2011-08-26 09:18:53 +02:00
|
|
|
hb_script_from_string (const char *s, int len)
|
2011-04-16 01:16:54 +02:00
|
|
|
{
|
2011-08-26 09:18:53 +02:00
|
|
|
return hb_script_from_iso15924_tag (hb_tag_from_string (s, len));
|
2011-04-16 01:16:54 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
hb_tag_t
|
|
|
|
hb_script_to_iso15924_tag (hb_script_t script)
|
|
|
|
{
|
2011-04-19 05:40:21 +02:00
|
|
|
return (hb_tag_t) script;
|
2011-04-16 01:16:54 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
hb_direction_t
|
|
|
|
hb_script_get_horizontal_direction (hb_script_t script)
|
|
|
|
{
|
2012-03-07 21:52:02 +01:00
|
|
|
/* http://goo.gl/x9ilM */
|
2011-04-19 05:40:21 +02:00
|
|
|
switch ((hb_tag_t) script)
|
|
|
|
{
|
2012-03-07 21:52:02 +01:00
|
|
|
/* Unicode-1.1 additions */
|
2011-04-19 05:40:21 +02:00
|
|
|
case HB_SCRIPT_ARABIC:
|
|
|
|
case HB_SCRIPT_HEBREW:
|
2012-03-07 21:52:02 +01:00
|
|
|
|
|
|
|
/* Unicode-3.0 additions */
|
2011-04-19 05:40:21 +02:00
|
|
|
case HB_SCRIPT_SYRIAC:
|
|
|
|
case HB_SCRIPT_THAANA:
|
|
|
|
|
|
|
|
/* Unicode-4.0 additions */
|
|
|
|
case HB_SCRIPT_CYPRIOT:
|
|
|
|
|
2012-03-07 18:49:08 +01:00
|
|
|
/* Unicode-4.1 additions */
|
|
|
|
case HB_SCRIPT_KHAROSHTHI:
|
|
|
|
|
2011-04-19 05:40:21 +02:00
|
|
|
/* Unicode-5.0 additions */
|
|
|
|
case HB_SCRIPT_PHOENICIAN:
|
|
|
|
case HB_SCRIPT_NKO:
|
|
|
|
|
2012-03-07 18:49:08 +01:00
|
|
|
/* Unicode-5.1 additions */
|
|
|
|
case HB_SCRIPT_LYDIAN:
|
|
|
|
|
2011-04-19 05:40:21 +02:00
|
|
|
/* Unicode-5.2 additions */
|
|
|
|
case HB_SCRIPT_AVESTAN:
|
|
|
|
case HB_SCRIPT_IMPERIAL_ARAMAIC:
|
|
|
|
case HB_SCRIPT_INSCRIPTIONAL_PAHLAVI:
|
|
|
|
case HB_SCRIPT_INSCRIPTIONAL_PARTHIAN:
|
|
|
|
case HB_SCRIPT_OLD_SOUTH_ARABIAN:
|
|
|
|
case HB_SCRIPT_OLD_TURKIC:
|
|
|
|
case HB_SCRIPT_SAMARITAN:
|
|
|
|
|
|
|
|
/* Unicode-6.0 additions */
|
|
|
|
case HB_SCRIPT_MANDAIC:
|
|
|
|
|
2012-03-07 21:52:02 +01:00
|
|
|
/* Unicode-6.1 additions */
|
|
|
|
case HB_SCRIPT_MEROITIC_CURSIVE:
|
|
|
|
case HB_SCRIPT_MEROITIC_HIEROGLYPHS:
|
|
|
|
|
2011-04-19 05:40:21 +02:00
|
|
|
return HB_DIRECTION_RTL;
|
|
|
|
}
|
2011-04-16 01:16:54 +02:00
|
|
|
|
2011-04-19 05:40:21 +02:00
|
|
|
return HB_DIRECTION_LTR;
|
2011-04-16 01:16:54 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2011-05-05 21:28:37 +02:00
|
|
|
/* hb_user_data_array_t */
|
|
|
|
|
2011-05-05 21:33:19 +02:00
|
|
|
|
|
|
|
/* NOTE: Currently we use a global lock for user_data access
|
|
|
|
* threadsafety. If one day we add a mutex to any object, we
|
|
|
|
* should switch to using that insted for these too.
|
|
|
|
*/
|
|
|
|
|
2011-05-11 01:12:49 +02:00
|
|
|
static hb_static_mutex_t user_data_lock;
|
2011-05-05 21:33:19 +02:00
|
|
|
|
2011-05-05 21:28:37 +02:00
|
|
|
bool
|
|
|
|
hb_user_data_array_t::set (hb_user_data_key_t *key,
|
|
|
|
void * data,
|
2011-08-09 00:43:24 +02:00
|
|
|
hb_destroy_func_t destroy,
|
|
|
|
hb_bool_t replace)
|
2011-05-05 21:28:37 +02:00
|
|
|
{
|
|
|
|
if (!key)
|
|
|
|
return false;
|
2011-05-05 21:33:19 +02:00
|
|
|
|
2011-08-09 00:43:24 +02:00
|
|
|
if (replace) {
|
|
|
|
if (!data && !destroy) {
|
|
|
|
items.remove (key, user_data_lock);
|
|
|
|
return true;
|
|
|
|
}
|
2011-05-05 21:28:37 +02:00
|
|
|
}
|
|
|
|
hb_user_data_item_t item = {key, data, destroy};
|
2011-08-09 00:43:24 +02:00
|
|
|
bool ret = !!items.replace_or_insert (item, user_data_lock, replace);
|
2011-05-05 21:33:19 +02:00
|
|
|
|
|
|
|
return ret;
|
2011-05-05 21:28:37 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
void *
|
|
|
|
hb_user_data_array_t::get (hb_user_data_key_t *key)
|
|
|
|
{
|
2011-05-11 01:12:49 +02:00
|
|
|
hb_user_data_item_t item = {NULL };
|
2011-05-05 21:33:19 +02:00
|
|
|
|
2011-05-11 01:12:49 +02:00
|
|
|
return items.find (key, &item, user_data_lock) ? item.data : NULL;
|
|
|
|
}
|
2011-05-05 21:33:19 +02:00
|
|
|
|
2011-05-11 01:12:49 +02:00
|
|
|
void
|
|
|
|
hb_user_data_array_t::finish (void)
|
|
|
|
{
|
|
|
|
items.finish (user_data_lock);
|
2011-05-05 21:28:37 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2011-05-06 03:31:04 +02:00
|
|
|
/* hb_version */
|
|
|
|
|
|
|
|
void
|
|
|
|
hb_version (unsigned int *major,
|
|
|
|
unsigned int *minor,
|
|
|
|
unsigned int *micro)
|
|
|
|
{
|
|
|
|
*major = HB_VERSION_MAJOR;
|
|
|
|
*minor = HB_VERSION_MINOR;
|
|
|
|
*micro = HB_VERSION_MICRO;
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *
|
|
|
|
hb_version_string (void)
|
|
|
|
{
|
|
|
|
return HB_VERSION_STRING;
|
|
|
|
}
|
|
|
|
|
|
|
|
hb_bool_t
|
|
|
|
hb_version_check (unsigned int major,
|
|
|
|
unsigned int minor,
|
|
|
|
unsigned int micro)
|
|
|
|
{
|
|
|
|
return HB_VERSION_CHECK (major, minor, micro);
|
|
|
|
}
|
|
|
|
|
|
|
|
|