2009-08-11 02:05:16 +02:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2009 Red Hat, Inc.
|
|
|
|
*
|
2010-04-22 06:11:43 +02:00
|
|
|
* This is part of HarfBuzz, a text shaping library.
|
2009-08-11 02:05:16 +02:00
|
|
|
*
|
|
|
|
* Permission is hereby granted, without written agreement and without
|
|
|
|
* license or royalty fees, to use, copy, modify, and distribute this
|
|
|
|
* software and its documentation for any purpose, provided that the
|
|
|
|
* above copyright notice and the following two paragraphs appear in
|
|
|
|
* all copies of this software.
|
|
|
|
*
|
|
|
|
* IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
|
|
|
|
* DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
|
|
|
|
* ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
|
|
|
|
* IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
|
|
|
|
* DAMAGE.
|
|
|
|
*
|
|
|
|
* THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
|
|
|
|
* BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
|
|
|
|
* ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
|
|
|
|
* PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
|
|
|
|
*
|
|
|
|
* Red Hat Author(s): Behdad Esfahbod
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef HB_UNICODE_H
|
|
|
|
#define HB_UNICODE_H
|
|
|
|
|
|
|
|
#include "hb-common.h"
|
|
|
|
|
|
|
|
HB_BEGIN_DECLS
|
|
|
|
|
2010-07-23 21:11:18 +02:00
|
|
|
|
2009-08-11 02:05:16 +02:00
|
|
|
/* Unicode General Category property */
|
|
|
|
typedef enum
|
|
|
|
{
|
|
|
|
HB_CATEGORY_CONTROL,
|
|
|
|
HB_CATEGORY_FORMAT,
|
|
|
|
HB_CATEGORY_UNASSIGNED,
|
|
|
|
HB_CATEGORY_PRIVATE_USE,
|
|
|
|
HB_CATEGORY_SURROGATE,
|
|
|
|
HB_CATEGORY_LOWERCASE_LETTER,
|
|
|
|
HB_CATEGORY_MODIFIER_LETTER,
|
|
|
|
HB_CATEGORY_OTHER_LETTER,
|
|
|
|
HB_CATEGORY_TITLECASE_LETTER,
|
|
|
|
HB_CATEGORY_UPPERCASE_LETTER,
|
|
|
|
HB_CATEGORY_COMBINING_MARK,
|
|
|
|
HB_CATEGORY_ENCLOSING_MARK,
|
|
|
|
HB_CATEGORY_NON_SPACING_MARK,
|
|
|
|
HB_CATEGORY_DECIMAL_NUMBER,
|
|
|
|
HB_CATEGORY_LETTER_NUMBER,
|
|
|
|
HB_CATEGORY_OTHER_NUMBER,
|
|
|
|
HB_CATEGORY_CONNECT_PUNCTUATION,
|
|
|
|
HB_CATEGORY_DASH_PUNCTUATION,
|
|
|
|
HB_CATEGORY_CLOSE_PUNCTUATION,
|
|
|
|
HB_CATEGORY_FINAL_PUNCTUATION,
|
|
|
|
HB_CATEGORY_INITIAL_PUNCTUATION,
|
|
|
|
HB_CATEGORY_OTHER_PUNCTUATION,
|
|
|
|
HB_CATEGORY_OPEN_PUNCTUATION,
|
|
|
|
HB_CATEGORY_CURRENCY_SYMBOL,
|
|
|
|
HB_CATEGORY_MODIFIER_SYMBOL,
|
|
|
|
HB_CATEGORY_MATH_SYMBOL,
|
|
|
|
HB_CATEGORY_OTHER_SYMBOL,
|
|
|
|
HB_CATEGORY_LINE_SEPARATOR,
|
|
|
|
HB_CATEGORY_PARAGRAPH_SEPARATOR,
|
|
|
|
HB_CATEGORY_SPACE_SEPARATOR
|
|
|
|
} hb_category_t;
|
|
|
|
|
|
|
|
/* Unicode Script property */
|
|
|
|
typedef enum
|
|
|
|
{ /* ISO 15924 code */
|
|
|
|
HB_SCRIPT_INVALID_CODE = -1,
|
|
|
|
HB_SCRIPT_COMMON = 0, /* Zyyy */
|
|
|
|
HB_SCRIPT_INHERITED, /* Qaai */
|
|
|
|
HB_SCRIPT_ARABIC, /* Arab */
|
|
|
|
HB_SCRIPT_ARMENIAN, /* Armn */
|
|
|
|
HB_SCRIPT_BENGALI, /* Beng */
|
|
|
|
HB_SCRIPT_BOPOMOFO, /* Bopo */
|
|
|
|
HB_SCRIPT_CHEROKEE, /* Cher */
|
|
|
|
HB_SCRIPT_COPTIC, /* Qaac */
|
|
|
|
HB_SCRIPT_CYRILLIC, /* Cyrl (Cyrs) */
|
|
|
|
HB_SCRIPT_DESERET, /* Dsrt */
|
|
|
|
HB_SCRIPT_DEVANAGARI, /* Deva */
|
|
|
|
HB_SCRIPT_ETHIOPIC, /* Ethi */
|
|
|
|
HB_SCRIPT_GEORGIAN, /* Geor (Geon, Geoa) */
|
|
|
|
HB_SCRIPT_GOTHIC, /* Goth */
|
|
|
|
HB_SCRIPT_GREEK, /* Grek */
|
|
|
|
HB_SCRIPT_GUJARATI, /* Gujr */
|
|
|
|
HB_SCRIPT_GURMUKHI, /* Guru */
|
|
|
|
HB_SCRIPT_HAN, /* Hani */
|
|
|
|
HB_SCRIPT_HANGUL, /* Hang */
|
|
|
|
HB_SCRIPT_HEBREW, /* Hebr */
|
|
|
|
HB_SCRIPT_HIRAGANA, /* Hira */
|
|
|
|
HB_SCRIPT_KANNADA, /* Knda */
|
|
|
|
HB_SCRIPT_KATAKANA, /* Kana */
|
|
|
|
HB_SCRIPT_KHMER, /* Khmr */
|
|
|
|
HB_SCRIPT_LAO, /* Laoo */
|
|
|
|
HB_SCRIPT_LATIN, /* Latn (Latf, Latg) */
|
|
|
|
HB_SCRIPT_MALAYALAM, /* Mlym */
|
|
|
|
HB_SCRIPT_MONGOLIAN, /* Mong */
|
|
|
|
HB_SCRIPT_MYANMAR, /* Mymr */
|
|
|
|
HB_SCRIPT_OGHAM, /* Ogam */
|
|
|
|
HB_SCRIPT_OLD_ITALIC, /* Ital */
|
|
|
|
HB_SCRIPT_ORIYA, /* Orya */
|
|
|
|
HB_SCRIPT_RUNIC, /* Runr */
|
|
|
|
HB_SCRIPT_SINHALA, /* Sinh */
|
|
|
|
HB_SCRIPT_SYRIAC, /* Syrc (Syrj, Syrn, Syre) */
|
|
|
|
HB_SCRIPT_TAMIL, /* Taml */
|
|
|
|
HB_SCRIPT_TELUGU, /* Telu */
|
|
|
|
HB_SCRIPT_THAANA, /* Thaa */
|
|
|
|
HB_SCRIPT_THAI, /* Thai */
|
|
|
|
HB_SCRIPT_TIBETAN, /* Tibt */
|
|
|
|
HB_SCRIPT_CANADIAN_ABORIGINAL, /* Cans */
|
|
|
|
HB_SCRIPT_YI, /* Yiii */
|
|
|
|
HB_SCRIPT_TAGALOG, /* Tglg */
|
|
|
|
HB_SCRIPT_HANUNOO, /* Hano */
|
|
|
|
HB_SCRIPT_BUHID, /* Buhd */
|
|
|
|
HB_SCRIPT_TAGBANWA, /* Tagb */
|
|
|
|
|
|
|
|
/* Unicode-4.0 additions */
|
|
|
|
HB_SCRIPT_BRAILLE, /* Brai */
|
|
|
|
HB_SCRIPT_CYPRIOT, /* Cprt */
|
|
|
|
HB_SCRIPT_LIMBU, /* Limb */
|
|
|
|
HB_SCRIPT_OSMANYA, /* Osma */
|
|
|
|
HB_SCRIPT_SHAVIAN, /* Shaw */
|
|
|
|
HB_SCRIPT_LINEAR_B, /* Linb */
|
|
|
|
HB_SCRIPT_TAI_LE, /* Tale */
|
|
|
|
HB_SCRIPT_UGARITIC, /* Ugar */
|
|
|
|
|
|
|
|
/* Unicode-4.1 additions */
|
|
|
|
HB_SCRIPT_NEW_TAI_LUE, /* Talu */
|
|
|
|
HB_SCRIPT_BUGINESE, /* Bugi */
|
|
|
|
HB_SCRIPT_GLAGOLITIC, /* Glag */
|
|
|
|
HB_SCRIPT_TIFINAGH, /* Tfng */
|
|
|
|
HB_SCRIPT_SYLOTI_NAGRI, /* Sylo */
|
|
|
|
HB_SCRIPT_OLD_PERSIAN, /* Xpeo */
|
|
|
|
HB_SCRIPT_KHAROSHTHI, /* Khar */
|
|
|
|
|
|
|
|
/* Unicode-5.0 additions */
|
|
|
|
HB_SCRIPT_UNKNOWN, /* Zzzz */
|
|
|
|
HB_SCRIPT_BALINESE, /* Bali */
|
|
|
|
HB_SCRIPT_CUNEIFORM, /* Xsux */
|
|
|
|
HB_SCRIPT_PHOENICIAN, /* Phnx */
|
|
|
|
HB_SCRIPT_PHAGS_PA, /* Phag */
|
|
|
|
HB_SCRIPT_NKO, /* Nkoo */
|
|
|
|
|
|
|
|
/* Unicode-5.1 additions */
|
|
|
|
HB_SCRIPT_KAYAH_LI, /* Kali */
|
|
|
|
HB_SCRIPT_LEPCHA, /* Lepc */
|
|
|
|
HB_SCRIPT_REJANG, /* Rjng */
|
|
|
|
HB_SCRIPT_SUNDANESE, /* Sund */
|
|
|
|
HB_SCRIPT_SAURASHTRA, /* Saur */
|
|
|
|
HB_SCRIPT_CHAM, /* Cham */
|
|
|
|
HB_SCRIPT_OL_CHIKI, /* Olck */
|
|
|
|
HB_SCRIPT_VAI, /* Vaii */
|
|
|
|
HB_SCRIPT_CARIAN, /* Cari */
|
|
|
|
HB_SCRIPT_LYCIAN, /* Lyci */
|
2010-05-21 14:29:12 +02:00
|
|
|
HB_SCRIPT_LYDIAN, /* Lydi */
|
|
|
|
|
|
|
|
/* Unicode-5.2 additions */
|
|
|
|
HB_SCRIPT_AVESTAN, /* Avst */
|
|
|
|
HB_SCRIPT_BAMUM, /* Bamu */
|
|
|
|
HB_SCRIPT_EGYPTIAN_HIEROGLYPHS, /* Egyp */
|
|
|
|
HB_SCRIPT_IMPERIAL_ARAMAIC, /* Armi */
|
|
|
|
HB_SCRIPT_INSCRIPTIONAL_PAHLAVI, /* Phli */
|
|
|
|
HB_SCRIPT_INSCRIPTIONAL_PARTHIAN, /* Prti */
|
|
|
|
HB_SCRIPT_JAVANESE, /* Java */
|
|
|
|
HB_SCRIPT_KAITHI, /* Kthi */
|
|
|
|
HB_SCRIPT_LISU, /* Lisu */
|
|
|
|
HB_SCRIPT_MEITEI_MAYEK, /* Mtei */
|
|
|
|
HB_SCRIPT_OLD_SOUTH_ARABIAN, /* Sarb */
|
|
|
|
HB_SCRIPT_OLD_TURKIC, /* Orkh */
|
|
|
|
HB_SCRIPT_SAMARITAN, /* Samr */
|
|
|
|
HB_SCRIPT_TAI_THAM, /* Lana */
|
|
|
|
HB_SCRIPT_TAI_VIET /* Tavt */
|
2009-08-11 02:05:16 +02:00
|
|
|
} hb_script_t;
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* hb_unicode_funcs_t
|
|
|
|
*/
|
|
|
|
|
|
|
|
typedef struct _hb_unicode_funcs_t hb_unicode_funcs_t;
|
|
|
|
|
|
|
|
hb_unicode_funcs_t *
|
|
|
|
hb_unicode_funcs_create (void);
|
|
|
|
|
|
|
|
hb_unicode_funcs_t *
|
|
|
|
hb_unicode_funcs_reference (hb_unicode_funcs_t *ufuncs);
|
|
|
|
|
|
|
|
unsigned int
|
|
|
|
hb_unicode_funcs_get_reference_count (hb_unicode_funcs_t *ufuncs);
|
|
|
|
|
|
|
|
void
|
|
|
|
hb_unicode_funcs_destroy (hb_unicode_funcs_t *ufuncs);
|
|
|
|
|
|
|
|
hb_unicode_funcs_t *
|
|
|
|
hb_unicode_funcs_copy (hb_unicode_funcs_t *ufuncs);
|
|
|
|
|
2009-08-11 05:25:28 +02:00
|
|
|
void
|
|
|
|
hb_unicode_funcs_make_immutable (hb_unicode_funcs_t *ufuncs);
|
2009-08-11 02:05:16 +02:00
|
|
|
|
|
|
|
|
|
|
|
/* funcs */
|
|
|
|
|
2009-08-11 05:35:05 +02:00
|
|
|
typedef hb_codepoint_t (*hb_unicode_get_mirroring_func_t) (hb_codepoint_t unicode);
|
2009-08-11 02:05:16 +02:00
|
|
|
typedef hb_category_t (*hb_unicode_get_general_category_func_t) (hb_codepoint_t unicode);
|
|
|
|
typedef hb_script_t (*hb_unicode_get_script_func_t) (hb_codepoint_t unicode);
|
|
|
|
typedef unsigned int (*hb_unicode_get_combining_class_func_t) (hb_codepoint_t unicode);
|
|
|
|
typedef unsigned int (*hb_unicode_get_eastasian_width_func_t) (hb_codepoint_t unicode);
|
|
|
|
|
|
|
|
|
|
|
|
void
|
2009-08-11 05:35:05 +02:00
|
|
|
hb_unicode_funcs_set_mirroring_func (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_unicode_get_mirroring_func_t mirroring_func);
|
2009-08-11 02:05:16 +02:00
|
|
|
|
|
|
|
void
|
|
|
|
hb_unicode_funcs_set_general_category_func (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_unicode_get_general_category_func_t general_category_func);
|
|
|
|
|
|
|
|
void
|
|
|
|
hb_unicode_funcs_set_script_func (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_unicode_get_script_func_t script_func);
|
|
|
|
|
|
|
|
void
|
|
|
|
hb_unicode_funcs_set_combining_class_func (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_unicode_get_combining_class_func_t combining_class_func);
|
|
|
|
|
|
|
|
void
|
|
|
|
hb_unicode_funcs_set_eastasian_width_func (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_unicode_get_eastasian_width_func_t eastasian_width_func);
|
|
|
|
|
|
|
|
|
2009-12-20 15:29:16 +01:00
|
|
|
hb_codepoint_t
|
|
|
|
hb_unicode_get_mirroring (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_codepoint_t unicode);
|
|
|
|
|
|
|
|
hb_category_t
|
|
|
|
hb_unicode_get_general_category (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_codepoint_t unicode);
|
|
|
|
|
|
|
|
hb_script_t
|
|
|
|
hb_unicode_get_script (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_codepoint_t unicode);
|
|
|
|
|
|
|
|
unsigned int
|
|
|
|
hb_unicode_get_combining_class (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_codepoint_t unicode);
|
|
|
|
|
|
|
|
unsigned int
|
|
|
|
hb_unicode_get_eastasian_width (hb_unicode_funcs_t *ufuncs,
|
|
|
|
hb_codepoint_t unicode);
|
|
|
|
|
|
|
|
|
2009-08-11 02:05:16 +02:00
|
|
|
HB_END_DECLS
|
|
|
|
|
2009-11-05 00:12:32 +01:00
|
|
|
#endif /* HB_UNICODE_H */
|