456 lines
11 KiB
C++
456 lines
11 KiB
C++
#line 1 "hb-ot-shape-complex-khmer-machine.rl"
|
|
/*
|
|
* Copyright © 2011,2012 Google, Inc.
|
|
*
|
|
* This is part of HarfBuzz, a text shaping library.
|
|
*
|
|
* Permission is hereby granted, without written agreement and without
|
|
* license or royalty fees, to use, copy, modify, and distribute this
|
|
* software and its documentation for any purpose, provided that the
|
|
* above copyright notice and the following two paragraphs appear in
|
|
* all copies of this software.
|
|
*
|
|
* IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
|
|
* DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
|
|
* ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
|
|
* IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
|
|
* DAMAGE.
|
|
*
|
|
* THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
|
|
* BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
|
|
* FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
|
|
* ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
|
|
* PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
|
|
*
|
|
* Google Author(s): Behdad Esfahbod
|
|
*/
|
|
|
|
#ifndef HB_OT_SHAPE_COMPLEX_KHMER_MACHINE_HH
|
|
#define HB_OT_SHAPE_COMPLEX_KHMER_MACHINE_HH
|
|
|
|
#include "hb.hh"
|
|
|
|
enum khmer_syllable_type_t {
|
|
khmer_consonant_syllable,
|
|
khmer_broken_cluster,
|
|
khmer_non_khmer_cluster,
|
|
};
|
|
|
|
|
|
#line 41 "hb-ot-shape-complex-khmer-machine.hh"
|
|
#define khmer_syllable_machine_ex_C 1u
|
|
#define khmer_syllable_machine_ex_Coeng 14u
|
|
#define khmer_syllable_machine_ex_DOTTEDCIRCLE 12u
|
|
#define khmer_syllable_machine_ex_PLACEHOLDER 11u
|
|
#define khmer_syllable_machine_ex_Ra 16u
|
|
#define khmer_syllable_machine_ex_Robatic 20u
|
|
#define khmer_syllable_machine_ex_V 2u
|
|
#define khmer_syllable_machine_ex_VAbv 26u
|
|
#define khmer_syllable_machine_ex_VBlw 27u
|
|
#define khmer_syllable_machine_ex_VPre 28u
|
|
#define khmer_syllable_machine_ex_VPst 29u
|
|
#define khmer_syllable_machine_ex_Xgroup 21u
|
|
#define khmer_syllable_machine_ex_Ygroup 22u
|
|
#define khmer_syllable_machine_ex_ZWJ 6u
|
|
#define khmer_syllable_machine_ex_ZWNJ 5u
|
|
|
|
|
|
#line 59 "hb-ot-shape-complex-khmer-machine.hh"
|
|
static const unsigned char _khmer_syllable_machine_trans_keys[] = {
|
|
2u, 8u, 2u, 6u, 2u, 8u, 2u, 6u,
|
|
0u, 0u, 2u, 6u, 2u, 8u, 2u, 6u,
|
|
2u, 8u, 2u, 6u, 2u, 6u, 2u, 8u,
|
|
2u, 6u, 0u, 0u, 2u, 6u, 2u, 8u,
|
|
2u, 6u, 2u, 8u, 2u, 6u, 2u, 8u,
|
|
0u, 11u, 2u, 11u, 2u, 11u, 2u, 11u,
|
|
7u, 7u, 2u, 7u, 2u, 11u, 2u, 11u,
|
|
2u, 11u, 0u, 0u, 2u, 8u, 2u, 11u,
|
|
2u, 11u, 7u, 7u, 2u, 7u, 2u, 11u,
|
|
2u, 11u, 0u, 0u, 2u, 11u, 2u, 11u,
|
|
0u
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_char_class[] = {
|
|
0, 0, 1, 1, 2, 2, 1, 1,
|
|
1, 1, 3, 3, 1, 4, 1, 0,
|
|
1, 1, 1, 5, 6, 7, 1, 1,
|
|
1, 8, 9, 10, 11, 0
|
|
};
|
|
|
|
static const short _khmer_syllable_machine_index_offsets[] = {
|
|
0, 7, 12, 19, 24, 25, 30, 37,
|
|
42, 49, 54, 59, 66, 71, 72, 77,
|
|
84, 89, 96, 101, 108, 120, 130, 140,
|
|
150, 151, 157, 167, 177, 187, 188, 195,
|
|
205, 215, 216, 222, 232, 242, 243, 253,
|
|
0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_indicies[] = {
|
|
1, 0, 0, 2, 3, 0, 4, 1,
|
|
0, 0, 0, 3, 1, 0, 0, 0,
|
|
3, 0, 4, 5, 0, 0, 0, 4,
|
|
6, 7, 0, 0, 0, 8, 9, 0,
|
|
0, 0, 10, 0, 4, 9, 0, 0,
|
|
0, 10, 11, 0, 0, 0, 12, 0,
|
|
4, 11, 0, 0, 0, 12, 14, 13,
|
|
13, 13, 15, 14, 16, 16, 16, 15,
|
|
16, 17, 18, 16, 16, 16, 17, 19,
|
|
20, 16, 16, 16, 21, 22, 16, 16,
|
|
16, 23, 16, 17, 22, 16, 16, 16,
|
|
23, 24, 16, 16, 16, 25, 16, 17,
|
|
24, 16, 16, 16, 25, 14, 16, 16,
|
|
26, 15, 16, 17, 29, 28, 30, 2,
|
|
31, 28, 15, 19, 17, 23, 25, 21,
|
|
33, 32, 34, 2, 3, 6, 4, 10,
|
|
12, 8, 35, 32, 36, 32, 3, 6,
|
|
4, 10, 12, 8, 5, 32, 36, 32,
|
|
4, 6, 32, 32, 32, 8, 6, 7,
|
|
32, 36, 32, 8, 6, 37, 32, 36,
|
|
32, 10, 6, 4, 32, 32, 8, 38,
|
|
32, 36, 32, 12, 6, 4, 10, 32,
|
|
8, 35, 32, 34, 32, 3, 6, 4,
|
|
10, 12, 8, 29, 14, 39, 39, 39,
|
|
15, 39, 17, 41, 40, 42, 40, 15,
|
|
19, 17, 23, 25, 21, 18, 40, 42,
|
|
40, 17, 19, 40, 40, 40, 21, 19,
|
|
20, 40, 42, 40, 21, 19, 43, 40,
|
|
42, 40, 23, 19, 17, 40, 40, 21,
|
|
44, 40, 42, 40, 25, 19, 17, 23,
|
|
40, 21, 45, 46, 40, 31, 26, 15,
|
|
19, 17, 23, 25, 21, 41, 40, 31,
|
|
40, 15, 19, 17, 23, 25, 21, 0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_index_defaults[] = {
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 13, 16, 16, 16, 16, 16,
|
|
16, 16, 16, 16, 28, 32, 32, 32,
|
|
32, 32, 32, 32, 32, 32, 39, 40,
|
|
40, 40, 40, 40, 40, 40, 40, 40,
|
|
0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_cond_targs[] = {
|
|
20, 1, 28, 22, 23, 3, 24, 5,
|
|
25, 7, 26, 9, 27, 20, 10, 31,
|
|
20, 32, 12, 33, 14, 34, 16, 35,
|
|
18, 36, 39, 20, 20, 21, 30, 37,
|
|
20, 0, 29, 2, 4, 6, 8, 20,
|
|
20, 11, 13, 15, 17, 38, 19, 0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_cond_actions[] = {
|
|
1, 0, 2, 2, 2, 0, 0, 0,
|
|
2, 0, 2, 0, 2, 3, 0, 4,
|
|
5, 2, 0, 0, 0, 2, 0, 2,
|
|
0, 2, 4, 0, 8, 2, 9, 0,
|
|
10, 0, 0, 0, 0, 0, 0, 11,
|
|
12, 0, 0, 0, 0, 4, 0, 0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_to_state_actions[] = {
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 0, 0, 6, 0, 0, 0,
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_from_state_actions[] = {
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 0, 0, 7, 0, 0, 0,
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
0
|
|
};
|
|
|
|
static const signed char _khmer_syllable_machine_eof_trans[] = {
|
|
1, 1, 1, 1, 1, 1, 1, 1,
|
|
1, 1, 14, 17, 17, 17, 17, 17,
|
|
17, 17, 17, 17, 28, 33, 33, 33,
|
|
33, 33, 33, 33, 33, 33, 40, 41,
|
|
41, 41, 41, 41, 41, 41, 41, 41,
|
|
0
|
|
};
|
|
|
|
static const int khmer_syllable_machine_start = 20;
|
|
static const int khmer_syllable_machine_first_final = 20;
|
|
static const int khmer_syllable_machine_error = -1;
|
|
|
|
static const int khmer_syllable_machine_en_main = 20;
|
|
|
|
|
|
#line 43 "hb-ot-shape-complex-khmer-machine.rl"
|
|
|
|
|
|
|
|
#line 86 "hb-ot-shape-complex-khmer-machine.rl"
|
|
|
|
|
|
#define found_syllable(syllable_type) \
|
|
HB_STMT_START { \
|
|
if (0) fprintf (stderr, "syllable %d..%d %s\n", ts, te, #syllable_type); \
|
|
for (unsigned int i = ts; i < te; i++) \
|
|
info[i].syllable() = (syllable_serial << 4) | syllable_type; \
|
|
syllable_serial++; \
|
|
if (unlikely (syllable_serial == 16)) syllable_serial = 1; \
|
|
} HB_STMT_END
|
|
|
|
static void
|
|
find_syllables_khmer (hb_buffer_t *buffer)
|
|
{
|
|
unsigned int p, pe, eof, ts, te, act HB_UNUSED;
|
|
int cs;
|
|
hb_glyph_info_t *info = buffer->info;
|
|
|
|
#line 210 "hb-ot-shape-complex-khmer-machine.hh"
|
|
{
|
|
cs = (int)khmer_syllable_machine_start;
|
|
ts = 0;
|
|
te = 0;
|
|
act = 0;
|
|
}
|
|
|
|
#line 106 "hb-ot-shape-complex-khmer-machine.rl"
|
|
|
|
|
|
p = 0;
|
|
pe = eof = buffer->len;
|
|
|
|
unsigned int syllable_serial = 1;
|
|
|
|
#line 226 "hb-ot-shape-complex-khmer-machine.hh"
|
|
{
|
|
unsigned int _trans = 0;
|
|
const unsigned char * _keys;
|
|
const signed char * _inds;
|
|
int _ic;
|
|
_resume: {}
|
|
if ( p == pe && p != eof )
|
|
goto _out;
|
|
switch ( _khmer_syllable_machine_from_state_actions[cs] ) {
|
|
case 7: {
|
|
{
|
|
#line 1 "NONE"
|
|
{ts = p;}}
|
|
|
|
#line 241 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
if ( p == eof ) {
|
|
if ( _khmer_syllable_machine_eof_trans[cs] > 0 ) {
|
|
_trans = (unsigned int)_khmer_syllable_machine_eof_trans[cs] - 1;
|
|
}
|
|
}
|
|
else {
|
|
_keys = ( _khmer_syllable_machine_trans_keys + ((cs<<1)));
|
|
_inds = ( _khmer_syllable_machine_indicies + (_khmer_syllable_machine_index_offsets[cs]));
|
|
|
|
if ( (info[p].khmer_category()) <= 29 && (info[p].khmer_category()) >= 1 ) {
|
|
_ic = (int)_khmer_syllable_machine_char_class[(int)(info[p].khmer_category()) - 1];
|
|
if ( _ic <= (int)(*( _keys+1)) && _ic >= (int)(*( _keys)) )
|
|
_trans = (unsigned int)(*( _inds + (int)( _ic - (int)(*( _keys)) ) ));
|
|
else
|
|
_trans = (unsigned int)_khmer_syllable_machine_index_defaults[cs];
|
|
}
|
|
else {
|
|
_trans = (unsigned int)_khmer_syllable_machine_index_defaults[cs];
|
|
}
|
|
|
|
}
|
|
cs = (int)_khmer_syllable_machine_cond_targs[_trans];
|
|
|
|
if ( _khmer_syllable_machine_cond_actions[_trans] != 0 ) {
|
|
|
|
switch ( _khmer_syllable_machine_cond_actions[_trans] ) {
|
|
case 2: {
|
|
{
|
|
#line 1 "NONE"
|
|
{te = p+1;}}
|
|
|
|
#line 279 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 8: {
|
|
{
|
|
#line 82 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{te = p+1;{
|
|
#line 82 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_non_khmer_cluster); }
|
|
}}
|
|
|
|
#line 292 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 10: {
|
|
{
|
|
#line 80 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{te = p;p = p - 1;{
|
|
#line 80 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_consonant_syllable); }
|
|
}}
|
|
|
|
#line 305 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 12: {
|
|
{
|
|
#line 81 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{te = p;p = p - 1;{
|
|
#line 81 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_broken_cluster); }
|
|
}}
|
|
|
|
#line 318 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 11: {
|
|
{
|
|
#line 82 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{te = p;p = p - 1;{
|
|
#line 82 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_non_khmer_cluster); }
|
|
}}
|
|
|
|
#line 331 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 1: {
|
|
{
|
|
#line 80 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{p = ((te))-1;
|
|
{
|
|
#line 80 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_consonant_syllable); }
|
|
}}
|
|
|
|
#line 345 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 5: {
|
|
{
|
|
#line 81 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{p = ((te))-1;
|
|
{
|
|
#line 81 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_broken_cluster); }
|
|
}}
|
|
|
|
#line 359 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 3: {
|
|
{
|
|
#line 1 "NONE"
|
|
{switch( act ) {
|
|
case 2: {
|
|
p = ((te))-1;
|
|
{
|
|
#line 81 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_broken_cluster); }
|
|
break;
|
|
}
|
|
case 3: {
|
|
p = ((te))-1;
|
|
{
|
|
#line 82 "hb-ot-shape-complex-khmer-machine.rl"
|
|
found_syllable (khmer_non_khmer_cluster); }
|
|
break;
|
|
}
|
|
}}
|
|
}
|
|
|
|
#line 385 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 4: {
|
|
{
|
|
#line 1 "NONE"
|
|
{te = p+1;}}
|
|
|
|
#line 395 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
{
|
|
#line 81 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{act = 2;}}
|
|
|
|
#line 401 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
case 9: {
|
|
{
|
|
#line 1 "NONE"
|
|
{te = p+1;}}
|
|
|
|
#line 411 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
{
|
|
#line 82 "hb-ot-shape-complex-khmer-machine.rl"
|
|
{act = 3;}}
|
|
|
|
#line 417 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
if ( p == eof ) {
|
|
if ( cs >= 20 )
|
|
goto _out;
|
|
}
|
|
else {
|
|
switch ( _khmer_syllable_machine_to_state_actions[cs] ) {
|
|
case 6: {
|
|
{
|
|
#line 1 "NONE"
|
|
{ts = 0;}}
|
|
|
|
#line 437 "hb-ot-shape-complex-khmer-machine.hh"
|
|
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
p += 1;
|
|
goto _resume;
|
|
}
|
|
_out: {}
|
|
}
|
|
|
|
#line 114 "hb-ot-shape-complex-khmer-machine.rl"
|
|
|
|
}
|
|
|
|
#undef found_syllable
|
|
|
|
#endif /* HB_OT_SHAPE_COMPLEX_KHMER_MACHINE_HH */
|