[aat] Improve unsafe-to-break logic
Reduces false-positives. See comments for new logic. Fixes https://github.com/harfbuzz/harfbuzz/issues/2860 Adjusts run-tests.sh to allow unhashed absolute filenames.
This commit is contained in:
parent
cf203936d7
commit
d8ea552d10
|
@ -730,6 +730,7 @@ template <typename Types, typename EntryData>
|
||||||
struct StateTableDriver
|
struct StateTableDriver
|
||||||
{
|
{
|
||||||
using StateTableT = StateTable<Types, EntryData>;
|
using StateTableT = StateTable<Types, EntryData>;
|
||||||
|
using EntryT = Entry<EntryData>;
|
||||||
|
|
||||||
StateTableDriver (const StateTableT &machine_,
|
StateTableDriver (const StateTableT &machine_,
|
||||||
hb_buffer_t *buffer_,
|
hb_buffer_t *buffer_,
|
||||||
|
@ -751,33 +752,79 @@ struct StateTableDriver
|
||||||
machine.get_class (buffer->info[buffer->idx].codepoint, num_glyphs) :
|
machine.get_class (buffer->info[buffer->idx].codepoint, num_glyphs) :
|
||||||
(unsigned) StateTableT::CLASS_END_OF_TEXT;
|
(unsigned) StateTableT::CLASS_END_OF_TEXT;
|
||||||
DEBUG_MSG (APPLY, nullptr, "c%u at %u", klass, buffer->idx);
|
DEBUG_MSG (APPLY, nullptr, "c%u at %u", klass, buffer->idx);
|
||||||
const Entry<EntryData> &entry = machine.get_entry (state, klass);
|
const EntryT &entry = machine.get_entry (state, klass);
|
||||||
|
const int next_state = machine.new_state (entry.newState);
|
||||||
|
|
||||||
/* Unsafe-to-break before this if not in state 0, as things might
|
/* Conditions under which it's guaranteed safe-to-break before current glyph:
|
||||||
* go differently if we start from state 0 here.
|
|
||||||
*
|
*
|
||||||
* Ugh. The indexing here is ugly... */
|
* 1. There was no action in this transition; and
|
||||||
if (state && buffer->backtrack_len () && buffer->idx < buffer->len)
|
*
|
||||||
{
|
* 2. If we break before current glyph, the results will be the same. That
|
||||||
/* If there's no action and we're just epsilon-transitioning to state 0,
|
* is guaranteed if:
|
||||||
* safe to break. */
|
*
|
||||||
if (c->is_actionable (this, entry) ||
|
* 2a. We were already in start-of-text state; or
|
||||||
!(entry.newState == StateTableT::STATE_START_OF_TEXT &&
|
*
|
||||||
entry.flags == context_t::DontAdvance))
|
* 2b. We are epsilon-transitioning to start-of-text state; or
|
||||||
buffer->unsafe_to_break_from_outbuffer (buffer->backtrack_len () - 1, buffer->idx + 1);
|
*
|
||||||
}
|
* 2c. Starting from start-of-text state seeing current glyph:
|
||||||
|
*
|
||||||
|
* 2c'. There won't be any actions; and
|
||||||
|
*
|
||||||
|
* 2c". We would end up in the same state that we were going to end up
|
||||||
|
* in now, including whether epsilon-transitioning.
|
||||||
|
*
|
||||||
|
* and
|
||||||
|
*
|
||||||
|
* 3. If we break before current glyph, there won't be any end-of-text action
|
||||||
|
* after previous glyph.
|
||||||
|
*
|
||||||
|
* This triples the transitions we need to look up, but is worth returning
|
||||||
|
* granular unsafe-to-break results. See eg.:
|
||||||
|
*
|
||||||
|
* https://github.com/harfbuzz/harfbuzz/issues/2860
|
||||||
|
*/
|
||||||
|
const EntryT *wouldbe_entry;
|
||||||
|
bool safe_to_break =
|
||||||
|
/* 1. */
|
||||||
|
!c->is_actionable (this, entry)
|
||||||
|
&&
|
||||||
|
/* 2. */
|
||||||
|
(
|
||||||
|
/* 2a. */
|
||||||
|
state == StateTableT::STATE_START_OF_TEXT
|
||||||
|
||
|
||||||
|
/* 2b. */
|
||||||
|
(
|
||||||
|
(entry.flags & context_t::DontAdvance) &&
|
||||||
|
next_state == StateTableT::STATE_START_OF_TEXT
|
||||||
|
)
|
||||||
|
||
|
||||||
|
/* 2c. */
|
||||||
|
(
|
||||||
|
wouldbe_entry = &machine.get_entry (StateTableT::STATE_START_OF_TEXT, klass)
|
||||||
|
,
|
||||||
|
/* 2c'. */
|
||||||
|
!c->is_actionable (this, *wouldbe_entry)
|
||||||
|
&&
|
||||||
|
/* 2c". */
|
||||||
|
(
|
||||||
|
next_state == machine.new_state (wouldbe_entry->newState)
|
||||||
|
&&
|
||||||
|
(entry.flags & context_t::DontAdvance) == (wouldbe_entry->flags & context_t::DontAdvance)
|
||||||
|
)
|
||||||
|
)
|
||||||
|
)
|
||||||
|
&&
|
||||||
|
/* 3. */
|
||||||
|
!c->is_actionable (this, machine.get_entry (state, StateTableT::CLASS_END_OF_TEXT))
|
||||||
|
;
|
||||||
|
|
||||||
/* Unsafe-to-break if end-of-text would kick in here. */
|
if (!safe_to_break && buffer->backtrack_len () && buffer->idx < buffer->len)
|
||||||
if (buffer->backtrack_len () && buffer->idx < buffer->len)
|
buffer->unsafe_to_break_from_outbuffer (buffer->backtrack_len () - 1, buffer->idx + 1);
|
||||||
{
|
|
||||||
const Entry<EntryData> &end_entry = machine.get_entry (state, StateTableT::CLASS_END_OF_TEXT);
|
|
||||||
if (c->is_actionable (this, end_entry))
|
|
||||||
buffer->unsafe_to_break_from_outbuffer (buffer->backtrack_len () - 1, buffer->idx + 1);
|
|
||||||
}
|
|
||||||
|
|
||||||
c->transition (this, entry);
|
c->transition (this, entry);
|
||||||
|
|
||||||
state = machine.new_state (entry.newState);
|
state = next_state;
|
||||||
DEBUG_MSG (APPLY, nullptr, "s%d", state);
|
DEBUG_MSG (APPLY, nullptr, "s%d", state);
|
||||||
|
|
||||||
if (buffer->idx == buffer->len || unlikely (!buffer->successful))
|
if (buffer->idx == buffer->len || unlikely (!buffer->successful))
|
||||||
|
|
|
@ -1,3 +1,6 @@
|
||||||
|
# https://github.com/harfbuzz/harfbuzz/pull/2871
|
||||||
|
/System/Library/Fonts/LucidaGrande.ttc:--font-funcs ot --show-flags:U+0041,U+0042,U+0043,U+0044:[A=0+1413|B=1+1178|C=2+1417|D=3+1534]
|
||||||
|
|
||||||
# 10.12.6 https://gist.github.com/ebraminio/1704341fa16b06979e605aafd88198cf
|
# 10.12.6 https://gist.github.com/ebraminio/1704341fa16b06979e605aafd88198cf
|
||||||
/System/Library/Fonts/Helvetica.dfont@c7bec2785a4c402b7809b5e35337c3d24c18e281:--font-funcs ot:U+006D,U+0300:[m=0+1706|gravecmb=0@-284,10+0]
|
/System/Library/Fonts/Helvetica.dfont@c7bec2785a4c402b7809b5e35337c3d24c18e281:--font-funcs ot:U+006D,U+0300:[m=0+1706|gravecmb=0@-284,10+0]
|
||||||
/System/Library/Fonts/LucidaGrande.ttc@d89a9d7e57767bfe3b5a4cfd22bb1e9dbe03a062:--font-funcs ot:U+006D,U+0300:[mgrave=0+1912]
|
/System/Library/Fonts/LucidaGrande.ttc@d89a9d7e57767bfe3b5a4cfd22bb1e9dbe03a062:--font-funcs ot:U+006D,U+0300:[mgrave=0+1912]
|
||||||
|
|
|
@ -67,17 +67,18 @@ for filename in args:
|
||||||
if os.name == 'nt': # Skip on Windows
|
if os.name == 'nt': # Skip on Windows
|
||||||
continue
|
continue
|
||||||
|
|
||||||
fontfile, expected_hash = fontfile.split('@')
|
fontfile, expected_hash = (fontfile.split('@') + [''])[:2]
|
||||||
|
|
||||||
try:
|
try:
|
||||||
with open (fontfile, 'rb') as ff:
|
with open (fontfile, 'rb') as ff:
|
||||||
actual_hash = hashlib.sha1 (ff.read()).hexdigest ().strip ()
|
if expected_hash:
|
||||||
if actual_hash != expected_hash:
|
actual_hash = hashlib.sha1 (ff.read()).hexdigest ().strip ()
|
||||||
print ('different version of %s found; Expected hash %s, got %s; skipping.' %
|
if actual_hash != expected_hash:
|
||||||
(fontfile, expected_hash, actual_hash))
|
print ('different version of %s found; Expected hash %s, got %s; skipping.' %
|
||||||
skips += 1
|
(fontfile, expected_hash, actual_hash))
|
||||||
continue
|
skips += 1
|
||||||
except:
|
continue
|
||||||
|
except IOError:
|
||||||
print ('%s not found, skip.' % fontfile)
|
print ('%s not found, skip.' % fontfile)
|
||||||
skips += 1
|
skips += 1
|
||||||
continue
|
continue
|
||||||
|
|
Loading…
Reference in New Issue