[tools] Print unicode links on gen-* tools output
As Behdad's review
This commit is contained in:
parent
4dc87365d7
commit
6a390df8af
|
@ -1,16 +1,17 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
|
|
||||||
# Input files:
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/ArabicShaping.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/UnicodeData.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/Blocks.txt
|
|
||||||
|
|
||||||
from __future__ import print_function, division, absolute_import
|
from __future__ import print_function, division, absolute_import
|
||||||
|
|
||||||
import io, os.path, sys
|
import io, os.path, sys
|
||||||
|
|
||||||
if len (sys.argv) != 4:
|
if len (sys.argv) != 4:
|
||||||
print ("usage: ./gen-arabic-table.py ArabicShaping.txt UnicodeData.txt Blocks.txt", file=sys.stderr)
|
print ("""usage: ./gen-arabic-table.py ArabicShaping.txt UnicodeData.txt Blocks.txt
|
||||||
|
|
||||||
|
Input files, as of Unicode 12:
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/ArabicShaping.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/Blocks.txt
|
||||||
|
""", file=sys.stderr)
|
||||||
sys.exit (1)
|
sys.exit (1)
|
||||||
|
|
||||||
files = [io.open (x, encoding='utf-8') for x in sys.argv[1:]]
|
files = [io.open (x, encoding='utf-8') for x in sys.argv[1:]]
|
||||||
|
|
|
@ -1,7 +1,5 @@
|
||||||
#!/usr/bin/python
|
#!/usr/bin/python
|
||||||
|
|
||||||
# Input file: https://www.unicode.org/Public/emoji/12.0/emoji-data.txt
|
|
||||||
|
|
||||||
from __future__ import print_function, division, absolute_import
|
from __future__ import print_function, division, absolute_import
|
||||||
import sys
|
import sys
|
||||||
import os.path
|
import os.path
|
||||||
|
@ -9,7 +7,10 @@ from collections import OrderedDict
|
||||||
import packTab
|
import packTab
|
||||||
|
|
||||||
if len (sys.argv) != 2:
|
if len (sys.argv) != 2:
|
||||||
print("usage: ./gen-emoji-table.py emoji-data.txt", file=sys.stderr)
|
print("""usage: ./gen-emoji-table.py emoji-data.txt
|
||||||
|
|
||||||
|
Input file, as of Unicode 12:
|
||||||
|
* https://www.unicode.org/Public/emoji/12.0/emoji-data.txt""", file=sys.stderr)
|
||||||
sys.exit (1)
|
sys.exit (1)
|
||||||
|
|
||||||
f = open(sys.argv[1])
|
f = open(sys.argv[1])
|
||||||
|
|
|
@ -1,16 +1,16 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
|
|
||||||
# Input files:
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/IndicSyllabicCategory.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/IndicPositionalCategory.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/Blocks.txt
|
|
||||||
|
|
||||||
from __future__ import print_function, division, absolute_import
|
from __future__ import print_function, division, absolute_import
|
||||||
|
|
||||||
import io, sys
|
import io, sys
|
||||||
|
|
||||||
if len (sys.argv) != 4:
|
if len (sys.argv) != 4:
|
||||||
print ("usage: ./gen-indic-table.py IndicSyllabicCategory.txt IndicPositionalCategory.txt Blocks.txt", file=sys.stderr)
|
print ("""usage: ./gen-indic-table.py IndicSyllabicCategory.txt IndicPositionalCategory.txt Blocks.txt
|
||||||
|
|
||||||
|
Input files, as of Unicode 12:
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/IndicSyllabicCategory.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/IndicPositionalCategory.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/Blocks.txt""", file=sys.stderr)
|
||||||
sys.exit (1)
|
sys.exit (1)
|
||||||
|
|
||||||
ALLOWED_SINGLES = [0x00A0, 0x25CC]
|
ALLOWED_SINGLES = [0x00A0, 0x25CC]
|
||||||
|
|
|
@ -1,7 +1,5 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
|
|
||||||
# Input file: http://unicode.org/Public/UCD/latest/ucdxml/ucd.nounihan.grouped.zip
|
|
||||||
|
|
||||||
from __future__ import print_function, division, absolute_import
|
from __future__ import print_function, division, absolute_import
|
||||||
|
|
||||||
import io, os.path, sys, re
|
import io, os.path, sys, re
|
||||||
|
@ -9,7 +7,10 @@ import logging
|
||||||
logging.basicConfig(format='%(levelname)s: %(message)s', level=logging.INFO)
|
logging.basicConfig(format='%(levelname)s: %(message)s', level=logging.INFO)
|
||||||
|
|
||||||
if len (sys.argv) not in (2, 3):
|
if len (sys.argv) not in (2, 3):
|
||||||
print("usage: ./gen-ucd-table ucd.nounihan.grouped.xml [/path/to/hb-common.h]", file=sys.stderr)
|
print("""usage: ./gen-ucd-table ucd.nounihan.grouped.xml [/path/to/hb-common.h]
|
||||||
|
|
||||||
|
Input file, as of Unicode 12:
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucdxml/ucd.nounihan.grouped.zip""", file=sys.stderr)
|
||||||
sys.exit(1)
|
sys.exit(1)
|
||||||
|
|
||||||
# https://github.com/harfbuzz/packtab
|
# https://github.com/harfbuzz/packtab
|
||||||
|
|
|
@ -1,19 +1,19 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
# flake8: noqa
|
# flake8: noqa
|
||||||
|
|
||||||
# Input files:
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/IndicSyllabicCategory.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/IndicPositionalCategory.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/UnicodeData.txt
|
|
||||||
# - https://unicode.org/Public/12.0.0/ucd/Blocks.txt
|
|
||||||
|
|
||||||
from __future__ import print_function, division, absolute_import
|
from __future__ import print_function, division, absolute_import
|
||||||
|
|
||||||
import io
|
import io
|
||||||
import sys
|
import sys
|
||||||
|
|
||||||
if len (sys.argv) != 5:
|
if len (sys.argv) != 5:
|
||||||
print ("usage: ./gen-use-table.py IndicSyllabicCategory.txt IndicPositionalCategory.txt UnicodeData.txt Blocks.txt", file=sys.stderr)
|
print ("""usage: ./gen-use-table.py IndicSyllabicCategory.txt IndicPositionalCategory.txt UnicodeData.txt Blocks.txt
|
||||||
|
|
||||||
|
Input file, as of Unicode 12:
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/IndicSyllabicCategory.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/IndicPositionalCategory.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/Blocks.txt""", file=sys.stderr)
|
||||||
sys.exit (1)
|
sys.exit (1)
|
||||||
|
|
||||||
BLACKLISTED_BLOCKS = ["Thai", "Lao"]
|
BLACKLISTED_BLOCKS = ["Thai", "Lao"]
|
||||||
|
|
|
@ -7,7 +7,6 @@ circles into sequences prohibited by the USE script development spec.
|
||||||
This function should be used as the ``preprocess_text`` of an
|
This function should be used as the ``preprocess_text`` of an
|
||||||
``hb_ot_complex_shaper_t``.
|
``hb_ot_complex_shaper_t``.
|
||||||
|
|
||||||
Input file: https://unicode.org/Public/12.0.0/ucd/Scripts.txt
|
|
||||||
"""
|
"""
|
||||||
|
|
||||||
from __future__ import absolute_import, division, print_function, unicode_literals
|
from __future__ import absolute_import, division, print_function, unicode_literals
|
||||||
|
@ -27,7 +26,10 @@ import io
|
||||||
import sys
|
import sys
|
||||||
|
|
||||||
if len (sys.argv) != 3:
|
if len (sys.argv) != 3:
|
||||||
print ('usage: ./gen-vowel-constraints.py ms-use/IndicShapingInvalidCluster.txt Scripts.txt', file=sys.stderr)
|
print ("""usage: ./gen-vowel-constraints.py ms-use/IndicShapingInvalidCluster.txt Scripts.txt
|
||||||
|
|
||||||
|
Input file, as of Unicode 12:
|
||||||
|
* https://unicode.org/Public/UCD/latest/ucd/Scripts.txt""", file=sys.stderr)
|
||||||
sys.exit (1)
|
sys.exit (1)
|
||||||
|
|
||||||
with io.open (sys.argv[2], encoding='utf-8') as f:
|
with io.open (sys.argv[2], encoding='utf-8') as f:
|
||||||
|
|
Loading…
Reference in New Issue