Clean up some coverage files; a few accidentally included PUA values and

punctuation. Add debugging stuff to dump out missing codepoints during
    cache building when missing only a few
This commit is contained in:
Keith Packard 2002-07-12 21:06:03 +00:00
parent b4a2c1f012
commit c80d2ac486
21 changed files with 1067 additions and 1067 deletions

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/bg.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -22,14 +22,15 @@
# PERFORMANCE OF THIS SOFTWARE.
#
# Bulgarian (BG)
0400
04ad
0400 # CYRILLIC CAPITAL IE WITH GRAVE
040d # CYRILLIC CAPITAL I WITH GRAVE
0410-042a
042c
042e-044a
042e-042f
0430-044a
044c
044e-044f
0450
045d
0450 # CYRILLIC SMALL IE WITH GRAVE
045d # CYRILLIC SMALL I WITH GRAVE
0462-0463
046a-046b

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/bi.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -31,9 +31,9 @@
00e9
00cf
00ef
e000
e001
e002
e003
#e000 # LATIN CAPITAL LETTER M WITH MACRON (no UCS code)
#e001 # LATIN SMALL LETTER M WITH MACRON (no UCS code)
#e002 # LATIN CAPITAL LETTER P WITH MACRON (no UCS code)
#e003 # LATIN SMALL LETTER P WITH MACRON (no UCS code)
00dc
00fc

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/bo.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -25,6 +25,15 @@
#
# Taken from the Unicode coverage of this language
#
0f00-0f47
0f49-0f6a
0f71-0f7f
0f40-0f47
0f49-0f69
0f71-0f76
0f78
0f7a-0f7d
0f80-0f81
0f90-0f97
0f99-0fb9
# Fixed-form subjoined consonants
# These characters are used only for transliteration and transcription.
#0fba-0fbc

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/el.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -29,21 +29,3 @@
038c
038e-03a1
03a3-03ce
03d7
03da-03e1
#1f00-1f15 # only for polytonic orthography below...
#1f18-1f1d
#1f20-1f45
#1f48-1f4d
#1f50-1f57
#1f59
#1f5b
#1f5d
#1f5f-157d
#1f80-1fb4
#1fb6-1fc4
#1fc6-1fd3
#1fd6-1fdb
#1fdd-1fef
#1ff2-1ff4
#1ff6-1ffe

File diff suppressed because it is too large Load Diff

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/ga.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -49,4 +49,4 @@
#1680-169c # Ogham
#2018-2019 # single quotes
#201c-201d # double quotes
204a # tironian sign et
#204a # tironian sign et

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/gn.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -33,7 +33,7 @@
00c9
00e9
1ebd
e005
#e005 # LATIN SMALL LETTER G WITH TILDE (no UCS)
00cd
00ed
0129

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/hy.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -23,6 +23,4 @@
#
# Armenian (HY)
0531-0556
055a-055f
0561-0586
0589-058a
0561-0587

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/km.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -25,5 +25,5 @@
#
# Taken from the Unicode coverage of this language
#
1780-17dc
17e0-17e9
1780-17c5

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/ko.orth,v 1.2 2002/07/06 23:59:16 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -22,9 +22,9 @@
# PERFORMANCE OF THIS SOFTWARE.
#
# Korean (KO)
0x3000 # IDEOGRAPHIC SPACE
0x3001 # IDEOGRAPHIC COMMA
0x3002 # IDEOGRAPHIC FULL STOP
#0x3000 # IDEOGRAPHIC SPACE
#0x3001 # IDEOGRAPHIC COMMA
#0x3002 # IDEOGRAPHIC FULL STOP
0x3131 # HANGUL LETTER KIYEOK
0x3132 # HANGUL LETTER SSANGKIYEOK
0x3133 # HANGUL LETTER KIYEOK-SIOS
@ -76,7 +76,7 @@
0x3161 # HANGUL LETTER EU
0x3162 # HANGUL LETTER YI
0x3163 # HANGUL LETTER I
0x3164 # HANGUL FILLER
#0x3164 # HANGUL FILLER
0x3165 # HANGUL LETTER SSANGNIEUN
0x3166 # HANGUL LETTER NIEUN-TIKEUT
0x3167 # HANGUL LETTER NIEUN-SIOS
@ -119,64 +119,64 @@
0x318C # HANGUL LETTER YU-I
0x318D # HANGUL LETTER ARAEA
0x318E # HANGUL LETTER ARAEAE
0x3200 # PARENTHESIZED HANGUL KIYEOK
0x3201 # PARENTHESIZED HANGUL NIEUN
0x3202 # PARENTHESIZED HANGUL TIKEUT
0x3203 # PARENTHESIZED HANGUL RIEUL
0x3204 # PARENTHESIZED HANGUL MIEUM
0x3205 # PARENTHESIZED HANGUL PIEUP
0x3206 # PARENTHESIZED HANGUL SIOS
0x3207 # PARENTHESIZED HANGUL IEUNG
0x3208 # PARENTHESIZED HANGUL CIEUC
0x3209 # PARENTHESIZED HANGUL CHIEUCH
0x320A # PARENTHESIZED HANGUL KHIEUKH
0x320B # PARENTHESIZED HANGUL THIEUTH
0x320C # PARENTHESIZED HANGUL PHIEUPH
0x320D # PARENTHESIZED HANGUL HIEUH
0x320E # PARENTHESIZED HANGUL KIYEOK A
0x320F # PARENTHESIZED HANGUL NIEUN A
0x3210 # PARENTHESIZED HANGUL TIKEUT A
0x3211 # PARENTHESIZED HANGUL RIEUL A
0x3212 # PARENTHESIZED HANGUL MIEUM A
0x3213 # PARENTHESIZED HANGUL PIEUP A
0x3214 # PARENTHESIZED HANGUL SIOS A
0x3215 # PARENTHESIZED HANGUL IEUNG A
0x3216 # PARENTHESIZED HANGUL CIEUC A
0x3217 # PARENTHESIZED HANGUL CHIEUCH A
0x3218 # PARENTHESIZED HANGUL KHIEUKH A
0x3219 # PARENTHESIZED HANGUL THIEUTH A
0x321A # PARENTHESIZED HANGUL PHIEUPH A
0x321B # PARENTHESIZED HANGUL HIEUH A
0x321C # PARENTHESIZED HANGUL CIEUC U
0x3260 # CIRCLED HANGUL KIYEOK
0x3261 # CIRCLED HANGUL NIEUN
0x3262 # CIRCLED HANGUL TIKEUT
0x3263 # CIRCLED HANGUL RIEUL
0x3264 # CIRCLED HANGUL MIEUM
0x3265 # CIRCLED HANGUL PIEUP
0x3266 # CIRCLED HANGUL SIOS
0x3267 # CIRCLED HANGUL IEUNG
0x3268 # CIRCLED HANGUL CIEUC
0x3269 # CIRCLED HANGUL CHIEUCH
0x326A # CIRCLED HANGUL KHIEUKH
0x326B # CIRCLED HANGUL THIEUTH
0x326C # CIRCLED HANGUL PHIEUPH
0x326D # CIRCLED HANGUL HIEUH
0x326E # CIRCLED HANGUL KIYEOK A
0x326F # CIRCLED HANGUL NIEUN A
0x3270 # CIRCLED HANGUL TIKEUT A
0x3271 # CIRCLED HANGUL RIEUL A
0x3272 # CIRCLED HANGUL MIEUM A
0x3273 # CIRCLED HANGUL PIEUP A
0x3274 # CIRCLED HANGUL SIOS A
0x3275 # CIRCLED HANGUL IEUNG A
0x3276 # CIRCLED HANGUL CIEUC A
0x3277 # CIRCLED HANGUL CHIEUCH A
0x3278 # CIRCLED HANGUL KHIEUKH A
0x3279 # CIRCLED HANGUL THIEUTH A
0x327A # CIRCLED HANGUL PHIEUPH A
0x327B # CIRCLED HANGUL HIEUH A
0x327F # KOREAN STANDARD SYMBOL
#0x3200 # PARENTHESIZED HANGUL KIYEOK
#0x3201 # PARENTHESIZED HANGUL NIEUN
#0x3202 # PARENTHESIZED HANGUL TIKEUT
#0x3203 # PARENTHESIZED HANGUL RIEUL
#0x3204 # PARENTHESIZED HANGUL MIEUM
#0x3205 # PARENTHESIZED HANGUL PIEUP
#0x3206 # PARENTHESIZED HANGUL SIOS
#0x3207 # PARENTHESIZED HANGUL IEUNG
#0x3208 # PARENTHESIZED HANGUL CIEUC
#0x3209 # PARENTHESIZED HANGUL CHIEUCH
#0x320A # PARENTHESIZED HANGUL KHIEUKH
#0x320B # PARENTHESIZED HANGUL THIEUTH
#0x320C # PARENTHESIZED HANGUL PHIEUPH
#0x320D # PARENTHESIZED HANGUL HIEUH
#0x320E # PARENTHESIZED HANGUL KIYEOK A
#0x320F # PARENTHESIZED HANGUL NIEUN A
#0x3210 # PARENTHESIZED HANGUL TIKEUT A
#0x3211 # PARENTHESIZED HANGUL RIEUL A
#0x3212 # PARENTHESIZED HANGUL MIEUM A
#0x3213 # PARENTHESIZED HANGUL PIEUP A
#0x3214 # PARENTHESIZED HANGUL SIOS A
#0x3215 # PARENTHESIZED HANGUL IEUNG A
#0x3216 # PARENTHESIZED HANGUL CIEUC A
#0x3217 # PARENTHESIZED HANGUL CHIEUCH A
#0x3218 # PARENTHESIZED HANGUL KHIEUKH A
#0x3219 # PARENTHESIZED HANGUL THIEUTH A
#0x321A # PARENTHESIZED HANGUL PHIEUPH A
#0x321B # PARENTHESIZED HANGUL HIEUH A
#0x321C # PARENTHESIZED HANGUL CIEUC U
#0x3260 # CIRCLED HANGUL KIYEOK
#0x3261 # CIRCLED HANGUL NIEUN
#0x3262 # CIRCLED HANGUL TIKEUT
#0x3263 # CIRCLED HANGUL RIEUL
#0x3264 # CIRCLED HANGUL MIEUM
#0x3265 # CIRCLED HANGUL PIEUP
#0x3266 # CIRCLED HANGUL SIOS
#0x3267 # CIRCLED HANGUL IEUNG
#0x3268 # CIRCLED HANGUL CIEUC
#0x3269 # CIRCLED HANGUL CHIEUCH
#0x326A # CIRCLED HANGUL KHIEUKH
#0x326B # CIRCLED HANGUL THIEUTH
#0x326C # CIRCLED HANGUL PHIEUPH
#0x326D # CIRCLED HANGUL HIEUH
#0x326E # CIRCLED HANGUL KIYEOK A
#0x326F # CIRCLED HANGUL NIEUN A
#0x3270 # CIRCLED HANGUL TIKEUT A
#0x3271 # CIRCLED HANGUL RIEUL A
#0x3272 # CIRCLED HANGUL MIEUM A
#0x3273 # CIRCLED HANGUL PIEUP A
#0x3274 # CIRCLED HANGUL SIOS A
#0x3275 # CIRCLED HANGUL IEUNG A
#0x3276 # CIRCLED HANGUL CIEUC A
#0x3277 # CIRCLED HANGUL CHIEUCH A
#0x3278 # CIRCLED HANGUL KHIEUKH A
#0x3279 # CIRCLED HANGUL THIEUTH A
#0x327A # CIRCLED HANGUL PHIEUPH A
#0x327B # CIRCLED HANGUL HIEUH A
#0x327F # KOREAN STANDARD SYMBOL
0x4E00 # <CJK>
0x4E01 # <CJK>
0x4E03 # <CJK>
@ -16237,4 +16237,4 @@
0xFA09 # <CJK>
0xFA0A # <CJK>
0xFA0B # <CJK>
0xFFE6 # FULLWIDTH WON SIGN
#0xFFE6 # FULLWIDTH WON SIGN

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/lb.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -21,7 +21,7 @@
# TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
# PERFORMANCE OF THIS SOFTWARE.
#
# Hawaiian (HAW)
# Luxembourgish (Letzeburgesch) (LB)
#
# Orthography from http://www.eki.ee/letter
#
@ -51,8 +51,10 @@
00ea
00ce
00ee
e006-e007
e008-e009
#e006 # LATIN CAPITAL LETTER M WITH CIRCUMFLEX (no UCS)
#e007 # LATIN SMALL LETTER M WITH CIRCUMFLEX (no UCS)
#e008 # LATIN CAPITAL LETTER N WITH CIRCUMFLEX (no UCS)
#e009 # LATIN SMALL LETTER N WITH CIRCUMFLEX (no UCS)
00d4
00f4
00db

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mg.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -29,7 +29,7 @@
0061-007a
00c1
00e1
e010
e011
#e010 # LATIN CAPITAL LETTER N WITH DIAERESIS
#e011 # LATIN SMALL LETTER N WITH DIAERESIS
00d4
00f4

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mh.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -31,15 +31,15 @@
0101
013b
013c
e00a
e00b
e00c
e00d
#e00a # LATIN CAPITAL LETTER M WITH CEDILLA (no UCS)
#e00b # LATIN SMALL LETTER M WITH CEDILLA (no UCS)
#e00c # LATIN CAPITAL LETTER N WITH MACRON (no UCS)
#e00d # LATIN SMALL LETTER N WITH MACRON (no UCS)
0145
0146
014c
014d
e00e
e00f
#e00e # LATIN CAPITAL LETTER O WITH CEDILLA (no UCS)
#e00f # LATIN SMALL LETTER O WITH CEDILLA (no UCS)
016a
016b

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mk.orth,v 1.2 2002/07/06 23:59:17 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -22,17 +22,19 @@
# PERFORMANCE OF THIS SOFTWARE.
#
# Macedonian (MK)
0400
0400 # CYRILLIC CAPITAL LETTER IE WITH GRAVE
0403
0405
0408-040a
040c-040d
040c
040d # CYRILLIC CAPITAL LETTER I WITH GRAVE
040f
0410-0418
041a-0428
0450
0450 # CYRILLIC SMALL LETTER IE WITH GRAVE
0453
0455
0458-045a
045c-045d
045c
045d # CYRILLIC SMALL LETTER I WITH GRAVE
045f

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mn.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -25,7 +25,13 @@
#
# Taken from the Unicode coverage of this language
#
1800-180a
1810-1819
1820-1877
# Basic letters
1820-1842
# Todo letters
1843-185c
# Sibe letters
185d-1872
# Manchu letters
1873-1877
# Extensions for Sanskrit and Tibetan
1880-18a9

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mo.orth,v 1.2 2002/07/06 23:59:17 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -29,7 +29,7 @@
00e2
00ee
0102-0103
0218-021b
0218-021b # Comma below forms (preferred over cedilla)
0401
0410-044f
0451

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/ro.orth,v 1.2 2002/07/06 23:59:19 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -29,6 +29,6 @@
00e2
00ee
0102-0103
0218-021b
0218-021b # comma-below forms (preferred over cedilla)
#2019-201a # single quotes
#201d-201e # double quotes

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/si.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -25,14 +25,16 @@
#
# Taken from the Unicode coverage of this language
#
0d82-0d83
# Independent vowels
0d85-0d96
# Consonants
0d9a-0db1
0db3-0dbb
0dbd
0dc0-0dc6
0dca
# Dependent vowel signs
0dcf-0dd4
0dd6
0dd8-0ddf
# Additional dependent vowel signs
0df2-0df4

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/tl.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -25,5 +25,10 @@
#
# Taken from the Unicode coverage of this language
#
1700-170c
170e-1714
# Independent vowels
1700-1702
# Consonants
1703-170c
170e-1711
# Dependent vowel signs
1712-1713

View File

@ -1,5 +1,5 @@
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/yo.orth,v 1.1 2002/07/12 19:19:16 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
@ -28,59 +28,59 @@
0041-005a
0061-007a
00c0
00e0
00c1
00e1
00c2
00e2
01cd-01ce
00c3
00c8
00e8
00c9
00e9
00ca
00cc
00cd
00ce
00d2
00d3
00d4
00d5
00d9
00da
00db
00e0
00e1
00e2
00e3
00e8
00e9
00ea
00ec
00ed
00ee
00f2
00f3
00f4
00f5
00f9
00fa
00fb
011a-011b
1eb8-1eb9
0128-0129
0143-0144
0168-0169
01cd-01ce
01cf-01d0
01d1-01d2
01d3-01d4
01f8-01f9 # LATIN LETTER N WITH GRAVE
0300
0301
0302
0303
030c
00cc
00ec
00cd
00ed
00ce
00ee
01cf-01d0
1e3e-1e3f
# LATIN CAPTIAL LETTER M WITH MACRON (no UCS code)
# LATIN SMALL LETTER M WITH MACRON (no UCS code)
01f8-01f9
0143-0144
# LATIN CAPTIAL LETTER N WITH MACRON (no UCS code)
# LATIN SMALL LETTER N WITH MACRON (no UCS code)
00d2
00f2
00d3
00f3
00d4
00f4
01d1-01d2
1ecc-1ecd
1e62-1e63
00d9
00f9
00da
00fa
00db
00fb
01d3-01d4
00c3
00e3
1eb8-1eb9
1ebc-1ebd
0128-0129
00d5
00f5
0168-0169
1ecc-1ecd
# LATIN CAPTIAL LETTER M WITH MACRON (no UCS code)
# LATIN CAPTIAL LETTER N WITH MACRON (no UCS code)
# LATIN SMALL LETTER M WITH MACRON (no UCS code)
# LATIN SMALL LETTER N WITH MACRON (no UCS code)

View File

@ -1,5 +1,5 @@
/*
* $XFree86: xc/lib/fontconfig/fc-lang/fclang.tmpl.c,v 1.1 2002/07/06 23:21:36 keithp Exp $
* $XFree86: xc/lib/fontconfig/src/fclang.c,v 1.3 2002/07/08 07:31:53 keithp Exp $
*
* Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
*
@ -60,7 +60,36 @@ FcFreeTypeSetLang (FcPattern *pattern,
}
missing = FcCharSetSubtractCount (&fcLangCharSets[i].charset, charset);
if (FcDebug() & FC_DBG_SCANV)
printf ("%s(%d) ", fcLangCharSets[i].lang, missing);
{
if (missing && missing < 10)
{
FcCharSet *missed = FcCharSetSubtract (&fcLangCharSets[i].charset,
charset);
FcChar32 ucs4;
FcChar32 map[FC_CHARSET_MAP_SIZE];
FcChar32 next;
printf ("\n%s(%d) ", fcLangCharSets[i].lang, missing);
printf ("{");
for (ucs4 = FcCharSetFirstPage (missed, map, &next);
ucs4 != FC_CHARSET_DONE;
ucs4 = FcCharSetNextPage (missed, map, &next))
{
int i, j;
for (i = 0; i < FC_CHARSET_MAP_SIZE; i++)
if (map[i])
{
for (j = 0; j < 32; j++)
if (map[i] & (1 << j))
printf (" %04x", ucs4 + i * 32 + j);
}
}
printf (" }\n\t");
FcCharSetDestroy (missed);
}
else
printf ("%s(%d) ", fcLangCharSets[i].lang, missing);
}
if (!missing)
{
if (!FcPatternAddString (pattern, FC_LANG, fcLangCharSets[i].lang))