Commit c80d2ac4 authored by Keith Packard's avatar Keith Packard

Clean up some coverage files; a few accidentally included PUA values and

    punctuation. Add debugging stuff to dump out missing codepoints during
    cache building when missing only a few
parent b4a2c1f0
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/bg.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -22,14 +22,15 @@
# PERFORMANCE OF THIS SOFTWARE.
#
# Bulgarian (BG)
0400
04ad
0400 # CYRILLIC CAPITAL IE WITH GRAVE
040d # CYRILLIC CAPITAL I WITH GRAVE
0410-042a
042c
042e-044a
042e-042f
0430-044a
044c
044e-044f
0450
045d
0450 # CYRILLIC SMALL IE WITH GRAVE
045d # CYRILLIC SMALL I WITH GRAVE
0462-0463
046a-046b
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/bi.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -31,9 +31,9 @@
00e9
00cf
00ef
e000
e001
e002
e003
#e000 # LATIN CAPITAL LETTER M WITH MACRON (no UCS code)
#e001 # LATIN SMALL LETTER M WITH MACRON (no UCS code)
#e002 # LATIN CAPITAL LETTER P WITH MACRON (no UCS code)
#e003 # LATIN SMALL LETTER P WITH MACRON (no UCS code)
00dc
00fc
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/bo.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -25,6 +25,15 @@
#
# Taken from the Unicode coverage of this language
#
0f00-0f47
0f49-0f6a
0f71-0f7f
0f40-0f47
0f49-0f69
0f71-0f76
0f78
0f7a-0f7d
0f80-0f81
0f90-0f97
0f99-0fb9
# Fixed-form subjoined consonants
# These characters are used only for transliteration and transcription.
#0fba-0fbc
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/el.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -29,21 +29,3 @@
038c
038e-03a1
03a3-03ce
03d7
03da-03e1
#1f00-1f15 # only for polytonic orthography below...
#1f18-1f1d
#1f20-1f45
#1f48-1f4d
#1f50-1f57
#1f59
#1f5b
#1f5d
#1f5f-157d
#1f80-1fb4
#1fb6-1fc4
#1fc6-1fd3
#1fd6-1fdb
#1fdd-1fef
#1ff2-1ff4
#1ff6-1ffe
This source diff could not be displayed because it is too large. You can view the blob instead.
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/ga.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -49,4 +49,4 @@
#1680-169c # Ogham
#2018-2019 # single quotes
#201c-201d # double quotes
204a # tironian sign et
#204a # tironian sign et
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/gn.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -33,7 +33,7 @@
00c9
00e9
1ebd
e005
#e005 # LATIN SMALL LETTER G WITH TILDE (no UCS)
00cd
00ed
0129
......
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/hy.orth,v 1.2 2002/07/06 23:59:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -23,6 +23,4 @@
#
# Armenian (HY)
0531-0556
055a-055f
0561-0586
0589-058a
0561-0587
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/km.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -25,5 +25,5 @@
#
# Taken from the Unicode coverage of this language
#
1780-17dc
17e0-17e9
1780-17c5
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/ko.orth,v 1.2 2002/07/06 23:59:16 keithp Exp $
#
# Copyright 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -22,9 +22,9 @@
# PERFORMANCE OF THIS SOFTWARE.
#
# Korean (KO)
0x3000 # IDEOGRAPHIC SPACE
0x3001 # IDEOGRAPHIC COMMA
0x3002 # IDEOGRAPHIC FULL STOP
#0x3000 # IDEOGRAPHIC SPACE
#0x3001 # IDEOGRAPHIC COMMA
#0x3002 # IDEOGRAPHIC FULL STOP
0x3131 # HANGUL LETTER KIYEOK
0x3132 # HANGUL LETTER SSANGKIYEOK
0x3133 # HANGUL LETTER KIYEOK-SIOS
......@@ -76,7 +76,7 @@
0x3161 # HANGUL LETTER EU
0x3162 # HANGUL LETTER YI
0x3163 # HANGUL LETTER I
0x3164 # HANGUL FILLER
#0x3164 # HANGUL FILLER
0x3165 # HANGUL LETTER SSANGNIEUN
0x3166 # HANGUL LETTER NIEUN-TIKEUT
0x3167 # HANGUL LETTER NIEUN-SIOS
......@@ -119,64 +119,64 @@
0x318C # HANGUL LETTER YU-I
0x318D # HANGUL LETTER ARAEA
0x318E # HANGUL LETTER ARAEAE
0x3200 # PARENTHESIZED HANGUL KIYEOK
0x3201 # PARENTHESIZED HANGUL NIEUN
0x3202 # PARENTHESIZED HANGUL TIKEUT
0x3203 # PARENTHESIZED HANGUL RIEUL
0x3204 # PARENTHESIZED HANGUL MIEUM
0x3205 # PARENTHESIZED HANGUL PIEUP
0x3206 # PARENTHESIZED HANGUL SIOS
0x3207 # PARENTHESIZED HANGUL IEUNG
0x3208 # PARENTHESIZED HANGUL CIEUC
0x3209 # PARENTHESIZED HANGUL CHIEUCH
0x320A # PARENTHESIZED HANGUL KHIEUKH
0x320B # PARENTHESIZED HANGUL THIEUTH
0x320C # PARENTHESIZED HANGUL PHIEUPH
0x320D # PARENTHESIZED HANGUL HIEUH
0x320E # PARENTHESIZED HANGUL KIYEOK A
0x320F # PARENTHESIZED HANGUL NIEUN A
0x3210 # PARENTHESIZED HANGUL TIKEUT A
0x3211 # PARENTHESIZED HANGUL RIEUL A
0x3212 # PARENTHESIZED HANGUL MIEUM A
0x3213 # PARENTHESIZED HANGUL PIEUP A
0x3214 # PARENTHESIZED HANGUL SIOS A
0x3215 # PARENTHESIZED HANGUL IEUNG A
0x3216 # PARENTHESIZED HANGUL CIEUC A
0x3217 # PARENTHESIZED HANGUL CHIEUCH A
0x3218 # PARENTHESIZED HANGUL KHIEUKH A
0x3219 # PARENTHESIZED HANGUL THIEUTH A
0x321A # PARENTHESIZED HANGUL PHIEUPH A
0x321B # PARENTHESIZED HANGUL HIEUH A
0x321C # PARENTHESIZED HANGUL CIEUC U
0x3260 # CIRCLED HANGUL KIYEOK
0x3261 # CIRCLED HANGUL NIEUN
0x3262 # CIRCLED HANGUL TIKEUT
0x3263 # CIRCLED HANGUL RIEUL
0x3264 # CIRCLED HANGUL MIEUM
0x3265 # CIRCLED HANGUL PIEUP
0x3266 # CIRCLED HANGUL SIOS
0x3267 # CIRCLED HANGUL IEUNG
0x3268 # CIRCLED HANGUL CIEUC
0x3269 # CIRCLED HANGUL CHIEUCH
0x326A # CIRCLED HANGUL KHIEUKH
0x326B # CIRCLED HANGUL THIEUTH
0x326C # CIRCLED HANGUL PHIEUPH
0x326D # CIRCLED HANGUL HIEUH
0x326E # CIRCLED HANGUL KIYEOK A
0x326F # CIRCLED HANGUL NIEUN A
0x3270 # CIRCLED HANGUL TIKEUT A
0x3271 # CIRCLED HANGUL RIEUL A
0x3272 # CIRCLED HANGUL MIEUM A
0x3273 # CIRCLED HANGUL PIEUP A
0x3274 # CIRCLED HANGUL SIOS A
0x3275 # CIRCLED HANGUL IEUNG A
0x3276 # CIRCLED HANGUL CIEUC A
0x3277 # CIRCLED HANGUL CHIEUCH A
0x3278 # CIRCLED HANGUL KHIEUKH A
0x3279 # CIRCLED HANGUL THIEUTH A
0x327A # CIRCLED HANGUL PHIEUPH A
0x327B # CIRCLED HANGUL HIEUH A
0x327F # KOREAN STANDARD SYMBOL
#0x3200 # PARENTHESIZED HANGUL KIYEOK
#0x3201 # PARENTHESIZED HANGUL NIEUN
#0x3202 # PARENTHESIZED HANGUL TIKEUT
#0x3203 # PARENTHESIZED HANGUL RIEUL
#0x3204 # PARENTHESIZED HANGUL MIEUM
#0x3205 # PARENTHESIZED HANGUL PIEUP
#0x3206 # PARENTHESIZED HANGUL SIOS
#0x3207 # PARENTHESIZED HANGUL IEUNG
#0x3208 # PARENTHESIZED HANGUL CIEUC
#0x3209 # PARENTHESIZED HANGUL CHIEUCH
#0x320A # PARENTHESIZED HANGUL KHIEUKH
#0x320B # PARENTHESIZED HANGUL THIEUTH
#0x320C # PARENTHESIZED HANGUL PHIEUPH
#0x320D # PARENTHESIZED HANGUL HIEUH
#0x320E # PARENTHESIZED HANGUL KIYEOK A
#0x320F # PARENTHESIZED HANGUL NIEUN A
#0x3210 # PARENTHESIZED HANGUL TIKEUT A
#0x3211 # PARENTHESIZED HANGUL RIEUL A
#0x3212 # PARENTHESIZED HANGUL MIEUM A
#0x3213 # PARENTHESIZED HANGUL PIEUP A
#0x3214 # PARENTHESIZED HANGUL SIOS A
#0x3215 # PARENTHESIZED HANGUL IEUNG A
#0x3216 # PARENTHESIZED HANGUL CIEUC A
#0x3217 # PARENTHESIZED HANGUL CHIEUCH A
#0x3218 # PARENTHESIZED HANGUL KHIEUKH A
#0x3219 # PARENTHESIZED HANGUL THIEUTH A
#0x321A # PARENTHESIZED HANGUL PHIEUPH A
#0x321B # PARENTHESIZED HANGUL HIEUH A
#0x321C # PARENTHESIZED HANGUL CIEUC U
#0x3260 # CIRCLED HANGUL KIYEOK
#0x3261 # CIRCLED HANGUL NIEUN
#0x3262 # CIRCLED HANGUL TIKEUT
#0x3263 # CIRCLED HANGUL RIEUL
#0x3264 # CIRCLED HANGUL MIEUM
#0x3265 # CIRCLED HANGUL PIEUP
#0x3266 # CIRCLED HANGUL SIOS
#0x3267 # CIRCLED HANGUL IEUNG
#0x3268 # CIRCLED HANGUL CIEUC
#0x3269 # CIRCLED HANGUL CHIEUCH
#0x326A # CIRCLED HANGUL KHIEUKH
#0x326B # CIRCLED HANGUL THIEUTH
#0x326C # CIRCLED HANGUL PHIEUPH
#0x326D # CIRCLED HANGUL HIEUH
#0x326E # CIRCLED HANGUL KIYEOK A
#0x326F # CIRCLED HANGUL NIEUN A
#0x3270 # CIRCLED HANGUL TIKEUT A
#0x3271 # CIRCLED HANGUL RIEUL A
#0x3272 # CIRCLED HANGUL MIEUM A
#0x3273 # CIRCLED HANGUL PIEUP A
#0x3274 # CIRCLED HANGUL SIOS A
#0x3275 # CIRCLED HANGUL IEUNG A
#0x3276 # CIRCLED HANGUL CIEUC A
#0x3277 # CIRCLED HANGUL CHIEUCH A
#0x3278 # CIRCLED HANGUL KHIEUKH A
#0x3279 # CIRCLED HANGUL THIEUTH A
#0x327A # CIRCLED HANGUL PHIEUPH A
#0x327B # CIRCLED HANGUL HIEUH A
#0x327F # KOREAN STANDARD SYMBOL
0x4E00 # <CJK>
0x4E01 # <CJK>
0x4E03 # <CJK>
......@@ -16237,4 +16237,4 @@
0xFA09 # <CJK>
0xFA0A # <CJK>
0xFA0B # <CJK>
0xFFE6 # FULLWIDTH WON SIGN
#0xFFE6 # FULLWIDTH WON SIGN
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/lb.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -21,7 +21,7 @@
# TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
# PERFORMANCE OF THIS SOFTWARE.
#
# Hawaiian (HAW)
# Luxembourgish (Letzeburgesch) (LB)
#
# Orthography from http://www.eki.ee/letter
#
......@@ -51,8 +51,10 @@
00ea
00ce
00ee
e006-e007
e008-e009
#e006 # LATIN CAPITAL LETTER M WITH CIRCUMFLEX (no UCS)
#e007 # LATIN SMALL LETTER M WITH CIRCUMFLEX (no UCS)
#e008 # LATIN CAPITAL LETTER N WITH CIRCUMFLEX (no UCS)
#e009 # LATIN SMALL LETTER N WITH CIRCUMFLEX (no UCS)
00d4
00f4
00db
......
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mg.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -29,7 +29,7 @@
0061-007a
00c1
00e1
e010
e011
#e010 # LATIN CAPITAL LETTER N WITH DIAERESIS
#e011 # LATIN SMALL LETTER N WITH DIAERESIS
00d4
00f4
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mh.orth,v 1.1 2002/07/12 19:19:15 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -31,15 +31,15 @@
0101
013b
013c
e00a
e00b
e00c
e00d
#e00a # LATIN CAPITAL LETTER M WITH CEDILLA (no UCS)
#e00b # LATIN SMALL LETTER M WITH CEDILLA (no UCS)
#e00c # LATIN CAPITAL LETTER N WITH MACRON (no UCS)
#e00d # LATIN SMALL LETTER N WITH MACRON (no UCS)
0145
0146
014c
014d
e00e
e00f
#e00e # LATIN CAPITAL LETTER O WITH CEDILLA (no UCS)
#e00f # LATIN SMALL LETTER O WITH CEDILLA (no UCS)
016a
016b
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mk.orth,v 1.2 2002/07/06 23:59:17 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -22,17 +22,19 @@
# PERFORMANCE OF THIS SOFTWARE.
#
# Macedonian (MK)
0400
0400 # CYRILLIC CAPITAL LETTER IE WITH GRAVE
0403
0405
0408-040a
040c-040d
040c
040d # CYRILLIC CAPITAL LETTER I WITH GRAVE
040f
0410-0418
041a-0428
0450
0450 # CYRILLIC SMALL LETTER IE WITH GRAVE
0453
0455
0458-045a
045c-045d
045c
045d # CYRILLIC SMALL LETTER I WITH GRAVE
045f
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mn.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -25,7 +25,13 @@
#
# Taken from the Unicode coverage of this language
#
1800-180a
1810-1819
1820-1877
# Basic letters
1820-1842
# Todo letters
1843-185c
# Sibe letters
185d-1872
# Manchu letters
1873-1877
# Extensions for Sanskrit and Tibetan
1880-18a9
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/mo.orth,v 1.2 2002/07/06 23:59:17 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -29,7 +29,7 @@
00e2
00ee
0102-0103
0218-021b
0218-021b # Comma below forms (preferred over cedilla)
0401
0410-044f
0451
......
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/ro.orth,v 1.2 2002/07/06 23:59:19 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -29,6 +29,6 @@
00e2
00ee
0102-0103
0218-021b
0218-021b # comma-below forms (preferred over cedilla)
#2019-201a # single quotes
#201d-201e # double quotes
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/si.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -25,14 +25,16 @@
#
# Taken from the Unicode coverage of this language
#
0d82-0d83
# Independent vowels
0d85-0d96
# Consonants
0d9a-0db1
0db3-0dbb
0dbd
0dc0-0dc6
0dca
# Dependent vowel signs
0dcf-0dd4
0dd6
0dd8-0ddf
# Additional dependent vowel signs
0df2-0df4
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/tl.orth,v 1.1 2002/07/07 19:18:51 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -25,5 +25,10 @@
#
# Taken from the Unicode coverage of this language
#
1700-170c
170e-1714
# Independent vowels
1700-1702
# Consonants
1703-170c
170e-1711
# Dependent vowel signs
1712-1713
#
# $XFree86$
# $XFree86: xc/lib/fontconfig/fc-lang/yo.orth,v 1.1 2002/07/12 19:19:16 keithp Exp $
#
# Copyright © 2002 Keith Packard, member of The XFree86 Project, Inc.
#
......@@ -28,59 +28,59 @@
0041-005a
0061-007a
00c0
00e0
00c1
00e1
00c2
00e2
01cd-01ce
00c3
00c8
00e8
00c9
00e9
00ca
00ea
011a-011b
1eb8-1eb9
0300
0301
0302
0303
030c
00cc
00ec
00cd
00ed
00ce
00ee
01cf-01d0
1e3e-1e3f
# LATIN CAPTIAL LETTER M WITH MACRON (no UCS code)
# LATIN SMALL LETTER M WITH MACRON (no UCS code)
01f8-01f9
0143-0144
# LATIN CAPTIAL LETTER N WITH MACRON (no UCS code)
# LATIN SMALL LETTER N WITH MACRON (no UCS code)
00d2
00f2
00d3
00f3
00d4
00f4
01d1-01d2
1ecc-1ecd
1e62-1e63
00d5
00d9
00f9
00da
00fa
00db
00fb
01d3-01d4
00c3
00e0
00e1
00e2
00e3
1ebc-1ebd
0128-0129
00d5
00e8
00e9
00ea
00ec
00ed
00ee
00f2
00f3
00f4
00f5
00f9
00fa
00fb
011a-011b
0128-0129
0143-0144
0168-0169
01cd-01ce
01cf-01d0
01d1-01d2
01d3-01d4
01f8-01f9 # LATIN LETTER N WITH GRAVE
0300
0301
0302
0303
030c
1e3e-1e3f
1e62-1e63
1eb8-1eb9
1ebc-1ebd
1ecc-1ecd
# LATIN CAPTIAL LETTER M WITH MACRON (no UCS code)
# LATIN CAPTIAL LETTER N WITH MACRON (no UCS code)
# LATIN SMALL LETTER M WITH MACRON (no UCS code)
# LATIN SMALL LETTER N WITH MACRON (no UCS code)
/*
* $XFree86: xc/lib/fontconfig/fc-lang/fclang.tmpl.c,v 1.1 2002/07/06 23:21:36 keithp Exp $
* $XFree86: xc/lib/fontconfig/src/fclang.c,v 1.3 2002/07/08 07:31:53 keithp Exp $
*
* Copyright 2002 Keith Packard, member of The XFree86 Project, Inc.
*
......@@ -60,7 +60,36 @@ FcFreeTypeSetLang (FcPattern *pattern,
}
missing = FcCharSetSubtractCount (&fcLangCharSets[i].charset, charset);
if (FcDebug() & FC_DBG_SCANV)
printf ("%s(%d) ", fcLangCharSets[i].lang, missing);
{
if (missing && missing < 10)
{
FcCharSet *missed = FcCharSetSubtract (&fcLangCharSets[i].charset,
charset);
FcChar32 ucs4;
FcChar32 map[FC_CHARSET_MAP_SIZE];
FcChar32 next;
printf ("\n%s(%d) ", fcLangCharSets[i].lang, missing);
printf ("{");
for (ucs4 = FcCharSetFirstPage (missed, map, &next);
ucs4 != FC_CHARSET_DONE;
ucs4 = FcCharSetNextPage (missed, map, &next))
{
int i, j;
for (i = 0; i < FC_CHARSET_MAP_SIZE; i++)
if (map[i])
{
for (j = 0; j < 32; j++)
if (map[i] & (1 << j))
printf (" %04x", ucs4 + i * 32 + j);
}
}
printf (" }\n\t");
FcCharSetDestroy (missed);
}
else
printf ("%s(%d) ", fcLangCharSets[i].lang, missing);
}
if (!missing)
{
if (!FcPatternAddString (pattern, FC_LANG, fcLangCharSets[i].lang))
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment