mirror of
https://sourceware.org/git/glibc.git
synced 2024-12-23 11:20:07 +00:00
4c7d276eb1
2000-08-31 Bruno Haible <haible@clisp.cons.org> * wctype/wcfuncs.c (iswblank): New function. * wctype/wcfuncs_l.c (__iswblank_l): New function. * wctype/wcextra.c: Remove file. * wctype/wcextra_l.c: Remove file. * wctype/Makefile (distribute): Remove wcextra and wcextra_l. 2000-08-31 Bruno Haible <haible@clisp.cons.org> * locale/programs/ld-collate.c (collate_output): Remove redundant assert call. * string/strcoll.c: Likewise. * string/strxfrm.c: Include assert.h. Add assert calls like in string/strcoll.c. 2000-08-31 Bruno Haible <haible@clisp.cons.org> * locale/categories.def (_NL_COLLATE_HASH_SIZE, _NL_COLLATE_HASH_LAYERS, _NL_COLLATE_NAMES, _NL_CTYPE_NAMES, _NL_CTYPE_HASH_SIZE, _NL_CTYPE_HASH_LAYERS): Remove definitions. * locale/langinfo.h (_NL_COLLATE_HASH_SIZE, _NL_COLLATE_HASH_LAYERS, _NL_COLLATE_NAMES): Rename to _NL_COLLATE_GAP1/2/3 respectively. (_NL_CTYPE_NAMES): Rename to _NL_CTYPE_GAP3. (_NL_CTYPE_GAP3): Rename to _NL_CTYPE_GAP4. (_NL_CTYPE_HASH_SIZE, _NL_CTYPE_HASH_LAYERS): Rename to _NL_CTYPE_GAP5/6 respectively. * locale/C-ctype.c (_nl_C_LC_CTYPE): Update. * ctype/ctype-info.c (__ctype_names, __ctype_width): Remove variables. * locale/lc-ctype.c (_nl_postload_ctype): Assume new locale format. Don't initialize __ctype_names and __ctype_width. * wctype/cname-lookup.h: Remove file. * wctype/Makefile (distribute): Remove cname-lookup.h. * wctype/wchar-lookup.h: Include stdint.h. * wctype/wctype.c (__wctype): Assume new locale format. * wctype/wctype_l.c (__wctype_l): Likewise. * wctype/iswctype.c: Don't include cname-lookup.h. (__iswctype): Assume new locale format. * wctype/iswctype_l.c: Don't include cname-lookup.h. (__iswctype_l): Assume new locale format. * wctype/wctrans.c: Don't include ctype.h. (wctrans): Assume new locale format. * wctype/wctrans_l.c (__wctrans_l): Likewise. * wctype/towctrans.c: Don't include cname-lookup.h. (__towctrans): Assume new locale format. * wctype/towctrans_l.c: Don't include cname-lookup.h. (__towctrans_l): Assume new locale format. * wctype/wcfuncs.c: Don't include ctype.h and cname-lookup.h. Include localeinfo.h instead. (__NO_WCTYPE): Remove unused macro. (__ctype32_b, __ctype32_toupper, __ctype32_tolower): Remove declarations. (iswalnum, iswalpha, iswcntrl, iswdigit, iswlower, iswgraph, iswprint, iswpunct, iswspace, iswupper, iswxdigit): Assume new locale format. (towlower, towupper): Likewise. * wctype/wcfuncs_l.c: Don't include cname-lookup.h. Include localeinfo.h instead. (__NO_WCTYPE): Remove unused macro. (__iswalnum_l, __iswalpha_l, __iswcntrl_l, __iswdigit_l, __iswlower_l, __iswgraph_l, __iswprint_l, __iswpunct_l, __iswspace_l, __iswupper_l, __iswxdigit_l): Assume new locale format. (__towlower_l, __towupper_l): Likewise. * wcsmbs/wcwidth.h: Don't include cname-lookup.h. (__ctype32_b): Remove declaration. (internal_wcwidth): Assume new locale format. * locale/programs/ld-ctype.c (struct locale_ctype_t): Remove fields plane_size, plane_cnt, names, width. Rename map to map_b, rename map32 to map32_b, rename width_3level to width. (ctype_output): Always create new locale format. Don't emit _NL_CTYPE_NAMES, _NL_CTYPE_HASH_SIZE, _NL_CTYPE_HASH_LAYERS any more. (allocate_arrays): Always create new locale format. * locale/C-collate.c (_nl_C_LC_COLLATE): Update. * locale/weightwc.h (findidx): Assume new locale format. * string/strcoll.c (wcscoll): Remove local variables size, layers, names. * string/strxfrm.c (wcsxfrm): Likewise. * posix/fnmatch_loop.c (internal_fnwmatch): Likewise. Change type of local variable collseq to 'const char *'. (SUFFIX): Don't use, don't undefine. * posix/fnmatch.c: Remove SUFFIX definition. * locale/programs/ld-collate.c (struct locale_collate_t): Remove fields plane_size, plane_cnt, wcheads, wcseqorder. Rename wcheads_3level to wcheads, rename wcseqorder_3level to wcseqorder. (collate_finish): Always create new locale format. Remove local variables min_total, act_size. (collate_output): Always create new locale format. Remove local variables table_size, names, tablewc. Rename tablewc_3level to tablewc. 2000-08-31 Bruno Haible <haible@clisp.cons.org> * locale/programs/ld-collate.c (obstack_int32_grow, obstack_int32_grow_fast): New inline functions. (output_weightwc, collate_output): Use them where possible.
142 lines
4.6 KiB
C
142 lines
4.6 KiB
C
/* Copyright (C) 2000 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
Contributed by Bruno Haible <haible@clisp.cons.org>, 2000.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Library General Public License as
|
|
published by the Free Software Foundation; either version 2 of the
|
|
License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Library General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Library General Public
|
|
License along with the GNU C Library; see the file COPYING.LIB. If not,
|
|
write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
Boston, MA 02111-1307, USA. */
|
|
|
|
#include <stdint.h>
|
|
|
|
/* Tables indexed by a wide character are compressed through the use
|
|
of a multi-level lookup. The compression effect comes from blocks
|
|
that don't need particular data and from blocks that can share their
|
|
data. */
|
|
|
|
/* Bit tables are accessed by cutting wc in four blocks of bits:
|
|
- the high 32-q-p bits,
|
|
- the next q bits,
|
|
- the next p bits,
|
|
- the next 5 bits.
|
|
|
|
+------------------+-----+-----+-----+
|
|
wc = + 32-q-p-5 | q | p | 5 |
|
|
+------------------+-----+-----+-----+
|
|
|
|
p and q are variable. For 16-bit Unicode it is sufficient to
|
|
choose p and q such that q+p+5 <= 16.
|
|
|
|
The table contains the following uint32_t words:
|
|
- q+p+5,
|
|
- s = upper exclusive bound for wc >> (q+p+5),
|
|
- p+5,
|
|
- 2^q-1,
|
|
- 2^p-1,
|
|
- 1st-level table: s offsets, pointing into the 2nd-level table,
|
|
- 2nd-level table: k*2^q offsets, pointing into the 3rd-level table,
|
|
- 3rd-level table: j*2^p words, each containing 32 bits of data.
|
|
*/
|
|
|
|
static __inline int
|
|
wctype_table_lookup (const char *table, uint32_t wc)
|
|
{
|
|
uint32_t shift1 = ((const uint32_t *) table)[0];
|
|
uint32_t index1 = wc >> shift1;
|
|
uint32_t bound = ((const uint32_t *) table)[1];
|
|
if (index1 < bound)
|
|
{
|
|
uint32_t lookup1 = ((const uint32_t *) table)[5 + index1];
|
|
if (lookup1 != 0)
|
|
{
|
|
uint32_t shift2 = ((const uint32_t *) table)[2];
|
|
uint32_t mask2 = ((const uint32_t *) table)[3];
|
|
uint32_t index2 = (wc >> shift2) & mask2;
|
|
uint32_t lookup2 = ((const uint32_t *)(table + lookup1))[index2];
|
|
if (lookup2 != 0)
|
|
{
|
|
uint32_t mask3 = ((const uint32_t *) table)[4];
|
|
uint32_t index3 = (wc >> 5) & mask3;
|
|
uint32_t lookup3 = ((const uint32_t *)(table + lookup2))[index3];
|
|
|
|
return (lookup3 >> (wc & 0x1f)) & 1;
|
|
}
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* Byte tables are similar to bit tables, except that the addressing
|
|
unit is a single byte, and no 5 bits are used as a word index. */
|
|
|
|
static __inline int
|
|
wcwidth_table_lookup (const char *table, uint32_t wc)
|
|
{
|
|
uint32_t shift1 = ((const uint32_t *) table)[0];
|
|
uint32_t index1 = wc >> shift1;
|
|
uint32_t bound = ((const uint32_t *) table)[1];
|
|
if (index1 < bound)
|
|
{
|
|
uint32_t lookup1 = ((const uint32_t *) table)[5 + index1];
|
|
if (lookup1 != 0)
|
|
{
|
|
uint32_t shift2 = ((const uint32_t *) table)[2];
|
|
uint32_t mask2 = ((const uint32_t *) table)[3];
|
|
uint32_t index2 = (wc >> shift2) & mask2;
|
|
uint32_t lookup2 = ((const uint32_t *)(table + lookup1))[index2];
|
|
if (lookup2 != 0)
|
|
{
|
|
uint32_t mask3 = ((const uint32_t *) table)[4];
|
|
uint32_t index3 = wc & mask3;
|
|
uint8_t lookup3 = ((const uint8_t *)(table + lookup2))[index3];
|
|
|
|
return lookup3;
|
|
}
|
|
}
|
|
}
|
|
return 0xff;
|
|
}
|
|
|
|
/* Mapping tables are similar to bit tables, except that the
|
|
addressing unit is a single signed 32-bit word, containing the
|
|
difference between the desired result and the argument, and no 5
|
|
bits are used as a word index. */
|
|
|
|
static __inline uint32_t
|
|
wctrans_table_lookup (const char *table, uint32_t wc)
|
|
{
|
|
uint32_t shift1 = ((const uint32_t *) table)[0];
|
|
uint32_t index1 = wc >> shift1;
|
|
uint32_t bound = ((const uint32_t *) table)[1];
|
|
if (index1 < bound)
|
|
{
|
|
uint32_t lookup1 = ((const uint32_t *) table)[5 + index1];
|
|
if (lookup1 != 0)
|
|
{
|
|
uint32_t shift2 = ((const uint32_t *) table)[2];
|
|
uint32_t mask2 = ((const uint32_t *) table)[3];
|
|
uint32_t index2 = (wc >> shift2) & mask2;
|
|
uint32_t lookup2 = ((const uint32_t *)(table + lookup1))[index2];
|
|
if (lookup2 != 0)
|
|
{
|
|
uint32_t mask3 = ((const uint32_t *) table)[4];
|
|
uint32_t index3 = wc & mask3;
|
|
int32_t lookup3 = ((const int32_t *)(table + lookup2))[index3];
|
|
|
|
return wc + lookup3;
|
|
}
|
|
}
|
|
}
|
|
return wc;
|
|
}
|