minix/lib/libc/locale/rune.c
Ben Gras 2fe8fb192f Full switch to clang/ELF. Drop ack. Simplify.
There is important information about booting non-ack images in
docs/UPDATING. ack/aout-format images can't be built any more, and
booting clang/ELF-format ones is a little different. Updating to the
new boot monitor is recommended.

Changes in this commit:

	. drop boot monitor -> allowing dropping ack support
	. facility to copy ELF boot files to /boot so that old boot monitor
	  can still boot fairly easily, see UPDATING
	. no more ack-format libraries -> single-case libraries
	. some cleanup of OBJECT_FMT, COMPILER_TYPE, etc cases
	. drop several ack toolchain commands, but not all support
	  commands (e.g. aal is gone but acksize is not yet).
	. a few libc files moved to netbsd libc dir
	. new /bin/date as minix date used code in libc/
	. test compile fix
	. harmonize includes
	. /usr/lib is no longer special: without ack, /usr/lib plays no
	  kind of special bootstrapping role any more and bootstrapping
	  is done exclusively through packages, so releases depend even
	  less on the state of the machine making them now.
	. rename nbsd_lib* to lib*
	. reduce mtree
2012-02-14 14:52:02 +01:00

351 lines
9.4 KiB
C

/* $NetBSD: rune.c,v 1.41 2010/11/30 15:25:05 tnozaki Exp $ */
/*-
* Copyright (c)2010 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/endian.h>
#include <sys/mman.h>
#include <sys/stat.h>
#include <assert.h>
#include <errno.h>
#include <fcntl.h>
#define __SETLOCALE_SOURCE__
#include <locale.h>
#include <stddef.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <wchar.h>
#include "setlocale_local.h"
#include "citrus_module.h"
#include "citrus_ctype.h"
#include "runetype_local.h"
#include "bsdctype_local.h"
#include "multibyte.h"
#include "_wctype_local.h"
#include "_wctrans_local.h"
typedef struct {
_RuneLocale rl;
unsigned char rlp_ctype_tab [_CTYPE_NUM_CHARS + 1];
short rlp_tolower_tab[_CTYPE_NUM_CHARS + 1];
short rlp_toupper_tab[_CTYPE_NUM_CHARS + 1];
char rlp_codeset[33]; /* XXX */
} _RuneLocalePriv;
static __inline void
_rune_wctype_init(_RuneLocale *rl)
{
memcpy(&rl->rl_wctype, &_DefaultRuneLocale.rl_wctype,
sizeof(rl->rl_wctype));
}
static __inline void
_rune_wctrans_init(_RuneLocale *rl)
{
rl->rl_wctrans[_WCTRANS_INDEX_LOWER].te_name = "tolower";
rl->rl_wctrans[_WCTRANS_INDEX_LOWER].te_cached = &rl->rl_maplower[0];
rl->rl_wctrans[_WCTRANS_INDEX_LOWER].te_extmap = &rl->rl_maplower_ext;
rl->rl_wctrans[_WCTRANS_INDEX_UPPER].te_name = "toupper";
rl->rl_wctrans[_WCTRANS_INDEX_UPPER].te_cached = &rl->rl_mapupper[0];
rl->rl_wctrans[_WCTRANS_INDEX_UPPER].te_extmap = &rl->rl_mapupper_ext;
}
static __inline void
_rune_init_priv(_RuneLocalePriv *rlp)
{
#if _CTYPE_CACHE_SIZE != _CTYPE_NUM_CHARS
int i;
for (i = _CTYPE_CACHE_SIZE; i < _CTYPE_NUM_CHARS; ++i) {
rlp->rlp_ctype_tab [i + 1] = 0;
rlp->rlp_tolower_tab[i + 1] = i;
rlp->rlp_toupper_tab[i + 1] = i;
}
#endif
rlp->rlp_ctype_tab [0] = 0;
rlp->rlp_tolower_tab[0] = EOF;
rlp->rlp_toupper_tab[0] = EOF;
rlp->rl.rl_ctype_tab = (const unsigned char *)&rlp->rlp_ctype_tab[0];
rlp->rl.rl_tolower_tab = (const short *)&rlp->rlp_tolower_tab[0];
rlp->rl.rl_toupper_tab = (const short *)&rlp->rlp_toupper_tab[0];
rlp->rl.rl_codeset = (const char *)&rlp->rlp_codeset[0];
_rune_wctype_init(&rlp->rl);
_rune_wctrans_init(&rlp->rl);
}
static __inline void
_rune_find_codeset(char *s, size_t n,
char *var, size_t *plenvar)
{
size_t lenvar;
const char *endvar;
#define _RUNE_CODESET_LEN (sizeof(_RUNE_CODESET)-1)
lenvar = *plenvar;
for (/**/; lenvar > _RUNE_CODESET_LEN; ++var, --lenvar) {
if (!memcmp(var, _RUNE_CODESET, _RUNE_CODESET_LEN)) {
*var = '\0';
*plenvar -= lenvar;
endvar = &var[_RUNE_CODESET_LEN];
while (n-- > 1 && lenvar-- > _RUNE_CODESET_LEN) {
if (*endvar == ' ' || *endvar == '\t')
break;
*s++ = *endvar++;
}
break;
}
}
*s = '\0';
}
static __inline int
_rune_read_file(const char * __restrict var, size_t lenvar,
_RuneLocale ** __restrict prl)
{
int ret, i;
const _FileRuneLocale *frl;
const _FileRuneEntry *fre;
const uint32_t *frune;
_RuneLocalePriv *rlp;
_RuneLocale *rl;
_RuneEntry *re;
uint32_t *rune;
uint32_t runetype_len, maplower_len, mapupper_len, variable_len;
size_t len, n;
if (lenvar < sizeof(*frl))
return EFTYPE;
lenvar -= sizeof(*frl);
frl = (const _FileRuneLocale *)(const void *)var;
if (memcmp(_RUNECT10_MAGIC, &frl->frl_magic[0], sizeof(frl->frl_magic)))
return EFTYPE;
runetype_len = be32toh(frl->frl_runetype_ext.frr_nranges);
maplower_len = be32toh(frl->frl_maplower_ext.frr_nranges);
mapupper_len = be32toh(frl->frl_mapupper_ext.frr_nranges);
len = runetype_len + maplower_len + mapupper_len;
fre = (const _FileRuneEntry *)(const void *)(frl + 1);
frune = (const uint32_t *)(const void *)(fre + len);
variable_len = be32toh((uint32_t)frl->frl_variable_len);
n = (len * sizeof(*fre)) + variable_len;
if (lenvar < n)
return EFTYPE;
lenvar -= n;
n = sizeof(*rlp) + (len * sizeof(*re)) + lenvar;
rlp = (_RuneLocalePriv *)malloc(n);
if (rlp == NULL)
return ENOMEM;
_rune_init_priv(rlp);
rl = &rlp->rl;
re = (_RuneEntry *)(void *)(rlp + 1);
rune = (uint32_t *)(void *)(re + len);
for (i = 0; i < _CTYPE_CACHE_SIZE; ++i) {
rl->rl_runetype[i] = be32toh(frl->frl_runetype[i]);
rl->rl_maplower[i] = be32toh((uint32_t)frl->frl_maplower[i]);
rl->rl_mapupper[i] = be32toh((uint32_t)frl->frl_mapupper[i]);
}
#define READ_RANGE(name) \
do { \
const _FileRuneEntry *end_fre; \
const uint32_t *end_frune; \
\
rl->rl_##name##_ext.rr_nranges = name##_len; \
rl->rl_##name##_ext.rr_rune_ranges = re; \
\
end_fre = fre + name##_len; \
while (fre < end_fre) { \
re->re_min = be32toh((uint32_t)fre->fre_min); \
re->re_max = be32toh((uint32_t)fre->fre_max); \
re->re_map = be32toh((uint32_t)fre->fre_map); \
if (re->re_map != 0) { \
re->re_rune_types = NULL; \
} else { \
re->re_rune_types = rune; \
len = re->re_max - re->re_min + 1; \
n = len * sizeof(*frune); \
if (lenvar < n) { \
ret = EFTYPE; \
goto err; \
} \
lenvar -= n; \
end_frune = frune + len; \
while (frune < end_frune) \
*rune++ = be32toh(*frune++); \
} \
++fre, ++re; \
} \
} while (/*CONSTCOND*/0)
READ_RANGE(runetype);
READ_RANGE(maplower);
READ_RANGE(mapupper);
memcpy((void *)rune, (void const *)frune, variable_len);
rl->rl_variable_len = variable_len;
rl->rl_variable = (void *)rune;
if (lenvar > 0) {
ret = EFTYPE;
goto err;
}
_rune_find_codeset(rlp->rlp_codeset, sizeof(rlp->rlp_codeset),
(char *)rl->rl_variable, &rl->rl_variable_len);
ret = _citrus_ctype_open(&rl->rl_citrus_ctype, frl->frl_encoding,
rl->rl_variable, rl->rl_variable_len, _PRIVSIZE);
if (ret)
goto err;
if (__mb_len_max_runtime <
_citrus_ctype_get_mb_cur_max(rl->rl_citrus_ctype)) {
ret = EINVAL;
goto err;
}
for (i = 0; i < _CTYPE_CACHE_SIZE; ++i) {
wint_t wc;
ret = _citrus_ctype_btowc(rl->rl_citrus_ctype, i, &wc);
if (ret)
goto err;
if (wc == WEOF) {
rlp->rlp_ctype_tab[i + 1] = 0;
rlp->rlp_tolower_tab[i + 1] = i;
rlp->rlp_toupper_tab[i + 1] = i;
} else {
rlp->rlp_ctype_tab[i + 1] = (unsigned char)
_runetype_to_ctype(_runetype_priv(rl, wc));
#define CONVERT_MAP(name) \
do { \
wint_t map; \
int c; \
\
map = _towctrans_priv(wc, _wctrans_##name(rl)); \
if (map == wc || (_citrus_ctype_wctob(rl->rl_citrus_ctype, \
map, &c) || c == EOF)) \
c = i; \
rlp->rlp_to##name##_tab[i + 1] = (short)c; \
} while (/*CONSTCOND*/0)
CONVERT_MAP(lower);
CONVERT_MAP(upper);
}
}
*prl = rl;
return 0;
err:
free(rlp);
return ret;
}
static __inline int
_rune_read_bsdctype(const char * __restrict var, size_t lenvar,
_RuneLocale ** __restrict prl)
{
const _FileBSDCTypeLocale *fbl;
uint32_t value;
int i, bits;
uint16_t lower, upper;
_RuneLocalePriv *rlp;
_RuneLocale *rl;
if (lenvar < sizeof(*fbl))
return EFTYPE;
fbl = (const _FileBSDCTypeLocale *)(const void *)var;
if (memcmp(&fbl->fbl_id[0], _CTYPE_ID, sizeof(fbl->fbl_id)))
return EFTYPE;
value = be32toh(fbl->fbl_rev);
if (value != _CTYPE_REV)
return EFTYPE;
value = be32toh(fbl->fbl_num_chars);
if (value != _CTYPE_CACHE_SIZE)
return EFTYPE;
rlp = (_RuneLocalePriv *)malloc(sizeof(*rlp));
if (rlp == NULL)
return ENOMEM;
_rune_init_priv(rlp);
rlp->rlp_codeset[0] = '\0';
rl = &rlp->rl;
for (i = 0; i < _CTYPE_CACHE_SIZE; ++i) {
bits = fbl->fbl_ctype_tab[i];
lower = be16toh(fbl->fbl_tolower_tab[i]);
upper = be16toh(fbl->fbl_toupper_tab[i]);
rlp->rlp_ctype_tab [i + 1] = (unsigned char)bits;
rlp->rlp_tolower_tab[i + 1] = (short)lower;
rlp->rlp_toupper_tab[i + 1] = (short)upper;
rl->rl_runetype[i] = _runetype_from_ctype(bits, i);
rl->rl_maplower[i] = (__nbrune_t)lower;
rl->rl_mapupper[i] = (__nbrune_t)upper;
}
*prl = rl;
return 0;
}
int
_rune_load(const char * __restrict var, size_t lenvar,
_RuneLocale ** __restrict prl)
{
int ret;
_DIAGASSERT(var != NULL || lenvar < 1);
_DIAGASSERT(prl != NULL);
if (lenvar < 1)
return EFTYPE;
switch (*var) {
case 'R':
ret = _rune_read_file(var, lenvar, prl);
break;
case 'B':
ret = _rune_read_bsdctype(var, lenvar, prl);
break;
default:
ret = EFTYPE;
}
return ret;
}