fd1b5c0fb6
2000-04-09 Ulrich Drepper <drepper@redhat.com> Implement handling of restartable conversion functions according to ISO C. * iconv/gconv.h (__gconv_fct): Add additional parameter. * iconv/gconv_int.h (__BUILTIN_TRANS): Likewise. * iconv/gconv.c: Pass additional parameter to conversion function. * iconv/gconv_simple.c (internal_ucs4_loop_single): New function. (internal_ucs4le_loop_single): New function. (__gconv_transform_ascii_internal): Define ONE_DIRECTION. (__gconv_transform_internal_ascii): Likewise. (__gconv_transform_internal_utf8): Likewise. (__gconv_transform_utf8_internal): Likewise. (__gconv_transform_ucs2_internal): Likewise. (__gconv_transform_internal_ucs2): Likewise. (__gconv_transform_ucs2reverse_internal): Likewise. (__gconv_transform_internal_ucs2reverse): Likewise. (internal_ucs4le_loop_unaligned): Before return __GCONV_INCOMPLETE_INPUT check that the remaining bytes really form a valid character. Otherwise return __GCONV_ILLEGAL_INPUT. (__gconv_transform_utf8_internal): Define STORE_REST and UNPACK_BYTES. * iconv/loop.c: Fit in definition of function to convert one character for processing of left-over bytes from the state object. * iconv/skeleton.c (gconv): Rename inbuf to inptrp and inbufend to inend to match names in loop functions. (RESET_INPUT_BUFFER): Change apprpriately. (gconv): If needed, call function to process bytes from the state object. Similar at the end: store left over bytes if input is incomplete. Take extra argument and add new argument to all calls of the conversion function. * iconvdata/iso-2022-cn.c: Adjust numeric values used to store information in the state object to not conflict with length count. * iconvdata/iso-2022-jp.c: Likewise. * iconvdata/iso-2022-kr.c: Likewise. * iconvdata/unicode.c: Adjust for change change in parameters of skeleton function. * iconvdata/utf-16.c: Likewise. * libio/iofwide.c: Add new parameter to all calls of conversion function. * wcsmbs/btowc.c: Likewise. * wcsmbs/mbrtowc.c: Likewise. * wcsmbs/mbsnrtowcs.c: Likewise. * wcsmbs/mbsrtowcs.c: Likewise. * wcsmbs/wcrtomb.c: Likewise. * wcsmbs/wcsnrtombs.c: Likewise. * wcsmbs/wcsrtombs.c: Likewise. * wcsmbs/wctob.c: Likewise. * iconvdata/gbgbk.c: Always define MAX_NEEDED_OUTPUT and MAX_NEEDED_INPUT.
143 lines
4.0 KiB
C
143 lines
4.0 KiB
C
/* Copyright (C) 1996, 1997, 1998, 1999, 2000 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
Contributed by Ulrich Drepper <drepper@gnu.org>, 1996.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Library General Public License as
|
|
published by the Free Software Foundation; either version 2 of the
|
|
License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Library General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Library General Public
|
|
License along with the GNU C Library; see the file COPYING.LIB. If not,
|
|
write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
Boston, MA 02111-1307, USA. */
|
|
|
|
#include <errno.h>
|
|
#include <gconv.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <wchar.h>
|
|
#include <wcsmbsload.h>
|
|
|
|
#include <assert.h>
|
|
|
|
#ifndef EILSEQ
|
|
# define EILSEQ EINVAL
|
|
#endif
|
|
|
|
|
|
/* This is the private state used if PS is NULL. */
|
|
static mbstate_t state;
|
|
|
|
size_t
|
|
__mbsrtowcs (dst, src, len, ps)
|
|
wchar_t *dst;
|
|
const char **src;
|
|
size_t len;
|
|
mbstate_t *ps;
|
|
{
|
|
struct __gconv_step_data data;
|
|
size_t result;
|
|
int status;
|
|
struct __gconv_step *towc;
|
|
size_t non_reversible;
|
|
|
|
/* Tell where we want the result. */
|
|
data.__invocation_counter = 0;
|
|
data.__internal_use = 1;
|
|
data.__is_last = 1;
|
|
data.__statep = ps ?: &state;
|
|
|
|
/* Make sure we use the correct function. */
|
|
update_conversion_ptrs ();
|
|
|
|
/* Get the structure with the function pointers. */
|
|
towc = __wcsmbs_gconv_fcts.towc;
|
|
|
|
/* We have to handle DST == NULL special. */
|
|
if (dst == NULL)
|
|
{
|
|
mbstate_t temp_state;
|
|
wchar_t buf[64]; /* Just an arbitrary size. */
|
|
const unsigned char *inbuf = (const unsigned char *) *src;
|
|
const unsigned char *srcend = inbuf + strlen (inbuf) + 1;
|
|
|
|
temp_state = *data.__statep;
|
|
data.__statep = &temp_state;
|
|
|
|
result = 0;
|
|
data.__outbufend = (char *) buf + sizeof (buf);
|
|
do
|
|
{
|
|
data.__outbuf = (char *) buf;
|
|
|
|
status = (*towc->__fct) (__wcsmbs_gconv_fcts.towc, &data, &inbuf,
|
|
srcend, &non_reversible, 0, 1);
|
|
|
|
result += (wchar_t *) data.__outbuf - buf;
|
|
}
|
|
while (status == __GCONV_FULL_OUTPUT);
|
|
|
|
if (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT)
|
|
{
|
|
/* There better should be a NUL wide char at the end. */
|
|
assert (((wchar_t *) data.__outbuf)[-1] == L'\0');
|
|
/* Don't count the NUL character in. */
|
|
--result;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
/* This code is based on the safe assumption that all internal
|
|
multi-byte encodings use the NUL byte only to mark the end
|
|
of the string. */
|
|
const unsigned char *srcend;
|
|
|
|
srcend = (const unsigned char *) (*src
|
|
+ __strnlen (*src, len * MB_CUR_MAX)
|
|
+ 1);
|
|
|
|
data.__outbuf = (unsigned char *) dst;
|
|
data.__outbufend = data.__outbuf + len * sizeof (wchar_t);
|
|
|
|
status = (*towc->__fct) (__wcsmbs_gconv_fcts.towc, &data,
|
|
(const unsigned char **) src, srcend,
|
|
&non_reversible, 0, 1);
|
|
|
|
result = (wchar_t *) data.__outbuf - dst;
|
|
|
|
/* We have to determine whether the last character converted
|
|
is the NUL character. */
|
|
if ((status == __GCONV_OK || status == __GCONV_EMPTY_INPUT)
|
|
&& ((wchar_t *) dst)[result - 1] == L'\0')
|
|
{
|
|
assert (result > 0);
|
|
assert (__mbsinit (data.__statep));
|
|
*src = NULL;
|
|
--result;
|
|
}
|
|
}
|
|
|
|
/* There must not be any problems with the conversion but illegal input
|
|
characters. */
|
|
assert (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT
|
|
|| status == __GCONV_ILLEGAL_INPUT
|
|
|| status == __GCONV_INCOMPLETE_INPUT
|
|
|| status == __GCONV_FULL_OUTPUT);
|
|
|
|
if (status != __GCONV_OK && status != __GCONV_FULL_OUTPUT
|
|
&& status != __GCONV_EMPTY_INPUT)
|
|
{
|
|
result = (size_t) -1;
|
|
__set_errno (EILSEQ);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
weak_alias (__mbsrtowcs, mbsrtowcs)
|