mirror of
git://sourceware.org/git/newlib-cygwin.git
synced 2025-01-16 19:40:07 +08:00
d16a56306d
- Remove charset parameter from low level __foo_wctomb/__foo_mbtowc calls. - Instead, create array of function for ISO and Windows codepages to point to function which does not require to evaluate the charset string on each call. Create matching helper functions. I.e., __iso_wctomb, __iso_mbtowc, __cp_wctomb and __cp_mbtowc are functions returning the right function pointer now. - Create __WCTOMB/__MBTOWC macros utilizing per-reent locale and replace calls to __wctomb/__mbtowc with calls to __WCTOMB/__MBTOWC. - Drop global __wctomb/__mbtowc vars. - Utilize aforementioned changes in Cygwin to get rid of charset in other, calling functions and simplify the code. - In Cygwin restrict global cygheap locale info to the job performed by internal_setlocale. Use UTF-8 instead of ASCII on the fly in internal conversion functions. - In Cygwin dll_entry, make sure to initialize a TLS area with a NULL _REENT->_locale pointer. Add comment to explain why. Signed-off by: Corinna Vinschen <corinna@vinschen.de>
82 lines
1.9 KiB
C
82 lines
1.9 KiB
C
/*
|
|
FUNCTION
|
|
<<mblen>>---minimal multibyte length function
|
|
|
|
INDEX
|
|
mblen
|
|
|
|
ANSI_SYNOPSIS
|
|
#include <stdlib.h>
|
|
int mblen(const char *<[s]>, size_t <[n]>);
|
|
|
|
TRAD_SYNOPSIS
|
|
#include <stdlib.h>
|
|
int mblen(<[s]>, <[n]>)
|
|
const char *<[s]>;
|
|
size_t <[n]>;
|
|
|
|
DESCRIPTION
|
|
When _MB_CAPABLE is not defined, this is a minimal ANSI-conforming
|
|
implementation of <<mblen>>. In this case, the
|
|
only ``multi-byte character sequences'' recognized are single bytes,
|
|
and thus <<1>> is returned unless <[s]> is the null pointer or
|
|
has a length of 0 or is the empty string.
|
|
|
|
When _MB_CAPABLE is defined, this routine calls <<_mbtowc_r>> to perform
|
|
the conversion, passing a state variable to allow state dependent
|
|
decoding. The result is based on the locale setting which may
|
|
be restricted to a defined set of locales.
|
|
|
|
RETURNS
|
|
This implementation of <<mblen>> returns <<0>> if
|
|
<[s]> is <<NULL>> or the empty string; it returns <<1>> if not _MB_CAPABLE or
|
|
the character is a single-byte character; it returns <<-1>>
|
|
if the multi-byte character is invalid; otherwise it returns
|
|
the number of bytes in the multibyte character.
|
|
|
|
PORTABILITY
|
|
<<mblen>> is required in the ANSI C standard. However, the precise
|
|
effects vary with the locale.
|
|
|
|
<<mblen>> requires no supporting OS subroutines.
|
|
*/
|
|
|
|
#ifndef _REENT_ONLY
|
|
|
|
#include <newlib.h>
|
|
#include <stdlib.h>
|
|
#include <wchar.h>
|
|
#include "local.h"
|
|
|
|
int
|
|
_DEFUN (mblen, (s, n),
|
|
const char *s _AND
|
|
size_t n)
|
|
{
|
|
#ifdef _MB_CAPABLE
|
|
int retval = 0;
|
|
struct _reent *reent = _REENT;
|
|
mbstate_t *state;
|
|
|
|
_REENT_CHECK_MISC(reent);
|
|
state = &(_REENT_MBLEN_STATE(reent));
|
|
retval = __MBTOWC (reent, NULL, s, n, state);
|
|
if (retval < 0)
|
|
{
|
|
state->__count = 0;
|
|
return -1;
|
|
}
|
|
else
|
|
return retval;
|
|
|
|
#else /* not _MB_CAPABLE */
|
|
if (s == NULL || *s == '\0')
|
|
return 0;
|
|
if (n == 0)
|
|
return -1;
|
|
return 1;
|
|
#endif /* not _MB_CAPABLE */
|
|
}
|
|
|
|
#endif /* !_REENT_ONLY */
|