size_t mbrtoc16 (char16_t *pc16, const char *s, size_t n, mbstate_t *ps) { if (ps == NULL) ps = &state; /* The standard text does not say that S being NULL means the state is reset even if the second half of a surrogate still have to be returned. In fact, the error code description indicates otherwise. Therefore always first try to return a second half. */ if (ps->__count & 0x80000000) { /* We have to return the second word for a surrogate. */ ps->__count &= 0x7fffffff; *pc16 = ps->__value.__wch; ps->__value.__wch = L'\0'; return (size_t) -3; } wchar_t wc; struct __gconv_step_data data; int status; size_t result; size_t dummy; const unsigned char *inbuf, *endbuf; unsigned char *outbuf = (unsigned char *) &wc; const struct gconv_fcts *fcts; /* Set information for this step. */ data.__invocation_counter = 0; data.__internal_use = 1; data.__flags = __GCONV_IS_LAST; data.__statep = ps; data.__trans = NULL; /* A first special case is if S is NULL. This means put PS in the initial state. */ if (s == NULL) { pc16 = NULL; s = ""; n = 1; } /* Tell where we want the result. */ data.__outbuf = outbuf; data.__outbufend = outbuf + sizeof (wchar_t); /* Get the conversion functions. */ fcts = get_gconv_fcts (_NL_CURRENT_DATA (LC_CTYPE)); /* Do a normal conversion. */ inbuf = (const unsigned char *) s; endbuf = inbuf + n; if (__glibc_unlikely (endbuf < inbuf)) { endbuf = (const unsigned char *) ~(uintptr_t) 0; if (endbuf == inbuf) goto ilseq; } __gconv_fct fct = fcts->towc->__fct; #ifdef PTR_DEMANGLE if (fcts->towc->__shlib_handle != NULL) PTR_DEMANGLE (fct); #endif status = DL_CALL_FCT (fct, (fcts->towc, &data, &inbuf, endbuf, NULL, &dummy, 0, 1)); /* There must not be any problems with the conversion but illegal input characters. The output buffer must be large enough, otherwise the definition of MB_CUR_MAX is not correct. All the other possible errors also must not happen. */ assert (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT || status == __GCONV_ILLEGAL_INPUT || status == __GCONV_INCOMPLETE_INPUT || status == __GCONV_FULL_OUTPUT); if (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT || status == __GCONV_FULL_OUTPUT) { result = inbuf - (const unsigned char *) s; if (wc < 0x10000) { if (pc16 != NULL) *pc16 = wc; if (data.__outbuf != outbuf && wc == L'\0') { /* The converted character is the NUL character. */ assert (__mbsinit (data.__statep)); result = 0; } } else { /* This is a surrogate. */ if (pc16 != NULL) *pc16 = 0xd7c0 + (wc >> 10); ps->__count |= 0x80000000; ps->__value.__wch = 0xdc00 + (wc & 0x3ff); } }
size_t __mbrtowc (wchar_t *pwc, const char *s, size_t n, mbstate_t *ps) { wchar_t buf[1]; struct __gconv_step_data data; int status; size_t result; size_t dummy; const unsigned char *inbuf; char *outbuf = (char *) (pwc ?: buf); /* Set information for this step. */ data.__invocation_counter = 0; data.__internal_use = 1; data.__flags = __GCONV_IS_LAST; data.__statep = ps ?: &state; data.__trans = NULL; /* A first special case is if S is NULL. This means put PS in the initial state. */ if (s == NULL) { outbuf = (char *) buf; s = ""; n = 1; } /* Tell where we want the result. */ data.__outbuf = outbuf; data.__outbufend = outbuf + sizeof (wchar_t); /* Make sure we use the correct function. */ update_conversion_ptrs (); /* Do a normal conversion. */ inbuf = (const unsigned char *) s; status = DL_CALL_FCT (__wcsmbs_gconv_fcts.towc->__fct, (__wcsmbs_gconv_fcts.towc, &data, &inbuf, inbuf + n, NULL, &dummy, 0, 1)); /* There must not be any problems with the conversion but illegal input characters. The output buffer must be large enough, otherwise the definition of MB_CUR_MAX is not correct. All the other possible errors also must not happen. */ assert (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT || status == __GCONV_ILLEGAL_INPUT || status == __GCONV_INCOMPLETE_INPUT || status == __GCONV_FULL_OUTPUT); if (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT || status == __GCONV_FULL_OUTPUT) { if (data.__outbuf != (unsigned char *) outbuf && *(wchar_t *) outbuf == L'\0') { /* The converted character is the NUL character. */ assert (__mbsinit (data.__statep)); result = 0; } else result = inbuf - (const unsigned char *) s; } else if (status == __GCONV_INCOMPLETE_INPUT) result = (size_t) -2; else { result = (size_t) -1; __set_errno (EILSEQ); } return result; }
size_t attribute_hidden __mbsrtowcs_l (wchar_t *dst, const char **src, size_t len, mbstate_t *ps, locale_t l) { struct __gconv_step_data data; size_t result; int status; struct __gconv_step *towc; size_t non_reversible; const struct gconv_fcts *fcts; /* Tell where we want the result. */ data.__invocation_counter = 0; data.__internal_use = 1; data.__flags = __GCONV_IS_LAST; data.__statep = ps; /* Get the conversion functions. */ fcts = get_gconv_fcts (l->__locales[LC_CTYPE]); /* Get the structure with the function pointers. */ towc = fcts->towc; __gconv_fct fct = towc->__fct; #ifdef PTR_DEMANGLE if (towc->__shlib_handle != NULL) PTR_DEMANGLE (fct); #endif /* We have to handle DST == NULL special. */ if (dst == NULL) { mbstate_t temp_state; wchar_t buf[64]; /* Just an arbitrary size. */ const unsigned char *inbuf = (const unsigned char *) *src; const unsigned char *srcend = inbuf + strlen (*src) + 1; temp_state = *data.__statep; data.__statep = &temp_state; result = 0; data.__outbufend = (unsigned char *) buf + sizeof (buf); do { data.__outbuf = (unsigned char *) buf; status = DL_CALL_FCT (fct, (towc, &data, &inbuf, srcend, NULL, &non_reversible, 0, 1)); result += (wchar_t *) data.__outbuf - buf; } while (status == __GCONV_FULL_OUTPUT); if (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT) { /* There better should be a NUL wide char at the end. */ assert (((wchar_t *) data.__outbuf)[-1] == L'\0'); /* Don't count the NUL character in. */ --result; } } else { /* This code is based on the safe assumption that all internal multi-byte encodings use the NUL byte only to mark the end of the string. */ const unsigned char *srcp = (const unsigned char *) *src; const unsigned char *srcend; data.__outbuf = (unsigned char *) dst; data.__outbufend = data.__outbuf + len * sizeof (wchar_t); status = __GCONV_FULL_OUTPUT; while (len > 0) { /* Pessimistic guess as to how much input we can use. In the worst case we need one input byte for one output wchar_t. */ srcend = srcp + __strnlen ((const char *) srcp, len) + 1; status = DL_CALL_FCT (fct, (towc, &data, &srcp, srcend, NULL, &non_reversible, 0, 1)); if ((status != __GCONV_EMPTY_INPUT && status != __GCONV_INCOMPLETE_INPUT) /* Not all input read. */ || srcp != srcend /* Reached the end of the input. */ || srcend[-1] == '\0') break; len = (wchar_t *) data.__outbufend - (wchar_t *) data.__outbuf; } /* Make the end if the input known to the caller. */ *src = (const char *) srcp; result = (wchar_t *) data.__outbuf - dst; /* We have to determine whether the last character converted is the NUL character. */ if ((status == __GCONV_OK || status == __GCONV_EMPTY_INPUT) && ((wchar_t *) dst)[result - 1] == L'\0') { assert (result > 0); assert (__mbsinit (data.__statep)); *src = NULL; --result; } } /* There must not be any problems with the conversion but illegal input characters. */ assert (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT || status == __GCONV_ILLEGAL_INPUT || status == __GCONV_INCOMPLETE_INPUT || status == __GCONV_FULL_OUTPUT); if (status != __GCONV_OK && status != __GCONV_FULL_OUTPUT && status != __GCONV_EMPTY_INPUT && status != __GCONV_INCOMPLETE_INPUT) { result = (size_t) -1; __set_errno (EILSEQ); } return result; }