xref: /minix3/lib/libc/citrus/modules/citrus_utf8.c (revision 84d9c625bfea59e274550651111ae9edfdc40fbd)
1*84d9c625SLionel Sambuc /*	$NetBSD: citrus_utf8.c,v 1.18 2013/05/28 16:57:56 joerg Exp $	*/
22fe8fb19SBen Gras 
32fe8fb19SBen Gras /*-
42fe8fb19SBen Gras  * Copyright (c)2002 Citrus Project,
52fe8fb19SBen Gras  * All rights reserved.
62fe8fb19SBen Gras  *
72fe8fb19SBen Gras  * Redistribution and use in source and binary forms, with or without
82fe8fb19SBen Gras  * modification, are permitted provided that the following conditions
92fe8fb19SBen Gras  * are met:
102fe8fb19SBen Gras  * 1. Redistributions of source code must retain the above copyright
112fe8fb19SBen Gras  *    notice, this list of conditions and the following disclaimer.
122fe8fb19SBen Gras  * 2. Redistributions in binary form must reproduce the above copyright
132fe8fb19SBen Gras  *    notice, this list of conditions and the following disclaimer in the
142fe8fb19SBen Gras  *    documentation and/or other materials provided with the distribution.
152fe8fb19SBen Gras  *
162fe8fb19SBen Gras  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
172fe8fb19SBen Gras  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
182fe8fb19SBen Gras  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
192fe8fb19SBen Gras  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
202fe8fb19SBen Gras  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
212fe8fb19SBen Gras  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
222fe8fb19SBen Gras  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
232fe8fb19SBen Gras  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
242fe8fb19SBen Gras  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
252fe8fb19SBen Gras  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
262fe8fb19SBen Gras  * SUCH DAMAGE.
272fe8fb19SBen Gras  */
282fe8fb19SBen Gras 
292fe8fb19SBen Gras /*-
302fe8fb19SBen Gras  * Copyright (c) 1993
312fe8fb19SBen Gras  *	The Regents of the University of California.  All rights reserved.
322fe8fb19SBen Gras  *
332fe8fb19SBen Gras  * This code is derived from software contributed to Berkeley by
342fe8fb19SBen Gras  * Paul Borman at Krystal Technologies.
352fe8fb19SBen Gras  *
362fe8fb19SBen Gras  * Redistribution and use in source and binary forms, with or without
372fe8fb19SBen Gras  * modification, are permitted provided that the following conditions
382fe8fb19SBen Gras  * are met:
392fe8fb19SBen Gras  * 1. Redistributions of source code must retain the above copyright
402fe8fb19SBen Gras  *    notice, this list of conditions and the following disclaimer.
412fe8fb19SBen Gras  * 2. Redistributions in binary form must reproduce the above copyright
422fe8fb19SBen Gras  *    notice, this list of conditions and the following disclaimer in the
432fe8fb19SBen Gras  *    documentation and/or other materials provided with the distribution.
442fe8fb19SBen Gras  * 3. Neither the name of the University nor the names of its contributors
452fe8fb19SBen Gras  *    may be used to endorse or promote products derived from this software
462fe8fb19SBen Gras  *    without specific prior written permission.
472fe8fb19SBen Gras  *
482fe8fb19SBen Gras  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
492fe8fb19SBen Gras  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
502fe8fb19SBen Gras  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
512fe8fb19SBen Gras  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
522fe8fb19SBen Gras  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
532fe8fb19SBen Gras  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
542fe8fb19SBen Gras  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
552fe8fb19SBen Gras  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
562fe8fb19SBen Gras  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
572fe8fb19SBen Gras  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
582fe8fb19SBen Gras  * SUCH DAMAGE.
592fe8fb19SBen Gras  */
602fe8fb19SBen Gras 
612fe8fb19SBen Gras #include <sys/cdefs.h>
622fe8fb19SBen Gras #if defined(LIBC_SCCS) && !defined(lint)
63*84d9c625SLionel Sambuc __RCSID("$NetBSD: citrus_utf8.c,v 1.18 2013/05/28 16:57:56 joerg Exp $");
642fe8fb19SBen Gras #endif /* LIBC_SCCS and not lint */
652fe8fb19SBen Gras 
662fe8fb19SBen Gras #include <assert.h>
672fe8fb19SBen Gras #include <errno.h>
682fe8fb19SBen Gras #include <string.h>
692fe8fb19SBen Gras #include <stdio.h>
702fe8fb19SBen Gras #include <stdlib.h>
712fe8fb19SBen Gras #include <stddef.h>
722fe8fb19SBen Gras #include <wchar.h>
732fe8fb19SBen Gras #include <sys/types.h>
742fe8fb19SBen Gras #include <limits.h>
752fe8fb19SBen Gras 
762fe8fb19SBen Gras #include "citrus_namespace.h"
772fe8fb19SBen Gras #include "citrus_types.h"
782fe8fb19SBen Gras #include "citrus_module.h"
792fe8fb19SBen Gras #include "citrus_ctype.h"
802fe8fb19SBen Gras #include "citrus_stdenc.h"
812fe8fb19SBen Gras #include "citrus_utf8.h"
822fe8fb19SBen Gras 
832fe8fb19SBen Gras 
842fe8fb19SBen Gras /* ----------------------------------------------------------------------
852fe8fb19SBen Gras  * private stuffs used by templates
862fe8fb19SBen Gras  */
872fe8fb19SBen Gras 
882fe8fb19SBen Gras static int _UTF8_count_array[256];
892fe8fb19SBen Gras static int const *_UTF8_count = NULL;
902fe8fb19SBen Gras 
912fe8fb19SBen Gras static const u_int32_t _UTF8_range[] = {
922fe8fb19SBen Gras 	0,	/*dummy*/
932fe8fb19SBen Gras 	0x00000000, 0x00000080, 0x00000800, 0x00010000,
942fe8fb19SBen Gras 	0x00200000, 0x04000000, 0x80000000,
952fe8fb19SBen Gras };
962fe8fb19SBen Gras 
972fe8fb19SBen Gras typedef struct {
982fe8fb19SBen Gras 	char ch[6];
992fe8fb19SBen Gras 	int chlen;
1002fe8fb19SBen Gras } _UTF8State;
1012fe8fb19SBen Gras 
1022fe8fb19SBen Gras typedef struct {
1032fe8fb19SBen Gras } _UTF8EncodingInfo;
1042fe8fb19SBen Gras 
1052fe8fb19SBen Gras typedef struct {
1062fe8fb19SBen Gras 	_UTF8EncodingInfo	ei;
1072fe8fb19SBen Gras 	struct {
1082fe8fb19SBen Gras 		/* for future multi-locale facility */
1092fe8fb19SBen Gras 		_UTF8State	s_mblen;
1102fe8fb19SBen Gras 		_UTF8State	s_mbrlen;
1112fe8fb19SBen Gras 		_UTF8State	s_mbrtowc;
1122fe8fb19SBen Gras 		_UTF8State	s_mbtowc;
1132fe8fb19SBen Gras 		_UTF8State	s_mbsrtowcs;
114*84d9c625SLionel Sambuc 		_UTF8State	s_mbsnrtowcs;
1152fe8fb19SBen Gras 		_UTF8State	s_wcrtomb;
1162fe8fb19SBen Gras 		_UTF8State	s_wcsrtombs;
117*84d9c625SLionel Sambuc 		_UTF8State	s_wcsnrtombs;
1182fe8fb19SBen Gras 		_UTF8State	s_wctomb;
1192fe8fb19SBen Gras 	} states;
1202fe8fb19SBen Gras } _UTF8CTypeInfo;
1212fe8fb19SBen Gras 
1222fe8fb19SBen Gras #define _CEI_TO_EI(_cei_)		(&(_cei_)->ei)
1232fe8fb19SBen Gras #define _CEI_TO_STATE(_ei_, _func_)	(_ei_)->states.s_##_func_
1242fe8fb19SBen Gras 
1252fe8fb19SBen Gras #define _FUNCNAME(m)			_citrus_UTF8_##m
1262fe8fb19SBen Gras #define _ENCODING_INFO			_UTF8EncodingInfo
1272fe8fb19SBen Gras #define _CTYPE_INFO			_UTF8CTypeInfo
1282fe8fb19SBen Gras #define _ENCODING_STATE			_UTF8State
1292fe8fb19SBen Gras #define _ENCODING_MB_CUR_MAX(_ei_)	6
1302fe8fb19SBen Gras #define _ENCODING_IS_STATE_DEPENDENT	0
1312fe8fb19SBen Gras #define _STATE_NEEDS_EXPLICIT_INIT(_ps_)	0
1322fe8fb19SBen Gras 
1332fe8fb19SBen Gras 
1342fe8fb19SBen Gras static __inline void
_UTF8_init_count(void)1352fe8fb19SBen Gras _UTF8_init_count(void)
1362fe8fb19SBen Gras {
1372fe8fb19SBen Gras 	int i;
1382fe8fb19SBen Gras 	if (!_UTF8_count) {
1392fe8fb19SBen Gras 		memset(_UTF8_count_array, 0, sizeof(_UTF8_count_array));
1402fe8fb19SBen Gras 		for (i = 0; i <= 0x7f; i++)
1412fe8fb19SBen Gras 			_UTF8_count_array[i] = 1;
1422fe8fb19SBen Gras 		for (i = 0xc0; i <= 0xdf; i++)
1432fe8fb19SBen Gras 			_UTF8_count_array[i] = 2;
1442fe8fb19SBen Gras 		for (i = 0xe0; i <= 0xef; i++)
1452fe8fb19SBen Gras 			_UTF8_count_array[i] = 3;
1462fe8fb19SBen Gras 		for (i = 0xf0; i <= 0xf7; i++)
1472fe8fb19SBen Gras 			_UTF8_count_array[i] = 4;
1482fe8fb19SBen Gras 		for (i = 0xf8; i <= 0xfb; i++)
1492fe8fb19SBen Gras 			_UTF8_count_array[i] = 5;
1502fe8fb19SBen Gras 		for (i = 0xfc; i <= 0xfd; i++)
1512fe8fb19SBen Gras 			_UTF8_count_array[i] = 6;
1522fe8fb19SBen Gras 		_UTF8_count = _UTF8_count_array;
1532fe8fb19SBen Gras 	}
1542fe8fb19SBen Gras }
1552fe8fb19SBen Gras 
1562fe8fb19SBen Gras static int
_UTF8_findlen(wchar_t v)1572fe8fb19SBen Gras _UTF8_findlen(wchar_t v)
1582fe8fb19SBen Gras {
1592fe8fb19SBen Gras 	int i;
1602fe8fb19SBen Gras 	u_int32_t c;
1612fe8fb19SBen Gras 
1622fe8fb19SBen Gras 	c = (u_int32_t)v;	/*XXX*/
1632fe8fb19SBen Gras 	for (i = 1; i < sizeof(_UTF8_range) / sizeof(_UTF8_range[0]) - 1; i++)
1642fe8fb19SBen Gras 		if (c >= _UTF8_range[i] && c < _UTF8_range[i + 1])
1652fe8fb19SBen Gras 			return i;
1662fe8fb19SBen Gras 
1672fe8fb19SBen Gras 	return -1;	/*out of range*/
1682fe8fb19SBen Gras }
1692fe8fb19SBen Gras 
1702fe8fb19SBen Gras static __inline int
_UTF8_surrogate(wchar_t wc)1712fe8fb19SBen Gras _UTF8_surrogate(wchar_t wc)
1722fe8fb19SBen Gras {
1732fe8fb19SBen Gras 	return wc >= 0xd800 && wc <= 0xdfff;
1742fe8fb19SBen Gras }
1752fe8fb19SBen Gras 
1762fe8fb19SBen Gras static __inline void
1772fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_init_state(_UTF8EncodingInfo * ei,_UTF8State * s)1782fe8fb19SBen Gras _citrus_UTF8_init_state(_UTF8EncodingInfo *ei, _UTF8State *s)
1792fe8fb19SBen Gras {
1802fe8fb19SBen Gras 	s->chlen = 0;
1812fe8fb19SBen Gras }
1822fe8fb19SBen Gras 
1832fe8fb19SBen Gras static __inline void
1842fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_pack_state(_UTF8EncodingInfo * ei,void * pspriv,const _UTF8State * s)1852fe8fb19SBen Gras _citrus_UTF8_pack_state(_UTF8EncodingInfo *ei, void *pspriv,
1862fe8fb19SBen Gras 			const _UTF8State *s)
1872fe8fb19SBen Gras {
1882fe8fb19SBen Gras 	memcpy(pspriv, (const void *)s, sizeof(*s));
1892fe8fb19SBen Gras }
1902fe8fb19SBen Gras 
1912fe8fb19SBen Gras static __inline void
1922fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_unpack_state(_UTF8EncodingInfo * ei,_UTF8State * s,const void * pspriv)1932fe8fb19SBen Gras _citrus_UTF8_unpack_state(_UTF8EncodingInfo *ei, _UTF8State *s,
1942fe8fb19SBen Gras 			  const void *pspriv)
1952fe8fb19SBen Gras {
1962fe8fb19SBen Gras 	memcpy((void *)s, pspriv, sizeof(*s));
1972fe8fb19SBen Gras }
1982fe8fb19SBen Gras 
1992fe8fb19SBen Gras static int
_citrus_UTF8_mbrtowc_priv(_UTF8EncodingInfo * ei,wchar_t * pwc,const char ** s,size_t n,_UTF8State * psenc,size_t * nresult)2002fe8fb19SBen Gras _citrus_UTF8_mbrtowc_priv(_UTF8EncodingInfo *ei, wchar_t *pwc, const char **s,
2012fe8fb19SBen Gras 			  size_t n, _UTF8State *psenc, size_t *nresult)
2022fe8fb19SBen Gras {
2032fe8fb19SBen Gras 	wchar_t wchar;
2042fe8fb19SBen Gras 	const char *s0;
2052fe8fb19SBen Gras 	int c;
2062fe8fb19SBen Gras 	int i;
2072fe8fb19SBen Gras 
2082fe8fb19SBen Gras 	_DIAGASSERT(nresult != 0);
2092fe8fb19SBen Gras 	_DIAGASSERT(s != NULL);
2102fe8fb19SBen Gras 	_DIAGASSERT(psenc != NULL);
2112fe8fb19SBen Gras 
2122fe8fb19SBen Gras 	s0 = *s;
2132fe8fb19SBen Gras 
2142fe8fb19SBen Gras 	if (s0 == NULL) {
2152fe8fb19SBen Gras 		_citrus_UTF8_init_state(ei, psenc);
2162fe8fb19SBen Gras 		*nresult = 0; /* state independent */
2172fe8fb19SBen Gras 		return 0;
2182fe8fb19SBen Gras 	}
2192fe8fb19SBen Gras 
2202fe8fb19SBen Gras 	/* make sure we have the first byte in the buffer */
2212fe8fb19SBen Gras 	if (psenc->chlen == 0) {
2222fe8fb19SBen Gras 		if (n-- < 1)
2232fe8fb19SBen Gras 			goto restart;
2242fe8fb19SBen Gras 		psenc->ch[psenc->chlen++] = *s0++;
2252fe8fb19SBen Gras 	}
2262fe8fb19SBen Gras 
2272fe8fb19SBen Gras 	c = _UTF8_count[psenc->ch[0] & 0xff];
2282fe8fb19SBen Gras 	if (c < 1 || c < psenc->chlen)
2292fe8fb19SBen Gras 		goto ilseq;
2302fe8fb19SBen Gras 
2312fe8fb19SBen Gras 	if (c == 1)
2322fe8fb19SBen Gras 		wchar = psenc->ch[0] & 0xff;
2332fe8fb19SBen Gras 	else {
2342fe8fb19SBen Gras 		while (psenc->chlen < c) {
2352fe8fb19SBen Gras 			if (n-- < 1)
2362fe8fb19SBen Gras 				goto restart;
2372fe8fb19SBen Gras 			psenc->ch[psenc->chlen++] = *s0++;
2382fe8fb19SBen Gras 		}
2392fe8fb19SBen Gras 		wchar = psenc->ch[0] & (0x7f >> c);
2402fe8fb19SBen Gras 		for (i = 1; i < c; i++) {
2412fe8fb19SBen Gras 			if ((psenc->ch[i] & 0xc0) != 0x80)
2422fe8fb19SBen Gras 				goto ilseq;
2432fe8fb19SBen Gras 			wchar <<= 6;
2442fe8fb19SBen Gras 			wchar |= (psenc->ch[i] & 0x3f);
2452fe8fb19SBen Gras 		}
2462fe8fb19SBen Gras 		if (_UTF8_surrogate(wchar) || _UTF8_findlen(wchar) != c)
2472fe8fb19SBen Gras 			goto ilseq;
2482fe8fb19SBen Gras 	}
2492fe8fb19SBen Gras 	if (pwc != NULL)
2502fe8fb19SBen Gras 		*pwc = wchar;
2512fe8fb19SBen Gras 	*nresult = (wchar == 0) ? 0 : s0 - *s;
2522fe8fb19SBen Gras 	*s = s0;
2532fe8fb19SBen Gras 	psenc->chlen = 0;
2542fe8fb19SBen Gras 
2552fe8fb19SBen Gras 	return 0;
2562fe8fb19SBen Gras 
2572fe8fb19SBen Gras ilseq:
2582fe8fb19SBen Gras 	*nresult = (size_t)-1;
2592fe8fb19SBen Gras 	return EILSEQ;
2602fe8fb19SBen Gras 
2612fe8fb19SBen Gras restart:
2622fe8fb19SBen Gras 	*s = s0;
2632fe8fb19SBen Gras 	*nresult = (size_t)-2;
2642fe8fb19SBen Gras 	return 0;
2652fe8fb19SBen Gras }
2662fe8fb19SBen Gras 
2672fe8fb19SBen Gras static int
_citrus_UTF8_wcrtomb_priv(_UTF8EncodingInfo * ei,char * s,size_t n,wchar_t wc,_UTF8State * psenc,size_t * nresult)2682fe8fb19SBen Gras _citrus_UTF8_wcrtomb_priv(_UTF8EncodingInfo *ei, char *s, size_t n, wchar_t wc,
2692fe8fb19SBen Gras 			  _UTF8State *psenc, size_t *nresult)
2702fe8fb19SBen Gras {
2712fe8fb19SBen Gras 	int cnt, i, ret;
2722fe8fb19SBen Gras 	wchar_t c;
2732fe8fb19SBen Gras 
2742fe8fb19SBen Gras 	_DIAGASSERT(nresult != 0);
2752fe8fb19SBen Gras 	_DIAGASSERT(s != NULL);
2762fe8fb19SBen Gras 
2772fe8fb19SBen Gras 	if (_UTF8_surrogate(wc)) {
2782fe8fb19SBen Gras 		ret = EILSEQ;
2792fe8fb19SBen Gras 		goto err;
2802fe8fb19SBen Gras 	}
2812fe8fb19SBen Gras 	cnt = _UTF8_findlen(wc);
2822fe8fb19SBen Gras 	if (cnt <= 0 || cnt > 6) {
2832fe8fb19SBen Gras 		/* invalid UCS4 value */
2842fe8fb19SBen Gras 		ret = EILSEQ;
2852fe8fb19SBen Gras 		goto err;
2862fe8fb19SBen Gras 	}
2872fe8fb19SBen Gras 	if (n < cnt) {
2882fe8fb19SBen Gras 		/* bound check failure */
2892fe8fb19SBen Gras 		ret = E2BIG;
2902fe8fb19SBen Gras 		goto err;
2912fe8fb19SBen Gras 	}
2922fe8fb19SBen Gras 
2932fe8fb19SBen Gras 	c = wc;
2942fe8fb19SBen Gras 	if (s) {
2952fe8fb19SBen Gras 		for (i = cnt - 1; i > 0; i--) {
2962fe8fb19SBen Gras 			s[i] = 0x80 | (c & 0x3f);
2972fe8fb19SBen Gras 			c >>= 6;
2982fe8fb19SBen Gras 		}
2992fe8fb19SBen Gras 		s[0] = c;
3002fe8fb19SBen Gras 		if (cnt == 1)
3012fe8fb19SBen Gras 			s[0] &= 0x7f;
3022fe8fb19SBen Gras 		else {
3032fe8fb19SBen Gras 			s[0] &= (0x7f >> cnt);
3042fe8fb19SBen Gras 			s[0] |= ((0xff00 >> cnt) & 0xff);
3052fe8fb19SBen Gras 		}
3062fe8fb19SBen Gras 	}
3072fe8fb19SBen Gras 
3082fe8fb19SBen Gras 	*nresult = (size_t)cnt;
3092fe8fb19SBen Gras 	return 0;
3102fe8fb19SBen Gras 
3112fe8fb19SBen Gras err:
3122fe8fb19SBen Gras 	*nresult = (size_t)-1;
3132fe8fb19SBen Gras 	return ret;
3142fe8fb19SBen Gras }
3152fe8fb19SBen Gras 
3162fe8fb19SBen Gras static __inline int
3172fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_stdenc_wctocs(_UTF8EncodingInfo * __restrict ei,_csid_t * __restrict csid,_index_t * __restrict idx,wchar_t wc)3182fe8fb19SBen Gras _citrus_UTF8_stdenc_wctocs(_UTF8EncodingInfo * __restrict ei,
3192fe8fb19SBen Gras 			   _csid_t * __restrict csid,
3202fe8fb19SBen Gras 			   _index_t * __restrict idx,
3212fe8fb19SBen Gras 			   wchar_t wc)
3222fe8fb19SBen Gras {
3232fe8fb19SBen Gras 
3242fe8fb19SBen Gras 	_DIAGASSERT(csid != NULL && idx != NULL);
3252fe8fb19SBen Gras 
3262fe8fb19SBen Gras 	*csid = 0;
3272fe8fb19SBen Gras 	*idx = (_citrus_index_t)wc;
3282fe8fb19SBen Gras 
3292fe8fb19SBen Gras 	return (0);
3302fe8fb19SBen Gras }
3312fe8fb19SBen Gras 
3322fe8fb19SBen Gras static __inline int
3332fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_stdenc_cstowc(_UTF8EncodingInfo * __restrict ei,wchar_t * __restrict wc,_csid_t csid,_index_t idx)3342fe8fb19SBen Gras _citrus_UTF8_stdenc_cstowc(_UTF8EncodingInfo * __restrict ei,
3352fe8fb19SBen Gras 			   wchar_t * __restrict wc,
3362fe8fb19SBen Gras 			   _csid_t csid, _index_t idx)
3372fe8fb19SBen Gras {
3382fe8fb19SBen Gras 
3392fe8fb19SBen Gras 	_DIAGASSERT(wc != NULL);
3402fe8fb19SBen Gras 
3412fe8fb19SBen Gras 	if (csid != 0)
3422fe8fb19SBen Gras 		return (EILSEQ);
3432fe8fb19SBen Gras 
3442fe8fb19SBen Gras 	*wc = (wchar_t)idx;
3452fe8fb19SBen Gras 
3462fe8fb19SBen Gras 	return (0);
3472fe8fb19SBen Gras }
3482fe8fb19SBen Gras 
3492fe8fb19SBen Gras static __inline int
3502fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_stdenc_get_state_desc_generic(_UTF8EncodingInfo * __restrict ei,_UTF8State * __restrict psenc,int * __restrict rstate)3512fe8fb19SBen Gras _citrus_UTF8_stdenc_get_state_desc_generic(_UTF8EncodingInfo * __restrict ei,
3522fe8fb19SBen Gras 					   _UTF8State * __restrict psenc,
3532fe8fb19SBen Gras 					   int * __restrict rstate)
3542fe8fb19SBen Gras {
3552fe8fb19SBen Gras 
3562fe8fb19SBen Gras 	if (psenc->chlen == 0)
3572fe8fb19SBen Gras 		*rstate = _STDENC_SDGEN_INITIAL;
3582fe8fb19SBen Gras 	else
3592fe8fb19SBen Gras 		*rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
3602fe8fb19SBen Gras 
3612fe8fb19SBen Gras 	return 0;
3622fe8fb19SBen Gras }
3632fe8fb19SBen Gras 
3642fe8fb19SBen Gras static int
3652fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_encoding_module_init(_UTF8EncodingInfo * __restrict ei,const void * __restrict var,size_t lenvar)3662fe8fb19SBen Gras _citrus_UTF8_encoding_module_init(_UTF8EncodingInfo * __restrict ei,
3672fe8fb19SBen Gras 				  const void * __restrict var, size_t lenvar)
3682fe8fb19SBen Gras {
3692fe8fb19SBen Gras 	_UTF8_init_count();
3702fe8fb19SBen Gras 
3712fe8fb19SBen Gras 	return 0;
3722fe8fb19SBen Gras }
3732fe8fb19SBen Gras 
3742fe8fb19SBen Gras static void
3752fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_encoding_module_uninit(_UTF8EncodingInfo * ei)3762fe8fb19SBen Gras _citrus_UTF8_encoding_module_uninit(_UTF8EncodingInfo *ei)
3772fe8fb19SBen Gras {
3782fe8fb19SBen Gras }
3792fe8fb19SBen Gras 
3802fe8fb19SBen Gras 
3812fe8fb19SBen Gras /* ----------------------------------------------------------------------
3822fe8fb19SBen Gras  * public interface for ctype
3832fe8fb19SBen Gras  */
3842fe8fb19SBen Gras 
3852fe8fb19SBen Gras _CITRUS_CTYPE_DECLS(UTF8);
3862fe8fb19SBen Gras _CITRUS_CTYPE_DEF_OPS(UTF8);
3872fe8fb19SBen Gras 
3882fe8fb19SBen Gras #include "citrus_ctype_template.h"
3892fe8fb19SBen Gras 
3902fe8fb19SBen Gras /* ----------------------------------------------------------------------
3912fe8fb19SBen Gras  * public interface for stdenc
3922fe8fb19SBen Gras  */
3932fe8fb19SBen Gras 
3942fe8fb19SBen Gras _CITRUS_STDENC_DECLS(UTF8);
3952fe8fb19SBen Gras _CITRUS_STDENC_DEF_OPS(UTF8);
3962fe8fb19SBen Gras 
3972fe8fb19SBen Gras #include "citrus_stdenc_template.h"
398