1*84d9c625SLionel Sambuc /* $NetBSD: citrus_utf8.c,v 1.18 2013/05/28 16:57:56 joerg Exp $ */
22fe8fb19SBen Gras
32fe8fb19SBen Gras /*-
42fe8fb19SBen Gras * Copyright (c)2002 Citrus Project,
52fe8fb19SBen Gras * All rights reserved.
62fe8fb19SBen Gras *
72fe8fb19SBen Gras * Redistribution and use in source and binary forms, with or without
82fe8fb19SBen Gras * modification, are permitted provided that the following conditions
92fe8fb19SBen Gras * are met:
102fe8fb19SBen Gras * 1. Redistributions of source code must retain the above copyright
112fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer.
122fe8fb19SBen Gras * 2. Redistributions in binary form must reproduce the above copyright
132fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer in the
142fe8fb19SBen Gras * documentation and/or other materials provided with the distribution.
152fe8fb19SBen Gras *
162fe8fb19SBen Gras * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
172fe8fb19SBen Gras * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
182fe8fb19SBen Gras * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
192fe8fb19SBen Gras * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
202fe8fb19SBen Gras * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
212fe8fb19SBen Gras * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
222fe8fb19SBen Gras * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
232fe8fb19SBen Gras * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
242fe8fb19SBen Gras * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
252fe8fb19SBen Gras * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
262fe8fb19SBen Gras * SUCH DAMAGE.
272fe8fb19SBen Gras */
282fe8fb19SBen Gras
292fe8fb19SBen Gras /*-
302fe8fb19SBen Gras * Copyright (c) 1993
312fe8fb19SBen Gras * The Regents of the University of California. All rights reserved.
322fe8fb19SBen Gras *
332fe8fb19SBen Gras * This code is derived from software contributed to Berkeley by
342fe8fb19SBen Gras * Paul Borman at Krystal Technologies.
352fe8fb19SBen Gras *
362fe8fb19SBen Gras * Redistribution and use in source and binary forms, with or without
372fe8fb19SBen Gras * modification, are permitted provided that the following conditions
382fe8fb19SBen Gras * are met:
392fe8fb19SBen Gras * 1. Redistributions of source code must retain the above copyright
402fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer.
412fe8fb19SBen Gras * 2. Redistributions in binary form must reproduce the above copyright
422fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer in the
432fe8fb19SBen Gras * documentation and/or other materials provided with the distribution.
442fe8fb19SBen Gras * 3. Neither the name of the University nor the names of its contributors
452fe8fb19SBen Gras * may be used to endorse or promote products derived from this software
462fe8fb19SBen Gras * without specific prior written permission.
472fe8fb19SBen Gras *
482fe8fb19SBen Gras * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
492fe8fb19SBen Gras * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
502fe8fb19SBen Gras * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
512fe8fb19SBen Gras * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
522fe8fb19SBen Gras * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
532fe8fb19SBen Gras * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
542fe8fb19SBen Gras * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
552fe8fb19SBen Gras * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
562fe8fb19SBen Gras * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
572fe8fb19SBen Gras * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
582fe8fb19SBen Gras * SUCH DAMAGE.
592fe8fb19SBen Gras */
602fe8fb19SBen Gras
612fe8fb19SBen Gras #include <sys/cdefs.h>
622fe8fb19SBen Gras #if defined(LIBC_SCCS) && !defined(lint)
63*84d9c625SLionel Sambuc __RCSID("$NetBSD: citrus_utf8.c,v 1.18 2013/05/28 16:57:56 joerg Exp $");
642fe8fb19SBen Gras #endif /* LIBC_SCCS and not lint */
652fe8fb19SBen Gras
662fe8fb19SBen Gras #include <assert.h>
672fe8fb19SBen Gras #include <errno.h>
682fe8fb19SBen Gras #include <string.h>
692fe8fb19SBen Gras #include <stdio.h>
702fe8fb19SBen Gras #include <stdlib.h>
712fe8fb19SBen Gras #include <stddef.h>
722fe8fb19SBen Gras #include <wchar.h>
732fe8fb19SBen Gras #include <sys/types.h>
742fe8fb19SBen Gras #include <limits.h>
752fe8fb19SBen Gras
762fe8fb19SBen Gras #include "citrus_namespace.h"
772fe8fb19SBen Gras #include "citrus_types.h"
782fe8fb19SBen Gras #include "citrus_module.h"
792fe8fb19SBen Gras #include "citrus_ctype.h"
802fe8fb19SBen Gras #include "citrus_stdenc.h"
812fe8fb19SBen Gras #include "citrus_utf8.h"
822fe8fb19SBen Gras
832fe8fb19SBen Gras
842fe8fb19SBen Gras /* ----------------------------------------------------------------------
852fe8fb19SBen Gras * private stuffs used by templates
862fe8fb19SBen Gras */
872fe8fb19SBen Gras
882fe8fb19SBen Gras static int _UTF8_count_array[256];
892fe8fb19SBen Gras static int const *_UTF8_count = NULL;
902fe8fb19SBen Gras
912fe8fb19SBen Gras static const u_int32_t _UTF8_range[] = {
922fe8fb19SBen Gras 0, /*dummy*/
932fe8fb19SBen Gras 0x00000000, 0x00000080, 0x00000800, 0x00010000,
942fe8fb19SBen Gras 0x00200000, 0x04000000, 0x80000000,
952fe8fb19SBen Gras };
962fe8fb19SBen Gras
972fe8fb19SBen Gras typedef struct {
982fe8fb19SBen Gras char ch[6];
992fe8fb19SBen Gras int chlen;
1002fe8fb19SBen Gras } _UTF8State;
1012fe8fb19SBen Gras
1022fe8fb19SBen Gras typedef struct {
1032fe8fb19SBen Gras } _UTF8EncodingInfo;
1042fe8fb19SBen Gras
1052fe8fb19SBen Gras typedef struct {
1062fe8fb19SBen Gras _UTF8EncodingInfo ei;
1072fe8fb19SBen Gras struct {
1082fe8fb19SBen Gras /* for future multi-locale facility */
1092fe8fb19SBen Gras _UTF8State s_mblen;
1102fe8fb19SBen Gras _UTF8State s_mbrlen;
1112fe8fb19SBen Gras _UTF8State s_mbrtowc;
1122fe8fb19SBen Gras _UTF8State s_mbtowc;
1132fe8fb19SBen Gras _UTF8State s_mbsrtowcs;
114*84d9c625SLionel Sambuc _UTF8State s_mbsnrtowcs;
1152fe8fb19SBen Gras _UTF8State s_wcrtomb;
1162fe8fb19SBen Gras _UTF8State s_wcsrtombs;
117*84d9c625SLionel Sambuc _UTF8State s_wcsnrtombs;
1182fe8fb19SBen Gras _UTF8State s_wctomb;
1192fe8fb19SBen Gras } states;
1202fe8fb19SBen Gras } _UTF8CTypeInfo;
1212fe8fb19SBen Gras
1222fe8fb19SBen Gras #define _CEI_TO_EI(_cei_) (&(_cei_)->ei)
1232fe8fb19SBen Gras #define _CEI_TO_STATE(_ei_, _func_) (_ei_)->states.s_##_func_
1242fe8fb19SBen Gras
1252fe8fb19SBen Gras #define _FUNCNAME(m) _citrus_UTF8_##m
1262fe8fb19SBen Gras #define _ENCODING_INFO _UTF8EncodingInfo
1272fe8fb19SBen Gras #define _CTYPE_INFO _UTF8CTypeInfo
1282fe8fb19SBen Gras #define _ENCODING_STATE _UTF8State
1292fe8fb19SBen Gras #define _ENCODING_MB_CUR_MAX(_ei_) 6
1302fe8fb19SBen Gras #define _ENCODING_IS_STATE_DEPENDENT 0
1312fe8fb19SBen Gras #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) 0
1322fe8fb19SBen Gras
1332fe8fb19SBen Gras
1342fe8fb19SBen Gras static __inline void
_UTF8_init_count(void)1352fe8fb19SBen Gras _UTF8_init_count(void)
1362fe8fb19SBen Gras {
1372fe8fb19SBen Gras int i;
1382fe8fb19SBen Gras if (!_UTF8_count) {
1392fe8fb19SBen Gras memset(_UTF8_count_array, 0, sizeof(_UTF8_count_array));
1402fe8fb19SBen Gras for (i = 0; i <= 0x7f; i++)
1412fe8fb19SBen Gras _UTF8_count_array[i] = 1;
1422fe8fb19SBen Gras for (i = 0xc0; i <= 0xdf; i++)
1432fe8fb19SBen Gras _UTF8_count_array[i] = 2;
1442fe8fb19SBen Gras for (i = 0xe0; i <= 0xef; i++)
1452fe8fb19SBen Gras _UTF8_count_array[i] = 3;
1462fe8fb19SBen Gras for (i = 0xf0; i <= 0xf7; i++)
1472fe8fb19SBen Gras _UTF8_count_array[i] = 4;
1482fe8fb19SBen Gras for (i = 0xf8; i <= 0xfb; i++)
1492fe8fb19SBen Gras _UTF8_count_array[i] = 5;
1502fe8fb19SBen Gras for (i = 0xfc; i <= 0xfd; i++)
1512fe8fb19SBen Gras _UTF8_count_array[i] = 6;
1522fe8fb19SBen Gras _UTF8_count = _UTF8_count_array;
1532fe8fb19SBen Gras }
1542fe8fb19SBen Gras }
1552fe8fb19SBen Gras
1562fe8fb19SBen Gras static int
_UTF8_findlen(wchar_t v)1572fe8fb19SBen Gras _UTF8_findlen(wchar_t v)
1582fe8fb19SBen Gras {
1592fe8fb19SBen Gras int i;
1602fe8fb19SBen Gras u_int32_t c;
1612fe8fb19SBen Gras
1622fe8fb19SBen Gras c = (u_int32_t)v; /*XXX*/
1632fe8fb19SBen Gras for (i = 1; i < sizeof(_UTF8_range) / sizeof(_UTF8_range[0]) - 1; i++)
1642fe8fb19SBen Gras if (c >= _UTF8_range[i] && c < _UTF8_range[i + 1])
1652fe8fb19SBen Gras return i;
1662fe8fb19SBen Gras
1672fe8fb19SBen Gras return -1; /*out of range*/
1682fe8fb19SBen Gras }
1692fe8fb19SBen Gras
1702fe8fb19SBen Gras static __inline int
_UTF8_surrogate(wchar_t wc)1712fe8fb19SBen Gras _UTF8_surrogate(wchar_t wc)
1722fe8fb19SBen Gras {
1732fe8fb19SBen Gras return wc >= 0xd800 && wc <= 0xdfff;
1742fe8fb19SBen Gras }
1752fe8fb19SBen Gras
1762fe8fb19SBen Gras static __inline void
1772fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_init_state(_UTF8EncodingInfo * ei,_UTF8State * s)1782fe8fb19SBen Gras _citrus_UTF8_init_state(_UTF8EncodingInfo *ei, _UTF8State *s)
1792fe8fb19SBen Gras {
1802fe8fb19SBen Gras s->chlen = 0;
1812fe8fb19SBen Gras }
1822fe8fb19SBen Gras
1832fe8fb19SBen Gras static __inline void
1842fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_pack_state(_UTF8EncodingInfo * ei,void * pspriv,const _UTF8State * s)1852fe8fb19SBen Gras _citrus_UTF8_pack_state(_UTF8EncodingInfo *ei, void *pspriv,
1862fe8fb19SBen Gras const _UTF8State *s)
1872fe8fb19SBen Gras {
1882fe8fb19SBen Gras memcpy(pspriv, (const void *)s, sizeof(*s));
1892fe8fb19SBen Gras }
1902fe8fb19SBen Gras
1912fe8fb19SBen Gras static __inline void
1922fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_unpack_state(_UTF8EncodingInfo * ei,_UTF8State * s,const void * pspriv)1932fe8fb19SBen Gras _citrus_UTF8_unpack_state(_UTF8EncodingInfo *ei, _UTF8State *s,
1942fe8fb19SBen Gras const void *pspriv)
1952fe8fb19SBen Gras {
1962fe8fb19SBen Gras memcpy((void *)s, pspriv, sizeof(*s));
1972fe8fb19SBen Gras }
1982fe8fb19SBen Gras
1992fe8fb19SBen Gras static int
_citrus_UTF8_mbrtowc_priv(_UTF8EncodingInfo * ei,wchar_t * pwc,const char ** s,size_t n,_UTF8State * psenc,size_t * nresult)2002fe8fb19SBen Gras _citrus_UTF8_mbrtowc_priv(_UTF8EncodingInfo *ei, wchar_t *pwc, const char **s,
2012fe8fb19SBen Gras size_t n, _UTF8State *psenc, size_t *nresult)
2022fe8fb19SBen Gras {
2032fe8fb19SBen Gras wchar_t wchar;
2042fe8fb19SBen Gras const char *s0;
2052fe8fb19SBen Gras int c;
2062fe8fb19SBen Gras int i;
2072fe8fb19SBen Gras
2082fe8fb19SBen Gras _DIAGASSERT(nresult != 0);
2092fe8fb19SBen Gras _DIAGASSERT(s != NULL);
2102fe8fb19SBen Gras _DIAGASSERT(psenc != NULL);
2112fe8fb19SBen Gras
2122fe8fb19SBen Gras s0 = *s;
2132fe8fb19SBen Gras
2142fe8fb19SBen Gras if (s0 == NULL) {
2152fe8fb19SBen Gras _citrus_UTF8_init_state(ei, psenc);
2162fe8fb19SBen Gras *nresult = 0; /* state independent */
2172fe8fb19SBen Gras return 0;
2182fe8fb19SBen Gras }
2192fe8fb19SBen Gras
2202fe8fb19SBen Gras /* make sure we have the first byte in the buffer */
2212fe8fb19SBen Gras if (psenc->chlen == 0) {
2222fe8fb19SBen Gras if (n-- < 1)
2232fe8fb19SBen Gras goto restart;
2242fe8fb19SBen Gras psenc->ch[psenc->chlen++] = *s0++;
2252fe8fb19SBen Gras }
2262fe8fb19SBen Gras
2272fe8fb19SBen Gras c = _UTF8_count[psenc->ch[0] & 0xff];
2282fe8fb19SBen Gras if (c < 1 || c < psenc->chlen)
2292fe8fb19SBen Gras goto ilseq;
2302fe8fb19SBen Gras
2312fe8fb19SBen Gras if (c == 1)
2322fe8fb19SBen Gras wchar = psenc->ch[0] & 0xff;
2332fe8fb19SBen Gras else {
2342fe8fb19SBen Gras while (psenc->chlen < c) {
2352fe8fb19SBen Gras if (n-- < 1)
2362fe8fb19SBen Gras goto restart;
2372fe8fb19SBen Gras psenc->ch[psenc->chlen++] = *s0++;
2382fe8fb19SBen Gras }
2392fe8fb19SBen Gras wchar = psenc->ch[0] & (0x7f >> c);
2402fe8fb19SBen Gras for (i = 1; i < c; i++) {
2412fe8fb19SBen Gras if ((psenc->ch[i] & 0xc0) != 0x80)
2422fe8fb19SBen Gras goto ilseq;
2432fe8fb19SBen Gras wchar <<= 6;
2442fe8fb19SBen Gras wchar |= (psenc->ch[i] & 0x3f);
2452fe8fb19SBen Gras }
2462fe8fb19SBen Gras if (_UTF8_surrogate(wchar) || _UTF8_findlen(wchar) != c)
2472fe8fb19SBen Gras goto ilseq;
2482fe8fb19SBen Gras }
2492fe8fb19SBen Gras if (pwc != NULL)
2502fe8fb19SBen Gras *pwc = wchar;
2512fe8fb19SBen Gras *nresult = (wchar == 0) ? 0 : s0 - *s;
2522fe8fb19SBen Gras *s = s0;
2532fe8fb19SBen Gras psenc->chlen = 0;
2542fe8fb19SBen Gras
2552fe8fb19SBen Gras return 0;
2562fe8fb19SBen Gras
2572fe8fb19SBen Gras ilseq:
2582fe8fb19SBen Gras *nresult = (size_t)-1;
2592fe8fb19SBen Gras return EILSEQ;
2602fe8fb19SBen Gras
2612fe8fb19SBen Gras restart:
2622fe8fb19SBen Gras *s = s0;
2632fe8fb19SBen Gras *nresult = (size_t)-2;
2642fe8fb19SBen Gras return 0;
2652fe8fb19SBen Gras }
2662fe8fb19SBen Gras
2672fe8fb19SBen Gras static int
_citrus_UTF8_wcrtomb_priv(_UTF8EncodingInfo * ei,char * s,size_t n,wchar_t wc,_UTF8State * psenc,size_t * nresult)2682fe8fb19SBen Gras _citrus_UTF8_wcrtomb_priv(_UTF8EncodingInfo *ei, char *s, size_t n, wchar_t wc,
2692fe8fb19SBen Gras _UTF8State *psenc, size_t *nresult)
2702fe8fb19SBen Gras {
2712fe8fb19SBen Gras int cnt, i, ret;
2722fe8fb19SBen Gras wchar_t c;
2732fe8fb19SBen Gras
2742fe8fb19SBen Gras _DIAGASSERT(nresult != 0);
2752fe8fb19SBen Gras _DIAGASSERT(s != NULL);
2762fe8fb19SBen Gras
2772fe8fb19SBen Gras if (_UTF8_surrogate(wc)) {
2782fe8fb19SBen Gras ret = EILSEQ;
2792fe8fb19SBen Gras goto err;
2802fe8fb19SBen Gras }
2812fe8fb19SBen Gras cnt = _UTF8_findlen(wc);
2822fe8fb19SBen Gras if (cnt <= 0 || cnt > 6) {
2832fe8fb19SBen Gras /* invalid UCS4 value */
2842fe8fb19SBen Gras ret = EILSEQ;
2852fe8fb19SBen Gras goto err;
2862fe8fb19SBen Gras }
2872fe8fb19SBen Gras if (n < cnt) {
2882fe8fb19SBen Gras /* bound check failure */
2892fe8fb19SBen Gras ret = E2BIG;
2902fe8fb19SBen Gras goto err;
2912fe8fb19SBen Gras }
2922fe8fb19SBen Gras
2932fe8fb19SBen Gras c = wc;
2942fe8fb19SBen Gras if (s) {
2952fe8fb19SBen Gras for (i = cnt - 1; i > 0; i--) {
2962fe8fb19SBen Gras s[i] = 0x80 | (c & 0x3f);
2972fe8fb19SBen Gras c >>= 6;
2982fe8fb19SBen Gras }
2992fe8fb19SBen Gras s[0] = c;
3002fe8fb19SBen Gras if (cnt == 1)
3012fe8fb19SBen Gras s[0] &= 0x7f;
3022fe8fb19SBen Gras else {
3032fe8fb19SBen Gras s[0] &= (0x7f >> cnt);
3042fe8fb19SBen Gras s[0] |= ((0xff00 >> cnt) & 0xff);
3052fe8fb19SBen Gras }
3062fe8fb19SBen Gras }
3072fe8fb19SBen Gras
3082fe8fb19SBen Gras *nresult = (size_t)cnt;
3092fe8fb19SBen Gras return 0;
3102fe8fb19SBen Gras
3112fe8fb19SBen Gras err:
3122fe8fb19SBen Gras *nresult = (size_t)-1;
3132fe8fb19SBen Gras return ret;
3142fe8fb19SBen Gras }
3152fe8fb19SBen Gras
3162fe8fb19SBen Gras static __inline int
3172fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_stdenc_wctocs(_UTF8EncodingInfo * __restrict ei,_csid_t * __restrict csid,_index_t * __restrict idx,wchar_t wc)3182fe8fb19SBen Gras _citrus_UTF8_stdenc_wctocs(_UTF8EncodingInfo * __restrict ei,
3192fe8fb19SBen Gras _csid_t * __restrict csid,
3202fe8fb19SBen Gras _index_t * __restrict idx,
3212fe8fb19SBen Gras wchar_t wc)
3222fe8fb19SBen Gras {
3232fe8fb19SBen Gras
3242fe8fb19SBen Gras _DIAGASSERT(csid != NULL && idx != NULL);
3252fe8fb19SBen Gras
3262fe8fb19SBen Gras *csid = 0;
3272fe8fb19SBen Gras *idx = (_citrus_index_t)wc;
3282fe8fb19SBen Gras
3292fe8fb19SBen Gras return (0);
3302fe8fb19SBen Gras }
3312fe8fb19SBen Gras
3322fe8fb19SBen Gras static __inline int
3332fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_stdenc_cstowc(_UTF8EncodingInfo * __restrict ei,wchar_t * __restrict wc,_csid_t csid,_index_t idx)3342fe8fb19SBen Gras _citrus_UTF8_stdenc_cstowc(_UTF8EncodingInfo * __restrict ei,
3352fe8fb19SBen Gras wchar_t * __restrict wc,
3362fe8fb19SBen Gras _csid_t csid, _index_t idx)
3372fe8fb19SBen Gras {
3382fe8fb19SBen Gras
3392fe8fb19SBen Gras _DIAGASSERT(wc != NULL);
3402fe8fb19SBen Gras
3412fe8fb19SBen Gras if (csid != 0)
3422fe8fb19SBen Gras return (EILSEQ);
3432fe8fb19SBen Gras
3442fe8fb19SBen Gras *wc = (wchar_t)idx;
3452fe8fb19SBen Gras
3462fe8fb19SBen Gras return (0);
3472fe8fb19SBen Gras }
3482fe8fb19SBen Gras
3492fe8fb19SBen Gras static __inline int
3502fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_stdenc_get_state_desc_generic(_UTF8EncodingInfo * __restrict ei,_UTF8State * __restrict psenc,int * __restrict rstate)3512fe8fb19SBen Gras _citrus_UTF8_stdenc_get_state_desc_generic(_UTF8EncodingInfo * __restrict ei,
3522fe8fb19SBen Gras _UTF8State * __restrict psenc,
3532fe8fb19SBen Gras int * __restrict rstate)
3542fe8fb19SBen Gras {
3552fe8fb19SBen Gras
3562fe8fb19SBen Gras if (psenc->chlen == 0)
3572fe8fb19SBen Gras *rstate = _STDENC_SDGEN_INITIAL;
3582fe8fb19SBen Gras else
3592fe8fb19SBen Gras *rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
3602fe8fb19SBen Gras
3612fe8fb19SBen Gras return 0;
3622fe8fb19SBen Gras }
3632fe8fb19SBen Gras
3642fe8fb19SBen Gras static int
3652fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_encoding_module_init(_UTF8EncodingInfo * __restrict ei,const void * __restrict var,size_t lenvar)3662fe8fb19SBen Gras _citrus_UTF8_encoding_module_init(_UTF8EncodingInfo * __restrict ei,
3672fe8fb19SBen Gras const void * __restrict var, size_t lenvar)
3682fe8fb19SBen Gras {
3692fe8fb19SBen Gras _UTF8_init_count();
3702fe8fb19SBen Gras
3712fe8fb19SBen Gras return 0;
3722fe8fb19SBen Gras }
3732fe8fb19SBen Gras
3742fe8fb19SBen Gras static void
3752fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF8_encoding_module_uninit(_UTF8EncodingInfo * ei)3762fe8fb19SBen Gras _citrus_UTF8_encoding_module_uninit(_UTF8EncodingInfo *ei)
3772fe8fb19SBen Gras {
3782fe8fb19SBen Gras }
3792fe8fb19SBen Gras
3802fe8fb19SBen Gras
3812fe8fb19SBen Gras /* ----------------------------------------------------------------------
3822fe8fb19SBen Gras * public interface for ctype
3832fe8fb19SBen Gras */
3842fe8fb19SBen Gras
3852fe8fb19SBen Gras _CITRUS_CTYPE_DECLS(UTF8);
3862fe8fb19SBen Gras _CITRUS_CTYPE_DEF_OPS(UTF8);
3872fe8fb19SBen Gras
3882fe8fb19SBen Gras #include "citrus_ctype_template.h"
3892fe8fb19SBen Gras
3902fe8fb19SBen Gras /* ----------------------------------------------------------------------
3912fe8fb19SBen Gras * public interface for stdenc
3922fe8fb19SBen Gras */
3932fe8fb19SBen Gras
3942fe8fb19SBen Gras _CITRUS_STDENC_DECLS(UTF8);
3952fe8fb19SBen Gras _CITRUS_STDENC_DEF_OPS(UTF8);
3962fe8fb19SBen Gras
3972fe8fb19SBen Gras #include "citrus_stdenc_template.h"
398