1*84d9c625SLionel Sambuc /* $NetBSD: citrus_utf7.c,v 1.6 2013/05/28 16:57:56 joerg Exp $ */
22fe8fb19SBen Gras
32fe8fb19SBen Gras /*-
42fe8fb19SBen Gras * Copyright (c)2004, 2005 Citrus Project,
52fe8fb19SBen Gras * All rights reserved.
62fe8fb19SBen Gras *
72fe8fb19SBen Gras * Redistribution and use in source and binary forms, with or without
82fe8fb19SBen Gras * modification, are permitted provided that the following conditions
92fe8fb19SBen Gras * are met:
102fe8fb19SBen Gras * 1. Redistributions of source code must retain the above copyright
112fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer.
122fe8fb19SBen Gras * 2. Redistributions in binary form must reproduce the above copyright
132fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer in the
142fe8fb19SBen Gras * documentation and/or other materials provided with the distribution.
152fe8fb19SBen Gras *
162fe8fb19SBen Gras * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
172fe8fb19SBen Gras * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
182fe8fb19SBen Gras * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
192fe8fb19SBen Gras * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
202fe8fb19SBen Gras * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
212fe8fb19SBen Gras * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
222fe8fb19SBen Gras * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
232fe8fb19SBen Gras * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
242fe8fb19SBen Gras * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
252fe8fb19SBen Gras * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
262fe8fb19SBen Gras * SUCH DAMAGE.
272fe8fb19SBen Gras *
282fe8fb19SBen Gras */
292fe8fb19SBen Gras
302fe8fb19SBen Gras #include <sys/cdefs.h>
312fe8fb19SBen Gras #if defined(LIB_SCCS) && !defined(lint)
32*84d9c625SLionel Sambuc __RCSID("$NetBSD: citrus_utf7.c,v 1.6 2013/05/28 16:57:56 joerg Exp $");
332fe8fb19SBen Gras #endif /* LIB_SCCS and not lint */
342fe8fb19SBen Gras
352fe8fb19SBen Gras #include <assert.h>
362fe8fb19SBen Gras #include <errno.h>
372fe8fb19SBen Gras #include <string.h>
382fe8fb19SBen Gras #include <stdio.h>
392fe8fb19SBen Gras #include <stdint.h>
402fe8fb19SBen Gras #include <stdlib.h>
412fe8fb19SBen Gras #include <limits.h>
422fe8fb19SBen Gras #include <wchar.h>
432fe8fb19SBen Gras
442fe8fb19SBen Gras #include "citrus_namespace.h"
452fe8fb19SBen Gras #include "citrus_types.h"
462fe8fb19SBen Gras #include "citrus_module.h"
472fe8fb19SBen Gras #include "citrus_ctype.h"
482fe8fb19SBen Gras #include "citrus_stdenc.h"
492fe8fb19SBen Gras #include "citrus_utf7.h"
502fe8fb19SBen Gras
512fe8fb19SBen Gras /* ----------------------------------------------------------------------
522fe8fb19SBen Gras * private stuffs used by templates
532fe8fb19SBen Gras */
542fe8fb19SBen Gras
552fe8fb19SBen Gras typedef struct {
562fe8fb19SBen Gras uint16_t cell[0x80];
572fe8fb19SBen Gras #define EI_MASK UINT16_C(0xff)
582fe8fb19SBen Gras #define EI_DIRECT UINT16_C(0x100)
592fe8fb19SBen Gras #define EI_OPTION UINT16_C(0x200)
602fe8fb19SBen Gras #define EI_SPACE UINT16_C(0x400)
612fe8fb19SBen Gras } _UTF7EncodingInfo;
622fe8fb19SBen Gras
632fe8fb19SBen Gras typedef struct {
642fe8fb19SBen Gras unsigned int
652fe8fb19SBen Gras mode: 1, /* whether base64 mode */
662fe8fb19SBen Gras bits: 4, /* need to hold 0 - 15 */
672fe8fb19SBen Gras cache: 22, /* 22 = BASE64_BIT + UTF16_BIT */
682fe8fb19SBen Gras surrogate: 1; /* whether surrogate pair or not */
692fe8fb19SBen Gras int chlen;
702fe8fb19SBen Gras char ch[4]; /* BASE64_IN, 3 * 6 = 18, most closed to UTF16_BIT */
712fe8fb19SBen Gras } _UTF7State;
722fe8fb19SBen Gras
732fe8fb19SBen Gras typedef struct {
742fe8fb19SBen Gras _UTF7EncodingInfo ei;
752fe8fb19SBen Gras struct {
762fe8fb19SBen Gras /* for future multi-locale facility */
772fe8fb19SBen Gras _UTF7State s_mblen;
782fe8fb19SBen Gras _UTF7State s_mbrlen;
792fe8fb19SBen Gras _UTF7State s_mbrtowc;
802fe8fb19SBen Gras _UTF7State s_mbtowc;
812fe8fb19SBen Gras _UTF7State s_mbsrtowcs;
82*84d9c625SLionel Sambuc _UTF7State s_mbsnrtowcs;
832fe8fb19SBen Gras _UTF7State s_wcrtomb;
842fe8fb19SBen Gras _UTF7State s_wcsrtombs;
85*84d9c625SLionel Sambuc _UTF7State s_wcsnrtombs;
862fe8fb19SBen Gras _UTF7State s_wctomb;
872fe8fb19SBen Gras } states;
882fe8fb19SBen Gras } _UTF7CTypeInfo;
892fe8fb19SBen Gras
902fe8fb19SBen Gras #define _CEI_TO_EI(_cei_) (&(_cei_)->ei)
912fe8fb19SBen Gras #define _CEI_TO_STATE(_cei_, _func_) (_cei_)->states.s_##_func_
922fe8fb19SBen Gras
932fe8fb19SBen Gras #define _FUNCNAME(m) _citrus_UTF7_##m
942fe8fb19SBen Gras #define _ENCODING_INFO _UTF7EncodingInfo
952fe8fb19SBen Gras #define _CTYPE_INFO _UTF7CTypeInfo
962fe8fb19SBen Gras #define _ENCODING_STATE _UTF7State
972fe8fb19SBen Gras #define _ENCODING_MB_CUR_MAX(_ei_) 4
982fe8fb19SBen Gras #define _ENCODING_IS_STATE_DEPENDENT 1
992fe8fb19SBen Gras #define _STATE_NEEDS_EXPLICIT_INIT(_ps_) 0
1002fe8fb19SBen Gras
1012fe8fb19SBen Gras static __inline void
1022fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_init_state(_UTF7EncodingInfo * __restrict ei,_UTF7State * __restrict s)1032fe8fb19SBen Gras _citrus_UTF7_init_state(_UTF7EncodingInfo * __restrict ei,
1042fe8fb19SBen Gras _UTF7State * __restrict s)
1052fe8fb19SBen Gras {
1062fe8fb19SBen Gras /* ei appears to be unused */
1072fe8fb19SBen Gras _DIAGASSERT(s != NULL);
1082fe8fb19SBen Gras
1092fe8fb19SBen Gras memset((void *)s, 0, sizeof(*s));
1102fe8fb19SBen Gras }
1112fe8fb19SBen Gras
1122fe8fb19SBen Gras static __inline void
1132fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_pack_state(_UTF7EncodingInfo * __restrict ei,void * __restrict pspriv,const _UTF7State * __restrict s)1142fe8fb19SBen Gras _citrus_UTF7_pack_state(_UTF7EncodingInfo * __restrict ei,
1152fe8fb19SBen Gras void *__restrict pspriv, const _UTF7State * __restrict s)
1162fe8fb19SBen Gras {
1172fe8fb19SBen Gras /* ei seem to be unused */
1182fe8fb19SBen Gras _DIAGASSERT(pspriv != NULL);
1192fe8fb19SBen Gras _DIAGASSERT(s != NULL);
1202fe8fb19SBen Gras
1212fe8fb19SBen Gras memcpy(pspriv, (const void *)s, sizeof(*s));
1222fe8fb19SBen Gras }
1232fe8fb19SBen Gras
1242fe8fb19SBen Gras static __inline void
1252fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_unpack_state(_UTF7EncodingInfo * __restrict ei,_UTF7State * __restrict s,const void * __restrict pspriv)1262fe8fb19SBen Gras _citrus_UTF7_unpack_state(_UTF7EncodingInfo * __restrict ei,
1272fe8fb19SBen Gras _UTF7State * __restrict s, const void * __restrict pspriv)
1282fe8fb19SBen Gras {
1292fe8fb19SBen Gras /* ei seem to be unused */
1302fe8fb19SBen Gras _DIAGASSERT(s != NULL);
1312fe8fb19SBen Gras _DIAGASSERT(pspriv != NULL);
1322fe8fb19SBen Gras
1332fe8fb19SBen Gras memcpy((void *)s, pspriv, sizeof(*s));
1342fe8fb19SBen Gras }
1352fe8fb19SBen Gras
1362fe8fb19SBen Gras static const char base64[] =
1372fe8fb19SBen Gras "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
1382fe8fb19SBen Gras "abcdefghijklmnopqrstuvwxyz"
1392fe8fb19SBen Gras "0123456789+/";
1402fe8fb19SBen Gras
1412fe8fb19SBen Gras static const char direct[] =
1422fe8fb19SBen Gras "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
1432fe8fb19SBen Gras "abcdefghijklmnopqrstuvwxyz"
1442fe8fb19SBen Gras "0123456789(),-./:?";
1452fe8fb19SBen Gras
1462fe8fb19SBen Gras static const char option[] = "!\"#$%&';<=>@[]^_`{|}";
1472fe8fb19SBen Gras static const char spaces[] = " \t\r\n";
1482fe8fb19SBen Gras
1492fe8fb19SBen Gras #define BASE64_BIT 6
1502fe8fb19SBen Gras #define UTF16_BIT 16
1512fe8fb19SBen Gras
1522fe8fb19SBen Gras #define BASE64_MAX 0x3f
1532fe8fb19SBen Gras #define UTF16_MAX UINT16_C(0xffff)
1542fe8fb19SBen Gras #define UTF32_MAX UINT32_C(0x10ffff)
1552fe8fb19SBen Gras
1562fe8fb19SBen Gras #define BASE64_IN '+'
1572fe8fb19SBen Gras #define BASE64_OUT '-'
1582fe8fb19SBen Gras
1592fe8fb19SBen Gras #define SHIFT7BIT(c) ((c) >> 7)
1602fe8fb19SBen Gras #define ISSPECIAL(c) ((c) == '\0' || (c) == BASE64_IN)
1612fe8fb19SBen Gras
1622fe8fb19SBen Gras #define FINDLEN(ei, c) \
1632fe8fb19SBen Gras (SHIFT7BIT((c)) ? -1 : (((ei)->cell[(c)] & EI_MASK) - 1))
1642fe8fb19SBen Gras
1652fe8fb19SBen Gras #define ISDIRECT(ei, c) (!SHIFT7BIT((c)) && (ISSPECIAL((c)) || \
1662fe8fb19SBen Gras ei->cell[(c)] & (EI_DIRECT | EI_OPTION | EI_SPACE)))
1672fe8fb19SBen Gras
1682fe8fb19SBen Gras #define ISSAFE(ei, c) (!SHIFT7BIT((c)) && (ISSPECIAL((c)) || \
1692fe8fb19SBen Gras (c < 0x80 && ei->cell[(c)] & (EI_DIRECT | EI_SPACE))))
1702fe8fb19SBen Gras
1712fe8fb19SBen Gras /* surrogate pair */
1722fe8fb19SBen Gras #define SRG_BASE UINT32_C(0x10000)
1732fe8fb19SBen Gras #define HISRG_MIN UINT16_C(0xd800)
1742fe8fb19SBen Gras #define HISRG_MAX UINT16_C(0xdbff)
1752fe8fb19SBen Gras #define LOSRG_MIN UINT16_C(0xdc00)
1762fe8fb19SBen Gras #define LOSRG_MAX UINT16_C(0xdfff)
1772fe8fb19SBen Gras
1782fe8fb19SBen Gras static int
_citrus_UTF7_mbtoutf16(_UTF7EncodingInfo * __restrict ei,uint16_t * __restrict u16,const char ** __restrict s,size_t n,_UTF7State * __restrict psenc,size_t * __restrict nresult)1792fe8fb19SBen Gras _citrus_UTF7_mbtoutf16(_UTF7EncodingInfo * __restrict ei,
1802fe8fb19SBen Gras uint16_t * __restrict u16, const char ** __restrict s, size_t n,
1812fe8fb19SBen Gras _UTF7State * __restrict psenc, size_t * __restrict nresult)
1822fe8fb19SBen Gras {
1832fe8fb19SBen Gras _UTF7State sv;
1842fe8fb19SBen Gras const char *s0;
1852fe8fb19SBen Gras int i, done, len;
1862fe8fb19SBen Gras
1872fe8fb19SBen Gras _DIAGASSERT(ei != NULL);
1882fe8fb19SBen Gras _DIAGASSERT(s != NULL && *s != NULL);
1892fe8fb19SBen Gras _DIAGASSERT(psenc != NULL);
1902fe8fb19SBen Gras
1912fe8fb19SBen Gras s0 = *s;
1922fe8fb19SBen Gras sv = *psenc;
1932fe8fb19SBen Gras
1942fe8fb19SBen Gras for (i = 0, done = 0; done == 0; i++) {
1952fe8fb19SBen Gras _DIAGASSERT(i <= psenc->chlen);
1962fe8fb19SBen Gras if (i == psenc->chlen) {
1972fe8fb19SBen Gras if (n-- < 1) {
1982fe8fb19SBen Gras *nresult = (size_t)-2;
1992fe8fb19SBen Gras *s = s0;
2002fe8fb19SBen Gras sv.chlen = psenc->chlen;
2012fe8fb19SBen Gras *psenc = sv;
2022fe8fb19SBen Gras return 0;
2032fe8fb19SBen Gras }
2042fe8fb19SBen Gras psenc->ch[psenc->chlen++] = *s0++;
2052fe8fb19SBen Gras }
2062fe8fb19SBen Gras if (SHIFT7BIT((int)psenc->ch[i]))
2072fe8fb19SBen Gras goto ilseq;
2082fe8fb19SBen Gras if (!psenc->mode) {
2092fe8fb19SBen Gras if (psenc->bits > 0 || psenc->cache > 0)
2102fe8fb19SBen Gras return EINVAL;
2112fe8fb19SBen Gras if (psenc->ch[i] == BASE64_IN) {
2122fe8fb19SBen Gras psenc->mode = 1;
2132fe8fb19SBen Gras } else {
2142fe8fb19SBen Gras if (!ISDIRECT(ei, (int)psenc->ch[i]))
2152fe8fb19SBen Gras goto ilseq;
2162fe8fb19SBen Gras *u16 = (uint16_t)psenc->ch[i];
2172fe8fb19SBen Gras done = 1;
2182fe8fb19SBen Gras continue;
2192fe8fb19SBen Gras }
2202fe8fb19SBen Gras } else {
2212fe8fb19SBen Gras if (psenc->ch[i] == BASE64_OUT && psenc->cache == 0) {
2222fe8fb19SBen Gras psenc->mode = 0;
2232fe8fb19SBen Gras *u16 = (uint16_t)BASE64_IN;
2242fe8fb19SBen Gras done = 1;
2252fe8fb19SBen Gras continue;
2262fe8fb19SBen Gras }
2272fe8fb19SBen Gras len = FINDLEN(ei, (int)psenc->ch[i]);
2282fe8fb19SBen Gras if (len < 0) {
2292fe8fb19SBen Gras if (psenc->bits >= BASE64_BIT)
2302fe8fb19SBen Gras return EINVAL;
2312fe8fb19SBen Gras psenc->mode = 0;
2322fe8fb19SBen Gras psenc->bits = psenc->cache = 0;
2332fe8fb19SBen Gras if (psenc->ch[i] != BASE64_OUT) {
2342fe8fb19SBen Gras if (!ISDIRECT(ei, (int)psenc->ch[i]))
2352fe8fb19SBen Gras goto ilseq;
2362fe8fb19SBen Gras *u16 = (uint16_t)psenc->ch[i];
2372fe8fb19SBen Gras done = 1;
2382fe8fb19SBen Gras }
2392fe8fb19SBen Gras } else {
2402fe8fb19SBen Gras psenc->cache =
2412fe8fb19SBen Gras (psenc->cache << BASE64_BIT) | len;
2422fe8fb19SBen Gras switch (psenc->bits) {
2432fe8fb19SBen Gras case 0: case 2: case 4: case 6: case 8:
2442fe8fb19SBen Gras psenc->bits += BASE64_BIT;
2452fe8fb19SBen Gras break;
2462fe8fb19SBen Gras case 10: case 12: case 14:
2472fe8fb19SBen Gras psenc->bits -= (UTF16_BIT - BASE64_BIT);
2482fe8fb19SBen Gras *u16 = (psenc->cache >> psenc->bits)
2492fe8fb19SBen Gras & UTF16_MAX;
2502fe8fb19SBen Gras done = 1;
2512fe8fb19SBen Gras break;
2522fe8fb19SBen Gras default:
2532fe8fb19SBen Gras return EINVAL;
2542fe8fb19SBen Gras }
2552fe8fb19SBen Gras }
2562fe8fb19SBen Gras }
2572fe8fb19SBen Gras }
2582fe8fb19SBen Gras
2592fe8fb19SBen Gras if (psenc->chlen > i)
2602fe8fb19SBen Gras return EINVAL;
2612fe8fb19SBen Gras psenc->chlen = 0;
2622fe8fb19SBen Gras *nresult = (size_t)((*u16 == 0) ? 0 : s0 - *s);
2632fe8fb19SBen Gras *s = s0;
2642fe8fb19SBen Gras
2652fe8fb19SBen Gras return 0;
2662fe8fb19SBen Gras
2672fe8fb19SBen Gras ilseq:
2682fe8fb19SBen Gras *nresult = (size_t)-1;
2692fe8fb19SBen Gras return EILSEQ;
2702fe8fb19SBen Gras }
2712fe8fb19SBen Gras
2722fe8fb19SBen Gras static int
_citrus_UTF7_mbrtowc_priv(_UTF7EncodingInfo * __restrict ei,wchar_t * __restrict pwc,const char ** __restrict s,size_t n,_UTF7State * __restrict psenc,size_t * __restrict nresult)2732fe8fb19SBen Gras _citrus_UTF7_mbrtowc_priv(_UTF7EncodingInfo * __restrict ei,
2742fe8fb19SBen Gras wchar_t * __restrict pwc, const char ** __restrict s, size_t n,
2752fe8fb19SBen Gras _UTF7State * __restrict psenc, size_t * __restrict nresult)
2762fe8fb19SBen Gras {
2772fe8fb19SBen Gras const char *s0;
2782fe8fb19SBen Gras uint32_t u32;
2792fe8fb19SBen Gras uint16_t hi, lo;
2802fe8fb19SBen Gras size_t siz, nr;
2812fe8fb19SBen Gras int err;
2822fe8fb19SBen Gras
2832fe8fb19SBen Gras _DIAGASSERT(ei != NULL);
2842fe8fb19SBen Gras /* pwc may be null */
2852fe8fb19SBen Gras _DIAGASSERT(s != NULL);
2862fe8fb19SBen Gras _DIAGASSERT(psenc != NULL);
2872fe8fb19SBen Gras
2882fe8fb19SBen Gras if (*s == NULL) {
2892fe8fb19SBen Gras _citrus_UTF7_init_state(ei, psenc);
2902fe8fb19SBen Gras *nresult = (size_t)_ENCODING_IS_STATE_DEPENDENT;
2912fe8fb19SBen Gras return 0;
2922fe8fb19SBen Gras }
2932fe8fb19SBen Gras s0 = *s;
2942fe8fb19SBen Gras if (psenc->surrogate) {
2952fe8fb19SBen Gras hi = (psenc->cache >> 2) & UTF16_MAX;
2962fe8fb19SBen Gras if (hi < HISRG_MIN || hi > HISRG_MAX)
2972fe8fb19SBen Gras return EINVAL;
2982fe8fb19SBen Gras siz = 0;
2992fe8fb19SBen Gras } else {
3002fe8fb19SBen Gras err = _citrus_UTF7_mbtoutf16(ei, &hi, &s0, n, psenc, &nr);
3012fe8fb19SBen Gras if (nr == (size_t)-1 || nr == (size_t)-2) {
3022fe8fb19SBen Gras *nresult = nr;
3032fe8fb19SBen Gras return err;
3042fe8fb19SBen Gras }
3052fe8fb19SBen Gras if (err != 0)
3062fe8fb19SBen Gras return err;
3072fe8fb19SBen Gras n -= nr;
3082fe8fb19SBen Gras siz = nr;
3092fe8fb19SBen Gras if (hi < HISRG_MIN || hi > HISRG_MAX) {
3102fe8fb19SBen Gras u32 = (uint32_t)hi;
3112fe8fb19SBen Gras goto done;
3122fe8fb19SBen Gras }
3132fe8fb19SBen Gras psenc->surrogate = 1;
3142fe8fb19SBen Gras }
3152fe8fb19SBen Gras err = _citrus_UTF7_mbtoutf16(ei, &lo, &s0, n, psenc, &nr);
3162fe8fb19SBen Gras if (nr == (size_t)-1 || nr == (size_t)-2) {
3172fe8fb19SBen Gras *nresult = nr;
3182fe8fb19SBen Gras return err;
3192fe8fb19SBen Gras }
3202fe8fb19SBen Gras if (err != 0)
3212fe8fb19SBen Gras return err;
3222fe8fb19SBen Gras hi -= HISRG_MIN;
3232fe8fb19SBen Gras lo -= LOSRG_MIN;
3242fe8fb19SBen Gras u32 = (hi << 10 | lo) + SRG_BASE;
3252fe8fb19SBen Gras siz += nr;
3262fe8fb19SBen Gras done:
3272fe8fb19SBen Gras *s = s0;
3282fe8fb19SBen Gras if (pwc != NULL)
3292fe8fb19SBen Gras *pwc = (wchar_t)u32;
3302fe8fb19SBen Gras if (u32 == (uint32_t)0) {
3312fe8fb19SBen Gras *nresult = (size_t)0;
3322fe8fb19SBen Gras _citrus_UTF7_init_state(ei, psenc);
3332fe8fb19SBen Gras } else {
3342fe8fb19SBen Gras *nresult = siz;
3352fe8fb19SBen Gras psenc->surrogate = 0;
3362fe8fb19SBen Gras }
3372fe8fb19SBen Gras return err;
3382fe8fb19SBen Gras }
3392fe8fb19SBen Gras
3402fe8fb19SBen Gras static int
_citrus_UTF7_utf16tomb(_UTF7EncodingInfo * __restrict ei,char * __restrict s,size_t n,uint16_t u16,_UTF7State * __restrict psenc,size_t * __restrict nresult)3412fe8fb19SBen Gras _citrus_UTF7_utf16tomb(_UTF7EncodingInfo * __restrict ei,
3422fe8fb19SBen Gras char * __restrict s, size_t n, uint16_t u16,
3432fe8fb19SBen Gras _UTF7State * __restrict psenc, size_t * __restrict nresult)
3442fe8fb19SBen Gras {
3452fe8fb19SBen Gras int bits, i;
3462fe8fb19SBen Gras
3472fe8fb19SBen Gras _DIAGASSERT(ei != NULL);
3482fe8fb19SBen Gras _DIAGASSERT(psenc != NULL);
3492fe8fb19SBen Gras
3502fe8fb19SBen Gras if (psenc->chlen != 0 || psenc->bits > BASE64_BIT)
3512fe8fb19SBen Gras return EINVAL;
3522fe8fb19SBen Gras
3532fe8fb19SBen Gras if (ISSAFE(ei, u16)) {
3542fe8fb19SBen Gras if (psenc->mode) {
3552fe8fb19SBen Gras if (psenc->bits > 0) {
3562fe8fb19SBen Gras bits = BASE64_BIT - psenc->bits;
3572fe8fb19SBen Gras i = (psenc->cache << bits) & BASE64_MAX;
3582fe8fb19SBen Gras psenc->ch[psenc->chlen++] = base64[i];
3592fe8fb19SBen Gras psenc->bits = psenc->cache = 0;
3602fe8fb19SBen Gras }
3612fe8fb19SBen Gras if (u16 == BASE64_OUT || FINDLEN(ei, u16) >= 0)
3622fe8fb19SBen Gras psenc->ch[psenc->chlen++] = BASE64_OUT;
3632fe8fb19SBen Gras psenc->mode = 0;
3642fe8fb19SBen Gras }
3652fe8fb19SBen Gras if (psenc->bits != 0)
3662fe8fb19SBen Gras return EINVAL;
3672fe8fb19SBen Gras psenc->ch[psenc->chlen++] = (char)u16;
3682fe8fb19SBen Gras if (u16 == BASE64_IN)
3692fe8fb19SBen Gras psenc->ch[psenc->chlen++] = BASE64_OUT;
3702fe8fb19SBen Gras } else {
3712fe8fb19SBen Gras if (!psenc->mode) {
3722fe8fb19SBen Gras if (psenc->bits > 0)
3732fe8fb19SBen Gras return EINVAL;
3742fe8fb19SBen Gras psenc->ch[psenc->chlen++] = BASE64_IN;
3752fe8fb19SBen Gras psenc->mode = 1;
3762fe8fb19SBen Gras }
3772fe8fb19SBen Gras psenc->cache = (psenc->cache << UTF16_BIT) | u16;
3782fe8fb19SBen Gras bits = UTF16_BIT + psenc->bits;
3792fe8fb19SBen Gras psenc->bits = bits % BASE64_BIT;
3802fe8fb19SBen Gras while ((bits -= BASE64_BIT) >= 0) {
3812fe8fb19SBen Gras i = (psenc->cache >> bits) & BASE64_MAX;
3822fe8fb19SBen Gras psenc->ch[psenc->chlen++] = base64[i];
3832fe8fb19SBen Gras }
3842fe8fb19SBen Gras }
3852fe8fb19SBen Gras memcpy(s, psenc->ch, psenc->chlen);
3862fe8fb19SBen Gras *nresult = psenc->chlen;
3872fe8fb19SBen Gras psenc->chlen = 0;
3882fe8fb19SBen Gras
3892fe8fb19SBen Gras return 0;
3902fe8fb19SBen Gras }
3912fe8fb19SBen Gras
3922fe8fb19SBen Gras static int
_citrus_UTF7_wcrtomb_priv(_UTF7EncodingInfo * __restrict ei,char * __restrict s,size_t n,wchar_t wchar,_UTF7State * __restrict psenc,size_t * __restrict nresult)3932fe8fb19SBen Gras _citrus_UTF7_wcrtomb_priv(_UTF7EncodingInfo * __restrict ei,
3942fe8fb19SBen Gras char * __restrict s, size_t n, wchar_t wchar,
3952fe8fb19SBen Gras _UTF7State * __restrict psenc, size_t * __restrict nresult)
3962fe8fb19SBen Gras {
3972fe8fb19SBen Gras uint32_t u32;
3982fe8fb19SBen Gras uint16_t u16[2];
3992fe8fb19SBen Gras int err, len, i;
4002fe8fb19SBen Gras size_t siz, nr;
4012fe8fb19SBen Gras
4022fe8fb19SBen Gras _DIAGASSERT(ei != NULL);
4032fe8fb19SBen Gras _DIAGASSERT(s != NULL);
4042fe8fb19SBen Gras _DIAGASSERT(psenc != NULL);
4052fe8fb19SBen Gras _DIAGASSERT(nresult != NULL);
4062fe8fb19SBen Gras
4072fe8fb19SBen Gras u32 = (uint32_t)wchar;
4082fe8fb19SBen Gras if (u32 <= UTF16_MAX) {
4092fe8fb19SBen Gras u16[0] = (uint16_t)u32;
4102fe8fb19SBen Gras len = 1;
4112fe8fb19SBen Gras } else if (u32 <= UTF32_MAX) {
4122fe8fb19SBen Gras u32 -= SRG_BASE;
4132fe8fb19SBen Gras u16[0] = (u32 >> 10) + HISRG_MIN;
4142fe8fb19SBen Gras u16[1] = ((uint16_t)(u32 & UINT32_C(0x3ff))) + LOSRG_MIN;
4152fe8fb19SBen Gras len = 2;
4162fe8fb19SBen Gras } else {
4172fe8fb19SBen Gras *nresult = (size_t)-1;
4182fe8fb19SBen Gras return EILSEQ;
4192fe8fb19SBen Gras }
4202fe8fb19SBen Gras siz = 0;
4212fe8fb19SBen Gras for (i = 0; i < len; ++i) {
4222fe8fb19SBen Gras err = _citrus_UTF7_utf16tomb(ei, s, n, u16[i], psenc, &nr);
4232fe8fb19SBen Gras if (err != 0)
4242fe8fb19SBen Gras return err; /* XXX: state has been modified */
4252fe8fb19SBen Gras s += nr;
4262fe8fb19SBen Gras n -= nr;
4272fe8fb19SBen Gras siz += nr;
4282fe8fb19SBen Gras }
4292fe8fb19SBen Gras *nresult = siz;
4302fe8fb19SBen Gras
4312fe8fb19SBen Gras return 0;
4322fe8fb19SBen Gras }
4332fe8fb19SBen Gras
4342fe8fb19SBen Gras static int
4352fe8fb19SBen Gras /* ARGSUSED */
_citrus_UTF7_put_state_reset(_UTF7EncodingInfo * __restrict ei,char * __restrict s,size_t n,_UTF7State * __restrict psenc,size_t * __restrict nresult)4362fe8fb19SBen Gras _citrus_UTF7_put_state_reset(_UTF7EncodingInfo * __restrict ei,
4372fe8fb19SBen Gras char * __restrict s, size_t n, _UTF7State * __restrict psenc,
4382fe8fb19SBen Gras size_t * __restrict nresult)
4392fe8fb19SBen Gras {
4402fe8fb19SBen Gras int bits, pos;
4412fe8fb19SBen Gras
4422fe8fb19SBen Gras _DIAGASSERT(ei != NULL);
4432fe8fb19SBen Gras _DIAGASSERT(s != NULL);
4442fe8fb19SBen Gras _DIAGASSERT(psenc != NULL);
4452fe8fb19SBen Gras _DIAGASSERT(nresult != NULL);
4462fe8fb19SBen Gras
4472fe8fb19SBen Gras if (psenc->chlen != 0 || psenc->bits > BASE64_BIT || psenc->surrogate)
4482fe8fb19SBen Gras return EINVAL;
4492fe8fb19SBen Gras
4502fe8fb19SBen Gras if (psenc->mode) {
4512fe8fb19SBen Gras if (psenc->bits > 0) {
4522fe8fb19SBen Gras if (n-- < 1)
4532fe8fb19SBen Gras return E2BIG;
4542fe8fb19SBen Gras bits = BASE64_BIT - psenc->bits;
4552fe8fb19SBen Gras pos = (psenc->cache << bits) & BASE64_MAX;
4562fe8fb19SBen Gras psenc->ch[psenc->chlen++] = base64[pos];
4572fe8fb19SBen Gras psenc->ch[psenc->chlen++] = BASE64_OUT;
4582fe8fb19SBen Gras psenc->bits = psenc->cache = 0;
4592fe8fb19SBen Gras }
4602fe8fb19SBen Gras psenc->mode = 0;
4612fe8fb19SBen Gras }
4622fe8fb19SBen Gras if (psenc->bits != 0)
4632fe8fb19SBen Gras return EINVAL;
4642fe8fb19SBen Gras if (n-- < 1)
4652fe8fb19SBen Gras return E2BIG;
4662fe8fb19SBen Gras
4672fe8fb19SBen Gras _DIAGASSERT(n >= psenc->chlen);
4682fe8fb19SBen Gras *nresult = (size_t)psenc->chlen;
4692fe8fb19SBen Gras if (psenc->chlen > 0) {
4702fe8fb19SBen Gras memcpy(s, psenc->ch, psenc->chlen);
4712fe8fb19SBen Gras psenc->chlen = 0;
4722fe8fb19SBen Gras }
4732fe8fb19SBen Gras
4742fe8fb19SBen Gras return 0;
4752fe8fb19SBen Gras }
4762fe8fb19SBen Gras
4772fe8fb19SBen Gras static __inline int
4782fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_stdenc_wctocs(_UTF7EncodingInfo * __restrict ei,_csid_t * __restrict csid,_index_t * __restrict idx,wchar_t wc)4792fe8fb19SBen Gras _citrus_UTF7_stdenc_wctocs(_UTF7EncodingInfo * __restrict ei,
4802fe8fb19SBen Gras _csid_t * __restrict csid,
4812fe8fb19SBen Gras _index_t * __restrict idx, wchar_t wc)
4822fe8fb19SBen Gras {
4832fe8fb19SBen Gras /* ei seem to be unused */
4842fe8fb19SBen Gras _DIAGASSERT(csid != NULL);
4852fe8fb19SBen Gras _DIAGASSERT(idx != NULL);
4862fe8fb19SBen Gras
4872fe8fb19SBen Gras *csid = 0;
4882fe8fb19SBen Gras *idx = (_index_t)wc;
4892fe8fb19SBen Gras
4902fe8fb19SBen Gras return 0;
4912fe8fb19SBen Gras }
4922fe8fb19SBen Gras
4932fe8fb19SBen Gras static __inline int
4942fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_stdenc_cstowc(_UTF7EncodingInfo * __restrict ei,wchar_t * __restrict wc,_csid_t csid,_index_t idx)4952fe8fb19SBen Gras _citrus_UTF7_stdenc_cstowc(_UTF7EncodingInfo * __restrict ei,
4962fe8fb19SBen Gras wchar_t * __restrict wc,
4972fe8fb19SBen Gras _csid_t csid, _index_t idx)
4982fe8fb19SBen Gras {
4992fe8fb19SBen Gras /* ei seem to be unused */
5002fe8fb19SBen Gras _DIAGASSERT(wc != NULL);
5012fe8fb19SBen Gras
5022fe8fb19SBen Gras if (csid != 0)
5032fe8fb19SBen Gras return EILSEQ;
5042fe8fb19SBen Gras *wc = (wchar_t)idx;
5052fe8fb19SBen Gras
5062fe8fb19SBen Gras return 0;
5072fe8fb19SBen Gras }
5082fe8fb19SBen Gras
5092fe8fb19SBen Gras static __inline int
5102fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_stdenc_get_state_desc_generic(_UTF7EncodingInfo * __restrict ei,_UTF7State * __restrict psenc,int * __restrict rstate)5112fe8fb19SBen Gras _citrus_UTF7_stdenc_get_state_desc_generic(_UTF7EncodingInfo * __restrict ei,
5122fe8fb19SBen Gras _UTF7State * __restrict psenc,
5132fe8fb19SBen Gras int * __restrict rstate)
5142fe8fb19SBen Gras {
5152fe8fb19SBen Gras
5162fe8fb19SBen Gras if (psenc->chlen == 0)
5172fe8fb19SBen Gras *rstate = _STDENC_SDGEN_INITIAL;
5182fe8fb19SBen Gras else
5192fe8fb19SBen Gras *rstate = _STDENC_SDGEN_INCOMPLETE_CHAR;
5202fe8fb19SBen Gras
5212fe8fb19SBen Gras return 0;
5222fe8fb19SBen Gras }
5232fe8fb19SBen Gras
5242fe8fb19SBen Gras static void
5252fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_encoding_module_uninit(_UTF7EncodingInfo * ei)5262fe8fb19SBen Gras _citrus_UTF7_encoding_module_uninit(_UTF7EncodingInfo *ei)
5272fe8fb19SBen Gras {
5282fe8fb19SBen Gras /* ei seems to be unused */
5292fe8fb19SBen Gras }
5302fe8fb19SBen Gras
5312fe8fb19SBen Gras static int
5322fe8fb19SBen Gras /*ARGSUSED*/
_citrus_UTF7_encoding_module_init(_UTF7EncodingInfo * __restrict ei,const void * __restrict var,size_t lenvar)5332fe8fb19SBen Gras _citrus_UTF7_encoding_module_init(_UTF7EncodingInfo * __restrict ei,
5342fe8fb19SBen Gras const void * __restrict var, size_t lenvar)
5352fe8fb19SBen Gras {
5362fe8fb19SBen Gras const char *s;
5372fe8fb19SBen Gras
5382fe8fb19SBen Gras _DIAGASSERT(ei != NULL);
5392fe8fb19SBen Gras /* var may be null */
5402fe8fb19SBen Gras
5412fe8fb19SBen Gras memset(ei, 0, sizeof(*ei));
5422fe8fb19SBen Gras
5432fe8fb19SBen Gras #define FILL(str, flag) \
5442fe8fb19SBen Gras do { \
5452fe8fb19SBen Gras for (s = str; *s != '\0'; s++) \
5462fe8fb19SBen Gras ei->cell[*s & 0x7f] |= flag; \
5472fe8fb19SBen Gras } while (/*CONSTCOND*/0)
5482fe8fb19SBen Gras
5492fe8fb19SBen Gras FILL(base64, (s - base64) + 1);
5502fe8fb19SBen Gras FILL(direct, EI_DIRECT);
5512fe8fb19SBen Gras FILL(option, EI_OPTION);
5522fe8fb19SBen Gras FILL(spaces, EI_SPACE);
5532fe8fb19SBen Gras
5542fe8fb19SBen Gras return 0;
5552fe8fb19SBen Gras }
5562fe8fb19SBen Gras
5572fe8fb19SBen Gras /* ----------------------------------------------------------------------
5582fe8fb19SBen Gras * public interface for ctype
5592fe8fb19SBen Gras */
5602fe8fb19SBen Gras
5612fe8fb19SBen Gras _CITRUS_CTYPE_DECLS(UTF7);
5622fe8fb19SBen Gras _CITRUS_CTYPE_DEF_OPS(UTF7);
5632fe8fb19SBen Gras
5642fe8fb19SBen Gras #include "citrus_ctype_template.h"
5652fe8fb19SBen Gras
5662fe8fb19SBen Gras /* ----------------------------------------------------------------------
5672fe8fb19SBen Gras * public interface for stdenc
5682fe8fb19SBen Gras */
5692fe8fb19SBen Gras
5702fe8fb19SBen Gras _CITRUS_STDENC_DECLS(UTF7);
5712fe8fb19SBen Gras _CITRUS_STDENC_DEF_OPS(UTF7);
5722fe8fb19SBen Gras
5732fe8fb19SBen Gras #include "citrus_stdenc_template.h"
574