usr.bin/mail/mime_header.c

*ba2b5111Schristos/*	$NetBSD: mime_header.c,v 1.9 2013/02/14 18:23:45 christos Exp $	*/
8207b28aSchristos
8207b28aSchristos/*-
8207b28aSchristos * Copyright (c) 2006 The NetBSD Foundation, Inc.
8207b28aSchristos * All rights reserved.
8207b28aSchristos *
8207b28aSchristos * This code is derived from software contributed to The NetBSD Foundation
8207b28aSchristos * by Anon Ymous.
8207b28aSchristos *
8207b28aSchristos * Redistribution and use in source and binary forms, with or without
8207b28aSchristos * modification, are permitted provided that the following conditions
8207b28aSchristos * are met:
8207b28aSchristos * 1. Redistributions of source code must retain the above copyright
8207b28aSchristos *    notice, this list of conditions and the following disclaimer.
8207b28aSchristos * 2. Redistributions in binary form must reproduce the above copyright
8207b28aSchristos *    notice, this list of conditions and the following disclaimer in the
8207b28aSchristos *    documentation and/or other materials provided with the distribution.
8207b28aSchristos *
8207b28aSchristos * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
8207b28aSchristos * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
8207b28aSchristos * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
8207b28aSchristos * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
8207b28aSchristos * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
8207b28aSchristos * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
8207b28aSchristos * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
8207b28aSchristos * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
8207b28aSchristos * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
8207b28aSchristos * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
8207b28aSchristos * POSSIBILITY OF SUCH DAMAGE.
8207b28aSchristos */
8207b28aSchristos
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * This module contains the core MIME header decoding routines.
8207b28aSchristos * Please refer to RFC 2047 and RFC 2822.
8207b28aSchristos */
8207b28aSchristos
8207b28aSchristos#ifdef MIME_SUPPORT
8207b28aSchristos
8207b28aSchristos#include <sys/cdefs.h>
8207b28aSchristos#ifndef __lint__
*ba2b5111Schristos__RCSID("$NetBSD: mime_header.c,v 1.9 2013/02/14 18:23:45 christos Exp $");
8207b28aSchristos#endif /* not __lint__ */
8207b28aSchristos
ca13337dSchristos#include <assert.h>
8207b28aSchristos#include <stdio.h>
8207b28aSchristos#include <stdlib.h>
8207b28aSchristos#include <string.h>
8207b28aSchristos
8207b28aSchristos#include "def.h"
8207b28aSchristos#include "extern.h"
8207b28aSchristos#include "mime.h"
8207b28aSchristos#include "mime_header.h"
8207b28aSchristos#include "mime_codecs.h"
8207b28aSchristos
8207b28aSchristosstatic const char *
8207b28aSchristosgrab_charset(char *from_cs, size_t from_cs_len, const char *p)
8207b28aSchristos{
8207b28aSchristos	char *q;
8207b28aSchristos	q = from_cs;
8207b28aSchristos	for (/*EMPTY*/; *p != '?'; p++) {
8207b28aSchristos		if (*p == '\0' || q >= from_cs + from_cs_len - 1)
8207b28aSchristos			return NULL;
8207b28aSchristos		*q++ = *p;
8207b28aSchristos	}
8207b28aSchristos	*q = '\0';
8207b28aSchristos	return ++p;	/* if here, then we got the '?' */
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * An encoded word is a string of at most 75 non-white space
8207b28aSchristos * characters of the following form:
8207b28aSchristos *
8207b28aSchristos *  =?charset?X?encoding?=
8207b28aSchristos *
8207b28aSchristos * where:
8207b28aSchristos *   'charset'	is the original character set of the unencoded string.
8207b28aSchristos *
8207b28aSchristos *   'X'	is the encoding type 'B' or 'Q' for "base64" or
8207b28aSchristos *              "quoted-printable", respectively,
8207b28aSchristos *   'encoding'	is the encoded string.
8207b28aSchristos *
8207b28aSchristos * Both 'charset' and 'X' are case independent and 'encoding' cannot
8207b28aSchristos * contain any whitespace or '?' characters.  The 'encoding' must also
8207b28aSchristos * be fully contained within the encoded words, i.e., it cannot be
8207b28aSchristos * split between encoded words.
8207b28aSchristos *
8207b28aSchristos * Note: the 'B' encoding is a slightly modified "quoted-printable"
8207b28aSchristos * encoding.  In particular, spaces (' ') may be encoded as '_' to
8207b28aSchristos * improve undecoded readability.
8207b28aSchristos */
8207b28aSchristosstatic int
8207b28aSchristosdecode_word(const char **ibuf, char **obuf, char *oend, const char *to_cs)
8207b28aSchristos{
8207b28aSchristos	ssize_t declen;
8207b28aSchristos	size_t enclen, dstlen;
8207b28aSchristos	char decword[LINESIZE];
8207b28aSchristos	char from_cs[LINESIZE];
8207b28aSchristos	const char *encword, *iend, *p;
8207b28aSchristos	char *dstend;
8207b28aSchristos	char enctype;
8207b28aSchristos
8207b28aSchristos	p = *ibuf;
8207b28aSchristos	if (p[0] != '=' && p[1] != '?')
8207b28aSchristos		return -1;
8207b28aSchristos	if (strlen(p) <  2 + 1 + 3 + 1 + 2)
8207b28aSchristos		return -1;
8207b28aSchristos	p = grab_charset(from_cs, sizeof(from_cs), p + 2);
8207b28aSchristos	if (p == NULL)
8207b28aSchristos		return -1;
8207b28aSchristos	enctype = *p++;
8207b28aSchristos	if (*p++ != '?')
8207b28aSchristos		return -1;
8207b28aSchristos	encword = p;
8207b28aSchristos	p = strchr(p, '?');
8207b28aSchristos	if (p == NULL || p[1] != '=')
8207b28aSchristos		return -1;
8207b28aSchristos	enclen = p - encword;	/* length of encoded substring */
8207b28aSchristos	iend = p + 2;
8207b28aSchristos	/* encoded words are at most 75 characters (RFC 2047, sec 2) */
8207b28aSchristos	if (iend > *ibuf + 75)
8207b28aSchristos		return -1;
8207b28aSchristos
ca13337dSchristos	if (oend < *obuf + 1) {
ca13337dSchristos		assert(/*CONSTCOND*/ 0);	/* We have a coding error! */
ca13337dSchristos		return -1;
ca13337dSchristos	}
8207b28aSchristos	dstend = to_cs ? decword : *obuf;
c172e3b9Slukem	dstlen = (to_cs ? sizeof(decword) : (size_t)(oend - *obuf)) - 1;
8207b28aSchristos
*ba2b5111Schristos	declen = mime_rfc2047_decode(enctype, dstend, dstlen, encword, enclen);
8207b28aSchristos	if (declen == -1)
8207b28aSchristos		return -1;
8207b28aSchristos
8207b28aSchristos	dstend += declen;
8207b28aSchristos#ifdef CHARSET_SUPPORT
8207b28aSchristos	if (to_cs != NULL) {
8207b28aSchristos		iconv_t cd;
8207b28aSchristos		const char *src;
8207b28aSchristos		size_t srclen;
8207b28aSchristos		size_t cnt;
8207b28aSchristos
8207b28aSchristos		cd = iconv_open(to_cs, from_cs);
8207b28aSchristos		if (cd == (iconv_t)-1)
8207b28aSchristos			return -1;
8207b28aSchristos
8207b28aSchristos		src = decword;
8207b28aSchristos		srclen = declen;
8207b28aSchristos		dstend = *obuf;
8207b28aSchristos		dstlen = oend - *obuf - 1;
8207b28aSchristos		cnt = mime_iconv(cd, &src, &srclen, &dstend, &dstlen);
8207b28aSchristos
8207b28aSchristos		(void)iconv_close(cd);
8207b28aSchristos		if (cnt == (size_t)-1)
8207b28aSchristos			return -1;
8207b28aSchristos	}
8207b28aSchristos#endif /* CHARSET_SUPPORT */
8207b28aSchristos	*dstend = '\0';
8207b28aSchristos	*ibuf = iend;
8207b28aSchristos	*obuf = dstend;
8207b28aSchristos	return 0;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Folding White Space.  See RFC 2822.
d727506fSchristos *
d727506fSchristos * Note: RFC 2822 specifies that '\n' and '\r' only occur as CRLF
d727506fSchristos * pairs (i.e., "\r\n") and never separately.  However, by the time
d727506fSchristos * mail(1) sees the messages, all CRLF pairs have been converted to
d727506fSchristos * '\n' characters.
d727506fSchristos *
d727506fSchristos * XXX - pull is_FWS() and skip_FWS() up to def.h?
8207b28aSchristos */
8207b28aSchristosstatic inline int
8207b28aSchristosis_FWS(int c)
8207b28aSchristos{
d727506fSchristos	return c == ' ' || c == '\t' || c == '\n';
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristosstatic inline const char *
8207b28aSchristosskip_FWS(const char *p)
8207b28aSchristos{
d727506fSchristos	while (is_FWS(*p))
8207b28aSchristos		p++;
8207b28aSchristos	return p;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristosstatic inline void
8207b28aSchristoscopy_skipped_FWS(char **dst, char *dstend, const char **src, const char *srcend)
8207b28aSchristos{
8207b28aSchristos	const char *p, *pend;
8207b28aSchristos	char *q, *qend;
8207b28aSchristos
8207b28aSchristos	p = *src;
8207b28aSchristos	q = *dst;
8207b28aSchristos	pend = srcend;
8207b28aSchristos	qend = dstend;
8207b28aSchristos
8207b28aSchristos	if (p) {  /* copy any skipped linear-white-space */
8207b28aSchristos		while (p < pend && q < qend)
8207b28aSchristos			*q++ = *p++;
8207b28aSchristos		*dst = q;
8207b28aSchristos		*src = NULL;
8207b28aSchristos	}
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Decode an unstructured field.
8207b28aSchristos *
8207b28aSchristos * See RFC 2822 Sec 2.2.1 and 3.6.5.
8207b28aSchristos * Encoded words may occur anywhere in unstructured fields provided
8207b28aSchristos * they are separated from any other text or encoded words by at least
8207b28aSchristos * one linear-white-space character. (See RFC 2047 sec 5.1.)  If two
8207b28aSchristos * encoded words occur sequentially (separated by only FWS) then the
8207b28aSchristos * separating FWS is removed.
8207b28aSchristos *
8207b28aSchristos * NOTE: unstructured fields cannot contain 'quoted-pairs' (see
8207b28aSchristos * RFC2822 sec 3.2.6 and RFC 2047), but that is no problem as a '\\'
8207b28aSchristos * (or any non-whitespace character) immediately before an
8207b28aSchristos * encoded-word will prevent it from being decoded.
8207b28aSchristos *
8207b28aSchristos * hstring should be a NULL terminated string.
8207b28aSchristos * outbuf should be sufficiently large to hold the result.
8207b28aSchristos */
8207b28aSchristosstatic void
8207b28aSchristosmime_decode_usfield(char *outbuf, size_t outsize, const char *hstring)
8207b28aSchristos{
8207b28aSchristos	const char *p, *p0;
8207b28aSchristos	char *q, *qend;
8207b28aSchristos	int lastc;
8207b28aSchristos	const char *charset;
8207b28aSchristos
8207b28aSchristos	charset = value(ENAME_MIME_CHARSET);
8207b28aSchristos	qend = outbuf + outsize - 1; /* Make sure there is room for the trailing NULL! */
8207b28aSchristos	q = outbuf;
8207b28aSchristos	p = hstring;
8207b28aSchristos	p0 = NULL;
8207b28aSchristos	lastc = (unsigned char)' ';
8207b28aSchristos	while (*p && q < qend) {
8207b28aSchristos		const char *p1;
8207b28aSchristos		char *q1;
8207b28aSchristos		if (is_FWS(lastc) && p[0] == '=' && p[1] == '?' &&
8207b28aSchristos		    decode_word((p1 = p, &p1), (q1 = q, &q1), qend, charset) == 0 &&
d727506fSchristos		    (*p1 == '\0' || is_FWS(*p1))) {
8207b28aSchristos			p0 = p1;  /* pointer to first character after encoded word */
8207b28aSchristos			q = q1;
8207b28aSchristos			p = skip_FWS(p1);
8207b28aSchristos			lastc = (unsigned char)*p0;
8207b28aSchristos		}
8207b28aSchristos		else {
8207b28aSchristos			copy_skipped_FWS(&q, qend, &p0, p);
8207b28aSchristos			lastc = (unsigned char)*p;
8207b28aSchristos			if (q < qend)
8207b28aSchristos				*q++ = *p++;
8207b28aSchristos		}
8207b28aSchristos	}
8207b28aSchristos	copy_skipped_FWS(&q, qend, &p0, p);
8207b28aSchristos	*q = '\0';
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Decode a field comment.
8207b28aSchristos *
8207b28aSchristos * Comments only occur in structured fields, can be nested (rfc 2822,
8207b28aSchristos * sec 3.2.3), and can contain 'encoded-words' and 'quoted-pairs'.
8207b28aSchristos * Otherwise, they can be regarded as unstructured fields that are
8207b28aSchristos * bounded by '(' and ')' characters.
8207b28aSchristos */
8207b28aSchristosstatic int
8207b28aSchristosdecode_comment(char **obuf, char *oend, const char **ibuf, const char *iend, const char *charset)
8207b28aSchristos{
8207b28aSchristos	const char *p, *pend, *p0;
8207b28aSchristos	char *q, *qend;
8207b28aSchristos	int lastc;
8207b28aSchristos
8207b28aSchristos	p = *ibuf;
8207b28aSchristos	q = *obuf;
8207b28aSchristos	pend = iend;
8207b28aSchristos	qend = oend;
d727506fSchristos	lastc = ' ';
8207b28aSchristos	p0 = NULL;
8207b28aSchristos	while (p < pend && q < qend) {
8207b28aSchristos		const char *p1;
8207b28aSchristos		char *q1;
8207b28aSchristos
8207b28aSchristos		if (is_FWS(lastc) && p[0] == '=' && p[1] == '?' &&
8207b28aSchristos		    decode_word((p1 = p, &p1), (q1 = q, &q1), qend, charset) == 0 &&
d727506fSchristos		    (*p1 == ')' || is_FWS(*p1))) {
8207b28aSchristos			lastc = (unsigned char)*p1;
8207b28aSchristos			p0 = p1;
8207b28aSchristos			q = q1;
8207b28aSchristos			p = skip_FWS(p1);
8207b28aSchristos			/*
8207b28aSchristos			 * XXX - this check should be unnecessary as *pend should
8207b28aSchristos			 * be '\0' which will stop skip_FWS()
8207b28aSchristos			 */
8207b28aSchristos			if (p > pend)
8207b28aSchristos				p = pend;
8207b28aSchristos		}
8207b28aSchristos		else {
8207b28aSchristos			copy_skipped_FWS(&q, qend, &p0, p);
8207b28aSchristos			if (q >= qend)	/* XXX - q > qend cannot happen */
8207b28aSchristos				break;
8207b28aSchristos
8207b28aSchristos			if (*p == ')') {
8207b28aSchristos				*q++ = *p++;	/* copy the closing ')' */
8207b28aSchristos				break;		/* and get out of here! */
8207b28aSchristos			}
8207b28aSchristos
8207b28aSchristos			if (*p == '(') {
8207b28aSchristos				*q++ = *p++;	/* copy the opening '(' */
8207b28aSchristos				if (decode_comment(&q, qend, &p, pend, charset) == -1)
8207b28aSchristos					return -1;	/* is this right or should we update? */
8207b28aSchristos				lastc = ')';
8207b28aSchristos			}
8207b28aSchristos			else if (*p == '\\' && p + 1 < pend) {	/* quoted-pair */
8207b28aSchristos				if (p[1] == '(' || p[1] == ')' || p[1] == '\\') /* need quoted-pair*/
8207b28aSchristos					*q++ = *p;
8207b28aSchristos				p++;
8207b28aSchristos				lastc = (unsigned char)*p;
8207b28aSchristos				if (q < qend)
8207b28aSchristos					*q++ = *p++;
8207b28aSchristos			}
8207b28aSchristos			else {
8207b28aSchristos				lastc = (unsigned char)*p;
8207b28aSchristos				*q++ = *p++;
8207b28aSchristos			}
8207b28aSchristos		}
8207b28aSchristos	}
8207b28aSchristos	*ibuf = p;
8207b28aSchristos	*obuf = q;
8207b28aSchristos	return 0;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Decode a quoted-string or no-fold-quote.
8207b28aSchristos *
8207b28aSchristos * These cannot contain encoded words.  They can contain quoted-pairs,
8207b28aSchristos * making '\\' special.  They have no other structure.  See RFC 2822
8207b28aSchristos * sec 3.2.5 and 3.6.4.
8207b28aSchristos */
8207b28aSchristosstatic void
8207b28aSchristosdecode_quoted_string(char **obuf, char *oend, const char **ibuf, const char *iend)
8207b28aSchristos{
8207b28aSchristos	const char *p, *pend;
8207b28aSchristos	char *q, *qend;
8207b28aSchristos
8207b28aSchristos	qend = oend;
8207b28aSchristos	pend = iend;
8207b28aSchristos	p = *ibuf;
8207b28aSchristos	q = *obuf;
8207b28aSchristos	while (p < pend && q < qend) {
8207b28aSchristos		if (*p == '"') {
8207b28aSchristos			*q++ = *p++;	/* copy the closing '"' */
8207b28aSchristos			break;
8207b28aSchristos		}
8207b28aSchristos		if (*p == '\\' && p + 1 < pend) { /* quoted-pair */
8207b28aSchristos			if (p[1] == '"' || p[1] == '\\') {
8207b28aSchristos				*q++ = *p;
8207b28aSchristos				if (q >= qend)
8207b28aSchristos					break;
8207b28aSchristos			}
8207b28aSchristos			p++;
8207b28aSchristos		}
8207b28aSchristos		*q++ = *p++;
8207b28aSchristos	}
8207b28aSchristos	*ibuf = p;
8207b28aSchristos	*obuf = q;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Decode a domain-literal or no-fold-literal.
8207b28aSchristos *
8207b28aSchristos * These cannot contain encoded words.  They can have quoted pairs and
8207b28aSchristos * are delimited by '[' and ']' making '\\', '[', and ']' special.
8207b28aSchristos * They have no other structure.  See RFC 2822 sec 3.4.1 and 3.6.4.
8207b28aSchristos */
8207b28aSchristosstatic void
8207b28aSchristosdecode_domain_literal(char **obuf, char *oend, const char **ibuf, const char *iend)
8207b28aSchristos{
8207b28aSchristos	const char *p, *pend;
8207b28aSchristos	char *q, *qend;
8207b28aSchristos
8207b28aSchristos	qend = oend;
8207b28aSchristos	pend = iend;
8207b28aSchristos	p = *ibuf;
8207b28aSchristos	q = *obuf;
8207b28aSchristos	while (p < pend && q < qend) {
8207b28aSchristos		if (*p == ']') {
8207b28aSchristos			*q++ = *p++;	/* copy the closing ']' */
8207b28aSchristos			break;
8207b28aSchristos		}
8207b28aSchristos		if (*p == '\\' && p + 1 < pend) { /* quoted-pair */
8207b28aSchristos			if (p[1] == '[' || p[1] == ']' || p[1] == '\\') {
8207b28aSchristos				*q++ = *p;
8207b28aSchristos				if (q >= qend)
8207b28aSchristos					break;
8207b28aSchristos			}
8207b28aSchristos			p++;
8207b28aSchristos		}
8207b28aSchristos		*q++ = *p++;
8207b28aSchristos	}
8207b28aSchristos	*ibuf = p;
8207b28aSchristos	*obuf = q;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Specials: see RFC 2822 sec 3.2.1.
8207b28aSchristos */
8207b28aSchristosstatic inline int
8207b28aSchristosis_specials(int c)
8207b28aSchristos{
8207b28aSchristos	static const char specialtab[] = {
8207b28aSchristos		0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,
8207b28aSchristos		0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,
8207b28aSchristos		0, 0, 1, 0,  0, 0, 0, 0,  1, 1, 0, 0,  1, 0, 1, 0,
8207b28aSchristos		0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 1, 1,  1, 0, 1, 0,
8207b28aSchristos
8207b28aSchristos		1, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,
8207b28aSchristos		0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 1,  1, 1, 0, 0,
8207b28aSchristos		0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,
8207b28aSchristos		0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,  0, 0, 0, 0,
8207b28aSchristos	};
d727506fSchristos	return !(c & ~0x7f) ? specialtab[c] : 0;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Decode a structured field.
8207b28aSchristos *
8207b28aSchristos * At the top level, structured fields can only contain encoded-words
8207b28aSchristos * via 'phrases' and 'comments'.  See RFC 2047 sec 5.
8207b28aSchristos */
8207b28aSchristosstatic void
8207b28aSchristosmime_decode_sfield(char *linebuf, size_t bufsize, const char *hstring)
8207b28aSchristos{
8207b28aSchristos	const char *p, *pend, *p0;
8207b28aSchristos	char *q, *qend;
8207b28aSchristos	const char *charset;
8207b28aSchristos	int lastc;
8207b28aSchristos
8207b28aSchristos	charset = value(ENAME_MIME_CHARSET);
8207b28aSchristos
8207b28aSchristos	p = hstring;
8207b28aSchristos	q = linebuf;
8207b28aSchristos	pend = hstring + strlen(hstring);
8207b28aSchristos	qend = linebuf + bufsize - 1;	/* save room for the NULL terminator */
8207b28aSchristos	lastc = (unsigned char)' ';
8207b28aSchristos	p0 = NULL;
8207b28aSchristos	while (p < pend && q < qend) {
8207b28aSchristos		const char *p1;
8207b28aSchristos		char *q1;
8207b28aSchristos
8207b28aSchristos		if (*p != '=') {
8207b28aSchristos			copy_skipped_FWS(&q, qend, &p0, p);
8207b28aSchristos			if (q >= qend)
8207b28aSchristos				break;
8207b28aSchristos		}
8207b28aSchristos
8207b28aSchristos		switch (*p) {
8207b28aSchristos		case '(':	/* start of comment */
8207b28aSchristos			*q++ = *p++;	/* copy the opening '(' */
8207b28aSchristos			(void)decode_comment(&q, qend, &p, pend, charset);
8207b28aSchristos			lastc = (unsigned char)p[-1];
8207b28aSchristos			break;
8207b28aSchristos
8207b28aSchristos		case '"':	/* start of quoted-string or no-fold-quote */
8207b28aSchristos			*q++ = *p++;	/* copy the opening '"' */
8207b28aSchristos			decode_quoted_string(&q, qend, &p, pend);
8207b28aSchristos			lastc = (unsigned char)p[-1];
8207b28aSchristos			break;
8207b28aSchristos
8207b28aSchristos		case '[':	/* start of domain-literal or no-fold-literal */
8207b28aSchristos			*q++ = *p++;	/* copy the opening '[' */
8207b28aSchristos			decode_domain_literal(&q, qend, &p, pend);
8207b28aSchristos			lastc = (unsigned char)p[-1];
8207b28aSchristos			break;
8207b28aSchristos
8207b28aSchristos		case '\\':	/* start of quoted-pair */
8207b28aSchristos			if (p + 1 < pend) {		/* quoted pair */
8207b28aSchristos				if (is_specials(p[1])) {
8207b28aSchristos					*q++ = *p;
8207b28aSchristos					if (q >= qend)
8207b28aSchristos						break;
8207b28aSchristos				}
8207b28aSchristos				p++;	/* skip the '\\' */
8207b28aSchristos			}
8207b28aSchristos			goto copy_char;
8207b28aSchristos
8207b28aSchristos		case '=':
8207b28aSchristos			/*
8207b28aSchristos			 * At this level encoded words can appear via
8207b28aSchristos			 * 'phrases' (possibly delimited by ',' as in
8207b28aSchristos			 * 'keywords').  Thus we handle them as such.
8207b28aSchristos			 * Hopefully this is sufficient.
8207b28aSchristos			 */
8207b28aSchristos			if ((lastc == ',' || is_FWS(lastc)) && p[1] == '?' &&
8207b28aSchristos			    decode_word((p1 = p, &p1), (q1 = q, &q1), qend, charset) == 0 &&
d727506fSchristos			    (*p1 == '\0' || *p1 == ',' || is_FWS(*p1))) {
8207b28aSchristos				lastc = (unsigned char)*p1;
8207b28aSchristos				p0 = p1;
8207b28aSchristos				q = q1;
8207b28aSchristos				p = skip_FWS(p1);
8207b28aSchristos				/*
8207b28aSchristos				 * XXX - this check should be
8207b28aSchristos				 * unnecessary as *pend should be '\0'
8207b28aSchristos				 * which will stop skip_FWS()
8207b28aSchristos				 */
8207b28aSchristos				if (p > pend)
8207b28aSchristos					p = pend;
8207b28aSchristos				break;
8207b28aSchristos			}
8207b28aSchristos			else {
8207b28aSchristos				copy_skipped_FWS(&q, qend, &p0, p);
8207b28aSchristos				if (q >= qend)
8207b28aSchristos					break;
8207b28aSchristos				goto copy_char;
8207b28aSchristos			}
8207b28aSchristos
8207b28aSchristos		case '<':	/* start of angle-addr, msg-id, or path. */
8207b28aSchristos			/*
8207b28aSchristos			 * A msg-id cannot contain encoded-pairs or
8207b28aSchristos			 * encoded-words, but angle-addr and path can.
8207b28aSchristos			 * Distinguishing between them seems to be
8207b28aSchristos			 * unnecessary, so let's be loose and just
8207b28aSchristos			 * decode them as if they were all the same.
8207b28aSchristos			 */
8207b28aSchristos		default:
8207b28aSchristos	copy_char:
8207b28aSchristos			lastc = (unsigned char)*p;
8207b28aSchristos			*q++ = *p++;
8207b28aSchristos			break;
8207b28aSchristos		}
8207b28aSchristos	}
8207b28aSchristos	copy_skipped_FWS(&q, qend, &p0, p);
8207b28aSchristos	*q = '\0';	/* null terminate the result! */
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos/*
8207b28aSchristos * Returns the correct hfield decoder, or NULL if none.
8207b28aSchristos * Info extracted from RFC 2822.
a2fe0ba0Schristos *
a2fe0ba0Schristos * name - pointer to field name of header line (with colon).
8207b28aSchristos */
8207b28aSchristosPUBLIC hfield_decoder_t
a2fe0ba0Schristosmime_hfield_decoder(const char *name)
8207b28aSchristos{
8207b28aSchristos	static const struct field_decoder_tbl_s {
8207b28aSchristos		const char *field_name;
a2fe0ba0Schristos		size_t field_len;
8207b28aSchristos		hfield_decoder_t decoder;
8207b28aSchristos	} field_decoder_tbl[] = {
a2fe0ba0Schristos#define X(s)	s, sizeof(s) - 1
a2fe0ba0Schristos		{ X("Received:"),			NULL },
a2fe0ba0Schristos
a2fe0ba0Schristos		{ X("Content-Type:"),			NULL },
a2fe0ba0Schristos		{ X("Content-Disposition:"),		NULL },
a2fe0ba0Schristos		{ X("Content-Transfer-Encoding:"),	NULL },
a2fe0ba0Schristos		{ X("Content-Description:"),		mime_decode_sfield },
a2fe0ba0Schristos		{ X("Content-ID:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("MIME-Version:"),			mime_decode_sfield },
a2fe0ba0Schristos
a2fe0ba0Schristos		{ X("Bcc:"),				mime_decode_sfield },
a2fe0ba0Schristos		{ X("Cc:"),				mime_decode_sfield },
a2fe0ba0Schristos		{ X("Date:"),				mime_decode_sfield },
a2fe0ba0Schristos		{ X("From:"),				mime_decode_sfield },
a2fe0ba0Schristos		{ X("In-Reply-To:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("Keywords:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("Message-ID:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("References:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("Reply-To:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("Return-Path:"),			mime_decode_sfield },
a2fe0ba0Schristos		{ X("Sender:"),				mime_decode_sfield },
a2fe0ba0Schristos		{ X("To:"),				mime_decode_sfield },
a2fe0ba0Schristos		{ X("Subject:"),			mime_decode_usfield },
a2fe0ba0Schristos		{ X("Comments:"),			mime_decode_usfield },
a2fe0ba0Schristos		{ X("X-"),				mime_decode_usfield },
a2fe0ba0Schristos		{ NULL, 0,				mime_decode_usfield },	/* optional-fields */
a2fe0ba0Schristos#undef X
8207b28aSchristos	};
8207b28aSchristos	const struct field_decoder_tbl_s *fp;
8207b28aSchristos
8207b28aSchristos	/* XXX - this begs for a hash table! */
8207b28aSchristos	for (fp = field_decoder_tbl; fp->field_name; fp++)
a2fe0ba0Schristos		if (strncasecmp(name, fp->field_name, fp->field_len) == 0)
a2fe0ba0Schristos			break;
8207b28aSchristos	return fp->decoder;
8207b28aSchristos}
8207b28aSchristos
8207b28aSchristos#endif /* MIME_SUPPORT */