1*00b67f09SDavid van Moolenbroek /* $NetBSD: selectiveencode.c,v 1.4 2014/12/10 04:37:56 christos Exp $ */
2*00b67f09SDavid van Moolenbroek
3*00b67f09SDavid van Moolenbroek #ifndef lint
4*00b67f09SDavid van Moolenbroek static char *rcsid = "Id: selectiveencode.c,v 1.1 2003/06/04 00:27:07 marka Exp ";
5*00b67f09SDavid van Moolenbroek #endif
6*00b67f09SDavid van Moolenbroek
7*00b67f09SDavid van Moolenbroek /*
8*00b67f09SDavid van Moolenbroek * Copyright (c) 2000,2002 Japan Network Information Center.
9*00b67f09SDavid van Moolenbroek * All rights reserved.
10*00b67f09SDavid van Moolenbroek *
11*00b67f09SDavid van Moolenbroek * By using this file, you agree to the terms and conditions set forth bellow.
12*00b67f09SDavid van Moolenbroek *
13*00b67f09SDavid van Moolenbroek * LICENSE TERMS AND CONDITIONS
14*00b67f09SDavid van Moolenbroek *
15*00b67f09SDavid van Moolenbroek * The following License Terms and Conditions apply, unless a different
16*00b67f09SDavid van Moolenbroek * license is obtained from Japan Network Information Center ("JPNIC"),
17*00b67f09SDavid van Moolenbroek * a Japanese association, Kokusai-Kougyou-Kanda Bldg 6F, 2-3-4 Uchi-Kanda,
18*00b67f09SDavid van Moolenbroek * Chiyoda-ku, Tokyo 101-0047, Japan.
19*00b67f09SDavid van Moolenbroek *
20*00b67f09SDavid van Moolenbroek * 1. Use, Modification and Redistribution (including distribution of any
21*00b67f09SDavid van Moolenbroek * modified or derived work) in source and/or binary forms is permitted
22*00b67f09SDavid van Moolenbroek * under this License Terms and Conditions.
23*00b67f09SDavid van Moolenbroek *
24*00b67f09SDavid van Moolenbroek * 2. Redistribution of source code must retain the copyright notices as they
25*00b67f09SDavid van Moolenbroek * appear in each source code file, this License Terms and Conditions.
26*00b67f09SDavid van Moolenbroek *
27*00b67f09SDavid van Moolenbroek * 3. Redistribution in binary form must reproduce the Copyright Notice,
28*00b67f09SDavid van Moolenbroek * this License Terms and Conditions, in the documentation and/or other
29*00b67f09SDavid van Moolenbroek * materials provided with the distribution. For the purposes of binary
30*00b67f09SDavid van Moolenbroek * distribution the "Copyright Notice" refers to the following language:
31*00b67f09SDavid van Moolenbroek * "Copyright (c) 2000-2002 Japan Network Information Center. All rights reserved."
32*00b67f09SDavid van Moolenbroek *
33*00b67f09SDavid van Moolenbroek * 4. The name of JPNIC may not be used to endorse or promote products
34*00b67f09SDavid van Moolenbroek * derived from this Software without specific prior written approval of
35*00b67f09SDavid van Moolenbroek * JPNIC.
36*00b67f09SDavid van Moolenbroek *
37*00b67f09SDavid van Moolenbroek * 5. Disclaimer/Limitation of Liability: THIS SOFTWARE IS PROVIDED BY JPNIC
38*00b67f09SDavid van Moolenbroek * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
39*00b67f09SDavid van Moolenbroek * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
40*00b67f09SDavid van Moolenbroek * PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL JPNIC BE LIABLE
41*00b67f09SDavid van Moolenbroek * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
42*00b67f09SDavid van Moolenbroek * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
43*00b67f09SDavid van Moolenbroek * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
44*00b67f09SDavid van Moolenbroek * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
45*00b67f09SDavid van Moolenbroek * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
46*00b67f09SDavid van Moolenbroek * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
47*00b67f09SDavid van Moolenbroek * ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
48*00b67f09SDavid van Moolenbroek */
49*00b67f09SDavid van Moolenbroek
50*00b67f09SDavid van Moolenbroek #include <config.h>
51*00b67f09SDavid van Moolenbroek
52*00b67f09SDavid van Moolenbroek #include <stddef.h>
53*00b67f09SDavid van Moolenbroek
54*00b67f09SDavid van Moolenbroek #include <idn/assert.h>
55*00b67f09SDavid van Moolenbroek #include <idn/logmacro.h>
56*00b67f09SDavid van Moolenbroek #include <idn/result.h>
57*00b67f09SDavid van Moolenbroek #include <idn/utf8.h>
58*00b67f09SDavid van Moolenbroek #include <idn/debug.h>
59*00b67f09SDavid van Moolenbroek
60*00b67f09SDavid van Moolenbroek #include "selectiveencode.h"
61*00b67f09SDavid van Moolenbroek
62*00b67f09SDavid van Moolenbroek static int is_domain_delimiter(char c);
63*00b67f09SDavid van Moolenbroek static char *find_nonascii(const char *s);
64*00b67f09SDavid van Moolenbroek
65*00b67f09SDavid van Moolenbroek idn_result_t
idn_selectiveencode_findregion(const char * s,char ** startp,char ** endp)66*00b67f09SDavid van Moolenbroek idn_selectiveencode_findregion(const char *s,
67*00b67f09SDavid van Moolenbroek char **startp, char **endp)
68*00b67f09SDavid van Moolenbroek {
69*00b67f09SDavid van Moolenbroek char *non_ascii;
70*00b67f09SDavid van Moolenbroek char *start, *end;
71*00b67f09SDavid van Moolenbroek
72*00b67f09SDavid van Moolenbroek assert(s != NULL && startp != NULL && endp != NULL);
73*00b67f09SDavid van Moolenbroek
74*00b67f09SDavid van Moolenbroek TRACE(("idn_selectiveencode_findregion(s=\"%s\")\n",
75*00b67f09SDavid van Moolenbroek idn__debug_xstring(s, 20)));
76*00b67f09SDavid van Moolenbroek
77*00b67f09SDavid van Moolenbroek /*
78*00b67f09SDavid van Moolenbroek * Scan the specified string looking for non-ascii character.
79*00b67f09SDavid van Moolenbroek */
80*00b67f09SDavid van Moolenbroek if ((non_ascii = find_nonascii(s)) == NULL)
81*00b67f09SDavid van Moolenbroek return (idn_notfound);
82*00b67f09SDavid van Moolenbroek
83*00b67f09SDavid van Moolenbroek /*
84*00b67f09SDavid van Moolenbroek * Non-ascii character found.
85*00b67f09SDavid van Moolenbroek * Determine the region to encode.
86*00b67f09SDavid van Moolenbroek */
87*00b67f09SDavid van Moolenbroek
88*00b67f09SDavid van Moolenbroek /*
89*00b67f09SDavid van Moolenbroek * First, we scan backwards to find the beginning of the region
90*00b67f09SDavid van Moolenbroek * that should be converted.
91*00b67f09SDavid van Moolenbroek */
92*00b67f09SDavid van Moolenbroek start = non_ascii;
93*00b67f09SDavid van Moolenbroek while (start > s) {
94*00b67f09SDavid van Moolenbroek char *prev = idn_utf8_findfirstbyte(start - 1, s);
95*00b67f09SDavid van Moolenbroek if (is_domain_delimiter(*prev))
96*00b67f09SDavid van Moolenbroek break; /* Found */
97*00b67f09SDavid van Moolenbroek start = prev;
98*00b67f09SDavid van Moolenbroek }
99*00b67f09SDavid van Moolenbroek *startp = start;
100*00b67f09SDavid van Moolenbroek
101*00b67f09SDavid van Moolenbroek /*
102*00b67f09SDavid van Moolenbroek * Next we scan forwards looking for the end of the region.
103*00b67f09SDavid van Moolenbroek */
104*00b67f09SDavid van Moolenbroek end = non_ascii + idn_utf8_mblen(non_ascii);
105*00b67f09SDavid van Moolenbroek while (!is_domain_delimiter(*end))
106*00b67f09SDavid van Moolenbroek end += idn_utf8_mblen(end);
107*00b67f09SDavid van Moolenbroek *endp = end;
108*00b67f09SDavid van Moolenbroek
109*00b67f09SDavid van Moolenbroek return (idn_success);
110*00b67f09SDavid van Moolenbroek }
111*00b67f09SDavid van Moolenbroek
112*00b67f09SDavid van Moolenbroek static int
is_domain_delimiter(char c)113*00b67f09SDavid van Moolenbroek is_domain_delimiter(char c) {
114*00b67f09SDavid van Moolenbroek return ((unsigned char)c < 0x80 &&
115*00b67f09SDavid van Moolenbroek !('A' <= c && c <= 'Z') &&
116*00b67f09SDavid van Moolenbroek !('a' <= c && c <= 'z') &&
117*00b67f09SDavid van Moolenbroek !('0' <= c && c <= '9') &&
118*00b67f09SDavid van Moolenbroek c != '-' && c != '.');
119*00b67f09SDavid van Moolenbroek }
120*00b67f09SDavid van Moolenbroek
121*00b67f09SDavid van Moolenbroek static char *
find_nonascii(const char * s)122*00b67f09SDavid van Moolenbroek find_nonascii(const char *s) {
123*00b67f09SDavid van Moolenbroek while (*s != '\0' && (unsigned char)*s < 0x80)
124*00b67f09SDavid van Moolenbroek s++;
125*00b67f09SDavid van Moolenbroek if (*s == '\0')
126*00b67f09SDavid van Moolenbroek return (NULL);
127*00b67f09SDavid van Moolenbroek else
128*00b67f09SDavid van Moolenbroek return ((char *)s);
129*00b67f09SDavid van Moolenbroek }
130