1 /* $NetBSD: vis.c,v 1.45 2012/12/14 21:38:18 christos Exp $ */ 2 3 /*- 4 * Copyright (c) 1989, 1993 5 * The Regents of the University of California. All rights reserved. 6 * 7 * Redistribution and use in source and binary forms, with or without 8 * modification, are permitted provided that the following conditions 9 * are met: 10 * 1. Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 3. Neither the name of the University nor the names of its contributors 16 * may be used to endorse or promote products derived from this software 17 * without specific prior written permission. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 * SUCH DAMAGE. 30 */ 31 32 /*- 33 * Copyright (c) 1999, 2005 The NetBSD Foundation, Inc. 34 * All rights reserved. 35 * 36 * Redistribution and use in source and binary forms, with or without 37 * modification, are permitted provided that the following conditions 38 * are met: 39 * 1. Redistributions of source code must retain the above copyright 40 * notice, this list of conditions and the following disclaimer. 41 * 2. Redistributions in binary form must reproduce the above copyright 42 * notice, this list of conditions and the following disclaimer in the 43 * documentation and/or other materials provided with the distribution. 44 * 45 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 46 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 47 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 48 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 49 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 50 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 51 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 52 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 53 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 54 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 55 * POSSIBILITY OF SUCH DAMAGE. 56 */ 57 58 #include <sys/cdefs.h> 59 #if defined(LIBC_SCCS) && !defined(lint) 60 __RCSID("$NetBSD: vis.c,v 1.45 2012/12/14 21:38:18 christos Exp $"); 61 #endif /* LIBC_SCCS and not lint */ 62 63 #include "namespace.h" 64 #include <sys/types.h> 65 66 #include <assert.h> 67 #include <vis.h> 68 #include <errno.h> 69 #include <stdlib.h> 70 71 #ifdef __weak_alias 72 __weak_alias(strvisx,_strvisx) 73 #endif 74 75 #if !HAVE_VIS || !HAVE_SVIS 76 #include <ctype.h> 77 #include <limits.h> 78 #include <stdio.h> 79 #include <string.h> 80 81 static char *do_svis(char *, size_t *, int, int, int, const char *); 82 83 #undef BELL 84 #define BELL '\a' 85 86 #define isoctal(c) (((u_char)(c)) >= '0' && ((u_char)(c)) <= '7') 87 #define iswhite(c) (c == ' ' || c == '\t' || c == '\n') 88 #define issafe(c) (c == '\b' || c == BELL || c == '\r') 89 #define xtoa(c) "0123456789abcdef"[c] 90 #define XTOA(c) "0123456789ABCDEF"[c] 91 92 #define MAXEXTRAS 9 93 94 #define MAKEEXTRALIST(flag, extra, orig_str) \ 95 do { \ 96 const char *orig = orig_str; \ 97 const char *o = orig; \ 98 char *e; \ 99 while (*o++) \ 100 continue; \ 101 extra = malloc((size_t)((o - orig) + MAXEXTRAS)); \ 102 if (!extra) break; \ 103 for (o = orig, e = extra; (*e++ = *o++) != '\0';) \ 104 continue; \ 105 e--; \ 106 if (flag & VIS_GLOB) { \ 107 *e++ = '*'; \ 108 *e++ = '?'; \ 109 *e++ = '['; \ 110 *e++ = '#'; \ 111 } \ 112 if (flag & VIS_SP) *e++ = ' '; \ 113 if (flag & VIS_TAB) *e++ = '\t'; \ 114 if (flag & VIS_NL) *e++ = '\n'; \ 115 if ((flag & VIS_NOSLASH) == 0) *e++ = '\\'; \ 116 *e = '\0'; \ 117 } while (/*CONSTCOND*/0) 118 119 /* 120 * This is do_hvis, for HTTP style (RFC 1808) 121 */ 122 static char * 123 do_hvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra) 124 { 125 126 if ((isascii(c) && isalnum(c)) 127 /* safe */ 128 || c == '$' || c == '-' || c == '_' || c == '.' || c == '+' 129 /* extra */ 130 || c == '!' || c == '*' || c == '\'' || c == '(' || c == ')' 131 || c == ',') { 132 dst = do_svis(dst, dlen, c, flag, nextc, extra); 133 } else { 134 if (dlen) { 135 if (*dlen < 3) 136 return NULL; 137 *dlen -= 3; 138 } 139 *dst++ = '%'; 140 *dst++ = xtoa(((unsigned int)c >> 4) & 0xf); 141 *dst++ = xtoa((unsigned int)c & 0xf); 142 } 143 144 return dst; 145 } 146 147 /* 148 * This is do_mvis, for Quoted-Printable MIME (RFC 2045) 149 * NB: No handling of long lines or CRLF. 150 */ 151 static char * 152 do_mvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra) 153 { 154 if ((c != '\n') && 155 /* Space at the end of the line */ 156 ((isspace(c) && (nextc == '\r' || nextc == '\n')) || 157 /* Out of range */ 158 (!isspace(c) && (c < 33 || (c > 60 && c < 62) || c > 126)) || 159 /* Specific char to be escaped */ 160 strchr("#$@[\\]^`{|}~", c) != NULL)) { 161 if (dlen) { 162 if (*dlen < 3) 163 return NULL; 164 *dlen -= 3; 165 } 166 *dst++ = '='; 167 *dst++ = XTOA(((unsigned int)c >> 4) & 0xf); 168 *dst++ = XTOA((unsigned int)c & 0xf); 169 } else { 170 dst = do_svis(dst, dlen, c, flag, nextc, extra); 171 } 172 return dst; 173 } 174 175 /* 176 * This is do_vis, the central code of vis. 177 * dst: Pointer to the destination buffer 178 * c: Character to encode 179 * flag: Flag word 180 * nextc: The character following 'c' 181 * extra: Pointer to the list of extra characters to be 182 * backslash-protected. 183 */ 184 static char * 185 do_svis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra) 186 { 187 int isextra; 188 size_t odlen = dlen ? *dlen : 0; 189 190 isextra = strchr(extra, c) != NULL; 191 #define HAVE(x) \ 192 do { \ 193 if (dlen) { \ 194 if (*dlen < (x)) \ 195 goto out; \ 196 *dlen -= (x); \ 197 } \ 198 } while (/*CONSTCOND*/0) 199 if (!isextra && isascii(c) && (isgraph(c) || iswhite(c) || 200 ((flag & VIS_SAFE) && issafe(c)))) { 201 HAVE(1); 202 *dst++ = c; 203 return dst; 204 } 205 if (flag & VIS_CSTYLE) { 206 HAVE(2); 207 switch (c) { 208 case '\n': 209 *dst++ = '\\'; *dst++ = 'n'; 210 return dst; 211 case '\r': 212 *dst++ = '\\'; *dst++ = 'r'; 213 return dst; 214 case '\b': 215 *dst++ = '\\'; *dst++ = 'b'; 216 return dst; 217 case BELL: 218 *dst++ = '\\'; *dst++ = 'a'; 219 return dst; 220 case '\v': 221 *dst++ = '\\'; *dst++ = 'v'; 222 return dst; 223 case '\t': 224 *dst++ = '\\'; *dst++ = 't'; 225 return dst; 226 case '\f': 227 *dst++ = '\\'; *dst++ = 'f'; 228 return dst; 229 case ' ': 230 *dst++ = '\\'; *dst++ = 's'; 231 return dst; 232 case '\0': 233 *dst++ = '\\'; *dst++ = '0'; 234 if (isoctal(nextc)) { 235 HAVE(2); 236 *dst++ = '0'; 237 *dst++ = '0'; 238 } 239 return dst; 240 default: 241 if (isgraph(c)) { 242 *dst++ = '\\'; *dst++ = c; 243 return dst; 244 } 245 if (dlen) 246 *dlen = odlen; 247 } 248 } 249 if (isextra || ((c & 0177) == ' ') || (flag & VIS_OCTAL)) { 250 HAVE(4); 251 *dst++ = '\\'; 252 *dst++ = (u_char)(((u_int32_t)(u_char)c >> 6) & 03) + '0'; 253 *dst++ = (u_char)(((u_int32_t)(u_char)c >> 3) & 07) + '0'; 254 *dst++ = (c & 07) + '0'; 255 } else { 256 if ((flag & VIS_NOSLASH) == 0) { 257 HAVE(1); 258 *dst++ = '\\'; 259 } 260 261 if (c & 0200) { 262 HAVE(1); 263 c &= 0177; *dst++ = 'M'; 264 } 265 266 if (iscntrl(c)) { 267 HAVE(2); 268 *dst++ = '^'; 269 if (c == 0177) 270 *dst++ = '?'; 271 else 272 *dst++ = c + '@'; 273 } else { 274 HAVE(2); 275 *dst++ = '-'; *dst++ = c; 276 } 277 } 278 return dst; 279 out: 280 *dlen = odlen; 281 return NULL; 282 } 283 284 typedef char *(*visfun_t)(char *, size_t *, int, int, int, const char *); 285 286 /* 287 * Return the appropriate encoding function depending on the flags given. 288 */ 289 static visfun_t 290 getvisfun(int flag) 291 { 292 if (flag & VIS_HTTPSTYLE) 293 return do_hvis; 294 if (flag & VIS_MIMESTYLE) 295 return do_mvis; 296 return do_svis; 297 } 298 299 /* 300 * isnvis - visually encode characters, also encoding the characters 301 * pointed to by `extra' 302 */ 303 static char * 304 isnvis(char *dst, size_t *dlen, int c, int flag, int nextc, const char *extra) 305 { 306 char *nextra = NULL; 307 visfun_t f; 308 309 _DIAGASSERT(dst != NULL); 310 _DIAGASSERT(extra != NULL); 311 MAKEEXTRALIST(flag, nextra, extra); 312 if (!nextra) { 313 if (dlen && *dlen == 0) { 314 errno = ENOSPC; 315 return NULL; 316 } 317 *dst = '\0'; /* can't create nextra, return "" */ 318 return dst; 319 } 320 f = getvisfun(flag); 321 dst = (*f)(dst, dlen, c, flag, nextc, nextra); 322 free(nextra); 323 if (dst == NULL || (dlen && *dlen == 0)) { 324 errno = ENOSPC; 325 return NULL; 326 } 327 *dst = '\0'; 328 return dst; 329 } 330 331 char * 332 svis(char *dst, int c, int flag, int nextc, const char *extra) 333 { 334 return isnvis(dst, NULL, c, flag, nextc, extra); 335 } 336 337 char * 338 snvis(char *dst, size_t dlen, int c, int flag, int nextc, const char *extra) 339 { 340 return isnvis(dst, &dlen, c, flag, nextc, extra); 341 } 342 343 344 /* 345 * strsvis, strsvisx - visually encode characters from src into dst 346 * 347 * Extra is a pointer to a \0-terminated list of characters to 348 * be encoded, too. These functions are useful e. g. to 349 * encode strings in such a way so that they are not interpreted 350 * by a shell. 351 * 352 * Dst must be 4 times the size of src to account for possible 353 * expansion. The length of dst, not including the trailing NULL, 354 * is returned. 355 * 356 * Strsvisx encodes exactly len bytes from src into dst. 357 * This is useful for encoding a block of data. 358 */ 359 static int 360 istrsnvis(char *dst, size_t *dlen, const char *csrc, int flag, const char *extra) 361 { 362 int c; 363 char *start; 364 char *nextra = NULL; 365 const unsigned char *src = (const unsigned char *)csrc; 366 visfun_t f; 367 368 _DIAGASSERT(dst != NULL); 369 _DIAGASSERT(src != NULL); 370 _DIAGASSERT(extra != NULL); 371 MAKEEXTRALIST(flag, nextra, extra); 372 if (!nextra) { 373 *dst = '\0'; /* can't create nextra, return "" */ 374 return 0; 375 } 376 f = getvisfun(flag); 377 for (start = dst; (c = *src++) != '\0'; /* empty */) { 378 dst = (*f)(dst, dlen, c, flag, *src, nextra); 379 if (dst == NULL) { 380 errno = ENOSPC; 381 return -1; 382 } 383 } 384 free(nextra); 385 if (dlen && *dlen == 0) { 386 errno = ENOSPC; 387 return -1; 388 } 389 *dst = '\0'; 390 return (int)(dst - start); 391 } 392 393 int 394 strsvis(char *dst, const char *csrc, int flag, const char *extra) 395 { 396 return istrsnvis(dst, NULL, csrc, flag, extra); 397 } 398 399 int 400 strsnvis(char *dst, size_t dlen, const char *csrc, int flag, const char *extra) 401 { 402 return istrsnvis(dst, &dlen, csrc, flag, extra); 403 } 404 405 static int 406 istrsnvisx(char *dst, size_t *dlen, const char *csrc, size_t len, int flag, 407 const char *extra) 408 { 409 unsigned char c; 410 char *start; 411 char *nextra = NULL; 412 const unsigned char *src = (const unsigned char *)csrc; 413 visfun_t f; 414 415 _DIAGASSERT(dst != NULL); 416 _DIAGASSERT(src != NULL); 417 _DIAGASSERT(extra != NULL); 418 MAKEEXTRALIST(flag, nextra, extra); 419 if (! nextra) { 420 if (dlen && *dlen == 0) { 421 errno = ENOSPC; 422 return -1; 423 } 424 *dst = '\0'; /* can't create nextra, return "" */ 425 return 0; 426 } 427 428 f = getvisfun(flag); 429 for (start = dst; len > 0; len--) { 430 c = *src++; 431 dst = (*f)(dst, dlen, c, flag, len > 1 ? *src : '\0', nextra); 432 if (dst == NULL) { 433 errno = ENOSPC; 434 return -1; 435 } 436 } 437 free(nextra); 438 if (dlen && *dlen == 0) { 439 errno = ENOSPC; 440 return -1; 441 } 442 *dst = '\0'; 443 return (int)(dst - start); 444 } 445 446 int 447 strsvisx(char *dst, const char *csrc, size_t len, int flag, const char *extra) 448 { 449 return istrsnvisx(dst, NULL, csrc, len, flag, extra); 450 } 451 452 int 453 strsnvisx(char *dst, size_t dlen, const char *csrc, size_t len, int flag, 454 const char *extra) 455 { 456 return istrsnvisx(dst, &dlen, csrc, len, flag, extra); 457 } 458 #endif 459 460 #if !HAVE_VIS 461 /* 462 * vis - visually encode characters 463 */ 464 static char * 465 invis(char *dst, size_t *dlen, int c, int flag, int nextc) 466 { 467 char *extra = NULL; 468 unsigned char uc = (unsigned char)c; 469 visfun_t f; 470 471 _DIAGASSERT(dst != NULL); 472 473 MAKEEXTRALIST(flag, extra, ""); 474 if (! extra) { 475 if (dlen && *dlen == 0) { 476 errno = ENOSPC; 477 return NULL; 478 } 479 *dst = '\0'; /* can't create extra, return "" */ 480 return dst; 481 } 482 f = getvisfun(flag); 483 dst = (*f)(dst, dlen, uc, flag, nextc, extra); 484 free(extra); 485 if (dst == NULL || (dlen && *dlen == 0)) { 486 errno = ENOSPC; 487 return NULL; 488 } 489 *dst = '\0'; 490 return dst; 491 } 492 493 char * 494 vis(char *dst, int c, int flag, int nextc) 495 { 496 return invis(dst, NULL, c, flag, nextc); 497 } 498 499 char * 500 nvis(char *dst, size_t dlen, int c, int flag, int nextc) 501 { 502 return invis(dst, &dlen, c, flag, nextc); 503 } 504 505 506 /* 507 * strvis, strvisx - visually encode characters from src into dst 508 * 509 * Dst must be 4 times the size of src to account for possible 510 * expansion. The length of dst, not including the trailing NULL, 511 * is returned. 512 * 513 * Strvisx encodes exactly len bytes from src into dst. 514 * This is useful for encoding a block of data. 515 */ 516 static int 517 istrnvis(char *dst, size_t *dlen, const char *src, int flag) 518 { 519 char *extra = NULL; 520 int rv; 521 522 MAKEEXTRALIST(flag, extra, ""); 523 if (!extra) { 524 if (dlen && *dlen == 0) { 525 errno = ENOSPC; 526 return -1; 527 } 528 *dst = '\0'; /* can't create extra, return "" */ 529 return 0; 530 } 531 rv = istrsnvis(dst, dlen, src, flag, extra); 532 free(extra); 533 return rv; 534 } 535 536 int 537 strvis(char *dst, const char *src, int flag) 538 { 539 return istrnvis(dst, NULL, src, flag); 540 } 541 542 int 543 strnvis(char *dst, size_t dlen, const char *src, int flag) 544 { 545 return istrnvis(dst, &dlen, src, flag); 546 } 547 548 static int 549 istrnvisx(char *dst, size_t *dlen, const char *src, size_t len, int flag) 550 { 551 char *extra = NULL; 552 int rv; 553 554 MAKEEXTRALIST(flag, extra, ""); 555 if (!extra) { 556 if (dlen && *dlen == 0) { 557 errno = ENOSPC; 558 return -1; 559 } 560 *dst = '\0'; /* can't create extra, return "" */ 561 return 0; 562 } 563 rv = istrsnvisx(dst, dlen, src, len, flag, extra); 564 free(extra); 565 return rv; 566 } 567 568 int 569 strvisx(char *dst, const char *src, size_t len, int flag) 570 { 571 return istrnvisx(dst, NULL, src, len, flag); 572 } 573 574 int 575 strnvisx(char *dst, size_t dlen, const char *src, size_t len, int flag) 576 { 577 return istrnvisx(dst, &dlen, src, len, flag); 578 } 579 580 #endif 581