1 /* $NetBSD: vis.c,v 1.24 2014/09/26 02:20:39 wiz Exp $ */ 2 3 /*- 4 * Copyright (c) 1989, 1993 5 * The Regents of the University of California. All rights reserved. 6 * 7 * Redistribution and use in source and binary forms, with or without 8 * modification, are permitted provided that the following conditions 9 * are met: 10 * 1. Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 3. Neither the name of the University nor the names of its contributors 16 * may be used to endorse or promote products derived from this software 17 * without specific prior written permission. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 * SUCH DAMAGE. 30 */ 31 32 #include <sys/cdefs.h> 33 #ifndef lint 34 __COPYRIGHT("@(#) Copyright (c) 1989, 1993\ 35 The Regents of the University of California. All rights reserved."); 36 #endif /* not lint */ 37 38 #ifndef lint 39 #if 0 40 static char sccsid[] = "@(#)vis.c 8.1 (Berkeley) 6/6/93"; 41 #endif 42 __RCSID("$NetBSD: vis.c,v 1.24 2014/09/26 02:20:39 wiz Exp $"); 43 #endif /* not lint */ 44 45 #include <stdio.h> 46 #include <string.h> 47 #include <stdlib.h> 48 #include <string.h> 49 #include <errno.h> 50 #include <wchar.h> 51 #include <limits.h> 52 #include <unistd.h> 53 #include <err.h> 54 #include <vis.h> 55 56 #include "extern.h" 57 58 static int eflags, fold, foldwidth = 80, none, markeol; 59 #ifdef DEBUG 60 int debug; 61 #endif 62 static const char *extra = ""; 63 64 static void process(FILE *); 65 66 int 67 main(int argc, char *argv[]) 68 { 69 FILE *fp; 70 int ch; 71 int rval; 72 73 while ((ch = getopt(argc, argv, "bcde:F:fhlMmnoSstw")) != -1) 74 switch((char)ch) { 75 case 'b': 76 eflags |= VIS_NOSLASH; 77 break; 78 case 'c': 79 eflags |= VIS_CSTYLE; 80 break; 81 #ifdef DEBUG 82 case 'd': 83 debug++; 84 break; 85 #endif 86 case 'e': 87 extra = optarg; 88 break; 89 case 'F': 90 if ((foldwidth = atoi(optarg)) < 5) { 91 errx(1, "can't fold lines to less than 5 cols"); 92 /* NOTREACHED */ 93 } 94 markeol++; 95 break; 96 case 'f': 97 fold++; /* fold output lines to 80 cols */ 98 break; /* using hidden newline */ 99 case 'h': 100 eflags |= VIS_HTTPSTYLE; 101 break; 102 case 'l': 103 markeol++; /* mark end of line with \$ */ 104 break; 105 case 'm': 106 eflags |= VIS_MIMESTYLE; 107 if (foldwidth == 80) 108 foldwidth = 76; 109 break; 110 case 'M': 111 eflags |= VIS_META; 112 break; 113 case 'n': 114 none++; 115 break; 116 case 'o': 117 eflags |= VIS_OCTAL; 118 break; 119 case 's': 120 eflags |= VIS_SAFE; 121 break; 122 case 'S': 123 eflags |= VIS_SHELL; 124 break; 125 case 't': 126 eflags |= VIS_TAB; 127 break; 128 case 'w': 129 eflags |= VIS_WHITE; 130 break; 131 case '?': 132 default: 133 (void)fprintf(stderr, 134 "Usage: %s [-bcfhlMmnoSstw] [-e extra]" 135 " [-F foldwidth] [file ...]\n", getprogname()); 136 return 1; 137 } 138 139 if ((eflags & (VIS_HTTPSTYLE|VIS_MIMESTYLE)) == 140 (VIS_HTTPSTYLE|VIS_MIMESTYLE)) 141 errx(1, "Can't specify -m and -h at the same time"); 142 143 argc -= optind; 144 argv += optind; 145 146 rval = 0; 147 148 if (*argv) 149 while (*argv) { 150 if ((fp = fopen(*argv, "r")) != NULL) { 151 process(fp); 152 (void)fclose(fp); 153 } else { 154 warn("%s", *argv); 155 rval = 1; 156 } 157 argv++; 158 } 159 else 160 process(stdin); 161 return rval; 162 } 163 164 static void 165 process(FILE *fp) 166 { 167 static int col = 0; 168 static char nul[] = "\0"; 169 char *cp = nul + 1; /* so *(cp-1) starts out != '\n' */ 170 wint_t c, c1, rachar; 171 char mbibuff[2 * MB_LEN_MAX + 1]; /* max space for 2 wchars */ 172 char buff[4 * MB_LEN_MAX + 1]; /* max encoding length for one char */ 173 int mbilen, cerr = 0, raerr = 0; 174 175 /* 176 * The input stream is considered to be multibyte characters. 177 * The input loop will read this data inputing one character, 178 * possibly multiple bytes, at a time and converting each to 179 * a wide character wchar_t. 180 * 181 * The vis(3) functions, however, require single either bytes 182 * or a multibyte string as their arguments. So we convert 183 * our input wchar_t and the following look-ahead wchar_t to 184 * a multibyte string for processing by vis(3). 185 */ 186 187 /* Read one multibyte character, store as wchar_t */ 188 c = getwc(fp); 189 if (c == WEOF && errno == EILSEQ) { 190 /* Error in multibyte data. Read one byte. */ 191 c = (wint_t)getc(fp); 192 cerr = 1; 193 } 194 while (c != WEOF) { 195 /* Clear multibyte input buffer. */ 196 memset(mbibuff, 0, sizeof(mbibuff)); 197 /* Read-ahead next multibyte character. */ 198 if (!cerr) 199 rachar = getwc(fp); 200 if (cerr || (rachar == WEOF && errno == EILSEQ)) { 201 /* Error in multibyte data. Read one byte. */ 202 rachar = (wint_t)getc(fp); 203 raerr = 1; 204 } 205 if (none) { 206 /* Handle -n flag. */ 207 cp = buff; 208 *cp++ = c; 209 if (c == '\\') 210 *cp++ = '\\'; 211 *cp = '\0'; 212 } else if (markeol && c == '\n') { 213 /* Handle -l flag. */ 214 cp = buff; 215 if ((eflags & VIS_NOSLASH) == 0) 216 *cp++ = '\\'; 217 *cp++ = '$'; 218 *cp++ = '\n'; 219 *cp = '\0'; 220 } else { 221 /* 222 * Convert character using vis(3) library. 223 * At this point we will process one character. 224 * But we must pass the vis(3) library this 225 * character plus the next one because the next 226 * one is used as a look-ahead to decide how to 227 * encode this one under certain circumstances. 228 * 229 * Since our characters may be multibyte, e.g., 230 * in the UTF-8 locale, we cannot use vis() and 231 * svis() which require byte input, so we must 232 * create a multibyte string and use strvisx(). 233 */ 234 /* Treat EOF as a NUL char. */ 235 c1 = rachar; 236 if (c1 == WEOF) 237 c1 = L'\0'; 238 /* 239 * If we hit a multibyte conversion error above, 240 * insert byte directly into string buff because 241 * wctomb() will fail. Else convert wchar_t to 242 * multibyte using wctomb(). 243 */ 244 if (cerr) { 245 *mbibuff = (char)c; 246 mbilen = 1; 247 } else 248 mbilen = wctomb(mbibuff, c); 249 /* Same for look-ahead character. */ 250 if (raerr) 251 mbibuff[mbilen] = (char)c1; 252 else 253 wctomb(mbibuff + mbilen, c1); 254 /* Perform encoding on just first character. */ 255 (void) strsenvisx(buff, 4 * MB_LEN_MAX, mbibuff, 256 1, eflags, extra, &cerr); 257 } 258 259 cp = buff; 260 if (fold) { 261 #ifdef DEBUG 262 if (debug) 263 (void)printf("<%02d,", col); 264 #endif 265 col = foldit(cp, col, foldwidth, eflags); 266 #ifdef DEBUG 267 if (debug) 268 (void)printf("%02d>", col); 269 #endif 270 } 271 do { 272 (void)putchar(*cp); 273 } while (*++cp); 274 c = rachar; 275 cerr = raerr; 276 } 277 /* 278 * terminate partial line with a hidden newline 279 */ 280 if (fold && *(cp - 1) != '\n') 281 (void)printf(eflags & VIS_MIMESTYLE ? "=\n" : "\\\n"); 282 } 283