1 /* $OpenBSD: main.c,v 1.41 2020/10/13 06:07:54 martijn Exp $ */ 2 3 /*- 4 * Copyright (c) 1992 Diomidis Spinellis. 5 * Copyright (c) 1992, 1993 6 * The Regents of the University of California. All rights reserved. 7 * 8 * This code is derived from software contributed to Berkeley by 9 * Diomidis Spinellis of Imperial College, University of London. 10 * 11 * Redistribution and use in source and binary forms, with or without 12 * modification, are permitted provided that the following conditions 13 * are met: 14 * 1. Redistributions of source code must retain the above copyright 15 * notice, this list of conditions and the following disclaimer. 16 * 2. Redistributions in binary form must reproduce the above copyright 17 * notice, this list of conditions and the following disclaimer in the 18 * documentation and/or other materials provided with the distribution. 19 * 3. Neither the name of the University nor the names of its contributors 20 * may be used to endorse or promote products derived from this software 21 * without specific prior written permission. 22 * 23 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 26 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 33 * SUCH DAMAGE. 34 */ 35 36 #include <sys/types.h> 37 #include <sys/ioctl.h> 38 #include <sys/stat.h> 39 40 #include <ctype.h> 41 #include <errno.h> 42 #include <fcntl.h> 43 #include <limits.h> 44 #include <regex.h> 45 #include <stddef.h> 46 #include <stdio.h> 47 #include <stdlib.h> 48 #include <string.h> 49 #include <unistd.h> 50 #include <libgen.h> 51 52 #include "defs.h" 53 #include "extern.h" 54 55 /* 56 * Linked list of units (strings and files) to be compiled 57 */ 58 struct s_compunit { 59 struct s_compunit *next; 60 enum e_cut {CU_FILE, CU_STRING} type; 61 char *s; /* Pointer to string or fname */ 62 }; 63 64 /* 65 * Linked list pointer to compilation units and pointer to current 66 * next pointer. 67 */ 68 static struct s_compunit *script, **cu_nextp = &script; 69 70 /* 71 * Linked list of files to be processed 72 */ 73 struct s_flist { 74 char *fname; 75 struct s_flist *next; 76 }; 77 78 /* 79 * Linked list pointer to files and pointer to current 80 * next pointer. 81 */ 82 static struct s_flist *files, **fl_nextp = &files; 83 84 FILE *infile; /* Current input file */ 85 FILE *outfile; /* Current output file */ 86 87 int Eflag, aflag, eflag, nflag; 88 static int rval; /* Exit status */ 89 90 /* 91 * Current file and line number; line numbers restart across compilation 92 * units, but span across input files. The latter is optional if editing 93 * in place. 94 */ 95 const char *fname; /* File name. */ 96 const char *outfname; /* Output file name */ 97 static char oldfname[PATH_MAX]; /* Old file name (for in-place editing) */ 98 static char tmpfname[PATH_MAX]; /* Temporary file name (for in-place editing) */ 99 char *inplace; /* Inplace edit file extension */ 100 u_long linenum; 101 102 static void add_compunit(enum e_cut, char *); 103 static void add_file(char *); 104 static int next_files_have_lines(void); 105 106 int termwidth; 107 108 int pledge_wpath, pledge_rpath; 109 110 int 111 main(int argc, char *argv[]) 112 { 113 struct winsize win; 114 int c, fflag; 115 char *p; 116 117 fflag = 0; 118 inplace = NULL; 119 while ((c = getopt(argc, argv, "Eae:f:i::nru")) != -1) 120 switch (c) { 121 case 'E': 122 case 'r': 123 Eflag = 1; 124 break; 125 case 'a': 126 aflag = 1; 127 break; 128 case 'e': 129 eflag = 1; 130 add_compunit(CU_STRING, optarg); 131 break; 132 case 'f': 133 fflag = 1; 134 add_compunit(CU_FILE, optarg); 135 break; 136 case 'i': 137 inplace = optarg ? optarg : ""; 138 break; 139 case 'n': 140 nflag = 1; 141 break; 142 case 'u': 143 setvbuf(stdout, NULL, _IOLBF, 0); 144 break; 145 default: 146 case '?': 147 (void)fprintf(stderr, 148 "usage: sed [-aEnru] [-i[extension]] command [file ...]\n" 149 " sed [-aEnru] [-e command] [-f command_file] [-i[extension]] [file ...]\n"); 150 exit(1); 151 } 152 argc -= optind; 153 argv += optind; 154 155 termwidth = 0; 156 if ((p = getenv("COLUMNS")) != NULL) 157 termwidth = strtonum(p, 0, INT_MAX, NULL); 158 if (termwidth == 0 && ioctl(STDOUT_FILENO, TIOCGWINSZ, &win) == 0 && 159 win.ws_col > 0) 160 termwidth = win.ws_col; 161 if (termwidth == 0) 162 termwidth = 80; 163 if (termwidth <= 8) 164 termwidth = 1; 165 else 166 termwidth -= 8; 167 168 if (inplace != NULL) { 169 if (pledge("stdio rpath wpath cpath fattr chown", NULL) == -1) 170 error(FATAL, "pledge: %s", strerror(errno)); 171 } else { 172 if (pledge("stdio rpath wpath cpath", NULL) == -1) 173 error(FATAL, "pledge: %s", strerror(errno)); 174 } 175 176 /* First usage case; script is the first arg */ 177 if (!eflag && !fflag && *argv) { 178 add_compunit(CU_STRING, *argv); 179 argv++; 180 } 181 182 compile(); 183 184 /* Continue with first and start second usage */ 185 if (*argv) { 186 if (!pledge_wpath && inplace == NULL) { 187 if (pledge("stdio rpath", NULL) == -1) 188 error(FATAL, "pledge: %s", strerror(errno)); 189 } 190 for (; *argv; argv++) 191 add_file(*argv); 192 } else { 193 if (!pledge_wpath && !pledge_rpath) { 194 if (pledge("stdio", NULL) == -1) 195 error(FATAL, "pledge: %s", strerror(errno)); 196 } else if (pledge_rpath) { 197 if (pledge("stdio rpath", NULL) == -1) 198 error(FATAL, "pledge: %s", strerror(errno)); 199 } else if (pledge_wpath) { 200 if (pledge("stdio wpath cpath", NULL) == -1) 201 error(FATAL, "pledge: %s", strerror(errno)); 202 } 203 add_file(NULL); 204 } 205 process(); 206 cfclose(prog, NULL); 207 if (fclose(stdout)) 208 error(FATAL, "stdout: %s", strerror(errno)); 209 exit (rval); 210 } 211 212 /* 213 * Like fgets, but go through the chain of compilation units chaining them 214 * together. Empty strings and files are ignored. 215 */ 216 char * 217 cu_fgets(char **outbuf, size_t *outsize) 218 { 219 static enum {ST_EOF, ST_FILE, ST_STRING} state = ST_EOF; 220 static FILE *f; /* Current open file */ 221 static char *s; /* Current pointer inside string */ 222 static char string_ident[30]; 223 size_t len; 224 char *p; 225 226 if (*outbuf == NULL) 227 *outsize = 0; 228 229 again: 230 switch (state) { 231 case ST_EOF: 232 if (script == NULL) 233 return (NULL); 234 linenum = 0; 235 switch (script->type) { 236 case CU_FILE: 237 if ((f = fopen(script->s, "r")) == NULL) 238 error(FATAL, 239 "%s: %s", script->s, strerror(errno)); 240 fname = script->s; 241 state = ST_FILE; 242 goto again; 243 case CU_STRING: 244 len = snprintf(string_ident, sizeof(string_ident), 245 "\"%s\"", script->s); 246 if (len >= sizeof(string_ident)) 247 strlcpy(string_ident + 248 sizeof(string_ident) - 6, " ...\"", 5); 249 fname = string_ident; 250 s = script->s; 251 state = ST_STRING; 252 goto again; 253 } 254 case ST_FILE: 255 if ((p = fgetln(f, &len)) != NULL) { 256 linenum++; 257 if (len >= *outsize) { 258 free(*outbuf); 259 *outsize = ROUNDLEN(len + 1); 260 *outbuf = xmalloc(*outsize); 261 } 262 memcpy(*outbuf, p, len); 263 (*outbuf)[len] = '\0'; 264 if (linenum == 1 && p[0] == '#' && p[1] == 'n') 265 nflag = 1; 266 return (*outbuf); 267 } 268 script = script->next; 269 (void)fclose(f); 270 state = ST_EOF; 271 goto again; 272 case ST_STRING: 273 if (linenum == 0 && s[0] == '#' && s[1] == 'n') 274 nflag = 1; 275 p = *outbuf; 276 len = *outsize; 277 for (;;) { 278 if (len <= 1) { 279 *outbuf = xrealloc(*outbuf, 280 *outsize + _POSIX2_LINE_MAX); 281 p = *outbuf + *outsize - len; 282 len += _POSIX2_LINE_MAX; 283 *outsize += _POSIX2_LINE_MAX; 284 } 285 switch (*s) { 286 case '\0': 287 state = ST_EOF; 288 if (s == script->s) { 289 script = script->next; 290 goto again; 291 } else { 292 script = script->next; 293 *p = '\0'; 294 linenum++; 295 return (*outbuf); 296 } 297 case '\n': 298 *p++ = '\n'; 299 *p = '\0'; 300 s++; 301 linenum++; 302 return (*outbuf); 303 default: 304 *p++ = *s++; 305 len--; 306 } 307 } 308 } 309 310 return (NULL); 311 } 312 313 void 314 finish_file(void) 315 { 316 if (infile != NULL) { 317 fclose(infile); 318 if (*oldfname != '\0') { 319 if (rename(fname, oldfname) != 0) { 320 warning("rename()"); 321 unlink(tmpfname); 322 exit(1); 323 } 324 *oldfname = '\0'; 325 } 326 if (*tmpfname != '\0') { 327 if (outfile != NULL && outfile != stdout) 328 fclose(outfile); 329 outfile = NULL; 330 rename(tmpfname, fname); 331 *tmpfname = '\0'; 332 } 333 outfname = NULL; 334 } 335 } 336 337 /* 338 * Like fgets, but go through the list of files chaining them together. 339 * Set len to the length of the line. 340 */ 341 int 342 mf_fgets(SPACE *sp, enum e_spflag spflag) 343 { 344 struct stat sb; 345 size_t len; 346 char dirbuf[PATH_MAX]; 347 char *p; 348 int c, fd; 349 static int firstfile; 350 351 if (infile == NULL) { 352 /* stdin? */ 353 if (files->fname == NULL) { 354 if (inplace != NULL) 355 error(FATAL, "-i may not be used with stdin"); 356 infile = stdin; 357 fname = "stdin"; 358 outfile = stdout; 359 outfname = "stdout"; 360 } 361 362 firstfile = 1; 363 } 364 365 for (;;) { 366 if (infile != NULL && (c = getc(infile)) != EOF) { 367 (void)ungetc(c, infile); 368 break; 369 } 370 /* If we are here then either eof or no files are open yet */ 371 if (infile == stdin) { 372 sp->len = 0; 373 return (0); 374 } 375 finish_file(); 376 if (firstfile == 0) 377 files = files->next; 378 else 379 firstfile = 0; 380 if (files == NULL) { 381 sp->len = 0; 382 return (0); 383 } 384 fname = files->fname; 385 if (inplace != NULL) { 386 if (lstat(fname, &sb) != 0) 387 error(FATAL, "%s: %s", fname, 388 strerror(errno ? errno : EIO)); 389 if (!S_ISREG(sb.st_mode)) 390 error(FATAL, "%s: %s %s", fname, 391 "in-place editing only", 392 "works for regular files"); 393 if (*inplace != '\0') { 394 strlcpy(oldfname, fname, 395 sizeof(oldfname)); 396 len = strlcat(oldfname, inplace, 397 sizeof(oldfname)); 398 if (len > sizeof(oldfname)) 399 error(FATAL, "%s: name too long", fname); 400 } 401 strlcpy(dirbuf, fname, sizeof(dirbuf)); 402 len = snprintf(tmpfname, sizeof(tmpfname), 403 "%s/sedXXXXXXXXXX", dirname(dirbuf)); 404 if (len >= sizeof(tmpfname)) 405 error(FATAL, "%s: name too long", fname); 406 if ((fd = mkstemp(tmpfname)) == -1) 407 error(FATAL, "%s: %s", fname, strerror(errno)); 408 if ((outfile = fdopen(fd, "w")) == NULL) { 409 unlink(tmpfname); 410 error(FATAL, "%s", fname); 411 } 412 fchown(fileno(outfile), sb.st_uid, sb.st_gid); 413 fchmod(fileno(outfile), sb.st_mode & ALLPERMS); 414 outfname = tmpfname; 415 linenum = 0; 416 resetstate(); 417 } else { 418 outfile = stdout; 419 outfname = "stdout"; 420 } 421 if ((infile = fopen(fname, "r")) == NULL) { 422 warning("%s", strerror(errno)); 423 rval = 1; 424 continue; 425 } 426 } 427 428 /* 429 * We are here only when infile is open and we still have something 430 * to read from it. 431 * 432 * Use fgetln so that we can handle essentially infinite input data. 433 * Can't use the pointer into the stdio buffer as the process space 434 * because the ungetc() can cause it to move. 435 */ 436 p = fgetln(infile, &len); 437 if (ferror(infile)) 438 error(FATAL, "%s: %s", fname, strerror(errno ? errno : EIO)); 439 if (len != 0 && p[len - 1] == '\n') { 440 sp->append_newline = 1; 441 len--; 442 } else if (!lastline()) { 443 sp->append_newline = 1; 444 } else { 445 sp->append_newline = 0; 446 } 447 cspace(sp, p, len, spflag); 448 449 linenum++; 450 451 return (1); 452 } 453 454 /* 455 * Add a compilation unit to the linked list 456 */ 457 static void 458 add_compunit(enum e_cut type, char *s) 459 { 460 struct s_compunit *cu; 461 462 cu = xmalloc(sizeof(struct s_compunit)); 463 cu->type = type; 464 cu->s = s; 465 cu->next = NULL; 466 *cu_nextp = cu; 467 cu_nextp = &cu->next; 468 } 469 470 /* 471 * Add a file to the linked list 472 */ 473 static void 474 add_file(char *s) 475 { 476 struct s_flist *fp; 477 478 fp = xmalloc(sizeof(struct s_flist)); 479 fp->next = NULL; 480 *fl_nextp = fp; 481 fp->fname = s; 482 fl_nextp = &fp->next; 483 } 484 485 486 static int 487 next_files_have_lines() 488 { 489 struct s_flist *file; 490 FILE *file_fd; 491 int ch; 492 493 file = files; 494 while ((file = file->next) != NULL) { 495 if ((file_fd = fopen(file->fname, "r")) == NULL) 496 continue; 497 498 if ((ch = getc(file_fd)) != EOF) { 499 /* 500 * This next file has content, therefore current 501 * file doesn't contains the last line. 502 */ 503 ungetc(ch, file_fd); 504 fclose(file_fd); 505 return (1); 506 } 507 fclose(file_fd); 508 } 509 return (0); 510 } 511 512 int 513 lastline(void) 514 { 515 int ch; 516 517 if (feof(infile)) { 518 return !( 519 (inplace == NULL) && 520 next_files_have_lines()); 521 } 522 if ((ch = getc(infile)) == EOF) { 523 return !( 524 (inplace == NULL) && 525 next_files_have_lines()); 526 } 527 ungetc(ch, infile); 528 return (0); 529 } 530