xref: /openbsd-src/usr.bin/patch/inp.c (revision 6f05df2d9be0954bec42d51d943d77bd250fb664)
1 /*	$OpenBSD: inp.c,v 1.41 2014/11/25 10:22:08 tobias Exp $	*/
2 
3 /*
4  * patch - a program to apply diffs to original files
5  *
6  * Copyright 1986, Larry Wall
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following condition is met:
10  * 1. Redistributions of source code must retain the above copyright notice,
11  * this condition and the following disclaimer.
12  *
13  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND ANY
14  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
15  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
16  * DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
17  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
18  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
19  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
20  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
21  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
22  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
23  * SUCH DAMAGE.
24  *
25  * -C option added in 1998, original code by Marc Espie, based on FreeBSD
26  * behaviour
27  */
28 
29 #include <sys/types.h>
30 #include <sys/file.h>
31 #include <sys/stat.h>
32 #include <sys/mman.h>
33 
34 #include <ctype.h>
35 #include <libgen.h>
36 #include <limits.h>
37 #include <stddef.h>
38 #include <stdio.h>
39 #include <stdlib.h>
40 #include <string.h>
41 #include <unistd.h>
42 
43 #include "common.h"
44 #include "util.h"
45 #include "pch.h"
46 #include "inp.h"
47 
48 
49 /* Input-file-with-indexable-lines abstract type */
50 
51 static off_t	i_size;		/* size of the input file */
52 static char	*i_womp;	/* plan a buffer for entire file */
53 static char	**i_ptr;	/* pointers to lines in i_womp */
54 
55 static int	tifd = -1;	/* plan b virtual string array */
56 static char	*tibuf[2];	/* plan b buffers */
57 static LINENUM	tiline[2] = {-1, -1};	/* 1st line in each buffer */
58 static LINENUM	lines_per_buf;	/* how many lines per buffer */
59 static int	tireclen;	/* length of records in tmp file */
60 
61 static bool	rev_in_string(const char *);
62 static bool	reallocate_lines(size_t *);
63 
64 /* returns false if insufficient memory */
65 static bool	plan_a(const char *);
66 
67 static void	plan_b(const char *);
68 
69 /* New patch--prepare to edit another file. */
70 
71 void
72 re_input(void)
73 {
74 	if (using_plan_a) {
75 		free(i_ptr);
76 		i_ptr = NULL;
77 		if (i_womp != NULL) {
78 			munmap(i_womp, i_size);
79 			i_womp = NULL;
80 		}
81 		i_size = 0;
82 	} else {
83 		using_plan_a = true;	/* maybe the next one is smaller */
84 		close(tifd);
85 		tifd = -1;
86 		free(tibuf[0]);
87 		free(tibuf[1]);
88 		tibuf[0] = tibuf[1] = NULL;
89 		tiline[0] = tiline[1] = -1;
90 		tireclen = 0;
91 	}
92 }
93 
94 /* Construct the line index, somehow or other. */
95 
96 void
97 scan_input(const char *filename)
98 {
99 	if (!plan_a(filename))
100 		plan_b(filename);
101 	if (verbose) {
102 		say("Patching file %s using Plan %s...\n", filename,
103 		    (using_plan_a ? "A" : "B"));
104 	}
105 }
106 
107 static bool
108 reallocate_lines(size_t *lines_allocated)
109 {
110 	char	**p;
111 	size_t	new_size;
112 
113 	new_size = *lines_allocated * 3 / 2;
114 	p = reallocarray(i_ptr, new_size + 2, sizeof(char *));
115 	if (p == NULL) {	/* shucks, it was a near thing */
116 		munmap(i_womp, i_size);
117 		i_womp = NULL;
118 		free(i_ptr);
119 		i_ptr = NULL;
120 		*lines_allocated = 0;
121 		return false;
122 	}
123 	*lines_allocated = new_size;
124 	i_ptr = p;
125 	return true;
126 }
127 
128 /* Try keeping everything in memory. */
129 
130 static bool
131 plan_a(const char *filename)
132 {
133 	int		ifd, statfailed;
134 	char		*p, *s, lbuf[MAXLINELEN];
135 	struct stat	filestat;
136 	off_t		i;
137 	ptrdiff_t	sz;
138 	size_t		iline, lines_allocated;
139 
140 #ifdef DEBUGGING
141 	if (debug & 8)
142 		return false;
143 #endif
144 
145 	if (filename == NULL || *filename == '\0')
146 		return false;
147 
148 	statfailed = stat(filename, &filestat);
149 	if (statfailed && ok_to_create_file) {
150 		if (verbose)
151 			say("(Creating file %s...)\n", filename);
152 
153 		/*
154 		 * in check_patch case, we still display `Creating file' even
155 		 * though we're not. The rule is that -C should be as similar
156 		 * to normal patch behavior as possible
157 		 */
158 		if (check_only)
159 			return true;
160 		makedirs(filename, true);
161 		close(creat(filename, 0666));
162 		statfailed = stat(filename, &filestat);
163 	}
164 	if (statfailed && check_only)
165 		fatal("%s not found, -C mode, can't probe further\n", filename);
166 	/* For nonexistent or read-only files, look for RCS versions.  */
167 	if (statfailed ||
168 	    /* No one can write to it.  */
169 	    (filestat.st_mode & 0222) == 0 ||
170 	    /* I can't write to it.  */
171 	    ((filestat.st_mode & 0022) == 0 && filestat.st_uid != getuid())) {
172 		char	*cs = NULL, *filebase, *filedir;
173 		struct stat	cstat;
174 
175 		filebase = basename(filename);
176 		filedir = dirname(filename);
177 
178 		/* Leave room in lbuf for the diff command.  */
179 		s = lbuf + 20;
180 
181 #define try(f, a1, a2, a3) \
182 	(snprintf(s, sizeof lbuf - 20, f, a1, a2, a3), stat(s, &cstat) == 0)
183 
184 		if (try("%s/RCS/%s%s", filedir, filebase, RCSSUFFIX) ||
185 		    try("%s/RCS/%s%s", filedir, filebase, "") ||
186 		    try("%s/%s%s", filedir, filebase, RCSSUFFIX)) {
187 			snprintf(buf, sizeof buf, CHECKOUT, filename);
188 			snprintf(lbuf, sizeof lbuf, RCSDIFF, filename);
189 			cs = "RCS";
190 		} else if (statfailed)
191 			fatal("can't find %s\n", filename);
192 		/*
193 		 * else we can't write to it but it's not under a version
194 		 * control system, so just proceed.
195 		 */
196 		if (cs) {
197 			if (!statfailed) {
198 				if ((filestat.st_mode & 0222) != 0)
199 					/* The owner can write to it.  */
200 					fatal("file %s seems to be locked "
201 					    "by somebody else under %s\n",
202 					    filename, cs);
203 				/*
204 				 * It might be checked out unlocked.  See if
205 				 * it's safe to check out the default version
206 				 * locked.
207 				 */
208 				if (verbose)
209 					say("Comparing file %s to default "
210 					    "%s version...\n",
211 					    filename, cs);
212 				if (system(lbuf))
213 					fatal("can't check out file %s: "
214 					    "differs from default %s version\n",
215 					    filename, cs);
216 			}
217 			if (verbose)
218 				say("Checking out file %s from %s...\n",
219 				    filename, cs);
220 			if (system(buf) || stat(filename, &filestat))
221 				fatal("can't check out file %s from %s\n",
222 				    filename, cs);
223 		}
224 	}
225 	filemode = filestat.st_mode;
226 	if (!S_ISREG(filemode))
227 		fatal("%s is not a normal file--can't patch\n", filename);
228 	i_size = filestat.st_size;
229 	if (out_of_mem) {
230 		set_hunkmax();	/* make sure dynamic arrays are allocated */
231 		out_of_mem = false;
232 		return false;	/* force plan b because plan a bombed */
233 	}
234 	if (i_size > SIZE_MAX) {
235 		say("block too large to mmap\n");
236 		return false;
237 	}
238 	if ((ifd = open(filename, O_RDONLY)) < 0)
239 		pfatal("can't open file %s", filename);
240 
241 	if (i_size) {
242 		i_womp = mmap(NULL, i_size, PROT_READ, MAP_PRIVATE, ifd, 0);
243 		if (i_womp == MAP_FAILED) {
244 			perror("mmap failed");
245 			i_womp = NULL;
246 			close(ifd);
247 			return false;
248 		}
249 	} else {
250 		i_womp = NULL;
251 	}
252 
253 	close(ifd);
254 	if (i_size)
255 		madvise(i_womp, i_size, MADV_SEQUENTIAL);
256 
257 	/* estimate the number of lines */
258 	lines_allocated = i_size / 25;
259 	if (lines_allocated < 100)
260 		lines_allocated = 100;
261 
262 	if (!reallocate_lines(&lines_allocated))
263 		return false;
264 
265 	/* now scan the buffer and build pointer array */
266 	iline = 1;
267 	i_ptr[iline] = i_womp;
268 	/* test for NUL too, to maintain the behavior of the original code */
269 	for (s = i_womp, i = 0; i < i_size && *s != '\0'; s++, i++) {
270 		if (*s == '\n') {
271 			if (iline == lines_allocated) {
272 				if (!reallocate_lines(&lines_allocated))
273 					return false;
274 			}
275 			/* these are NOT NUL terminated */
276 			i_ptr[++iline] = s + 1;
277 		}
278 	}
279 	/* if the last line contains no EOL, append one */
280 	if (i_size > 0 && i_womp[i_size - 1] != '\n') {
281 		last_line_missing_eol = true;
282 		/* fix last line */
283 		sz = s - i_ptr[iline];
284 		p = malloc(sz + 1);
285 		if (p == NULL) {
286 			free(i_ptr);
287 			i_ptr = NULL;
288 			munmap(i_womp, i_size);
289 			i_womp = NULL;
290 			return false;
291 		}
292 
293 		memcpy(p, i_ptr[iline], sz);
294 		p[sz] = '\n';
295 		i_ptr[iline] = p;
296 		/* count the extra line and make it point to some valid mem */
297 		i_ptr[++iline] = "";
298 	} else
299 		last_line_missing_eol = false;
300 
301 	input_lines = iline - 1;
302 
303 	/* now check for revision, if any */
304 
305 	if (revision != NULL) {
306 		if (i_womp == NULL || !rev_in_string(i_womp)) {
307 			if (force) {
308 				if (verbose)
309 					say("Warning: this file doesn't appear "
310 					    "to be the %s version--patching anyway.\n",
311 					    revision);
312 			} else if (batch) {
313 				fatal("this file doesn't appear to be the "
314 				    "%s version--aborting.\n",
315 				    revision);
316 			} else {
317 				ask("This file doesn't appear to be the "
318 				    "%s version--patch anyway? [n] ",
319 				    revision);
320 				if (*buf != 'y')
321 					fatal("aborted\n");
322 			}
323 		} else if (verbose)
324 			say("Good.  This file appears to be the %s version.\n",
325 			    revision);
326 	}
327 	return true;		/* plan a will work */
328 }
329 
330 /* Keep (virtually) nothing in memory. */
331 
332 static void
333 plan_b(const char *filename)
334 {
335 	FILE	*ifp;
336 	size_t	i = 0, j, maxlen = 1;
337 	char	*p;
338 	bool	found_revision = (revision == NULL);
339 
340 	using_plan_a = false;
341 	if ((ifp = fopen(filename, "r")) == NULL)
342 		pfatal("can't open file %s", filename);
343 	(void) unlink(TMPINNAME);
344 	if ((tifd = open(TMPINNAME, O_EXCL | O_CREAT | O_WRONLY, 0666)) < 0)
345 		pfatal("can't open file %s", TMPINNAME);
346 	while (fgets(buf, sizeof buf, ifp) != NULL) {
347 		if (revision != NULL && !found_revision && rev_in_string(buf))
348 			found_revision = true;
349 		if ((i = strlen(buf)) > maxlen)
350 			maxlen = i;	/* find longest line */
351 	}
352 	last_line_missing_eol = i > 0 && buf[i - 1] != '\n';
353 	if (last_line_missing_eol && maxlen == i)
354 		maxlen++;
355 
356 	if (revision != NULL) {
357 		if (!found_revision) {
358 			if (force) {
359 				if (verbose)
360 					say("Warning: this file doesn't appear "
361 					    "to be the %s version--patching anyway.\n",
362 					    revision);
363 			} else if (batch) {
364 				fatal("this file doesn't appear to be the "
365 				    "%s version--aborting.\n",
366 				    revision);
367 			} else {
368 				ask("This file doesn't appear to be the %s "
369 				    "version--patch anyway? [n] ",
370 				    revision);
371 				if (*buf != 'y')
372 					fatal("aborted\n");
373 			}
374 		} else if (verbose)
375 			say("Good.  This file appears to be the %s version.\n",
376 			    revision);
377 	}
378 	fseek(ifp, 0L, SEEK_SET);	/* rewind file */
379 	lines_per_buf = BUFFERSIZE / maxlen;
380 	tireclen = maxlen;
381 	tibuf[0] = malloc(BUFFERSIZE + 1);
382 	if (tibuf[0] == NULL)
383 		fatal("out of memory\n");
384 	tibuf[1] = malloc(BUFFERSIZE + 1);
385 	if (tibuf[1] == NULL)
386 		fatal("out of memory\n");
387 	for (i = 1;; i++) {
388 		p = tibuf[0] + maxlen * (i % lines_per_buf);
389 		if (i % lines_per_buf == 0)	/* new block */
390 			if (write(tifd, tibuf[0], BUFFERSIZE) < BUFFERSIZE)
391 				pfatal("can't write temp file");
392 		if (fgets(p, maxlen + 1, ifp) == NULL) {
393 			input_lines = i - 1;
394 			if (i % lines_per_buf != 0)
395 				if (write(tifd, tibuf[0], BUFFERSIZE) < BUFFERSIZE)
396 					pfatal("can't write temp file");
397 			break;
398 		}
399 		j = strlen(p);
400 		/* These are '\n' terminated strings, so no need to add a NUL */
401 		if (j == 0 || p[j - 1] != '\n')
402 			p[j] = '\n';
403 	}
404 	fclose(ifp);
405 	close(tifd);
406 	if ((tifd = open(TMPINNAME, O_RDONLY)) < 0)
407 		pfatal("can't reopen file %s", TMPINNAME);
408 }
409 
410 /*
411  * Fetch a line from the input file, \n terminated, not necessarily \0.
412  */
413 char *
414 ifetch(LINENUM line, int whichbuf)
415 {
416 	if (line < 1 || line > input_lines) {
417 		if (warn_on_invalid_line) {
418 			say("No such line %ld in input file, ignoring\n", line);
419 			warn_on_invalid_line = false;
420 		}
421 		return NULL;
422 	}
423 	if (using_plan_a)
424 		return i_ptr[line];
425 	else {
426 		LINENUM	offline = line % lines_per_buf;
427 		LINENUM	baseline = line - offline;
428 
429 		if (tiline[0] == baseline)
430 			whichbuf = 0;
431 		else if (tiline[1] == baseline)
432 			whichbuf = 1;
433 		else {
434 			tiline[whichbuf] = baseline;
435 
436 			if (lseek(tifd, (off_t) (baseline / lines_per_buf *
437 			    BUFFERSIZE), SEEK_SET) < 0)
438 				pfatal("cannot seek in the temporary input file");
439 
440 			if (read(tifd, tibuf[whichbuf], BUFFERSIZE) < 0)
441 				pfatal("error reading tmp file %s", TMPINNAME);
442 		}
443 		return tibuf[whichbuf] + (tireclen * offline);
444 	}
445 }
446 
447 /*
448  * True if the string argument contains the revision number we want.
449  */
450 static bool
451 rev_in_string(const char *string)
452 {
453 	const char	*s;
454 	size_t		patlen;
455 
456 	if (revision == NULL)
457 		return true;
458 	patlen = strlen(revision);
459 	if (strnEQ(string, revision, patlen) &&
460 	    isspace((unsigned char)string[patlen]))
461 		return true;
462 	for (s = string; *s; s++) {
463 		if (isspace((unsigned char)*s) && strnEQ(s + 1, revision, patlen) &&
464 		    isspace((unsigned char)s[patlen + 1])) {
465 			return true;
466 		}
467 	}
468 	return false;
469 }
470