xref: /netbsd-src/bin/ed/sub.c (revision a3542600fb90a091eaaa565870223a5fc9ee33e4)
1*a3542600Sdholland /*	$NetBSD: sub.c,v 1.7 2014/03/23 05:06:42 dholland Exp $	*/
249f0ad86Scgd 
31357f155Salm /* sub.c: This file contains the substitution routines for the ed
41357f155Salm    line editor */
51357f155Salm /*-
61357f155Salm  * Copyright (c) 1993 Andrew Moore, Talke Studio.
71357f155Salm  * All rights reserved.
81357f155Salm  *
91357f155Salm  * Redistribution and use in source and binary forms, with or without
101357f155Salm  * modification, are permitted provided that the following conditions
111357f155Salm  * are met:
121357f155Salm  * 1. Redistributions of source code must retain the above copyright
131357f155Salm  *    notice, this list of conditions and the following disclaimer.
141357f155Salm  * 2. Redistributions in binary form must reproduce the above copyright
151357f155Salm  *    notice, this list of conditions and the following disclaimer in the
161357f155Salm  *    documentation and/or other materials provided with the distribution.
171357f155Salm  *
181357f155Salm  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
191357f155Salm  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
201357f155Salm  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
211357f155Salm  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
221357f155Salm  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
231357f155Salm  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
241357f155Salm  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
251357f155Salm  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
261357f155Salm  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
271357f155Salm  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
281357f155Salm  * SUCH DAMAGE.
291357f155Salm  */
301357f155Salm 
318b7ade1aSthorpej #include <sys/cdefs.h>
321357f155Salm #ifndef lint
3349f0ad86Scgd #if 0
341357f155Salm static char *rcsid = "@(#)sub.c,v 1.1 1994/02/01 00:34:44 alm Exp";
3549f0ad86Scgd #else
36*a3542600Sdholland __RCSID("$NetBSD: sub.c,v 1.7 2014/03/23 05:06:42 dholland Exp $");
3749f0ad86Scgd #endif
381357f155Salm #endif /* not lint */
391357f155Salm 
401357f155Salm #include "ed.h"
411357f155Salm 
421357f155Salm 
431357f155Salm char *rhbuf;			/* rhs substitution buffer */
441357f155Salm int rhbufsz;			/* rhs substitution buffer size */
451357f155Salm int rhbufi;			/* rhs substitution buffer index */
461357f155Salm 
471357f155Salm /* extract_subst_tail: extract substitution tail from the command buffer */
481357f155Salm int
extract_subst_tail(int * flagp,long * np)49d33a7206Sxtraeme extract_subst_tail(int *flagp, long *np)
501357f155Salm {
511357f155Salm 	char delimiter;
521357f155Salm 
531357f155Salm 	*flagp = *np = 0;
541357f155Salm 	if ((delimiter = *ibufp) == '\n') {
551357f155Salm 		rhbufi = 0;
561357f155Salm 		*flagp = GPR;
571357f155Salm 		return 0;
581357f155Salm 	} else if (extract_subst_template() == NULL)
591357f155Salm 		return  ERR;
601357f155Salm 	else if (*ibufp == '\n') {
611357f155Salm 		*flagp = GPR;
621357f155Salm 		return 0;
631357f155Salm 	} else if (*ibufp == delimiter)
641357f155Salm 		ibufp++;
651357f155Salm 	if ('1' <= *ibufp && *ibufp <= '9') {
661357f155Salm 		STRTOL(*np, ibufp);
671357f155Salm 		return 0;
681357f155Salm 	} else if (*ibufp == 'g') {
691357f155Salm 		ibufp++;
701357f155Salm 		*flagp = GSG;
711357f155Salm 		return 0;
721357f155Salm 	}
731357f155Salm 	return 0;
741357f155Salm }
751357f155Salm 
761357f155Salm 
771357f155Salm /* extract_subst_template: return pointer to copy of substitution template
781357f155Salm    in the command buffer */
791357f155Salm char *
extract_subst_template(void)80d33a7206Sxtraeme extract_subst_template(void)
811357f155Salm {
821357f155Salm 	int n = 0;
831357f155Salm 	int i = 0;
841357f155Salm 	char c;
851357f155Salm 	char delimiter = *ibufp++;
861357f155Salm 
871357f155Salm 	if (*ibufp == '%' && *(ibufp + 1) == delimiter) {
881357f155Salm 		ibufp++;
89*a3542600Sdholland 		if (!rhbuf) {
90*a3542600Sdholland 			seterrmsg("no previous substitution");
91*a3542600Sdholland 		}
921357f155Salm 		return rhbuf;
931357f155Salm 	}
941357f155Salm 	while (*ibufp != delimiter) {
951357f155Salm 		REALLOC(rhbuf, rhbufsz, i + 2, NULL);
961357f155Salm 		if ((c = rhbuf[i++] = *ibufp++) == '\n' && *ibufp == '\0') {
971357f155Salm 			i--, ibufp--;
981357f155Salm 			break;
991357f155Salm 		} else if (c != '\\')
1001357f155Salm 			;
1011357f155Salm 		else if ((rhbuf[i++] = *ibufp++) != '\n')
1021357f155Salm 			;
1031357f155Salm 		else if (!isglobal) {
1041357f155Salm 			while ((n = get_tty_line()) == 0 ||
1058b7ade1aSthorpej 			    (n > 0 && ibuf[n - 1] != '\n'))
1061357f155Salm 				clearerr(stdin);
1071357f155Salm 			if (n < 0)
1081357f155Salm 				return NULL;
1091357f155Salm 		}
1101357f155Salm 	}
1111357f155Salm 	REALLOC(rhbuf, rhbufsz, i + 1, NULL);
1121357f155Salm 	rhbuf[rhbufi = i] = '\0';
1131357f155Salm 	return  rhbuf;
1141357f155Salm }
1151357f155Salm 
1161357f155Salm 
1171357f155Salm char *rbuf;			/* substitute_matching_text buffer */
1181357f155Salm int rbufsz;			/* substitute_matching_text buffer size */
1191357f155Salm 
1201357f155Salm /* search_and_replace: for each line in a range, change text matching a pattern
1211357f155Salm    according to a substitution template; return status  */
1221357f155Salm int
search_and_replace(pattern_t * pat,int gflag,int kth)123d33a7206Sxtraeme search_and_replace(pattern_t *pat, int gflag, int kth)
1241357f155Salm {
1251357f155Salm 	undo_t *up;
1261357f155Salm 	char *txt;
1271357f155Salm 	char *eot;
1281357f155Salm 	long lc;
1299154deaeSmycroft 	long xa = current_addr;
1301357f155Salm 	int nsubs = 0;
1311357f155Salm 	line_t *lp;
1321357f155Salm 	int len;
1331357f155Salm 
1341357f155Salm 	current_addr = first_addr - 1;
1351357f155Salm 	for (lc = 0; lc <= second_addr - first_addr; lc++) {
1361357f155Salm 		lp = get_addressed_line_node(++current_addr);
1371357f155Salm 		if ((len = substitute_matching_text(pat, lp, gflag, kth)) < 0)
1381357f155Salm 			return ERR;
1391357f155Salm 		else if (len) {
1401357f155Salm 			up = NULL;
1411357f155Salm 			if (delete_lines(current_addr, current_addr) < 0)
1421357f155Salm 				return ERR;
1431357f155Salm 			txt = rbuf;
1441357f155Salm 			eot = rbuf + len;
1451357f155Salm 			SPL1();
1461357f155Salm 			do {
1471357f155Salm 				if ((txt = put_sbuf_line(txt)) == NULL) {
1481357f155Salm 					SPL0();
1491357f155Salm 					return ERR;
1501357f155Salm 				} else if (up)
1511357f155Salm 					up->t = get_addressed_line_node(current_addr);
1521357f155Salm 				else if ((up = push_undo_stack(UADD,
1531357f155Salm 				    current_addr, current_addr)) == NULL) {
1541357f155Salm 					SPL0();
1551357f155Salm 					return ERR;
1561357f155Salm 				}
1571357f155Salm 			} while (txt != eot);
1581357f155Salm 			SPL0();
1591357f155Salm 			nsubs++;
1609154deaeSmycroft 			xa = current_addr;
1611357f155Salm 		}
1621357f155Salm 	}
1639154deaeSmycroft 	current_addr = xa;
1641357f155Salm 	if  (nsubs == 0 && !(gflag & GLB)) {
165*a3542600Sdholland 		seterrmsg("no match");
1661357f155Salm 		return ERR;
1671357f155Salm 	} else if ((gflag & (GPR | GLS | GNP)) &&
1681357f155Salm 	    display_lines(current_addr, current_addr, gflag) < 0)
1691357f155Salm 		return ERR;
1701357f155Salm 	return 0;
1711357f155Salm }
1721357f155Salm 
1731357f155Salm 
1741357f155Salm /* substitute_matching_text: replace text matched by a pattern according to
1751357f155Salm    a substitution template; return pointer to the modified text */
1761357f155Salm int
substitute_matching_text(pattern_t * pat,line_t * lp,int gflag,int kth)177d33a7206Sxtraeme substitute_matching_text(pattern_t *pat, line_t *lp, int gflag, int kth)
1781357f155Salm {
1791357f155Salm 	int off = 0;
1801357f155Salm 	int changed = 0;
1811357f155Salm 	int matchno = 0;
1821357f155Salm 	int i = 0;
1831357f155Salm 	regmatch_t rm[SE_MAX];
1841357f155Salm 	char *txt;
1851357f155Salm 	char *eot;
1861357f155Salm 
1871357f155Salm 	if ((txt = get_sbuf_line(lp)) == NULL)
1881357f155Salm 		return ERR;
1891357f155Salm 	if (isbinary)
1901357f155Salm 		NUL_TO_NEWLINE(txt, lp->len);
1911357f155Salm 	eot = txt + lp->len;
1921357f155Salm 	if (!regexec(pat, txt, SE_MAX, rm, 0)) {
1931357f155Salm 		do {
1941357f155Salm 			if (!kth || kth == ++matchno) {
1951357f155Salm 				changed++;
1961357f155Salm 				i = rm[0].rm_so;
1971357f155Salm 				REALLOC(rbuf, rbufsz, off + i, ERR);
1981357f155Salm 				if (isbinary)
1991357f155Salm 					NEWLINE_TO_NUL(txt, rm[0].rm_eo);
2001357f155Salm 				memcpy(rbuf + off, txt, i);
2011357f155Salm 				off += i;
2021357f155Salm 				if ((off = apply_subst_template(txt, rm, off,
2031357f155Salm 				    pat->re_nsub)) < 0)
2041357f155Salm 					return ERR;
2051357f155Salm 			} else {
2061357f155Salm 				i = rm[0].rm_eo;
2071357f155Salm 				REALLOC(rbuf, rbufsz, off + i, ERR);
2081357f155Salm 				if (isbinary)
2091357f155Salm 					NEWLINE_TO_NUL(txt, i);
2101357f155Salm 				memcpy(rbuf + off, txt, i);
2111357f155Salm 				off += i;
2121357f155Salm 			}
2131357f155Salm 			txt += rm[0].rm_eo;
2148b7ade1aSthorpej 		} while (*txt && (!changed || ((gflag & GSG) && rm[0].rm_eo))
2158b7ade1aSthorpej 		    && !regexec(pat, txt, SE_MAX, rm, REG_NOTBOL));
2161357f155Salm 		i = eot - txt;
2171357f155Salm 		REALLOC(rbuf, rbufsz, off + i + 2, ERR);
2181357f155Salm 		if (i > 0 && !rm[0].rm_eo && (gflag & GSG)) {
219*a3542600Sdholland 			seterrmsg("infinite substitution loop");
2201357f155Salm 			return  ERR;
2211357f155Salm 		}
2221357f155Salm 		if (isbinary)
2231357f155Salm 			NEWLINE_TO_NUL(txt, i);
2241357f155Salm 		memcpy(rbuf + off, txt, i);
2251357f155Salm 		memcpy(rbuf + off + i, "\n", 2);
2261357f155Salm 	}
2271357f155Salm 	return changed ? off + i + 1 : 0;
2281357f155Salm }
2291357f155Salm 
2301357f155Salm 
2311357f155Salm /* apply_subst_template: modify text according to a substitution template;
2321357f155Salm    return offset to end of modified text */
2331357f155Salm int
apply_subst_template(char * boln,regmatch_t * rm,int off,int re_nsub)234d33a7206Sxtraeme apply_subst_template(char *boln, regmatch_t *rm, int off, int re_nsub)
2351357f155Salm {
2361357f155Salm 	int j = 0;
2371357f155Salm 	int k = 0;
2381357f155Salm 	int n;
2391357f155Salm 	char *sub = rhbuf;
2401357f155Salm 
2411357f155Salm 	for (; sub - rhbuf < rhbufi; sub++)
2421357f155Salm 		if (*sub == '&') {
2431357f155Salm 			j = rm[0].rm_so;
2441357f155Salm 			k = rm[0].rm_eo;
2451357f155Salm 			REALLOC(rbuf, rbufsz, off + k - j, ERR);
2461357f155Salm 			while (j < k)
2471357f155Salm 				rbuf[off++] = boln[j++];
2481357f155Salm 		} else if (*sub == '\\' && '1' <= *++sub && *sub <= '9' &&
2491357f155Salm 		    (n = *sub - '0') <= re_nsub) {
2501357f155Salm 			j = rm[n].rm_so;
2511357f155Salm 			k = rm[n].rm_eo;
2521357f155Salm 			REALLOC(rbuf, rbufsz, off + k - j, ERR);
2531357f155Salm 			while (j < k)
2541357f155Salm 				rbuf[off++] = boln[j++];
2551357f155Salm 		} else {
2561357f155Salm 			REALLOC(rbuf, rbufsz, off + 1, ERR);
2571357f155Salm 			rbuf[off++] = *sub;
2581357f155Salm 		}
2591357f155Salm 	REALLOC(rbuf, rbufsz, off + 1, ERR);
2601357f155Salm 	rbuf[off] = '\0';
2611357f155Salm 	return off;
2621357f155Salm }
263