xref: /dflybsd-src/contrib/bmake/for.c (revision 9e7ae5a0527a977cab412aede3a532cfe2903bbb)
1*6eef5f0cSAntonio Huete Jimenez /*	$NetBSD: for.c,v 1.170 2022/09/03 00:50:07 rillig Exp $	*/
201e196c8SJohn Marino 
301e196c8SJohn Marino /*
401e196c8SJohn Marino  * Copyright (c) 1992, The Regents of the University of California.
501e196c8SJohn Marino  * All rights reserved.
601e196c8SJohn Marino  *
701e196c8SJohn Marino  * Redistribution and use in source and binary forms, with or without
801e196c8SJohn Marino  * modification, are permitted provided that the following conditions
901e196c8SJohn Marino  * are met:
1001e196c8SJohn Marino  * 1. Redistributions of source code must retain the above copyright
1101e196c8SJohn Marino  *    notice, this list of conditions and the following disclaimer.
1201e196c8SJohn Marino  * 2. Redistributions in binary form must reproduce the above copyright
1301e196c8SJohn Marino  *    notice, this list of conditions and the following disclaimer in the
1401e196c8SJohn Marino  *    documentation and/or other materials provided with the distribution.
1501e196c8SJohn Marino  * 3. Neither the name of the University nor the names of its contributors
1601e196c8SJohn Marino  *    may be used to endorse or promote products derived from this software
1701e196c8SJohn Marino  *    without specific prior written permission.
1801e196c8SJohn Marino  *
1901e196c8SJohn Marino  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
2001e196c8SJohn Marino  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2101e196c8SJohn Marino  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2201e196c8SJohn Marino  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
2301e196c8SJohn Marino  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2401e196c8SJohn Marino  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2501e196c8SJohn Marino  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2601e196c8SJohn Marino  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2701e196c8SJohn Marino  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2801e196c8SJohn Marino  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2901e196c8SJohn Marino  * SUCH DAMAGE.
3001e196c8SJohn Marino  */
3101e196c8SJohn Marino 
32a34d5fb1SAntonio Huete Jimenez /*
33a34d5fb1SAntonio Huete Jimenez  * Handling of .for/.endfor loops in a makefile.
34a34d5fb1SAntonio Huete Jimenez  *
35a34d5fb1SAntonio Huete Jimenez  * For loops have the form:
36a34d5fb1SAntonio Huete Jimenez  *
37a34d5fb1SAntonio Huete Jimenez  *	.for <varname...> in <value...>
38a34d5fb1SAntonio Huete Jimenez  *	# the body
39a34d5fb1SAntonio Huete Jimenez  *	.endfor
40a34d5fb1SAntonio Huete Jimenez  *
41a34d5fb1SAntonio Huete Jimenez  * When a .for line is parsed, the following lines are copied to the body of
42a34d5fb1SAntonio Huete Jimenez  * the .for loop, until the corresponding .endfor line is reached.  In this
43a34d5fb1SAntonio Huete Jimenez  * phase, the body is not yet evaluated.  This also applies to any nested
44a34d5fb1SAntonio Huete Jimenez  * .for loops.
45a34d5fb1SAntonio Huete Jimenez  *
46a34d5fb1SAntonio Huete Jimenez  * After reaching the .endfor, the values from the .for line are grouped
47a34d5fb1SAntonio Huete Jimenez  * according to the number of variables.  For each such group, the unexpanded
48*6eef5f0cSAntonio Huete Jimenez  * body is scanned for variable expressions, and those that match the
49*6eef5f0cSAntonio Huete Jimenez  * variable names are replaced with expressions of the form ${:U...}.  After
50*6eef5f0cSAntonio Huete Jimenez  * that, the body is treated like a file from an .include directive.
5101e196c8SJohn Marino  *
5201e196c8SJohn Marino  * Interface:
5301e196c8SJohn Marino  *	For_Eval	Evaluate the loop in the passed line.
5401e196c8SJohn Marino  *
55a34d5fb1SAntonio Huete Jimenez  *	For_Run		Run accumulated loop
5601e196c8SJohn Marino  */
5701e196c8SJohn Marino 
5801e196c8SJohn Marino #include "make.h"
5901e196c8SJohn Marino 
60a34d5fb1SAntonio Huete Jimenez /*	"@(#)for.c	8.1 (Berkeley) 6/6/93"	*/
61*6eef5f0cSAntonio Huete Jimenez MAKE_RCSID("$NetBSD: for.c,v 1.170 2022/09/03 00:50:07 rillig Exp $");
6201e196c8SJohn Marino 
6301e196c8SJohn Marino 
64a34d5fb1SAntonio Huete Jimenez typedef struct ForLoop {
65*6eef5f0cSAntonio Huete Jimenez 	Vector /* of 'char *' */ vars; /* Iteration variables */
66*6eef5f0cSAntonio Huete Jimenez 	SubstringWords items;	/* Substitution items */
67a34d5fb1SAntonio Huete Jimenez 	Buffer body;		/* Unexpanded body of the loop */
68*6eef5f0cSAntonio Huete Jimenez 	unsigned int nextItem;	/* Where to continue iterating */
69a34d5fb1SAntonio Huete Jimenez } ForLoop;
70a34d5fb1SAntonio Huete Jimenez 
71a34d5fb1SAntonio Huete Jimenez 
72a34d5fb1SAntonio Huete Jimenez static ForLoop *accumFor;	/* Loop being accumulated */
7301e196c8SJohn Marino 
7401e196c8SJohn Marino 
75a34d5fb1SAntonio Huete Jimenez static ForLoop *
ForLoop_New(void)76a34d5fb1SAntonio Huete Jimenez ForLoop_New(void)
7701e196c8SJohn Marino {
78a34d5fb1SAntonio Huete Jimenez 	ForLoop *f = bmake_malloc(sizeof *f);
7901e196c8SJohn Marino 
80*6eef5f0cSAntonio Huete Jimenez 	Vector_Init(&f->vars, sizeof(char *));
81*6eef5f0cSAntonio Huete Jimenez 	SubstringWords_Init(&f->items);
82a34d5fb1SAntonio Huete Jimenez 	Buf_Init(&f->body);
83*6eef5f0cSAntonio Huete Jimenez 	f->nextItem = 0;
84a34d5fb1SAntonio Huete Jimenez 
85a34d5fb1SAntonio Huete Jimenez 	return f;
8601e196c8SJohn Marino }
8701e196c8SJohn Marino 
88*6eef5f0cSAntonio Huete Jimenez void
ForLoop_Free(ForLoop * f)89a34d5fb1SAntonio Huete Jimenez ForLoop_Free(ForLoop *f)
9001e196c8SJohn Marino {
91*6eef5f0cSAntonio Huete Jimenez 	while (f->vars.len > 0)
92*6eef5f0cSAntonio Huete Jimenez 		free(*(char **)Vector_Pop(&f->vars));
93a34d5fb1SAntonio Huete Jimenez 	Vector_Done(&f->vars);
94a34d5fb1SAntonio Huete Jimenez 
95*6eef5f0cSAntonio Huete Jimenez 	SubstringWords_Free(f->items);
96*6eef5f0cSAntonio Huete Jimenez 	Buf_Done(&f->body);
97a34d5fb1SAntonio Huete Jimenez 
98a34d5fb1SAntonio Huete Jimenez 	free(f);
9901e196c8SJohn Marino }
10001e196c8SJohn Marino 
101*6eef5f0cSAntonio Huete Jimenez char *
ForLoop_Details(ForLoop * f)102*6eef5f0cSAntonio Huete Jimenez ForLoop_Details(ForLoop *f)
103a34d5fb1SAntonio Huete Jimenez {
104*6eef5f0cSAntonio Huete Jimenez 	size_t i, n;
105*6eef5f0cSAntonio Huete Jimenez 	const char **vars;
106*6eef5f0cSAntonio Huete Jimenez 	const Substring *items;
107*6eef5f0cSAntonio Huete Jimenez 	Buffer buf;
108*6eef5f0cSAntonio Huete Jimenez 
109*6eef5f0cSAntonio Huete Jimenez 	n = f->vars.len;
110*6eef5f0cSAntonio Huete Jimenez 	vars = f->vars.items;
111*6eef5f0cSAntonio Huete Jimenez 	assert(f->nextItem >= n);
112*6eef5f0cSAntonio Huete Jimenez 	items = f->items.words + f->nextItem - n;
113*6eef5f0cSAntonio Huete Jimenez 
114*6eef5f0cSAntonio Huete Jimenez 	Buf_Init(&buf);
115*6eef5f0cSAntonio Huete Jimenez 	for (i = 0; i < n; i++) {
116*6eef5f0cSAntonio Huete Jimenez 		if (i > 0)
117*6eef5f0cSAntonio Huete Jimenez 			Buf_AddStr(&buf, ", ");
118*6eef5f0cSAntonio Huete Jimenez 		Buf_AddStr(&buf, vars[i]);
119*6eef5f0cSAntonio Huete Jimenez 		Buf_AddStr(&buf, " = ");
120*6eef5f0cSAntonio Huete Jimenez 		Buf_AddBytesBetween(&buf, items[i].start, items[i].end);
121*6eef5f0cSAntonio Huete Jimenez 	}
122*6eef5f0cSAntonio Huete Jimenez 	return Buf_DoneData(&buf);
123a34d5fb1SAntonio Huete Jimenez }
124a34d5fb1SAntonio Huete Jimenez 
125*6eef5f0cSAntonio Huete Jimenez static bool
ForLoop_ParseVarnames(ForLoop * f,const char ** pp)126a34d5fb1SAntonio Huete Jimenez ForLoop_ParseVarnames(ForLoop *f, const char **pp)
127a34d5fb1SAntonio Huete Jimenez {
128a34d5fb1SAntonio Huete Jimenez 	const char *p = *pp;
129a34d5fb1SAntonio Huete Jimenez 
130a34d5fb1SAntonio Huete Jimenez 	for (;;) {
131a34d5fb1SAntonio Huete Jimenez 		size_t len;
132a34d5fb1SAntonio Huete Jimenez 
133a34d5fb1SAntonio Huete Jimenez 		cpp_skip_whitespace(&p);
134a34d5fb1SAntonio Huete Jimenez 		if (*p == '\0') {
135a34d5fb1SAntonio Huete Jimenez 			Parse_Error(PARSE_FATAL, "missing `in' in for");
136*6eef5f0cSAntonio Huete Jimenez 			return false;
137a34d5fb1SAntonio Huete Jimenez 		}
138a34d5fb1SAntonio Huete Jimenez 
139a34d5fb1SAntonio Huete Jimenez 		/*
140a34d5fb1SAntonio Huete Jimenez 		 * XXX: This allows arbitrary variable names;
141a34d5fb1SAntonio Huete Jimenez 		 * see directive-for.mk.
142a34d5fb1SAntonio Huete Jimenez 		 */
143a34d5fb1SAntonio Huete Jimenez 		for (len = 1; p[len] != '\0' && !ch_isspace(p[len]); len++)
144a34d5fb1SAntonio Huete Jimenez 			continue;
145a34d5fb1SAntonio Huete Jimenez 
146a34d5fb1SAntonio Huete Jimenez 		if (len == 2 && p[0] == 'i' && p[1] == 'n') {
147a34d5fb1SAntonio Huete Jimenez 			p += 2;
148a34d5fb1SAntonio Huete Jimenez 			break;
149a34d5fb1SAntonio Huete Jimenez 		}
150a34d5fb1SAntonio Huete Jimenez 
151*6eef5f0cSAntonio Huete Jimenez 		*(char **)Vector_Push(&f->vars) = bmake_strldup(p, len);
152a34d5fb1SAntonio Huete Jimenez 		p += len;
153a34d5fb1SAntonio Huete Jimenez 	}
154a34d5fb1SAntonio Huete Jimenez 
155a34d5fb1SAntonio Huete Jimenez 	if (f->vars.len == 0) {
156a34d5fb1SAntonio Huete Jimenez 		Parse_Error(PARSE_FATAL, "no iteration variables in for");
157*6eef5f0cSAntonio Huete Jimenez 		return false;
158a34d5fb1SAntonio Huete Jimenez 	}
159a34d5fb1SAntonio Huete Jimenez 
160a34d5fb1SAntonio Huete Jimenez 	*pp = p;
161*6eef5f0cSAntonio Huete Jimenez 	return true;
162a34d5fb1SAntonio Huete Jimenez }
163a34d5fb1SAntonio Huete Jimenez 
164*6eef5f0cSAntonio Huete Jimenez static bool
ForLoop_ParseItems(ForLoop * f,const char * p)165a34d5fb1SAntonio Huete Jimenez ForLoop_ParseItems(ForLoop *f, const char *p)
166a34d5fb1SAntonio Huete Jimenez {
167a34d5fb1SAntonio Huete Jimenez 	char *items;
168a34d5fb1SAntonio Huete Jimenez 
169a34d5fb1SAntonio Huete Jimenez 	cpp_skip_whitespace(&p);
170a34d5fb1SAntonio Huete Jimenez 
171a34d5fb1SAntonio Huete Jimenez 	if (Var_Subst(p, SCOPE_GLOBAL, VARE_WANTRES, &items) != VPR_OK) {
172a34d5fb1SAntonio Huete Jimenez 		Parse_Error(PARSE_FATAL, "Error in .for loop items");
173*6eef5f0cSAntonio Huete Jimenez 		return false;
174a34d5fb1SAntonio Huete Jimenez 	}
175a34d5fb1SAntonio Huete Jimenez 
176*6eef5f0cSAntonio Huete Jimenez 	f->items = Substring_Words(items, false);
177a34d5fb1SAntonio Huete Jimenez 	free(items);
178a34d5fb1SAntonio Huete Jimenez 
179*6eef5f0cSAntonio Huete Jimenez 	if (f->items.len == 1 && Substring_IsEmpty(f->items.words[0]))
180a34d5fb1SAntonio Huete Jimenez 		f->items.len = 0;	/* .for var in ${:U} */
181a34d5fb1SAntonio Huete Jimenez 
182*6eef5f0cSAntonio Huete Jimenez 	if (f->items.len % f->vars.len != 0) {
183a34d5fb1SAntonio Huete Jimenez 		Parse_Error(PARSE_FATAL,
184a34d5fb1SAntonio Huete Jimenez 		    "Wrong number of words (%u) in .for "
185a34d5fb1SAntonio Huete Jimenez 		    "substitution list with %u variables",
186a34d5fb1SAntonio Huete Jimenez 		    (unsigned)f->items.len, (unsigned)f->vars.len);
187*6eef5f0cSAntonio Huete Jimenez 		return false;
188a34d5fb1SAntonio Huete Jimenez 	}
189a34d5fb1SAntonio Huete Jimenez 
190*6eef5f0cSAntonio Huete Jimenez 	return true;
191a34d5fb1SAntonio Huete Jimenez }
192a34d5fb1SAntonio Huete Jimenez 
193*6eef5f0cSAntonio Huete Jimenez static bool
IsFor(const char * p)194a34d5fb1SAntonio Huete Jimenez IsFor(const char *p)
195a34d5fb1SAntonio Huete Jimenez {
196a34d5fb1SAntonio Huete Jimenez 	return p[0] == 'f' && p[1] == 'o' && p[2] == 'r' && ch_isspace(p[3]);
197a34d5fb1SAntonio Huete Jimenez }
198a34d5fb1SAntonio Huete Jimenez 
199*6eef5f0cSAntonio Huete Jimenez static bool
IsEndfor(const char * p)200a34d5fb1SAntonio Huete Jimenez IsEndfor(const char *p)
201a34d5fb1SAntonio Huete Jimenez {
202a34d5fb1SAntonio Huete Jimenez 	return p[0] == 'e' && strncmp(p, "endfor", 6) == 0 &&
203a34d5fb1SAntonio Huete Jimenez 	       (p[6] == '\0' || ch_isspace(p[6]));
204a34d5fb1SAntonio Huete Jimenez }
205a34d5fb1SAntonio Huete Jimenez 
206a34d5fb1SAntonio Huete Jimenez /*
207a34d5fb1SAntonio Huete Jimenez  * Evaluate the for loop in the passed line. The line looks like this:
208a34d5fb1SAntonio Huete Jimenez  *	.for <varname...> in <value...>
20901e196c8SJohn Marino  *
21001e196c8SJohn Marino  * Results:
211*6eef5f0cSAntonio Huete Jimenez  *	0	not a .for directive
212*6eef5f0cSAntonio Huete Jimenez  *	1	found a .for directive
213*6eef5f0cSAntonio Huete Jimenez  *	-1	erroneous .for directive
21401e196c8SJohn Marino  */
21501e196c8SJohn Marino int
For_Eval(const char * line)216a34d5fb1SAntonio Huete Jimenez For_Eval(const char *line)
21701e196c8SJohn Marino {
218a34d5fb1SAntonio Huete Jimenez 	const char *p;
219*6eef5f0cSAntonio Huete Jimenez 	ForLoop *f;
22001e196c8SJohn Marino 
221a34d5fb1SAntonio Huete Jimenez 	p = line + 1;		/* skip the '.' */
222a34d5fb1SAntonio Huete Jimenez 	cpp_skip_whitespace(&p);
22301e196c8SJohn Marino 
224*6eef5f0cSAntonio Huete Jimenez 	if (IsFor(p)) {
225a34d5fb1SAntonio Huete Jimenez 		p += 3;
22601e196c8SJohn Marino 
227a34d5fb1SAntonio Huete Jimenez 		f = ForLoop_New();
228a34d5fb1SAntonio Huete Jimenez 		if (!ForLoop_ParseVarnames(f, &p)) {
229a34d5fb1SAntonio Huete Jimenez 			ForLoop_Free(f);
23001e196c8SJohn Marino 			return -1;
23101e196c8SJohn Marino 		}
232*6eef5f0cSAntonio Huete Jimenez 		if (!ForLoop_ParseItems(f, p))
233*6eef5f0cSAntonio Huete Jimenez 			f->items.len = 0;	/* don't iterate */
23401e196c8SJohn Marino 
235a34d5fb1SAntonio Huete Jimenez 		accumFor = f;
23601e196c8SJohn Marino 		return 1;
237*6eef5f0cSAntonio Huete Jimenez 	} else if (IsEndfor(p)) {
238*6eef5f0cSAntonio Huete Jimenez 		Parse_Error(PARSE_FATAL, "for-less endfor");
239*6eef5f0cSAntonio Huete Jimenez 		return -1;
240*6eef5f0cSAntonio Huete Jimenez 	} else
241*6eef5f0cSAntonio Huete Jimenez 		return 0;
24201e196c8SJohn Marino }
24301e196c8SJohn Marino 
24401e196c8SJohn Marino /*
245a34d5fb1SAntonio Huete Jimenez  * Add another line to the .for loop that is being built up.
246*6eef5f0cSAntonio Huete Jimenez  * Returns false when the matching .endfor is reached.
24701e196c8SJohn Marino  */
248*6eef5f0cSAntonio Huete Jimenez bool
For_Accum(const char * line,int * forLevel)249*6eef5f0cSAntonio Huete Jimenez For_Accum(const char *line, int *forLevel)
25001e196c8SJohn Marino {
251a34d5fb1SAntonio Huete Jimenez 	const char *p = line;
25201e196c8SJohn Marino 
253a34d5fb1SAntonio Huete Jimenez 	if (*p == '.') {
254a34d5fb1SAntonio Huete Jimenez 		p++;
255a34d5fb1SAntonio Huete Jimenez 		cpp_skip_whitespace(&p);
25601e196c8SJohn Marino 
257a34d5fb1SAntonio Huete Jimenez 		if (IsEndfor(p)) {
258*6eef5f0cSAntonio Huete Jimenez 			DEBUG1(FOR, "For: end for %d\n", *forLevel);
259*6eef5f0cSAntonio Huete Jimenez 			if (--*forLevel == 0)
260*6eef5f0cSAntonio Huete Jimenez 				return false;
261a34d5fb1SAntonio Huete Jimenez 		} else if (IsFor(p)) {
262*6eef5f0cSAntonio Huete Jimenez 			(*forLevel)++;
263*6eef5f0cSAntonio Huete Jimenez 			DEBUG1(FOR, "For: new loop %d\n", *forLevel);
26401e196c8SJohn Marino 		}
26501e196c8SJohn Marino 	}
26601e196c8SJohn Marino 
267a34d5fb1SAntonio Huete Jimenez 	Buf_AddStr(&accumFor->body, line);
268a34d5fb1SAntonio Huete Jimenez 	Buf_AddByte(&accumFor->body, '\n');
269*6eef5f0cSAntonio Huete Jimenez 	return true;
27001e196c8SJohn Marino }
27101e196c8SJohn Marino 
272*6eef5f0cSAntonio Huete Jimenez /*
273*6eef5f0cSAntonio Huete Jimenez  * When the body of a '.for i' loop is prepared for an iteration, each
274*6eef5f0cSAntonio Huete Jimenez  * occurrence of $i in the body is replaced with ${:U...}, inserting the
275*6eef5f0cSAntonio Huete Jimenez  * value of the item.  If this item contains a '$', it may be the start of a
276*6eef5f0cSAntonio Huete Jimenez  * variable expression.  This expression is copied verbatim, its length is
277*6eef5f0cSAntonio Huete Jimenez  * determined here, in a rather naive way, ignoring escape characters and
278*6eef5f0cSAntonio Huete Jimenez  * funny delimiters in modifiers like ':S}from}to}'.
279*6eef5f0cSAntonio Huete Jimenez  */
280a34d5fb1SAntonio Huete Jimenez static size_t
ExprLen(const char * s,const char * e)281*6eef5f0cSAntonio Huete Jimenez ExprLen(const char *s, const char *e)
28201e196c8SJohn Marino {
283*6eef5f0cSAntonio Huete Jimenez 	char expr_open, expr_close;
28401e196c8SJohn Marino 	int depth;
285*6eef5f0cSAntonio Huete Jimenez 	const char *p;
28601e196c8SJohn Marino 
287*6eef5f0cSAntonio Huete Jimenez 	if (s == e)
288*6eef5f0cSAntonio Huete Jimenez 		return 0;	/* just escape the '$' */
28901e196c8SJohn Marino 
290*6eef5f0cSAntonio Huete Jimenez 	expr_open = s[0];
291*6eef5f0cSAntonio Huete Jimenez 	if (expr_open == '(')
292*6eef5f0cSAntonio Huete Jimenez 		expr_close = ')';
293*6eef5f0cSAntonio Huete Jimenez 	else if (expr_open == '{')
294*6eef5f0cSAntonio Huete Jimenez 		expr_close = '}';
29501e196c8SJohn Marino 	else
296a34d5fb1SAntonio Huete Jimenez 		return 1;	/* Single char variable */
29701e196c8SJohn Marino 
29801e196c8SJohn Marino 	depth = 1;
299*6eef5f0cSAntonio Huete Jimenez 	for (p = s + 1; p != e; p++) {
300*6eef5f0cSAntonio Huete Jimenez 		if (*p == expr_open)
30101e196c8SJohn Marino 			depth++;
302*6eef5f0cSAntonio Huete Jimenez 		else if (*p == expr_close && --depth == 0)
303*6eef5f0cSAntonio Huete Jimenez 			return (size_t)(p + 1 - s);
30401e196c8SJohn Marino 	}
30501e196c8SJohn Marino 
306*6eef5f0cSAntonio Huete Jimenez 	/* Expression end not found, escape the $ */
30701e196c8SJohn Marino 	return 0;
30801e196c8SJohn Marino }
30901e196c8SJohn Marino 
310a34d5fb1SAntonio Huete Jimenez /*
311a34d5fb1SAntonio Huete Jimenez  * The .for loop substitutes the items as ${:U<value>...}, which means
312a34d5fb1SAntonio Huete Jimenez  * that characters that break this syntax must be backslash-escaped.
313a34d5fb1SAntonio Huete Jimenez  */
314*6eef5f0cSAntonio Huete Jimenez static bool
NeedsEscapes(Substring value,char endc)315*6eef5f0cSAntonio Huete Jimenez NeedsEscapes(Substring value, char endc)
31601e196c8SJohn Marino {
317a34d5fb1SAntonio Huete Jimenez 	const char *p;
318a34d5fb1SAntonio Huete Jimenez 
319*6eef5f0cSAntonio Huete Jimenez 	for (p = value.start; p != value.end; p++) {
320*6eef5f0cSAntonio Huete Jimenez 		if (*p == ':' || *p == '$' || *p == '\\' || *p == endc ||
321*6eef5f0cSAntonio Huete Jimenez 		    *p == '\n')
322*6eef5f0cSAntonio Huete Jimenez 			return true;
323a34d5fb1SAntonio Huete Jimenez 	}
324*6eef5f0cSAntonio Huete Jimenez 	return false;
325a34d5fb1SAntonio Huete Jimenez }
326a34d5fb1SAntonio Huete Jimenez 
327a34d5fb1SAntonio Huete Jimenez /*
328a34d5fb1SAntonio Huete Jimenez  * While expanding the body of a .for loop, write the item in the ${:U...}
329*6eef5f0cSAntonio Huete Jimenez  * expression, escaping characters as needed.  The result is later unescaped
330*6eef5f0cSAntonio Huete Jimenez  * by ApplyModifier_Defined.
331a34d5fb1SAntonio Huete Jimenez  */
332a34d5fb1SAntonio Huete Jimenez static void
AddEscaped(Buffer * cmds,Substring item,char endc)333*6eef5f0cSAntonio Huete Jimenez AddEscaped(Buffer *cmds, Substring item, char endc)
334a34d5fb1SAntonio Huete Jimenez {
335*6eef5f0cSAntonio Huete Jimenez 	const char *p;
33601e196c8SJohn Marino 	char ch;
33701e196c8SJohn Marino 
338a34d5fb1SAntonio Huete Jimenez 	if (!NeedsEscapes(item, endc)) {
339*6eef5f0cSAntonio Huete Jimenez 		Buf_AddBytesBetween(cmds, item.start, item.end);
34001e196c8SJohn Marino 		return;
34101e196c8SJohn Marino 	}
34201e196c8SJohn Marino 
343*6eef5f0cSAntonio Huete Jimenez 	for (p = item.start; p != item.end;) {
344*6eef5f0cSAntonio Huete Jimenez 		ch = *p;
34501e196c8SJohn Marino 		if (ch == '$') {
346*6eef5f0cSAntonio Huete Jimenez 			size_t len = ExprLen(p + 1, item.end);
34701e196c8SJohn Marino 			if (len != 0) {
348*6eef5f0cSAntonio Huete Jimenez 				/*
349*6eef5f0cSAntonio Huete Jimenez 				 * XXX: Should a '\' be added here?
350*6eef5f0cSAntonio Huete Jimenez 				 * See directive-for-escape.mk, ExprLen.
351*6eef5f0cSAntonio Huete Jimenez 				 */
352*6eef5f0cSAntonio Huete Jimenez 				Buf_AddBytes(cmds, p, 1 + len);
353*6eef5f0cSAntonio Huete Jimenez 				p += 1 + len;
35401e196c8SJohn Marino 				continue;
35501e196c8SJohn Marino 			}
35601e196c8SJohn Marino 			Buf_AddByte(cmds, '\\');
357a34d5fb1SAntonio Huete Jimenez 		} else if (ch == ':' || ch == '\\' || ch == endc)
35801e196c8SJohn Marino 			Buf_AddByte(cmds, '\\');
359*6eef5f0cSAntonio Huete Jimenez 		else if (ch == '\n') {
360*6eef5f0cSAntonio Huete Jimenez 			Parse_Error(PARSE_FATAL, "newline in .for value");
361*6eef5f0cSAntonio Huete Jimenez 			ch = ' ';	/* prevent newline injection */
362*6eef5f0cSAntonio Huete Jimenez 		}
36301e196c8SJohn Marino 		Buf_AddByte(cmds, ch);
364*6eef5f0cSAntonio Huete Jimenez 		p++;
36501e196c8SJohn Marino 	}
36601e196c8SJohn Marino }
36701e196c8SJohn Marino 
368a34d5fb1SAntonio Huete Jimenez /*
369*6eef5f0cSAntonio Huete Jimenez  * When expanding the body of a .for loop, replace the variable name of an
370a34d5fb1SAntonio Huete Jimenez  * expression like ${i} or ${i:...} or $(i) or $(i:...) with ":Uvalue".
371a34d5fb1SAntonio Huete Jimenez  */
372a34d5fb1SAntonio Huete Jimenez static void
ForLoop_SubstVarLong(ForLoop * f,unsigned int firstItem,Buffer * body,const char ** pp,char endc,const char ** inout_mark)373*6eef5f0cSAntonio Huete Jimenez ForLoop_SubstVarLong(ForLoop *f, unsigned int firstItem, Buffer *body,
374*6eef5f0cSAntonio Huete Jimenez 		     const char **pp, char endc, const char **inout_mark)
37501e196c8SJohn Marino {
376a34d5fb1SAntonio Huete Jimenez 	size_t i;
377*6eef5f0cSAntonio Huete Jimenez 	const char *start = *pp;
378*6eef5f0cSAntonio Huete Jimenez 	const char **vars = Vector_Get(&f->vars, 0);
37901e196c8SJohn Marino 
380a34d5fb1SAntonio Huete Jimenez 	for (i = 0; i < f->vars.len; i++) {
381*6eef5f0cSAntonio Huete Jimenez 		const char *p = start;
382a34d5fb1SAntonio Huete Jimenez 
383*6eef5f0cSAntonio Huete Jimenez 		if (!cpp_skip_string(&p, vars[i]))
384a34d5fb1SAntonio Huete Jimenez 			continue;
385a34d5fb1SAntonio Huete Jimenez 		/* XXX: why test for backslash here? */
386*6eef5f0cSAntonio Huete Jimenez 		if (*p != ':' && *p != endc && *p != '\\')
387a34d5fb1SAntonio Huete Jimenez 			continue;
388a34d5fb1SAntonio Huete Jimenez 
389a34d5fb1SAntonio Huete Jimenez 		/*
390a34d5fb1SAntonio Huete Jimenez 		 * Found a variable match.  Skip over the variable name and
391a34d5fb1SAntonio Huete Jimenez 		 * instead add ':U<value>' to the current body.
392a34d5fb1SAntonio Huete Jimenez 		 */
393*6eef5f0cSAntonio Huete Jimenez 		Buf_AddBytesBetween(body, *inout_mark, start);
394*6eef5f0cSAntonio Huete Jimenez 		Buf_AddStr(body, ":U");
395*6eef5f0cSAntonio Huete Jimenez 		AddEscaped(body, f->items.words[firstItem + i], endc);
396a34d5fb1SAntonio Huete Jimenez 
397a34d5fb1SAntonio Huete Jimenez 		*inout_mark = p;
398a34d5fb1SAntonio Huete Jimenez 		*pp = p;
399a34d5fb1SAntonio Huete Jimenez 		return;
400a34d5fb1SAntonio Huete Jimenez 	}
401a34d5fb1SAntonio Huete Jimenez }
402a34d5fb1SAntonio Huete Jimenez 
403a34d5fb1SAntonio Huete Jimenez /*
404*6eef5f0cSAntonio Huete Jimenez  * When expanding the body of a .for loop, replace single-character
405a34d5fb1SAntonio Huete Jimenez  * variable expressions like $i with their ${:U...} expansion.
406a34d5fb1SAntonio Huete Jimenez  */
407a34d5fb1SAntonio Huete Jimenez static void
ForLoop_SubstVarShort(ForLoop * f,unsigned int firstItem,Buffer * body,const char * p,const char ** inout_mark)408*6eef5f0cSAntonio Huete Jimenez ForLoop_SubstVarShort(ForLoop *f, unsigned int firstItem, Buffer *body,
409*6eef5f0cSAntonio Huete Jimenez 		      const char *p, const char **inout_mark)
410a34d5fb1SAntonio Huete Jimenez {
411a34d5fb1SAntonio Huete Jimenez 	const char ch = *p;
412*6eef5f0cSAntonio Huete Jimenez 	const char **vars;
413a34d5fb1SAntonio Huete Jimenez 	size_t i;
414a34d5fb1SAntonio Huete Jimenez 
415a34d5fb1SAntonio Huete Jimenez 	/* Skip $$ and stupid ones. */
416*6eef5f0cSAntonio Huete Jimenez 	if (ch == '}' || ch == ')' || ch == ':' || ch == '$')
417a34d5fb1SAntonio Huete Jimenez 		return;
418a34d5fb1SAntonio Huete Jimenez 
419a34d5fb1SAntonio Huete Jimenez 	vars = Vector_Get(&f->vars, 0);
420a34d5fb1SAntonio Huete Jimenez 	for (i = 0; i < f->vars.len; i++) {
421*6eef5f0cSAntonio Huete Jimenez 		const char *varname = vars[i];
422a34d5fb1SAntonio Huete Jimenez 		if (varname[0] == ch && varname[1] == '\0')
423a34d5fb1SAntonio Huete Jimenez 			goto found;
424a34d5fb1SAntonio Huete Jimenez 	}
425a34d5fb1SAntonio Huete Jimenez 	return;
426a34d5fb1SAntonio Huete Jimenez 
427a34d5fb1SAntonio Huete Jimenez found:
428*6eef5f0cSAntonio Huete Jimenez 	Buf_AddBytesBetween(body, *inout_mark, p);
429*6eef5f0cSAntonio Huete Jimenez 	*inout_mark = p + 1;
430*6eef5f0cSAntonio Huete Jimenez 
431a34d5fb1SAntonio Huete Jimenez 	/* Replace $<ch> with ${:U<value>} */
432*6eef5f0cSAntonio Huete Jimenez 	Buf_AddStr(body, "{:U");
433*6eef5f0cSAntonio Huete Jimenez 	AddEscaped(body, f->items.words[firstItem + i], '}');
434*6eef5f0cSAntonio Huete Jimenez 	Buf_AddByte(body, '}');
435a34d5fb1SAntonio Huete Jimenez }
436a34d5fb1SAntonio Huete Jimenez 
437a34d5fb1SAntonio Huete Jimenez /*
438a34d5fb1SAntonio Huete Jimenez  * Compute the body for the current iteration by copying the unexpanded body,
439a34d5fb1SAntonio Huete Jimenez  * replacing the expressions for the iteration variables on the way.
440a34d5fb1SAntonio Huete Jimenez  *
441a34d5fb1SAntonio Huete Jimenez  * Using variable expressions ensures that the .for loop can't generate
442a34d5fb1SAntonio Huete Jimenez  * syntax, and that the later parsing will still see a variable.
443a34d5fb1SAntonio Huete Jimenez  * This code assumes that the variable with the empty name will never be
444a34d5fb1SAntonio Huete Jimenez  * defined, see unit-tests/varname-empty.mk for more details.
445a34d5fb1SAntonio Huete Jimenez  *
446a34d5fb1SAntonio Huete Jimenez  * The detection of substitutions of the loop control variables is naive.
447*6eef5f0cSAntonio Huete Jimenez  * Many of the modifiers use '\$' instead of '$$' to escape '$', so it is
448*6eef5f0cSAntonio Huete Jimenez  * possible to contrive a makefile where an unwanted substitution happens.
449a34d5fb1SAntonio Huete Jimenez  */
450a34d5fb1SAntonio Huete Jimenez static void
ForLoop_SubstBody(ForLoop * f,unsigned int firstItem,Buffer * body)451*6eef5f0cSAntonio Huete Jimenez ForLoop_SubstBody(ForLoop *f, unsigned int firstItem, Buffer *body)
452a34d5fb1SAntonio Huete Jimenez {
453*6eef5f0cSAntonio Huete Jimenez 	const char *p, *end;
454*6eef5f0cSAntonio Huete Jimenez 	const char *mark;	/* where the last substitution left off */
455a34d5fb1SAntonio Huete Jimenez 
456*6eef5f0cSAntonio Huete Jimenez 	Buf_Clear(body);
457a34d5fb1SAntonio Huete Jimenez 
458a34d5fb1SAntonio Huete Jimenez 	mark = f->body.data;
459*6eef5f0cSAntonio Huete Jimenez 	end = f->body.data + f->body.len;
460a34d5fb1SAntonio Huete Jimenez 	for (p = mark; (p = strchr(p, '$')) != NULL;) {
461a34d5fb1SAntonio Huete Jimenez 		if (p[1] == '{' || p[1] == '(') {
462*6eef5f0cSAntonio Huete Jimenez 			char endc = p[1] == '{' ? '}' : ')';
463a34d5fb1SAntonio Huete Jimenez 			p += 2;
464*6eef5f0cSAntonio Huete Jimenez 			ForLoop_SubstVarLong(f, firstItem, body,
465*6eef5f0cSAntonio Huete Jimenez 			    &p, endc, &mark);
466a34d5fb1SAntonio Huete Jimenez 		} else if (p[1] != '\0') {
467*6eef5f0cSAntonio Huete Jimenez 			ForLoop_SubstVarShort(f, firstItem, body,
468*6eef5f0cSAntonio Huete Jimenez 			    p + 1, &mark);
469a34d5fb1SAntonio Huete Jimenez 			p += 2;
470a34d5fb1SAntonio Huete Jimenez 		} else
471a34d5fb1SAntonio Huete Jimenez 			break;
472a34d5fb1SAntonio Huete Jimenez 	}
473a34d5fb1SAntonio Huete Jimenez 
474*6eef5f0cSAntonio Huete Jimenez 	Buf_AddBytesBetween(body, mark, end);
475a34d5fb1SAntonio Huete Jimenez }
476a34d5fb1SAntonio Huete Jimenez 
477a34d5fb1SAntonio Huete Jimenez /*
478a34d5fb1SAntonio Huete Jimenez  * Compute the body for the current iteration by copying the unexpanded body,
479a34d5fb1SAntonio Huete Jimenez  * replacing the expressions for the iteration variables on the way.
480a34d5fb1SAntonio Huete Jimenez  */
481*6eef5f0cSAntonio Huete Jimenez bool
For_NextIteration(ForLoop * f,Buffer * body)482*6eef5f0cSAntonio Huete Jimenez For_NextIteration(ForLoop *f, Buffer *body)
483a34d5fb1SAntonio Huete Jimenez {
484*6eef5f0cSAntonio Huete Jimenez 	if (f->nextItem == f->items.len)
485*6eef5f0cSAntonio Huete Jimenez 		return false;
486a34d5fb1SAntonio Huete Jimenez 
487*6eef5f0cSAntonio Huete Jimenez 	f->nextItem += (unsigned int)f->vars.len;
488*6eef5f0cSAntonio Huete Jimenez 	ForLoop_SubstBody(f, f->nextItem - (unsigned int)f->vars.len, body);
489*6eef5f0cSAntonio Huete Jimenez 	DEBUG1(FOR, "For: loop body:\n%s", body->data);
490*6eef5f0cSAntonio Huete Jimenez 	return true;
49101e196c8SJohn Marino }
49201e196c8SJohn Marino 
493*6eef5f0cSAntonio Huete Jimenez /* Break out of the .for loop. */
494*6eef5f0cSAntonio Huete Jimenez void
For_Break(ForLoop * f)495*6eef5f0cSAntonio Huete Jimenez For_Break(ForLoop *f)
496*6eef5f0cSAntonio Huete Jimenez {
497*6eef5f0cSAntonio Huete Jimenez 	f->nextItem = (unsigned int)f->items.len;
49801e196c8SJohn Marino }
49901e196c8SJohn Marino 
500a34d5fb1SAntonio Huete Jimenez /* Run the .for loop, imitating the actions of an include file. */
50101e196c8SJohn Marino void
For_Run(unsigned headLineno,unsigned bodyReadLines)502*6eef5f0cSAntonio Huete Jimenez For_Run(unsigned headLineno, unsigned bodyReadLines)
50301e196c8SJohn Marino {
504*6eef5f0cSAntonio Huete Jimenez 	Buffer buf;
505a34d5fb1SAntonio Huete Jimenez 	ForLoop *f = accumFor;
50601e196c8SJohn Marino 	accumFor = NULL;
50701e196c8SJohn Marino 
508*6eef5f0cSAntonio Huete Jimenez 	if (f->items.len > 0) {
509*6eef5f0cSAntonio Huete Jimenez 		Buf_Init(&buf);
510*6eef5f0cSAntonio Huete Jimenez 		Parse_PushInput(NULL, headLineno, bodyReadLines, buf, f);
511*6eef5f0cSAntonio Huete Jimenez 	} else
512a34d5fb1SAntonio Huete Jimenez 		ForLoop_Free(f);
51301e196c8SJohn Marino }
514