xref: /netbsd-src/external/cddl/osnet/dist/tools/ctf/cvt/stabs.c (revision ba2539a9805a0544ff82c0003cc02fe1eee5603d)
1a864dc36Sdarran /*
2a864dc36Sdarran  * CDDL HEADER START
3a864dc36Sdarran  *
4a864dc36Sdarran  * The contents of this file are subject to the terms of the
5a864dc36Sdarran  * Common Development and Distribution License (the "License").
6a864dc36Sdarran  * You may not use this file except in compliance with the License.
7a864dc36Sdarran  *
8a864dc36Sdarran  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9a864dc36Sdarran  * or http://www.opensolaris.org/os/licensing.
10a864dc36Sdarran  * See the License for the specific language governing permissions
11a864dc36Sdarran  * and limitations under the License.
12a864dc36Sdarran  *
13a864dc36Sdarran  * When distributing Covered Code, include this CDDL HEADER in each
14a864dc36Sdarran  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15a864dc36Sdarran  * If applicable, add the following below this CDDL HEADER, with the
16a864dc36Sdarran  * fields enclosed by brackets "[]" replaced with your own identifying
17a864dc36Sdarran  * information: Portions Copyright [yyyy] [name of copyright owner]
18a864dc36Sdarran  *
19a864dc36Sdarran  * CDDL HEADER END
20a864dc36Sdarran  */
21a864dc36Sdarran /*
22a864dc36Sdarran  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
23a864dc36Sdarran  * Use is subject to license terms.
24a864dc36Sdarran  */
25a864dc36Sdarran 
26a864dc36Sdarran #pragma ident	"%Z%%M%	%I%	%E% SMI"
27a864dc36Sdarran 
28a864dc36Sdarran /*
29a864dc36Sdarran  * Routines used to read stabs data from a file, and to build a tdata structure
30a864dc36Sdarran  * based on the interesting parts of that data.
31a864dc36Sdarran  */
32a864dc36Sdarran 
3389300bd9Sdarran #if HAVE_NBTOOL_CONFIG_H
3489300bd9Sdarran # include "nbtool_config.h"
3589300bd9Sdarran #endif
3689300bd9Sdarran 
37a864dc36Sdarran #include <stdio.h>
38a864dc36Sdarran #include <stdlib.h>
39a864dc36Sdarran #include <fcntl.h>
40a864dc36Sdarran #include <unistd.h>
41a864dc36Sdarran #include <assert.h>
42a864dc36Sdarran #include <string.h>
43a864dc36Sdarran #include <libgen.h>
44a864dc36Sdarran #include <errno.h>
45a864dc36Sdarran #include <sys/types.h>
46a864dc36Sdarran #include <sys/param.h>
47a864dc36Sdarran 
48a864dc36Sdarran #include "ctftools.h"
49a864dc36Sdarran #include "list.h"
50a864dc36Sdarran #include "stack.h"
51a864dc36Sdarran #include "memory.h"
52a864dc36Sdarran #include "traverse.h"
53a864dc36Sdarran 
54bb8023b5Sdarran char *curhdr;
55a864dc36Sdarran 
56a864dc36Sdarran /*
57a864dc36Sdarran  * The stabs generator will sometimes reference types before they've been
58a864dc36Sdarran  * defined.  If this is the case, a TYPEDEF_UNRES tdesc will be generated.
59a864dc36Sdarran  * Note that this is different from a forward declaration, in which the
60a864dc36Sdarran  * stab is defined, but is defined as something that doesn't exist yet.
61a864dc36Sdarran  * When we have read all of the stabs from the file, we can go back and
62a864dc36Sdarran  * fix up all of the unresolved types.  We should be able to fix all of them.
63a864dc36Sdarran  */
64a864dc36Sdarran /*ARGSUSED2*/
65a864dc36Sdarran static int
resolve_tou_node(tdesc_t * node,tdesc_t ** nodep,void * private __unused)66bb8023b5Sdarran resolve_tou_node(tdesc_t *node, tdesc_t **nodep, void *private __unused)
67a864dc36Sdarran {
68a864dc36Sdarran 	tdesc_t *new;
69a864dc36Sdarran 
70a864dc36Sdarran 	debug(3, "Trying to resolve %s (%d)\n", tdesc_name(node), node->t_id);
71a864dc36Sdarran 	new = lookup(node->t_id);
72a864dc36Sdarran 
73a864dc36Sdarran 	if (new == NULL) {
74a864dc36Sdarran 		terminate("Couldn't resolve type %d\n", node->t_id);
75a864dc36Sdarran 	}
76a864dc36Sdarran 
77a864dc36Sdarran 	debug(3, " Resolving to %d\n", new->t_id);
78a864dc36Sdarran 
79a864dc36Sdarran 	*nodep = new;
80a864dc36Sdarran 
81a864dc36Sdarran 	return (1);
82a864dc36Sdarran }
83a864dc36Sdarran 
84a864dc36Sdarran /*ARGSUSED*/
85a864dc36Sdarran static int
resolve_fwd_node(tdesc_t * node,tdesc_t ** nodep,void * private __unused)86bb8023b5Sdarran resolve_fwd_node(tdesc_t *node, tdesc_t **nodep, void *private __unused)
87a864dc36Sdarran {
88a864dc36Sdarran 	tdesc_t *new = lookupname(node->t_name);
89a864dc36Sdarran 
90a864dc36Sdarran 	debug(3, "Trying to unforward %s (%d)\n", tdesc_name(node), node->t_id);
91a864dc36Sdarran 
92a864dc36Sdarran 	if (!new || (new->t_type != STRUCT && new->t_type != UNION))
93a864dc36Sdarran 		return (0);
94a864dc36Sdarran 
95a864dc36Sdarran 	debug(3, " Unforwarded to %d\n", new->t_id);
96a864dc36Sdarran 
97a864dc36Sdarran 	*nodep = new;
98a864dc36Sdarran 
99a864dc36Sdarran 	return (1);
100a864dc36Sdarran }
101a864dc36Sdarran 
102a864dc36Sdarran static tdtrav_cb_f resolve_cbs[] = {
103a864dc36Sdarran 	NULL,
104a864dc36Sdarran 	NULL,			/* intrinsic */
105a864dc36Sdarran 	NULL,			/* pointer */
106a864dc36Sdarran 	NULL,			/* array */
107a864dc36Sdarran 	NULL,			/* function */
108a864dc36Sdarran 	NULL,			/* struct */
109a864dc36Sdarran 	NULL,			/* union */
110a864dc36Sdarran 	NULL,			/* enum */
111a864dc36Sdarran 	resolve_fwd_node,	/* forward */
112a864dc36Sdarran 	NULL,			/* typedef */
113a864dc36Sdarran 	resolve_tou_node,	/* typedef unres */
114a864dc36Sdarran 	NULL,			/* volatile */
115a864dc36Sdarran 	NULL,			/* const */
116a864dc36Sdarran 	NULL,			/* restrict */
117a864dc36Sdarran };
118a864dc36Sdarran 
119a864dc36Sdarran static void
resolve_nodes(tdata_t * td)120a864dc36Sdarran resolve_nodes(tdata_t *td)
121a864dc36Sdarran {
122a864dc36Sdarran 	debug(2, "Resolving unresolved stabs\n");
123a864dc36Sdarran 
124a864dc36Sdarran 	(void) iitraverse_hash(td->td_iihash, &td->td_curvgen, resolve_cbs,
125a864dc36Sdarran 	    NULL, NULL, td);
126a864dc36Sdarran }
127a864dc36Sdarran 
128a864dc36Sdarran static char *
concat(char * s1,char * s2,int s2strip)129a864dc36Sdarran concat(char *s1, char *s2, int s2strip)
130a864dc36Sdarran {
131a864dc36Sdarran 	int savelen = strlen(s2) - s2strip;
132a864dc36Sdarran 	int newlen = (s1 ? strlen(s1) : 0) + savelen + 1;
133a864dc36Sdarran 	char *out;
134a864dc36Sdarran 
135a864dc36Sdarran 	out = xrealloc(s1, newlen);
136a864dc36Sdarran 	if (s1)
137a864dc36Sdarran 		strncpy(out + strlen(out), s2, savelen);
138a864dc36Sdarran 	else
139a864dc36Sdarran 		strncpy(out, s2, savelen);
140a864dc36Sdarran 
141a864dc36Sdarran 	out[newlen - 1] = '\0';
142a864dc36Sdarran 
143a864dc36Sdarran 	return (out);
144a864dc36Sdarran }
145a864dc36Sdarran 
146a864dc36Sdarran /*
147a864dc36Sdarran  * N_FUN stabs come with their arguments in promoted form.  In order to get the
148a864dc36Sdarran  * actual arguments, we need to wait for the N_PSYM stabs that will come towards
149a864dc36Sdarran  * the end of the function.  These routines free the arguments (fnarg_free) we
150a864dc36Sdarran  * got from the N_FUN stab and add (fnarg_add) the ones from the N_PSYM stabs.
151a864dc36Sdarran  */
152a864dc36Sdarran static void
fnarg_add(iidesc_t * curfun,iidesc_t * arg)153a864dc36Sdarran fnarg_add(iidesc_t *curfun, iidesc_t *arg)
154a864dc36Sdarran {
155a864dc36Sdarran 	curfun->ii_nargs++;
156a864dc36Sdarran 
157a864dc36Sdarran 	if (curfun->ii_nargs == 1)
158a864dc36Sdarran 		curfun->ii_args = xmalloc(sizeof (tdesc_t *) * FUNCARG_DEF);
159a864dc36Sdarran 	else if (curfun->ii_nargs > FUNCARG_DEF) {
160a864dc36Sdarran 		curfun->ii_args = xrealloc(curfun->ii_args,
161a864dc36Sdarran 		    sizeof (tdesc_t *) * curfun->ii_nargs);
162a864dc36Sdarran 	}
163a864dc36Sdarran 
164a864dc36Sdarran 	curfun->ii_args[curfun->ii_nargs - 1] = arg->ii_dtype;
165a864dc36Sdarran 	arg->ii_dtype = NULL;
166a864dc36Sdarran }
167a864dc36Sdarran 
168a864dc36Sdarran static void
fnarg_free(iidesc_t * ii)169a864dc36Sdarran fnarg_free(iidesc_t *ii)
170a864dc36Sdarran {
171a864dc36Sdarran 	ii->ii_nargs = 0;
172a864dc36Sdarran 	free(ii->ii_args);
173a864dc36Sdarran 	ii->ii_args = NULL;
174a864dc36Sdarran }
175a864dc36Sdarran 
176a864dc36Sdarran /*
177a864dc36Sdarran  * Read the stabs from the stab ELF section, and turn them into a tdesc tree,
178a864dc36Sdarran  * assembled under an iidesc list.
179a864dc36Sdarran  */
180a864dc36Sdarran int
stabs_read(tdata_t * td,Elf * elf,char * file)181bb8023b5Sdarran stabs_read(tdata_t *td, Elf *elf, char *file)
182a864dc36Sdarran {
183a864dc36Sdarran 	Elf_Scn *scn;
184a864dc36Sdarran 	Elf_Data *data;
185a864dc36Sdarran 	stab_t *stab;
186a864dc36Sdarran 	stk_t *file_stack;
187a864dc36Sdarran 	iidesc_t *iidescp;
188a864dc36Sdarran 	iidesc_t *curfun = NULL;
189a864dc36Sdarran 	char curpath[MAXPATHLEN];
190a864dc36Sdarran 	char *curfile = NULL;
191a864dc36Sdarran 	char *str;
192a864dc36Sdarran 	char *fstr = NULL, *ofstr = NULL;
193*ba2539a9Schs 	int stabidx, stabstridx;
194a864dc36Sdarran 	int nstabs, rc, i;
195a864dc36Sdarran 	int scope = 0;
196a864dc36Sdarran 
197a864dc36Sdarran 	if (!((stabidx = findelfsecidx(elf, file, ".stab.excl")) >= 0 &&
198a864dc36Sdarran 	    (stabstridx = findelfsecidx(elf, file, ".stab.exclstr")) >= 0) &&
199a864dc36Sdarran 	    !((stabidx = findelfsecidx(elf, file, ".stab")) >= 0 &&
200a864dc36Sdarran 	    (stabstridx = findelfsecidx(elf, file, ".stabstr")) >= 0)) {
201a864dc36Sdarran 		errno = ENOENT;
202a864dc36Sdarran 		return (-1);
203a864dc36Sdarran 	}
204a864dc36Sdarran 
205a864dc36Sdarran 	file_stack = stack_new(free);
206a864dc36Sdarran 
207bb8023b5Sdarran 	stack_push(file_stack, file);
208a864dc36Sdarran 	curhdr = file;
209a864dc36Sdarran 
210a864dc36Sdarran 	debug(3, "Found stabs in %d, strings in %d\n", stabidx, stabstridx);
211a864dc36Sdarran 
212a864dc36Sdarran 	scn = elf_getscn(elf, stabidx);
213a864dc36Sdarran 	data = elf_rawdata(scn, NULL);
214a864dc36Sdarran 	nstabs = data->d_size / sizeof (stab_t);
215a864dc36Sdarran 
216a864dc36Sdarran 	parse_init(td);
217a864dc36Sdarran 	for (i = 0; i < nstabs; i++) {
218a864dc36Sdarran 		stab = &((stab_t *)data->d_buf)[i];
219a864dc36Sdarran 
220a864dc36Sdarran 		/* We don't want any local definitions */
221a864dc36Sdarran 		if (stab->n_type == N_LBRAC) {
222a864dc36Sdarran 			scope++;
223a864dc36Sdarran 			debug(3, "stab %d: opening scope (%d)\n", i + 1, scope);
224a864dc36Sdarran 			continue;
225a864dc36Sdarran 		} else if (stab->n_type == N_RBRAC) {
226a864dc36Sdarran 			scope--;
227a864dc36Sdarran 			debug(3, "stab %d: closing scope (%d)\n", i + 1, scope);
228a864dc36Sdarran 			continue;
229a864dc36Sdarran 		} else if (stab->n_type == N_EINCL) {
230a864dc36Sdarran 			/*
231a864dc36Sdarran 			 * There's a bug in the 5.2 (Taz) compilers that causes
232a864dc36Sdarran 			 * them to emit an extra N_EINCL if there's no actual
233a864dc36Sdarran 			 * text in the file being compiled.  To work around this
234a864dc36Sdarran 			 * bug, we explicitly check to make sure we're not
235a864dc36Sdarran 			 * trying to pop a stack that only has the outer scope
236a864dc36Sdarran 			 * on it.
237a864dc36Sdarran 			 */
238a864dc36Sdarran 			if (stack_level(file_stack) != 1) {
239a864dc36Sdarran 				str = (char *)stack_pop(file_stack);
240a864dc36Sdarran 				free(str);
241a864dc36Sdarran 				curhdr = (char *)stack_peek(file_stack);
242a864dc36Sdarran 			}
243a864dc36Sdarran 		}
244a864dc36Sdarran 
245a864dc36Sdarran 		/* We only care about a subset of the stabs */
246a864dc36Sdarran 		if (!(stab->n_type == N_FUN || stab->n_type == N_GSYM ||
247a864dc36Sdarran 		    stab->n_type == N_LCSYM || stab->n_type == N_LSYM ||
248a864dc36Sdarran 		    stab->n_type == N_PSYM || stab->n_type == N_ROSYM ||
249a864dc36Sdarran 		    stab->n_type == N_RSYM ||
250a864dc36Sdarran 		    stab->n_type == N_STSYM || stab->n_type == N_BINCL ||
251a864dc36Sdarran 		    stab->n_type == N_SO || stab->n_type == N_OPT))
252a864dc36Sdarran 			continue;
253a864dc36Sdarran 
254a864dc36Sdarran 		if ((str = elf_strptr(elf, stabstridx,
255a864dc36Sdarran 		    (size_t)stab->n_strx)) == NULL) {
256a864dc36Sdarran 			terminate("%s: Can't find string at %u for stab %d\n",
257a864dc36Sdarran 			    file, stab->n_strx, i);
258a864dc36Sdarran 		}
259a864dc36Sdarran 
260a864dc36Sdarran 		if (stab->n_type == N_BINCL) {
261a864dc36Sdarran 			curhdr = xstrdup(str);
262bb8023b5Sdarran 			stack_push(file_stack, curhdr);
263a864dc36Sdarran 			continue;
264a864dc36Sdarran 		} else if (stab->n_type == N_SO) {
265a864dc36Sdarran 			if (str[strlen(str) - 1] != '/') {
266a864dc36Sdarran 				strcpy(curpath, str);
267a864dc36Sdarran 				curfile = basename(curpath);
268a864dc36Sdarran 			}
269a864dc36Sdarran 			continue;
270a864dc36Sdarran 		} else if (stab->n_type == N_OPT) {
271a864dc36Sdarran 			if (strcmp(str, "gcc2_compiled.") == 0) {
272a864dc36Sdarran 				terminate("%s: GCC-generated stabs are "
273a864dc36Sdarran 				    "unsupported. Use DWARF instead.\n", file);
274a864dc36Sdarran 			}
275a864dc36Sdarran 			continue;
276a864dc36Sdarran 		}
277a864dc36Sdarran 
278a864dc36Sdarran 		if (str[strlen(str) - 1] == '\\') {
279a864dc36Sdarran 			int offset = 1;
280a864dc36Sdarran 			/*
281a864dc36Sdarran 			 * There's a bug in the compilers that causes them to
282a864dc36Sdarran 			 * generate \ for continuations with just -g (this is
283a864dc36Sdarran 			 * ok), and \\ for continuations with -g -O (this is
284a864dc36Sdarran 			 * broken).  This bug is "fixed" in the 6.2 compilers
285a864dc36Sdarran 			 * via the elimination of continuation stabs.
286a864dc36Sdarran 			 */
287a864dc36Sdarran 			if (str[strlen(str) - 2] == '\\')
288a864dc36Sdarran 				offset = 2;
289a864dc36Sdarran 			fstr = concat(fstr, str, offset);
290a864dc36Sdarran 			continue;
291a864dc36Sdarran 		} else
292a864dc36Sdarran 			fstr = concat(fstr, str, 0);
293a864dc36Sdarran 
294a864dc36Sdarran 		debug(3, "%4d: .stabs \"%s\", %#x, %d, %hd, %d (from %s)\n", i,
295a864dc36Sdarran 		    fstr, stab->n_type, 0, stab->n_desc,
296a864dc36Sdarran 		    stab->n_value, curhdr);
297a864dc36Sdarran 
298a864dc36Sdarran 		if (debug_level >= 3)
299a864dc36Sdarran 			check_hash();
300a864dc36Sdarran 
301a864dc36Sdarran 		/*
302a864dc36Sdarran 		 * Sometimes the compiler stutters, and emits the same stab
303a864dc36Sdarran 		 * twice.  This is bad for the parser, which will attempt to
304a864dc36Sdarran 		 * redefine the type IDs indicated in the stabs.  This is
305a864dc36Sdarran 		 * compiler bug 4433511.
306a864dc36Sdarran 		 */
307a864dc36Sdarran 		if (ofstr && strcmp(fstr, ofstr) == 0) {
308a864dc36Sdarran 			debug(3, "Stutter stab\n");
309a864dc36Sdarran 			free(fstr);
310a864dc36Sdarran 			fstr = NULL;
311a864dc36Sdarran 			continue;
312a864dc36Sdarran 		}
313a864dc36Sdarran 
314a864dc36Sdarran 		if (ofstr)
315a864dc36Sdarran 			free(ofstr);
316a864dc36Sdarran 		ofstr = fstr;
317a864dc36Sdarran 
318a864dc36Sdarran 		iidescp = NULL;
319a864dc36Sdarran 
320a864dc36Sdarran 		if ((rc = parse_stab(stab, fstr, &iidescp)) < 0) {
321a864dc36Sdarran 			terminate("%s: Couldn't parse stab \"%s\" "
322a864dc36Sdarran 			    "(source file %s)\n", file, str, curhdr);
323a864dc36Sdarran 		}
324a864dc36Sdarran 
325a864dc36Sdarran 		if (rc == 0)
326a864dc36Sdarran 			goto parse_loop_end;
327a864dc36Sdarran 
328a864dc36Sdarran 		/* Make sure the scope tracking is working correctly */
329a864dc36Sdarran 		assert(stab->n_type != N_FUN || (iidescp->ii_type != II_GFUN &&
330a864dc36Sdarran 		    iidescp->ii_type != II_SFUN) || scope == 0);
331a864dc36Sdarran 
332a864dc36Sdarran 		/*
333a864dc36Sdarran 		 * The only things we care about that are in local scope are
334a864dc36Sdarran 		 * the N_PSYM stabs.
335a864dc36Sdarran 		 */
336a864dc36Sdarran 		if (scope && stab->n_type != N_PSYM) {
337a864dc36Sdarran 			if (iidescp)
338a864dc36Sdarran 				iidesc_free(iidescp, NULL);
339a864dc36Sdarran 			goto parse_loop_end;
340a864dc36Sdarran 		}
341a864dc36Sdarran 
342a864dc36Sdarran 		switch (iidescp->ii_type) {
343a864dc36Sdarran 		case II_SFUN:
344a864dc36Sdarran 			iidescp->ii_owner = xstrdup(curfile);
345a864dc36Sdarran 			/*FALLTHROUGH*/
346a864dc36Sdarran 		case II_GFUN:
347a864dc36Sdarran 			curfun = iidescp;
348a864dc36Sdarran 			fnarg_free(iidescp);
349a864dc36Sdarran 			iidesc_add(td->td_iihash, iidescp);
350a864dc36Sdarran 			break;
351a864dc36Sdarran 
352a864dc36Sdarran 		case II_SVAR:
353a864dc36Sdarran 			iidescp->ii_owner = xstrdup(curfile);
354a864dc36Sdarran 			/*FALLTHROUGH*/
355a864dc36Sdarran 		case II_GVAR:
356a864dc36Sdarran 		case II_TYPE:
357a864dc36Sdarran 		case II_SOU:
358a864dc36Sdarran 			iidesc_add(td->td_iihash, iidescp);
359a864dc36Sdarran 			break;
360a864dc36Sdarran 
361a864dc36Sdarran 		case II_PSYM:
362a864dc36Sdarran 			fnarg_add(curfun, iidescp);
363a864dc36Sdarran 			iidesc_free(iidescp, NULL);
364a864dc36Sdarran 			break;
365a864dc36Sdarran 		default:
366a864dc36Sdarran 			aborterr("invalid ii_type %d for stab type %d",
367a864dc36Sdarran 			    iidescp->ii_type, stab->n_type);
368a864dc36Sdarran 		}
369a864dc36Sdarran 
370a864dc36Sdarran parse_loop_end:
371a864dc36Sdarran 		fstr = NULL;
372a864dc36Sdarran 	}
373a864dc36Sdarran 
374a864dc36Sdarran 	if (ofstr)
375a864dc36Sdarran 		free(ofstr);
376a864dc36Sdarran 
377a864dc36Sdarran 	resolve_nodes(td);
378a864dc36Sdarran 	resolve_typed_bitfields();
379a864dc36Sdarran 	parse_finish(td);
380a864dc36Sdarran 
381a864dc36Sdarran 	cvt_fixstabs(td);
382a864dc36Sdarran 	cvt_fixups(td, elf_ptrsz(elf));
383a864dc36Sdarran 
384a864dc36Sdarran 	return (0);
385a864dc36Sdarran }
386