xref: /netbsd-src/external/bsd/elftoolchain/dist/libelf/libelf_ar_util.c (revision 5ac3bc719ce6e70593039505b491894133237d12)
1*5ac3bc71Schristos /*	$NetBSD: libelf_ar_util.c,v 1.5 2024/03/03 17:37:34 christos Exp $	*/
2e81373b4Schristos 
39dd9d0cfSchristos /*-
49dd9d0cfSchristos  * Copyright (c) 2006,2009,2010 Joseph Koshy
59dd9d0cfSchristos  * All rights reserved.
69dd9d0cfSchristos  *
79dd9d0cfSchristos  * Redistribution and use in source and binary forms, with or without
89dd9d0cfSchristos  * modification, are permitted provided that the following conditions
99dd9d0cfSchristos  * are met:
109dd9d0cfSchristos  * 1. Redistributions of source code must retain the above copyright
119dd9d0cfSchristos  *    notice, this list of conditions and the following disclaimer.
129dd9d0cfSchristos  * 2. Redistributions in binary form must reproduce the above copyright
139dd9d0cfSchristos  *    notice, this list of conditions and the following disclaimer in the
149dd9d0cfSchristos  *    documentation and/or other materials provided with the distribution.
159dd9d0cfSchristos  *
169dd9d0cfSchristos  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS `AS IS' AND
179dd9d0cfSchristos  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
189dd9d0cfSchristos  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
199dd9d0cfSchristos  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
209dd9d0cfSchristos  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
219dd9d0cfSchristos  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
229dd9d0cfSchristos  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
239dd9d0cfSchristos  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
249dd9d0cfSchristos  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
259dd9d0cfSchristos  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
269dd9d0cfSchristos  * SUCH DAMAGE.
279dd9d0cfSchristos  */
289dd9d0cfSchristos 
29e81373b4Schristos #if HAVE_NBTOOL_CONFIG_H
30e81373b4Schristos # include "nbtool_config.h"
31e81373b4Schristos #endif
32e81373b4Schristos 
339dd9d0cfSchristos #include <sys/cdefs.h>
349dd9d0cfSchristos 
359dd9d0cfSchristos #include <assert.h>
369dd9d0cfSchristos #include <libelf.h>
379dd9d0cfSchristos #include <stdlib.h>
389dd9d0cfSchristos #include <string.h>
399dd9d0cfSchristos 
409dd9d0cfSchristos #include "_libelf.h"
419dd9d0cfSchristos #include "_libelf_ar.h"
429dd9d0cfSchristos 
43*5ac3bc71Schristos __RCSID("$NetBSD: libelf_ar_util.c,v 1.5 2024/03/03 17:37:34 christos Exp $");
44*5ac3bc71Schristos ELFTC_VCSID("Id: libelf_ar_util.c 3977 2022-05-01 06:45:34Z jkoshy");
459dd9d0cfSchristos 
469dd9d0cfSchristos /*
479dd9d0cfSchristos  * Convert a string bounded by `start' and `start+sz' (exclusive) to a
489dd9d0cfSchristos  * number in the specified base.
499dd9d0cfSchristos  */
509dd9d0cfSchristos int
_libelf_ar_get_number(const char * src,size_t sz,unsigned int base,size_t * ret)5142bd3019Schristos _libelf_ar_get_number(const char *src, size_t sz, unsigned int base,
5242bd3019Schristos     size_t *ret)
539dd9d0cfSchristos {
549dd9d0cfSchristos 	size_t r;
5542bd3019Schristos 	unsigned int c, v;
5642bd3019Schristos 	const unsigned char *e, *s;
579dd9d0cfSchristos 
589dd9d0cfSchristos 	assert(base <= 10);
599dd9d0cfSchristos 
6042bd3019Schristos 	s = (const unsigned char *) src;
619dd9d0cfSchristos 	e = s + sz;
629dd9d0cfSchristos 
639dd9d0cfSchristos 	/* skip leading blanks */
649dd9d0cfSchristos 	for (;s < e && (c = *s) == ' '; s++)
659dd9d0cfSchristos 		;
669dd9d0cfSchristos 
679dd9d0cfSchristos 	r = 0L;
689dd9d0cfSchristos 	for (;s < e; s++) {
699dd9d0cfSchristos 		if ((c = *s) == ' ')
709dd9d0cfSchristos 			break;
719dd9d0cfSchristos 		if (c < '0' || c > '9')
729dd9d0cfSchristos 			return (0);
739dd9d0cfSchristos 		v = c - '0';
749dd9d0cfSchristos 		if (v >= base)		/* Illegal digit. */
759dd9d0cfSchristos 			break;
769dd9d0cfSchristos 		r *= base;
779dd9d0cfSchristos 		r += v;
789dd9d0cfSchristos 	}
799dd9d0cfSchristos 
809dd9d0cfSchristos 	*ret = r;
819dd9d0cfSchristos 
829dd9d0cfSchristos 	return (1);
839dd9d0cfSchristos }
849dd9d0cfSchristos 
859dd9d0cfSchristos /*
869dd9d0cfSchristos  * Return the translated name for an archive member.
879dd9d0cfSchristos  */
889dd9d0cfSchristos char *
_libelf_ar_get_translated_name(const struct ar_hdr * arh,Elf * ar)899dd9d0cfSchristos _libelf_ar_get_translated_name(const struct ar_hdr *arh, Elf *ar)
909dd9d0cfSchristos {
9142bd3019Schristos 	char *s;
9242bd3019Schristos 	unsigned char c;
939dd9d0cfSchristos 	size_t len, offset;
9442bd3019Schristos 	const unsigned char *buf, *p, *q, *r;
959dd9d0cfSchristos 	const size_t bufsize = sizeof(arh->ar_name);
969dd9d0cfSchristos 
979dd9d0cfSchristos 	assert(arh != NULL);
989dd9d0cfSchristos 	assert(ar->e_kind == ELF_K_AR);
9942bd3019Schristos 	assert((const unsigned char *) arh >= ar->e_rawfile &&
10042bd3019Schristos 	    (const unsigned char *) arh < ar->e_rawfile + ar->e_rawsize);
1019dd9d0cfSchristos 
10242bd3019Schristos 	buf = (const unsigned char *) arh->ar_name;
1039dd9d0cfSchristos 
1049dd9d0cfSchristos 	/*
1059dd9d0cfSchristos 	 * Check for extended naming.
1069dd9d0cfSchristos 	 *
1079dd9d0cfSchristos 	 * If the name matches the pattern "^/[0-9]+", it is an
1089dd9d0cfSchristos 	 * SVR4-style extended name.  If the name matches the pattern
1099dd9d0cfSchristos 	 * "#1/[0-9]+", the entry uses BSD style extended naming.
1109dd9d0cfSchristos 	 */
1119dd9d0cfSchristos 	if (buf[0] == '/' && (c = buf[1]) >= '0' && c <= '9') {
1129dd9d0cfSchristos 		/*
1139dd9d0cfSchristos 		 * The value in field ar_name is a decimal offset into
1149dd9d0cfSchristos 		 * the archive string table where the actual name
1159dd9d0cfSchristos 		 * resides.
1169dd9d0cfSchristos 		 */
11742bd3019Schristos 		if (_libelf_ar_get_number((const char *) (buf + 1),
11842bd3019Schristos 			bufsize - 1, 10, &offset) == 0) {
1199dd9d0cfSchristos 			LIBELF_SET_ERROR(ARCHIVE, 0);
1209dd9d0cfSchristos 			return (NULL);
1219dd9d0cfSchristos 		}
1229dd9d0cfSchristos 
1239dd9d0cfSchristos 		if (offset > ar->e_u.e_ar.e_rawstrtabsz) {
1249dd9d0cfSchristos 			LIBELF_SET_ERROR(ARCHIVE, 0);
1259dd9d0cfSchristos 			return (NULL);
1269dd9d0cfSchristos 		}
1279dd9d0cfSchristos 
1289dd9d0cfSchristos 		p = q = ar->e_u.e_ar.e_rawstrtab + offset;
1299dd9d0cfSchristos 		r = ar->e_u.e_ar.e_rawstrtab + ar->e_u.e_ar.e_rawstrtabsz;
1309dd9d0cfSchristos 
1319dd9d0cfSchristos 		for (; p < r && *p != '/'; p++)
1329dd9d0cfSchristos 			;
13342bd3019Schristos 		len = (size_t) (p - q + 1); /* space for the trailing NUL */
1349dd9d0cfSchristos 
1359dd9d0cfSchristos 		if ((s = malloc(len)) == NULL) {
1369dd9d0cfSchristos 			LIBELF_SET_ERROR(RESOURCE, 0);
1379dd9d0cfSchristos 			return (NULL);
1389dd9d0cfSchristos 		}
1399dd9d0cfSchristos 
14042bd3019Schristos 		(void) strncpy(s, (const char *) q, len - 1);
1419dd9d0cfSchristos 		s[len - 1] = '\0';
1429dd9d0cfSchristos 
1439dd9d0cfSchristos 		return (s);
1449dd9d0cfSchristos 	} else if (IS_EXTENDED_BSD_NAME(buf)) {
1459dd9d0cfSchristos 		r = buf + LIBELF_AR_BSD_EXTENDED_NAME_PREFIX_SIZE;
1469dd9d0cfSchristos 
14742bd3019Schristos 		if (_libelf_ar_get_number((const char *) r, bufsize -
1489dd9d0cfSchristos 			LIBELF_AR_BSD_EXTENDED_NAME_PREFIX_SIZE, 10,
1499dd9d0cfSchristos 			&len) == 0) {
1509dd9d0cfSchristos 			LIBELF_SET_ERROR(ARCHIVE, 0);
1519dd9d0cfSchristos 			return (NULL);
1529dd9d0cfSchristos 		}
1539dd9d0cfSchristos 
1549dd9d0cfSchristos 		/*
1559dd9d0cfSchristos 		 * Allocate space for the file name plus a
1569dd9d0cfSchristos 		 * trailing NUL.
1579dd9d0cfSchristos 		 */
1589dd9d0cfSchristos 		if ((s = malloc(len + 1)) == NULL) {
1599dd9d0cfSchristos 			LIBELF_SET_ERROR(RESOURCE, 0);
1609dd9d0cfSchristos 			return (NULL);
1619dd9d0cfSchristos 		}
1629dd9d0cfSchristos 
1639dd9d0cfSchristos 		/*
1649dd9d0cfSchristos 		 * The file name follows the archive header.
1659dd9d0cfSchristos 		 */
16642bd3019Schristos 		q = (const unsigned char *) (arh + 1);
1679dd9d0cfSchristos 
16842bd3019Schristos 		(void) strncpy(s, (const char *) q, len);
1699dd9d0cfSchristos 		s[len] = '\0';
1709dd9d0cfSchristos 
1719dd9d0cfSchristos 		return (s);
1729dd9d0cfSchristos 	}
1739dd9d0cfSchristos 
1749dd9d0cfSchristos 	/*
1759dd9d0cfSchristos 	 * A 'normal' name.
1769dd9d0cfSchristos 	 *
1779dd9d0cfSchristos 	 * Skip back over trailing blanks from the end of the field.
1789dd9d0cfSchristos 	 * In the SVR4 format, a '/' is used as a terminator for
1799dd9d0cfSchristos 	 * non-special names.
1809dd9d0cfSchristos 	 */
1819dd9d0cfSchristos 	for (q = buf + bufsize - 1; q >= buf && *q == ' '; --q)
1829dd9d0cfSchristos 		;
1839dd9d0cfSchristos 
1849dd9d0cfSchristos 	if (q >= buf) {
1859dd9d0cfSchristos 		if (*q == '/') {
1869dd9d0cfSchristos 			/*
1879dd9d0cfSchristos 			 * SVR4 style names: ignore the trailing
1889dd9d0cfSchristos 			 * character '/', but only if the name is not
1899dd9d0cfSchristos 			 * one of the special names "/" and "//".
1909dd9d0cfSchristos 			 */
1919dd9d0cfSchristos 			if (q > buf + 1 ||
1929dd9d0cfSchristos 			    (q == (buf + 1) && *buf != '/'))
1939dd9d0cfSchristos 				q--;
1949dd9d0cfSchristos 		}
1959dd9d0cfSchristos 
19642bd3019Schristos 		len = (size_t) (q - buf + 2); /* Space for a trailing NUL. */
1979dd9d0cfSchristos 	} else {
1989dd9d0cfSchristos 		/* The buffer only had blanks. */
19942bd3019Schristos 		buf = (const unsigned char *) "";
2009dd9d0cfSchristos 		len = 1;
2019dd9d0cfSchristos 	}
2029dd9d0cfSchristos 
2039dd9d0cfSchristos 	if ((s = malloc(len)) == NULL) {
2049dd9d0cfSchristos 		LIBELF_SET_ERROR(RESOURCE, 0);
2059dd9d0cfSchristos 		return (NULL);
2069dd9d0cfSchristos 	}
2079dd9d0cfSchristos 
20842bd3019Schristos 	(void) strncpy(s, (const char *) buf, len - 1);
2099dd9d0cfSchristos 	s[len - 1] = '\0';
2109dd9d0cfSchristos 
2119dd9d0cfSchristos 	return (s);
2129dd9d0cfSchristos }
2139dd9d0cfSchristos 
2149dd9d0cfSchristos /*
2159dd9d0cfSchristos  * Return the raw name for an archive member, inclusive of any
2169dd9d0cfSchristos  * formatting characters.
2179dd9d0cfSchristos  */
2189dd9d0cfSchristos char *
_libelf_ar_get_raw_name(const struct ar_hdr * arh)2199dd9d0cfSchristos _libelf_ar_get_raw_name(const struct ar_hdr *arh)
2209dd9d0cfSchristos {
2219dd9d0cfSchristos 	char *rawname;
2229dd9d0cfSchristos 	const size_t namesz = sizeof(arh->ar_name);
2239dd9d0cfSchristos 
2249dd9d0cfSchristos 	if ((rawname = malloc(namesz + 1)) == NULL) {
2259dd9d0cfSchristos 		LIBELF_SET_ERROR(RESOURCE, 0);
2269dd9d0cfSchristos 		return (NULL);
2279dd9d0cfSchristos 	}
2289dd9d0cfSchristos 
2299dd9d0cfSchristos 	(void) strncpy(rawname, arh->ar_name, namesz);
2309dd9d0cfSchristos 	rawname[namesz] = '\0';
2319dd9d0cfSchristos 	return (rawname);
2329dd9d0cfSchristos }
2339dd9d0cfSchristos 
2349dd9d0cfSchristos /*
2359dd9d0cfSchristos  * Open an 'ar' archive.
2369dd9d0cfSchristos  */
2379dd9d0cfSchristos Elf *
_libelf_ar_open(Elf * e,int reporterror)2389dd9d0cfSchristos _libelf_ar_open(Elf *e, int reporterror)
2399dd9d0cfSchristos {
2409dd9d0cfSchristos 	size_t sz;
2419dd9d0cfSchristos 	int scanahead;
2429dd9d0cfSchristos 	struct ar_hdr arh;
24342bd3019Schristos 	unsigned char *s, *end;
2449dd9d0cfSchristos 
2459dd9d0cfSchristos 	_libelf_init_elf(e, ELF_K_AR);
2469dd9d0cfSchristos 
2479dd9d0cfSchristos 	e->e_u.e_ar.e_nchildren = 0;
2489dd9d0cfSchristos 	e->e_u.e_ar.e_next = (off_t) -1;
2499dd9d0cfSchristos 
2509dd9d0cfSchristos 	/*
2519dd9d0cfSchristos 	 * Look for special members.
2529dd9d0cfSchristos 	 */
2539dd9d0cfSchristos 
2549dd9d0cfSchristos 	s = e->e_rawfile + SARMAG;
2559dd9d0cfSchristos 	end = e->e_rawfile + e->e_rawsize;
2569dd9d0cfSchristos 
2579dd9d0cfSchristos 	assert(e->e_rawsize > 0);
2589dd9d0cfSchristos 
2599dd9d0cfSchristos 	/*
2609dd9d0cfSchristos 	 * We use heuristics to determine the flavor of the archive we
2619dd9d0cfSchristos 	 * are examining.
2629dd9d0cfSchristos 	 *
2639dd9d0cfSchristos 	 * SVR4 flavor archives use the name "/ " and "// " for
2649dd9d0cfSchristos 	 * special members.
2659dd9d0cfSchristos 	 *
2669dd9d0cfSchristos 	 * In BSD flavor archives the symbol table, if present, is the
2679dd9d0cfSchristos 	 * first archive with name "__.SYMDEF".
2689dd9d0cfSchristos 	 */
2699dd9d0cfSchristos 
2709dd9d0cfSchristos #define	READ_AR_HEADER(S, ARH, SZ, END)					\
2719dd9d0cfSchristos 	do {								\
2729dd9d0cfSchristos 		if ((S) + sizeof((ARH)) > (END))			\
2739dd9d0cfSchristos 		        goto error;					\
2749dd9d0cfSchristos 		(void) memcpy(&(ARH), (S), sizeof((ARH)));		\
2759dd9d0cfSchristos 		if ((ARH).ar_fmag[0] != '`' || (ARH).ar_fmag[1] != '\n') \
2769dd9d0cfSchristos 			goto error;					\
27742bd3019Schristos 		if (_libelf_ar_get_number((char *) (ARH).ar_size,	\
2789dd9d0cfSchristos 		    sizeof((ARH).ar_size), 10, &(SZ)) == 0)		\
2799dd9d0cfSchristos 			goto error;					\
280*5ac3bc71Schristos 	} while (/* CONSTCOND */ 0)
2819dd9d0cfSchristos 
2829dd9d0cfSchristos 	READ_AR_HEADER(s, arh, sz, end);
2839dd9d0cfSchristos 
2849dd9d0cfSchristos 	/*
2859dd9d0cfSchristos 	 * Handle special archive members for the SVR4 format.
2869dd9d0cfSchristos 	 */
2879dd9d0cfSchristos 	if (arh.ar_name[0] == '/') {
28842bd3019Schristos 		if (sz == 0)
28942bd3019Schristos 			goto error;
2909dd9d0cfSchristos 
2919dd9d0cfSchristos 		e->e_flags |= LIBELF_F_AR_VARIANT_SVR4;
2929dd9d0cfSchristos 
2939dd9d0cfSchristos 		scanahead = 0;
2949dd9d0cfSchristos 
2959dd9d0cfSchristos 		/*
2969dd9d0cfSchristos 		 * The symbol table (file name "/ ") always comes before the
2979dd9d0cfSchristos 		 * string table (file name "// ").
2989dd9d0cfSchristos 		 */
2999dd9d0cfSchristos 		if (arh.ar_name[1] == ' ') {
3009dd9d0cfSchristos 			/* "/ " => symbol table. */
3019dd9d0cfSchristos 			scanahead = 1;	/* The string table to follow. */
3029dd9d0cfSchristos 
3039dd9d0cfSchristos 			s += sizeof(arh);
3049dd9d0cfSchristos 			e->e_u.e_ar.e_rawsymtab = s;
3059dd9d0cfSchristos 			e->e_u.e_ar.e_rawsymtabsz = sz;
3069dd9d0cfSchristos 
3079dd9d0cfSchristos 			sz = LIBELF_ADJUST_AR_SIZE(sz);
3089dd9d0cfSchristos 			s += sz;
3099dd9d0cfSchristos 
3109dd9d0cfSchristos 		} else if (arh.ar_name[1] == '/' && arh.ar_name[2] == ' ') {
3119dd9d0cfSchristos 			/* "// " => string table for long file names. */
3129dd9d0cfSchristos 			s += sizeof(arh);
3139dd9d0cfSchristos 			e->e_u.e_ar.e_rawstrtab = s;
3149dd9d0cfSchristos 			e->e_u.e_ar.e_rawstrtabsz = sz;
3159dd9d0cfSchristos 
3169dd9d0cfSchristos 			sz = LIBELF_ADJUST_AR_SIZE(sz);
3179dd9d0cfSchristos 			s += sz;
3189dd9d0cfSchristos 		}
3199dd9d0cfSchristos 
3209dd9d0cfSchristos 		/*
3219dd9d0cfSchristos 		 * If the string table hasn't been seen yet, look for
3229dd9d0cfSchristos 		 * it in the next member.
3239dd9d0cfSchristos 		 */
3249dd9d0cfSchristos 		if (scanahead) {
3259dd9d0cfSchristos 			READ_AR_HEADER(s, arh, sz, end);
3269dd9d0cfSchristos 
3279dd9d0cfSchristos 			/* "// " => string table for long file names. */
3289dd9d0cfSchristos 			if (arh.ar_name[0] == '/' && arh.ar_name[1] == '/' &&
3299dd9d0cfSchristos 			    arh.ar_name[2] == ' ') {
3309dd9d0cfSchristos 
3319dd9d0cfSchristos 				s += sizeof(arh);
3329dd9d0cfSchristos 
3339dd9d0cfSchristos 				e->e_u.e_ar.e_rawstrtab = s;
3349dd9d0cfSchristos 				e->e_u.e_ar.e_rawstrtabsz = sz;
3359dd9d0cfSchristos 
3369dd9d0cfSchristos 				sz = LIBELF_ADJUST_AR_SIZE(sz);
3379dd9d0cfSchristos 				s += sz;
3389dd9d0cfSchristos 			}
3399dd9d0cfSchristos 		}
3409dd9d0cfSchristos 	} else if (strncmp(arh.ar_name, LIBELF_AR_BSD_SYMTAB_NAME,
3419dd9d0cfSchristos 		sizeof(LIBELF_AR_BSD_SYMTAB_NAME) - 1) == 0) {
3429dd9d0cfSchristos 		/*
3439dd9d0cfSchristos 		 * BSD style archive symbol table.
3449dd9d0cfSchristos 		 */
3459dd9d0cfSchristos 		s += sizeof(arh);
3469dd9d0cfSchristos 		e->e_u.e_ar.e_rawsymtab = s;
3479dd9d0cfSchristos 		e->e_u.e_ar.e_rawsymtabsz = sz;
3489dd9d0cfSchristos 
3499dd9d0cfSchristos 		sz = LIBELF_ADJUST_AR_SIZE(sz);
3509dd9d0cfSchristos 		s += sz;
3519dd9d0cfSchristos 	}
3529dd9d0cfSchristos 
3539dd9d0cfSchristos 	/*
3549dd9d0cfSchristos 	 * Update the 'next' offset, so that a subsequent elf_begin()
3559dd9d0cfSchristos 	 * works as expected.
3569dd9d0cfSchristos 	 */
3579dd9d0cfSchristos 	e->e_u.e_ar.e_next = (off_t) (s - e->e_rawfile);
3589dd9d0cfSchristos 
3599dd9d0cfSchristos 	return (e);
3609dd9d0cfSchristos 
3619dd9d0cfSchristos error:
3629dd9d0cfSchristos 	if (!reporterror) {
3639dd9d0cfSchristos 		e->e_kind = ELF_K_NONE;
3649dd9d0cfSchristos 		return (e);
3659dd9d0cfSchristos 	}
3669dd9d0cfSchristos 
3679dd9d0cfSchristos 	LIBELF_SET_ERROR(ARCHIVE, 0);
3689dd9d0cfSchristos 	return (NULL);
3699dd9d0cfSchristos }
370