1*5ac3bc71Schristos /* $NetBSD: libelf_ar_util.c,v 1.5 2024/03/03 17:37:34 christos Exp $ */
2e81373b4Schristos
39dd9d0cfSchristos /*-
49dd9d0cfSchristos * Copyright (c) 2006,2009,2010 Joseph Koshy
59dd9d0cfSchristos * All rights reserved.
69dd9d0cfSchristos *
79dd9d0cfSchristos * Redistribution and use in source and binary forms, with or without
89dd9d0cfSchristos * modification, are permitted provided that the following conditions
99dd9d0cfSchristos * are met:
109dd9d0cfSchristos * 1. Redistributions of source code must retain the above copyright
119dd9d0cfSchristos * notice, this list of conditions and the following disclaimer.
129dd9d0cfSchristos * 2. Redistributions in binary form must reproduce the above copyright
139dd9d0cfSchristos * notice, this list of conditions and the following disclaimer in the
149dd9d0cfSchristos * documentation and/or other materials provided with the distribution.
159dd9d0cfSchristos *
169dd9d0cfSchristos * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS `AS IS' AND
179dd9d0cfSchristos * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
189dd9d0cfSchristos * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
199dd9d0cfSchristos * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
209dd9d0cfSchristos * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
219dd9d0cfSchristos * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
229dd9d0cfSchristos * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
239dd9d0cfSchristos * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
249dd9d0cfSchristos * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
259dd9d0cfSchristos * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
269dd9d0cfSchristos * SUCH DAMAGE.
279dd9d0cfSchristos */
289dd9d0cfSchristos
29e81373b4Schristos #if HAVE_NBTOOL_CONFIG_H
30e81373b4Schristos # include "nbtool_config.h"
31e81373b4Schristos #endif
32e81373b4Schristos
339dd9d0cfSchristos #include <sys/cdefs.h>
349dd9d0cfSchristos
359dd9d0cfSchristos #include <assert.h>
369dd9d0cfSchristos #include <libelf.h>
379dd9d0cfSchristos #include <stdlib.h>
389dd9d0cfSchristos #include <string.h>
399dd9d0cfSchristos
409dd9d0cfSchristos #include "_libelf.h"
419dd9d0cfSchristos #include "_libelf_ar.h"
429dd9d0cfSchristos
43*5ac3bc71Schristos __RCSID("$NetBSD: libelf_ar_util.c,v 1.5 2024/03/03 17:37:34 christos Exp $");
44*5ac3bc71Schristos ELFTC_VCSID("Id: libelf_ar_util.c 3977 2022-05-01 06:45:34Z jkoshy");
459dd9d0cfSchristos
469dd9d0cfSchristos /*
479dd9d0cfSchristos * Convert a string bounded by `start' and `start+sz' (exclusive) to a
489dd9d0cfSchristos * number in the specified base.
499dd9d0cfSchristos */
509dd9d0cfSchristos int
_libelf_ar_get_number(const char * src,size_t sz,unsigned int base,size_t * ret)5142bd3019Schristos _libelf_ar_get_number(const char *src, size_t sz, unsigned int base,
5242bd3019Schristos size_t *ret)
539dd9d0cfSchristos {
549dd9d0cfSchristos size_t r;
5542bd3019Schristos unsigned int c, v;
5642bd3019Schristos const unsigned char *e, *s;
579dd9d0cfSchristos
589dd9d0cfSchristos assert(base <= 10);
599dd9d0cfSchristos
6042bd3019Schristos s = (const unsigned char *) src;
619dd9d0cfSchristos e = s + sz;
629dd9d0cfSchristos
639dd9d0cfSchristos /* skip leading blanks */
649dd9d0cfSchristos for (;s < e && (c = *s) == ' '; s++)
659dd9d0cfSchristos ;
669dd9d0cfSchristos
679dd9d0cfSchristos r = 0L;
689dd9d0cfSchristos for (;s < e; s++) {
699dd9d0cfSchristos if ((c = *s) == ' ')
709dd9d0cfSchristos break;
719dd9d0cfSchristos if (c < '0' || c > '9')
729dd9d0cfSchristos return (0);
739dd9d0cfSchristos v = c - '0';
749dd9d0cfSchristos if (v >= base) /* Illegal digit. */
759dd9d0cfSchristos break;
769dd9d0cfSchristos r *= base;
779dd9d0cfSchristos r += v;
789dd9d0cfSchristos }
799dd9d0cfSchristos
809dd9d0cfSchristos *ret = r;
819dd9d0cfSchristos
829dd9d0cfSchristos return (1);
839dd9d0cfSchristos }
849dd9d0cfSchristos
859dd9d0cfSchristos /*
869dd9d0cfSchristos * Return the translated name for an archive member.
879dd9d0cfSchristos */
889dd9d0cfSchristos char *
_libelf_ar_get_translated_name(const struct ar_hdr * arh,Elf * ar)899dd9d0cfSchristos _libelf_ar_get_translated_name(const struct ar_hdr *arh, Elf *ar)
909dd9d0cfSchristos {
9142bd3019Schristos char *s;
9242bd3019Schristos unsigned char c;
939dd9d0cfSchristos size_t len, offset;
9442bd3019Schristos const unsigned char *buf, *p, *q, *r;
959dd9d0cfSchristos const size_t bufsize = sizeof(arh->ar_name);
969dd9d0cfSchristos
979dd9d0cfSchristos assert(arh != NULL);
989dd9d0cfSchristos assert(ar->e_kind == ELF_K_AR);
9942bd3019Schristos assert((const unsigned char *) arh >= ar->e_rawfile &&
10042bd3019Schristos (const unsigned char *) arh < ar->e_rawfile + ar->e_rawsize);
1019dd9d0cfSchristos
10242bd3019Schristos buf = (const unsigned char *) arh->ar_name;
1039dd9d0cfSchristos
1049dd9d0cfSchristos /*
1059dd9d0cfSchristos * Check for extended naming.
1069dd9d0cfSchristos *
1079dd9d0cfSchristos * If the name matches the pattern "^/[0-9]+", it is an
1089dd9d0cfSchristos * SVR4-style extended name. If the name matches the pattern
1099dd9d0cfSchristos * "#1/[0-9]+", the entry uses BSD style extended naming.
1109dd9d0cfSchristos */
1119dd9d0cfSchristos if (buf[0] == '/' && (c = buf[1]) >= '0' && c <= '9') {
1129dd9d0cfSchristos /*
1139dd9d0cfSchristos * The value in field ar_name is a decimal offset into
1149dd9d0cfSchristos * the archive string table where the actual name
1159dd9d0cfSchristos * resides.
1169dd9d0cfSchristos */
11742bd3019Schristos if (_libelf_ar_get_number((const char *) (buf + 1),
11842bd3019Schristos bufsize - 1, 10, &offset) == 0) {
1199dd9d0cfSchristos LIBELF_SET_ERROR(ARCHIVE, 0);
1209dd9d0cfSchristos return (NULL);
1219dd9d0cfSchristos }
1229dd9d0cfSchristos
1239dd9d0cfSchristos if (offset > ar->e_u.e_ar.e_rawstrtabsz) {
1249dd9d0cfSchristos LIBELF_SET_ERROR(ARCHIVE, 0);
1259dd9d0cfSchristos return (NULL);
1269dd9d0cfSchristos }
1279dd9d0cfSchristos
1289dd9d0cfSchristos p = q = ar->e_u.e_ar.e_rawstrtab + offset;
1299dd9d0cfSchristos r = ar->e_u.e_ar.e_rawstrtab + ar->e_u.e_ar.e_rawstrtabsz;
1309dd9d0cfSchristos
1319dd9d0cfSchristos for (; p < r && *p != '/'; p++)
1329dd9d0cfSchristos ;
13342bd3019Schristos len = (size_t) (p - q + 1); /* space for the trailing NUL */
1349dd9d0cfSchristos
1359dd9d0cfSchristos if ((s = malloc(len)) == NULL) {
1369dd9d0cfSchristos LIBELF_SET_ERROR(RESOURCE, 0);
1379dd9d0cfSchristos return (NULL);
1389dd9d0cfSchristos }
1399dd9d0cfSchristos
14042bd3019Schristos (void) strncpy(s, (const char *) q, len - 1);
1419dd9d0cfSchristos s[len - 1] = '\0';
1429dd9d0cfSchristos
1439dd9d0cfSchristos return (s);
1449dd9d0cfSchristos } else if (IS_EXTENDED_BSD_NAME(buf)) {
1459dd9d0cfSchristos r = buf + LIBELF_AR_BSD_EXTENDED_NAME_PREFIX_SIZE;
1469dd9d0cfSchristos
14742bd3019Schristos if (_libelf_ar_get_number((const char *) r, bufsize -
1489dd9d0cfSchristos LIBELF_AR_BSD_EXTENDED_NAME_PREFIX_SIZE, 10,
1499dd9d0cfSchristos &len) == 0) {
1509dd9d0cfSchristos LIBELF_SET_ERROR(ARCHIVE, 0);
1519dd9d0cfSchristos return (NULL);
1529dd9d0cfSchristos }
1539dd9d0cfSchristos
1549dd9d0cfSchristos /*
1559dd9d0cfSchristos * Allocate space for the file name plus a
1569dd9d0cfSchristos * trailing NUL.
1579dd9d0cfSchristos */
1589dd9d0cfSchristos if ((s = malloc(len + 1)) == NULL) {
1599dd9d0cfSchristos LIBELF_SET_ERROR(RESOURCE, 0);
1609dd9d0cfSchristos return (NULL);
1619dd9d0cfSchristos }
1629dd9d0cfSchristos
1639dd9d0cfSchristos /*
1649dd9d0cfSchristos * The file name follows the archive header.
1659dd9d0cfSchristos */
16642bd3019Schristos q = (const unsigned char *) (arh + 1);
1679dd9d0cfSchristos
16842bd3019Schristos (void) strncpy(s, (const char *) q, len);
1699dd9d0cfSchristos s[len] = '\0';
1709dd9d0cfSchristos
1719dd9d0cfSchristos return (s);
1729dd9d0cfSchristos }
1739dd9d0cfSchristos
1749dd9d0cfSchristos /*
1759dd9d0cfSchristos * A 'normal' name.
1769dd9d0cfSchristos *
1779dd9d0cfSchristos * Skip back over trailing blanks from the end of the field.
1789dd9d0cfSchristos * In the SVR4 format, a '/' is used as a terminator for
1799dd9d0cfSchristos * non-special names.
1809dd9d0cfSchristos */
1819dd9d0cfSchristos for (q = buf + bufsize - 1; q >= buf && *q == ' '; --q)
1829dd9d0cfSchristos ;
1839dd9d0cfSchristos
1849dd9d0cfSchristos if (q >= buf) {
1859dd9d0cfSchristos if (*q == '/') {
1869dd9d0cfSchristos /*
1879dd9d0cfSchristos * SVR4 style names: ignore the trailing
1889dd9d0cfSchristos * character '/', but only if the name is not
1899dd9d0cfSchristos * one of the special names "/" and "//".
1909dd9d0cfSchristos */
1919dd9d0cfSchristos if (q > buf + 1 ||
1929dd9d0cfSchristos (q == (buf + 1) && *buf != '/'))
1939dd9d0cfSchristos q--;
1949dd9d0cfSchristos }
1959dd9d0cfSchristos
19642bd3019Schristos len = (size_t) (q - buf + 2); /* Space for a trailing NUL. */
1979dd9d0cfSchristos } else {
1989dd9d0cfSchristos /* The buffer only had blanks. */
19942bd3019Schristos buf = (const unsigned char *) "";
2009dd9d0cfSchristos len = 1;
2019dd9d0cfSchristos }
2029dd9d0cfSchristos
2039dd9d0cfSchristos if ((s = malloc(len)) == NULL) {
2049dd9d0cfSchristos LIBELF_SET_ERROR(RESOURCE, 0);
2059dd9d0cfSchristos return (NULL);
2069dd9d0cfSchristos }
2079dd9d0cfSchristos
20842bd3019Schristos (void) strncpy(s, (const char *) buf, len - 1);
2099dd9d0cfSchristos s[len - 1] = '\0';
2109dd9d0cfSchristos
2119dd9d0cfSchristos return (s);
2129dd9d0cfSchristos }
2139dd9d0cfSchristos
2149dd9d0cfSchristos /*
2159dd9d0cfSchristos * Return the raw name for an archive member, inclusive of any
2169dd9d0cfSchristos * formatting characters.
2179dd9d0cfSchristos */
2189dd9d0cfSchristos char *
_libelf_ar_get_raw_name(const struct ar_hdr * arh)2199dd9d0cfSchristos _libelf_ar_get_raw_name(const struct ar_hdr *arh)
2209dd9d0cfSchristos {
2219dd9d0cfSchristos char *rawname;
2229dd9d0cfSchristos const size_t namesz = sizeof(arh->ar_name);
2239dd9d0cfSchristos
2249dd9d0cfSchristos if ((rawname = malloc(namesz + 1)) == NULL) {
2259dd9d0cfSchristos LIBELF_SET_ERROR(RESOURCE, 0);
2269dd9d0cfSchristos return (NULL);
2279dd9d0cfSchristos }
2289dd9d0cfSchristos
2299dd9d0cfSchristos (void) strncpy(rawname, arh->ar_name, namesz);
2309dd9d0cfSchristos rawname[namesz] = '\0';
2319dd9d0cfSchristos return (rawname);
2329dd9d0cfSchristos }
2339dd9d0cfSchristos
2349dd9d0cfSchristos /*
2359dd9d0cfSchristos * Open an 'ar' archive.
2369dd9d0cfSchristos */
2379dd9d0cfSchristos Elf *
_libelf_ar_open(Elf * e,int reporterror)2389dd9d0cfSchristos _libelf_ar_open(Elf *e, int reporterror)
2399dd9d0cfSchristos {
2409dd9d0cfSchristos size_t sz;
2419dd9d0cfSchristos int scanahead;
2429dd9d0cfSchristos struct ar_hdr arh;
24342bd3019Schristos unsigned char *s, *end;
2449dd9d0cfSchristos
2459dd9d0cfSchristos _libelf_init_elf(e, ELF_K_AR);
2469dd9d0cfSchristos
2479dd9d0cfSchristos e->e_u.e_ar.e_nchildren = 0;
2489dd9d0cfSchristos e->e_u.e_ar.e_next = (off_t) -1;
2499dd9d0cfSchristos
2509dd9d0cfSchristos /*
2519dd9d0cfSchristos * Look for special members.
2529dd9d0cfSchristos */
2539dd9d0cfSchristos
2549dd9d0cfSchristos s = e->e_rawfile + SARMAG;
2559dd9d0cfSchristos end = e->e_rawfile + e->e_rawsize;
2569dd9d0cfSchristos
2579dd9d0cfSchristos assert(e->e_rawsize > 0);
2589dd9d0cfSchristos
2599dd9d0cfSchristos /*
2609dd9d0cfSchristos * We use heuristics to determine the flavor of the archive we
2619dd9d0cfSchristos * are examining.
2629dd9d0cfSchristos *
2639dd9d0cfSchristos * SVR4 flavor archives use the name "/ " and "// " for
2649dd9d0cfSchristos * special members.
2659dd9d0cfSchristos *
2669dd9d0cfSchristos * In BSD flavor archives the symbol table, if present, is the
2679dd9d0cfSchristos * first archive with name "__.SYMDEF".
2689dd9d0cfSchristos */
2699dd9d0cfSchristos
2709dd9d0cfSchristos #define READ_AR_HEADER(S, ARH, SZ, END) \
2719dd9d0cfSchristos do { \
2729dd9d0cfSchristos if ((S) + sizeof((ARH)) > (END)) \
2739dd9d0cfSchristos goto error; \
2749dd9d0cfSchristos (void) memcpy(&(ARH), (S), sizeof((ARH))); \
2759dd9d0cfSchristos if ((ARH).ar_fmag[0] != '`' || (ARH).ar_fmag[1] != '\n') \
2769dd9d0cfSchristos goto error; \
27742bd3019Schristos if (_libelf_ar_get_number((char *) (ARH).ar_size, \
2789dd9d0cfSchristos sizeof((ARH).ar_size), 10, &(SZ)) == 0) \
2799dd9d0cfSchristos goto error; \
280*5ac3bc71Schristos } while (/* CONSTCOND */ 0)
2819dd9d0cfSchristos
2829dd9d0cfSchristos READ_AR_HEADER(s, arh, sz, end);
2839dd9d0cfSchristos
2849dd9d0cfSchristos /*
2859dd9d0cfSchristos * Handle special archive members for the SVR4 format.
2869dd9d0cfSchristos */
2879dd9d0cfSchristos if (arh.ar_name[0] == '/') {
28842bd3019Schristos if (sz == 0)
28942bd3019Schristos goto error;
2909dd9d0cfSchristos
2919dd9d0cfSchristos e->e_flags |= LIBELF_F_AR_VARIANT_SVR4;
2929dd9d0cfSchristos
2939dd9d0cfSchristos scanahead = 0;
2949dd9d0cfSchristos
2959dd9d0cfSchristos /*
2969dd9d0cfSchristos * The symbol table (file name "/ ") always comes before the
2979dd9d0cfSchristos * string table (file name "// ").
2989dd9d0cfSchristos */
2999dd9d0cfSchristos if (arh.ar_name[1] == ' ') {
3009dd9d0cfSchristos /* "/ " => symbol table. */
3019dd9d0cfSchristos scanahead = 1; /* The string table to follow. */
3029dd9d0cfSchristos
3039dd9d0cfSchristos s += sizeof(arh);
3049dd9d0cfSchristos e->e_u.e_ar.e_rawsymtab = s;
3059dd9d0cfSchristos e->e_u.e_ar.e_rawsymtabsz = sz;
3069dd9d0cfSchristos
3079dd9d0cfSchristos sz = LIBELF_ADJUST_AR_SIZE(sz);
3089dd9d0cfSchristos s += sz;
3099dd9d0cfSchristos
3109dd9d0cfSchristos } else if (arh.ar_name[1] == '/' && arh.ar_name[2] == ' ') {
3119dd9d0cfSchristos /* "// " => string table for long file names. */
3129dd9d0cfSchristos s += sizeof(arh);
3139dd9d0cfSchristos e->e_u.e_ar.e_rawstrtab = s;
3149dd9d0cfSchristos e->e_u.e_ar.e_rawstrtabsz = sz;
3159dd9d0cfSchristos
3169dd9d0cfSchristos sz = LIBELF_ADJUST_AR_SIZE(sz);
3179dd9d0cfSchristos s += sz;
3189dd9d0cfSchristos }
3199dd9d0cfSchristos
3209dd9d0cfSchristos /*
3219dd9d0cfSchristos * If the string table hasn't been seen yet, look for
3229dd9d0cfSchristos * it in the next member.
3239dd9d0cfSchristos */
3249dd9d0cfSchristos if (scanahead) {
3259dd9d0cfSchristos READ_AR_HEADER(s, arh, sz, end);
3269dd9d0cfSchristos
3279dd9d0cfSchristos /* "// " => string table for long file names. */
3289dd9d0cfSchristos if (arh.ar_name[0] == '/' && arh.ar_name[1] == '/' &&
3299dd9d0cfSchristos arh.ar_name[2] == ' ') {
3309dd9d0cfSchristos
3319dd9d0cfSchristos s += sizeof(arh);
3329dd9d0cfSchristos
3339dd9d0cfSchristos e->e_u.e_ar.e_rawstrtab = s;
3349dd9d0cfSchristos e->e_u.e_ar.e_rawstrtabsz = sz;
3359dd9d0cfSchristos
3369dd9d0cfSchristos sz = LIBELF_ADJUST_AR_SIZE(sz);
3379dd9d0cfSchristos s += sz;
3389dd9d0cfSchristos }
3399dd9d0cfSchristos }
3409dd9d0cfSchristos } else if (strncmp(arh.ar_name, LIBELF_AR_BSD_SYMTAB_NAME,
3419dd9d0cfSchristos sizeof(LIBELF_AR_BSD_SYMTAB_NAME) - 1) == 0) {
3429dd9d0cfSchristos /*
3439dd9d0cfSchristos * BSD style archive symbol table.
3449dd9d0cfSchristos */
3459dd9d0cfSchristos s += sizeof(arh);
3469dd9d0cfSchristos e->e_u.e_ar.e_rawsymtab = s;
3479dd9d0cfSchristos e->e_u.e_ar.e_rawsymtabsz = sz;
3489dd9d0cfSchristos
3499dd9d0cfSchristos sz = LIBELF_ADJUST_AR_SIZE(sz);
3509dd9d0cfSchristos s += sz;
3519dd9d0cfSchristos }
3529dd9d0cfSchristos
3539dd9d0cfSchristos /*
3549dd9d0cfSchristos * Update the 'next' offset, so that a subsequent elf_begin()
3559dd9d0cfSchristos * works as expected.
3569dd9d0cfSchristos */
3579dd9d0cfSchristos e->e_u.e_ar.e_next = (off_t) (s - e->e_rawfile);
3589dd9d0cfSchristos
3599dd9d0cfSchristos return (e);
3609dd9d0cfSchristos
3619dd9d0cfSchristos error:
3629dd9d0cfSchristos if (!reporterror) {
3639dd9d0cfSchristos e->e_kind = ELF_K_NONE;
3649dd9d0cfSchristos return (e);
3659dd9d0cfSchristos }
3669dd9d0cfSchristos
3679dd9d0cfSchristos LIBELF_SET_ERROR(ARCHIVE, 0);
3689dd9d0cfSchristos return (NULL);
3699dd9d0cfSchristos }
370