1327e51cbSPeter Avalos /*
2327e51cbSPeter Avalos * Copyright (c) Ian F. Darwin 1986-1995.
3327e51cbSPeter Avalos * Software written by Ian F. Darwin and others;
4327e51cbSPeter Avalos * maintained 1995-present by Christos Zoulas and others.
5327e51cbSPeter Avalos *
6327e51cbSPeter Avalos * Redistribution and use in source and binary forms, with or without
7327e51cbSPeter Avalos * modification, are permitted provided that the following conditions
8327e51cbSPeter Avalos * are met:
9327e51cbSPeter Avalos * 1. Redistributions of source code must retain the above copyright
10327e51cbSPeter Avalos * notice immediately at the beginning of the file, without modification,
11327e51cbSPeter Avalos * this list of conditions, and the following disclaimer.
12327e51cbSPeter Avalos * 2. Redistributions in binary form must reproduce the above copyright
13327e51cbSPeter Avalos * notice, this list of conditions and the following disclaimer in the
14327e51cbSPeter Avalos * documentation and/or other materials provided with the distribution.
15327e51cbSPeter Avalos *
16327e51cbSPeter Avalos * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17327e51cbSPeter Avalos * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18327e51cbSPeter Avalos * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19327e51cbSPeter Avalos * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
20327e51cbSPeter Avalos * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21327e51cbSPeter Avalos * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22327e51cbSPeter Avalos * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23327e51cbSPeter Avalos * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24327e51cbSPeter Avalos * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25327e51cbSPeter Avalos * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26327e51cbSPeter Avalos * SUCH DAMAGE.
27327e51cbSPeter Avalos */
28327e51cbSPeter Avalos /*
29327e51cbSPeter Avalos * apprentice - make one pass through /etc/magic, learning its secrets.
30327e51cbSPeter Avalos */
31327e51cbSPeter Avalos
32327e51cbSPeter Avalos #include "file.h"
3379343712SPeter Avalos
3479343712SPeter Avalos #ifndef lint
35*3b9cdfa3SAntonio Huete Jimenez FILE_RCSID("@(#)$File: apprentice.c,v 1.326 2022/09/13 18:46:07 christos Exp $")
3679343712SPeter Avalos #endif /* lint */
3779343712SPeter Avalos
38327e51cbSPeter Avalos #include "magic.h"
39327e51cbSPeter Avalos #include <stdlib.h>
40327e51cbSPeter Avalos #ifdef HAVE_UNISTD_H
41327e51cbSPeter Avalos #include <unistd.h>
42327e51cbSPeter Avalos #endif
43e8af9738SPeter Avalos #include <stddef.h>
44327e51cbSPeter Avalos #include <string.h>
45327e51cbSPeter Avalos #include <assert.h>
46327e51cbSPeter Avalos #include <ctype.h>
47327e51cbSPeter Avalos #include <fcntl.h>
48327e51cbSPeter Avalos #ifdef QUICK
49327e51cbSPeter Avalos #include <sys/mman.h>
50327e51cbSPeter Avalos #endif
5179343712SPeter Avalos #include <dirent.h>
52e8af9738SPeter Avalos #include <limits.h>
53*3b9cdfa3SAntonio Huete Jimenez #ifdef HAVE_BYTESWAP_H
54*3b9cdfa3SAntonio Huete Jimenez #include <byteswap.h>
55*3b9cdfa3SAntonio Huete Jimenez #endif
56*3b9cdfa3SAntonio Huete Jimenez #ifdef HAVE_SYS_BSWAP_H
57*3b9cdfa3SAntonio Huete Jimenez #include <sys/bswap.h>
58*3b9cdfa3SAntonio Huete Jimenez #endif
59e8af9738SPeter Avalos
60327e51cbSPeter Avalos
616fca56fbSSascha Wildner #define EATAB {while (isascii(CAST(unsigned char, *l)) && \
626fca56fbSSascha Wildner isspace(CAST(unsigned char, *l))) ++l;}
636fca56fbSSascha Wildner #define LOWCASE(l) (isupper(CAST(unsigned char, l)) ? \
646fca56fbSSascha Wildner tolower(CAST(unsigned char, l)) : (l))
65327e51cbSPeter Avalos /*
66327e51cbSPeter Avalos * Work around a bug in headers on Digital Unix.
67327e51cbSPeter Avalos * At least confirmed for: OSF1 V4.0 878
68327e51cbSPeter Avalos */
69327e51cbSPeter Avalos #if defined(__osf__) && defined(__DECC)
70327e51cbSPeter Avalos #ifdef MAP_FAILED
71327e51cbSPeter Avalos #undef MAP_FAILED
72327e51cbSPeter Avalos #endif
73327e51cbSPeter Avalos #endif
74327e51cbSPeter Avalos
75327e51cbSPeter Avalos #ifndef MAP_FAILED
76327e51cbSPeter Avalos #define MAP_FAILED (void *) -1
77327e51cbSPeter Avalos #endif
78327e51cbSPeter Avalos
79327e51cbSPeter Avalos #ifndef MAP_FILE
80327e51cbSPeter Avalos #define MAP_FILE 0
81327e51cbSPeter Avalos #endif
82327e51cbSPeter Avalos
836fca56fbSSascha Wildner #define ALLOC_CHUNK CAST(size_t, 10)
846fca56fbSSascha Wildner #define ALLOC_INCR CAST(size_t, 200)
85e8af9738SPeter Avalos
86c30bd091SSascha Wildner #define MAP_TYPE_USER 0
8782c5fa3eSPeter Avalos #define MAP_TYPE_MALLOC 1
88c30bd091SSascha Wildner #define MAP_TYPE_MMAP 2
8982c5fa3eSPeter Avalos
90327e51cbSPeter Avalos struct magic_entry {
91327e51cbSPeter Avalos struct magic *mp;
92327e51cbSPeter Avalos uint32_t cont_count;
93327e51cbSPeter Avalos uint32_t max_count;
94327e51cbSPeter Avalos };
95327e51cbSPeter Avalos
96e8af9738SPeter Avalos struct magic_entry_set {
97e8af9738SPeter Avalos struct magic_entry *me;
98e8af9738SPeter Avalos uint32_t count;
99e8af9738SPeter Avalos uint32_t max;
100e8af9738SPeter Avalos };
101e8af9738SPeter Avalos
102e8af9738SPeter Avalos struct magic_map {
103e8af9738SPeter Avalos void *p;
104e8af9738SPeter Avalos size_t len;
10582c5fa3eSPeter Avalos int type;
106e8af9738SPeter Avalos struct magic *magic[MAGIC_SETS];
107e8af9738SPeter Avalos uint32_t nmagic[MAGIC_SETS];
108e8af9738SPeter Avalos };
109e8af9738SPeter Avalos
110327e51cbSPeter Avalos int file_formats[FILE_NAMES_SIZE];
111327e51cbSPeter Avalos const size_t file_nformats = FILE_NAMES_SIZE;
112327e51cbSPeter Avalos const char *file_names[FILE_NAMES_SIZE];
113327e51cbSPeter Avalos const size_t file_nnames = FILE_NAMES_SIZE;
114327e51cbSPeter Avalos
115327e51cbSPeter Avalos private int getvalue(struct magic_set *ms, struct magic *, const char **, int);
116327e51cbSPeter Avalos private int hextoint(int);
11779343712SPeter Avalos private const char *getstr(struct magic_set *, struct magic *, const char *,
11879343712SPeter Avalos int);
119e8af9738SPeter Avalos private int parse(struct magic_set *, struct magic_entry *, const char *,
120e8af9738SPeter Avalos size_t, int);
121327e51cbSPeter Avalos private void eatsize(const char **);
122e8af9738SPeter Avalos private int apprentice_1(struct magic_set *, const char *, int);
123*3b9cdfa3SAntonio Huete Jimenez private ssize_t apprentice_magic_strength_1(const struct magic *);
124*3b9cdfa3SAntonio Huete Jimenez private size_t apprentice_magic_strength(const struct magic *, size_t);
125327e51cbSPeter Avalos private int apprentice_sort(const void *, const void *);
126e4d4ce0cSPeter Avalos private void apprentice_list(struct mlist *, int );
127e8af9738SPeter Avalos private struct magic_map *apprentice_load(struct magic_set *,
128327e51cbSPeter Avalos const char *, int);
129e8af9738SPeter Avalos private struct mlist *mlist_alloc(void);
130c990e5baSDaniel Fojt private void mlist_free_all(struct magic_set *);
131e8af9738SPeter Avalos private void mlist_free(struct mlist *);
132327e51cbSPeter Avalos private void byteswap(struct magic *, uint32_t);
133327e51cbSPeter Avalos private void bs1(struct magic *);
134*3b9cdfa3SAntonio Huete Jimenez
135*3b9cdfa3SAntonio Huete Jimenez #if defined(HAVE_BYTESWAP_H)
136*3b9cdfa3SAntonio Huete Jimenez #define swap2(x) bswap_16(x)
137*3b9cdfa3SAntonio Huete Jimenez #define swap4(x) bswap_32(x)
138*3b9cdfa3SAntonio Huete Jimenez #define swap8(x) bswap_64(x)
139*3b9cdfa3SAntonio Huete Jimenez #elif defined(HAVE_SYS_BSWAP_H)
140*3b9cdfa3SAntonio Huete Jimenez #define swap2(x) bswap16(x)
141*3b9cdfa3SAntonio Huete Jimenez #define swap4(x) bswap32(x)
142*3b9cdfa3SAntonio Huete Jimenez #define swap8(x) bswap64(x)
143*3b9cdfa3SAntonio Huete Jimenez #else
144327e51cbSPeter Avalos private uint16_t swap2(uint16_t);
145327e51cbSPeter Avalos private uint32_t swap4(uint32_t);
146327e51cbSPeter Avalos private uint64_t swap8(uint64_t);
147*3b9cdfa3SAntonio Huete Jimenez #endif
148*3b9cdfa3SAntonio Huete Jimenez
14979343712SPeter Avalos private char *mkdbname(struct magic_set *, const char *, int);
15082c5fa3eSPeter Avalos private struct magic_map *apprentice_buf(struct magic_set *, struct magic *,
15182c5fa3eSPeter Avalos size_t);
152e8af9738SPeter Avalos private struct magic_map *apprentice_map(struct magic_set *, const char *);
15382c5fa3eSPeter Avalos private int check_buffer(struct magic_set *, struct magic_map *, const char *);
154e8af9738SPeter Avalos private void apprentice_unmap(struct magic_map *);
155e8af9738SPeter Avalos private int apprentice_compile(struct magic_set *, struct magic_map *,
156327e51cbSPeter Avalos const char *);
157c30bd091SSascha Wildner private int check_format_type(const char *, int, const char **);
158327e51cbSPeter Avalos private int check_format(struct magic_set *, struct magic *);
159327e51cbSPeter Avalos private int get_op(char);
160c990e5baSDaniel Fojt private int parse_mime(struct magic_set *, struct magic_entry *, const char *,
161c990e5baSDaniel Fojt size_t);
162c990e5baSDaniel Fojt private int parse_strength(struct magic_set *, struct magic_entry *,
163c990e5baSDaniel Fojt const char *, size_t);
164c990e5baSDaniel Fojt private int parse_apple(struct magic_set *, struct magic_entry *, const char *,
165c990e5baSDaniel Fojt size_t);
166c990e5baSDaniel Fojt private int parse_ext(struct magic_set *, struct magic_entry *, const char *,
167c990e5baSDaniel Fojt size_t);
16879343712SPeter Avalos
169327e51cbSPeter Avalos
170327e51cbSPeter Avalos private size_t magicsize = sizeof(struct magic);
171327e51cbSPeter Avalos
17279343712SPeter Avalos private const char usg_hdr[] = "cont\toffset\ttype\topcode\tmask\tvalue\tdesc";
17379343712SPeter Avalos
17479343712SPeter Avalos private struct {
17579343712SPeter Avalos const char *name;
17679343712SPeter Avalos size_t len;
177c990e5baSDaniel Fojt int (*fun)(struct magic_set *, struct magic_entry *, const char *,
178c990e5baSDaniel Fojt size_t);
17979343712SPeter Avalos } bang[] = {
18079343712SPeter Avalos #define DECLARE_FIELD(name) { # name, sizeof(# name) - 1, parse_ ## name }
18179343712SPeter Avalos DECLARE_FIELD(mime),
18279343712SPeter Avalos DECLARE_FIELD(apple),
183c30bd091SSascha Wildner DECLARE_FIELD(ext),
18479343712SPeter Avalos DECLARE_FIELD(strength),
18579343712SPeter Avalos #undef DECLARE_FIELD
18679343712SPeter Avalos { NULL, 0, NULL }
18779343712SPeter Avalos };
188327e51cbSPeter Avalos
189327e51cbSPeter Avalos #ifdef COMPILE_ONLY
190327e51cbSPeter Avalos
191327e51cbSPeter Avalos int main(int, char *[]);
192327e51cbSPeter Avalos
193327e51cbSPeter Avalos int
main(int argc,char * argv[])194327e51cbSPeter Avalos main(int argc, char *argv[])
195327e51cbSPeter Avalos {
196327e51cbSPeter Avalos int ret;
197327e51cbSPeter Avalos struct magic_set *ms;
198327e51cbSPeter Avalos char *progname;
199327e51cbSPeter Avalos
200327e51cbSPeter Avalos if ((progname = strrchr(argv[0], '/')) != NULL)
201327e51cbSPeter Avalos progname++;
202327e51cbSPeter Avalos else
203327e51cbSPeter Avalos progname = argv[0];
204327e51cbSPeter Avalos
205327e51cbSPeter Avalos if (argc != 2) {
206327e51cbSPeter Avalos (void)fprintf(stderr, "Usage: %s file\n", progname);
207327e51cbSPeter Avalos return 1;
208327e51cbSPeter Avalos }
209327e51cbSPeter Avalos
210327e51cbSPeter Avalos if ((ms = magic_open(MAGIC_CHECK)) == NULL) {
211327e51cbSPeter Avalos (void)fprintf(stderr, "%s: %s\n", progname, strerror(errno));
212327e51cbSPeter Avalos return 1;
213327e51cbSPeter Avalos }
214327e51cbSPeter Avalos ret = magic_compile(ms, argv[1]) == -1 ? 1 : 0;
215327e51cbSPeter Avalos if (ret == 1)
216327e51cbSPeter Avalos (void)fprintf(stderr, "%s: %s\n", progname, magic_error(ms));
217327e51cbSPeter Avalos magic_close(ms);
218327e51cbSPeter Avalos return ret;
219327e51cbSPeter Avalos }
220327e51cbSPeter Avalos #endif /* COMPILE_ONLY */
221327e51cbSPeter Avalos
222e8af9738SPeter Avalos struct type_tbl_s {
22379343712SPeter Avalos const char name[16];
224327e51cbSPeter Avalos const size_t len;
225327e51cbSPeter Avalos const int type;
226327e51cbSPeter Avalos const int format;
227e8af9738SPeter Avalos };
228e8af9738SPeter Avalos
229e8af9738SPeter Avalos /*
230e8af9738SPeter Avalos * XXX - the actual Single UNIX Specification says that "long" means "long",
231e8af9738SPeter Avalos * as in the C data type, but we treat it as meaning "4-byte integer".
232e8af9738SPeter Avalos * Given that the OS X version of file 5.04 did the same, I guess that passes
233e8af9738SPeter Avalos * the actual test; having "long" be dependent on how big a "long" is on
234e8af9738SPeter Avalos * the machine running "file" is silly.
235e8af9738SPeter Avalos */
236e8af9738SPeter Avalos static const struct type_tbl_s type_tbl[] = {
237327e51cbSPeter Avalos # define XX(s) s, (sizeof(s) - 1)
23879343712SPeter Avalos # define XX_NULL "", 0
239e8af9738SPeter Avalos { XX("invalid"), FILE_INVALID, FILE_FMT_NONE },
240327e51cbSPeter Avalos { XX("byte"), FILE_BYTE, FILE_FMT_NUM },
241327e51cbSPeter Avalos { XX("short"), FILE_SHORT, FILE_FMT_NUM },
242e8af9738SPeter Avalos { XX("default"), FILE_DEFAULT, FILE_FMT_NONE },
243327e51cbSPeter Avalos { XX("long"), FILE_LONG, FILE_FMT_NUM },
244327e51cbSPeter Avalos { XX("string"), FILE_STRING, FILE_FMT_STR },
245327e51cbSPeter Avalos { XX("date"), FILE_DATE, FILE_FMT_STR },
246327e51cbSPeter Avalos { XX("beshort"), FILE_BESHORT, FILE_FMT_NUM },
247327e51cbSPeter Avalos { XX("belong"), FILE_BELONG, FILE_FMT_NUM },
248327e51cbSPeter Avalos { XX("bedate"), FILE_BEDATE, FILE_FMT_STR },
249327e51cbSPeter Avalos { XX("leshort"), FILE_LESHORT, FILE_FMT_NUM },
250327e51cbSPeter Avalos { XX("lelong"), FILE_LELONG, FILE_FMT_NUM },
251327e51cbSPeter Avalos { XX("ledate"), FILE_LEDATE, FILE_FMT_STR },
252327e51cbSPeter Avalos { XX("pstring"), FILE_PSTRING, FILE_FMT_STR },
253327e51cbSPeter Avalos { XX("ldate"), FILE_LDATE, FILE_FMT_STR },
254327e51cbSPeter Avalos { XX("beldate"), FILE_BELDATE, FILE_FMT_STR },
255327e51cbSPeter Avalos { XX("leldate"), FILE_LELDATE, FILE_FMT_STR },
256327e51cbSPeter Avalos { XX("regex"), FILE_REGEX, FILE_FMT_STR },
257327e51cbSPeter Avalos { XX("bestring16"), FILE_BESTRING16, FILE_FMT_STR },
258327e51cbSPeter Avalos { XX("lestring16"), FILE_LESTRING16, FILE_FMT_STR },
259327e51cbSPeter Avalos { XX("search"), FILE_SEARCH, FILE_FMT_STR },
260327e51cbSPeter Avalos { XX("medate"), FILE_MEDATE, FILE_FMT_STR },
261327e51cbSPeter Avalos { XX("meldate"), FILE_MELDATE, FILE_FMT_STR },
262327e51cbSPeter Avalos { XX("melong"), FILE_MELONG, FILE_FMT_NUM },
263327e51cbSPeter Avalos { XX("quad"), FILE_QUAD, FILE_FMT_QUAD },
264327e51cbSPeter Avalos { XX("lequad"), FILE_LEQUAD, FILE_FMT_QUAD },
265327e51cbSPeter Avalos { XX("bequad"), FILE_BEQUAD, FILE_FMT_QUAD },
266327e51cbSPeter Avalos { XX("qdate"), FILE_QDATE, FILE_FMT_STR },
267327e51cbSPeter Avalos { XX("leqdate"), FILE_LEQDATE, FILE_FMT_STR },
268327e51cbSPeter Avalos { XX("beqdate"), FILE_BEQDATE, FILE_FMT_STR },
269327e51cbSPeter Avalos { XX("qldate"), FILE_QLDATE, FILE_FMT_STR },
270327e51cbSPeter Avalos { XX("leqldate"), FILE_LEQLDATE, FILE_FMT_STR },
271327e51cbSPeter Avalos { XX("beqldate"), FILE_BEQLDATE, FILE_FMT_STR },
272327e51cbSPeter Avalos { XX("float"), FILE_FLOAT, FILE_FMT_FLOAT },
273327e51cbSPeter Avalos { XX("befloat"), FILE_BEFLOAT, FILE_FMT_FLOAT },
274327e51cbSPeter Avalos { XX("lefloat"), FILE_LEFLOAT, FILE_FMT_FLOAT },
275327e51cbSPeter Avalos { XX("double"), FILE_DOUBLE, FILE_FMT_DOUBLE },
276327e51cbSPeter Avalos { XX("bedouble"), FILE_BEDOUBLE, FILE_FMT_DOUBLE },
277327e51cbSPeter Avalos { XX("ledouble"), FILE_LEDOUBLE, FILE_FMT_DOUBLE },
27879343712SPeter Avalos { XX("leid3"), FILE_LEID3, FILE_FMT_NUM },
27979343712SPeter Avalos { XX("beid3"), FILE_BEID3, FILE_FMT_NUM },
280e8af9738SPeter Avalos { XX("indirect"), FILE_INDIRECT, FILE_FMT_NUM },
281e8af9738SPeter Avalos { XX("qwdate"), FILE_QWDATE, FILE_FMT_STR },
282e8af9738SPeter Avalos { XX("leqwdate"), FILE_LEQWDATE, FILE_FMT_STR },
283e8af9738SPeter Avalos { XX("beqwdate"), FILE_BEQWDATE, FILE_FMT_STR },
284e8af9738SPeter Avalos { XX("name"), FILE_NAME, FILE_FMT_NONE },
285e8af9738SPeter Avalos { XX("use"), FILE_USE, FILE_FMT_NONE },
286e8af9738SPeter Avalos { XX("clear"), FILE_CLEAR, FILE_FMT_NONE },
287c30bd091SSascha Wildner { XX("der"), FILE_DER, FILE_FMT_STR },
288c990e5baSDaniel Fojt { XX("guid"), FILE_GUID, FILE_FMT_STR },
289c990e5baSDaniel Fojt { XX("offset"), FILE_OFFSET, FILE_FMT_QUAD },
290614728caSSascha Wildner { XX("bevarint"), FILE_BEVARINT, FILE_FMT_STR },
291614728caSSascha Wildner { XX("levarint"), FILE_LEVARINT, FILE_FMT_STR },
292*3b9cdfa3SAntonio Huete Jimenez { XX("msdosdate"), FILE_MSDOSDATE, FILE_FMT_STR },
293*3b9cdfa3SAntonio Huete Jimenez { XX("lemsdosdate"), FILE_LEMSDOSDATE, FILE_FMT_STR },
294*3b9cdfa3SAntonio Huete Jimenez { XX("bemsdosdate"), FILE_BEMSDOSDATE, FILE_FMT_STR },
295*3b9cdfa3SAntonio Huete Jimenez { XX("msdostime"), FILE_MSDOSTIME, FILE_FMT_STR },
296*3b9cdfa3SAntonio Huete Jimenez { XX("lemsdostime"), FILE_LEMSDOSTIME, FILE_FMT_STR },
297*3b9cdfa3SAntonio Huete Jimenez { XX("bemsdostime"), FILE_BEMSDOSTIME, FILE_FMT_STR },
298*3b9cdfa3SAntonio Huete Jimenez { XX("octal"), FILE_OCTAL, FILE_FMT_STR },
299327e51cbSPeter Avalos { XX_NULL, FILE_INVALID, FILE_FMT_NONE },
300327e51cbSPeter Avalos };
301327e51cbSPeter Avalos
302e8af9738SPeter Avalos /*
303e8af9738SPeter Avalos * These are not types, and cannot be preceded by "u" to make them
304e8af9738SPeter Avalos * unsigned.
305e8af9738SPeter Avalos */
306e8af9738SPeter Avalos static const struct type_tbl_s special_tbl[] = {
307c30bd091SSascha Wildner { XX("der"), FILE_DER, FILE_FMT_STR },
308e8af9738SPeter Avalos { XX("name"), FILE_NAME, FILE_FMT_STR },
309e8af9738SPeter Avalos { XX("use"), FILE_USE, FILE_FMT_STR },
310*3b9cdfa3SAntonio Huete Jimenez { XX("octal"), FILE_OCTAL, FILE_FMT_STR },
311e8af9738SPeter Avalos { XX_NULL, FILE_INVALID, FILE_FMT_NONE },
312e8af9738SPeter Avalos };
313e8af9738SPeter Avalos # undef XX
314e8af9738SPeter Avalos # undef XX_NULL
315e8af9738SPeter Avalos
316327e51cbSPeter Avalos private int
get_type(const struct type_tbl_s * tbl,const char * l,const char ** t)317e8af9738SPeter Avalos get_type(const struct type_tbl_s *tbl, const char *l, const char **t)
318327e51cbSPeter Avalos {
319327e51cbSPeter Avalos const struct type_tbl_s *p;
320327e51cbSPeter Avalos
321e8af9738SPeter Avalos for (p = tbl; p->len; p++) {
322327e51cbSPeter Avalos if (strncmp(l, p->name, p->len) == 0) {
323327e51cbSPeter Avalos if (t)
324327e51cbSPeter Avalos *t = l + p->len;
325327e51cbSPeter Avalos break;
326327e51cbSPeter Avalos }
327327e51cbSPeter Avalos }
328327e51cbSPeter Avalos return p->type;
329327e51cbSPeter Avalos }
330327e51cbSPeter Avalos
3316fca56fbSSascha Wildner private off_t
maxoff_t(void)3326fca56fbSSascha Wildner maxoff_t(void) {
3336fca56fbSSascha Wildner if (/*CONSTCOND*/sizeof(off_t) == sizeof(int))
3346fca56fbSSascha Wildner return CAST(off_t, INT_MAX);
3356fca56fbSSascha Wildner if (/*CONSTCOND*/sizeof(off_t) == sizeof(long))
3366fca56fbSSascha Wildner return CAST(off_t, LONG_MAX);
3376fca56fbSSascha Wildner return 0x7fffffff;
3386fca56fbSSascha Wildner }
3396fca56fbSSascha Wildner
340e8af9738SPeter Avalos private int
get_standard_integer_type(const char * l,const char ** t)341e8af9738SPeter Avalos get_standard_integer_type(const char *l, const char **t)
342e8af9738SPeter Avalos {
343e8af9738SPeter Avalos int type;
344e8af9738SPeter Avalos
3456fca56fbSSascha Wildner if (isalpha(CAST(unsigned char, l[1]))) {
346e8af9738SPeter Avalos switch (l[1]) {
347e8af9738SPeter Avalos case 'C':
348e8af9738SPeter Avalos /* "dC" and "uC" */
349e8af9738SPeter Avalos type = FILE_BYTE;
350e8af9738SPeter Avalos break;
351e8af9738SPeter Avalos case 'S':
352e8af9738SPeter Avalos /* "dS" and "uS" */
353e8af9738SPeter Avalos type = FILE_SHORT;
354e8af9738SPeter Avalos break;
355e8af9738SPeter Avalos case 'I':
356e8af9738SPeter Avalos case 'L':
357e8af9738SPeter Avalos /*
358e8af9738SPeter Avalos * "dI", "dL", "uI", and "uL".
359e8af9738SPeter Avalos *
360e8af9738SPeter Avalos * XXX - the actual Single UNIX Specification says
361e8af9738SPeter Avalos * that "L" means "long", as in the C data type,
362e8af9738SPeter Avalos * but we treat it as meaning "4-byte integer".
363e8af9738SPeter Avalos * Given that the OS X version of file 5.04 did
364e8af9738SPeter Avalos * the same, I guess that passes the actual SUS
365e8af9738SPeter Avalos * validation suite; having "dL" be dependent on
366e8af9738SPeter Avalos * how big a "long" is on the machine running
367e8af9738SPeter Avalos * "file" is silly.
368e8af9738SPeter Avalos */
369e8af9738SPeter Avalos type = FILE_LONG;
370e8af9738SPeter Avalos break;
371e8af9738SPeter Avalos case 'Q':
372e8af9738SPeter Avalos /* "dQ" and "uQ" */
373e8af9738SPeter Avalos type = FILE_QUAD;
374e8af9738SPeter Avalos break;
375e8af9738SPeter Avalos default:
376e8af9738SPeter Avalos /* "d{anything else}", "u{anything else}" */
377e8af9738SPeter Avalos return FILE_INVALID;
378e8af9738SPeter Avalos }
379e8af9738SPeter Avalos l += 2;
3806fca56fbSSascha Wildner } else if (isdigit(CAST(unsigned char, l[1]))) {
381e8af9738SPeter Avalos /*
382e8af9738SPeter Avalos * "d{num}" and "u{num}"; we only support {num} values
383e8af9738SPeter Avalos * of 1, 2, 4, and 8 - the Single UNIX Specification
384e8af9738SPeter Avalos * doesn't say anything about whether arbitrary
385e8af9738SPeter Avalos * values should be supported, but both the Solaris 10
386e8af9738SPeter Avalos * and OS X Mountain Lion versions of file passed the
387e8af9738SPeter Avalos * Single UNIX Specification validation suite, and
388e8af9738SPeter Avalos * neither of them support values bigger than 8 or
389e8af9738SPeter Avalos * non-power-of-2 values.
390e8af9738SPeter Avalos */
3916fca56fbSSascha Wildner if (isdigit(CAST(unsigned char, l[2]))) {
392e8af9738SPeter Avalos /* Multi-digit, so > 9 */
393e8af9738SPeter Avalos return FILE_INVALID;
394e8af9738SPeter Avalos }
395e8af9738SPeter Avalos switch (l[1]) {
396e8af9738SPeter Avalos case '1':
397e8af9738SPeter Avalos type = FILE_BYTE;
398e8af9738SPeter Avalos break;
399e8af9738SPeter Avalos case '2':
400e8af9738SPeter Avalos type = FILE_SHORT;
401e8af9738SPeter Avalos break;
402e8af9738SPeter Avalos case '4':
403e8af9738SPeter Avalos type = FILE_LONG;
404e8af9738SPeter Avalos break;
405e8af9738SPeter Avalos case '8':
406e8af9738SPeter Avalos type = FILE_QUAD;
407e8af9738SPeter Avalos break;
408e8af9738SPeter Avalos default:
409e8af9738SPeter Avalos /* XXX - what about 3, 5, 6, or 7? */
410e8af9738SPeter Avalos return FILE_INVALID;
411e8af9738SPeter Avalos }
412e8af9738SPeter Avalos l += 2;
413e8af9738SPeter Avalos } else {
414e8af9738SPeter Avalos /*
415e8af9738SPeter Avalos * "d" or "u" by itself.
416e8af9738SPeter Avalos */
417e8af9738SPeter Avalos type = FILE_LONG;
418e8af9738SPeter Avalos ++l;
419e8af9738SPeter Avalos }
420e8af9738SPeter Avalos if (t)
421e8af9738SPeter Avalos *t = l;
422e8af9738SPeter Avalos return type;
423e8af9738SPeter Avalos }
424e8af9738SPeter Avalos
425327e51cbSPeter Avalos private void
init_file_tables(void)426327e51cbSPeter Avalos init_file_tables(void)
427327e51cbSPeter Avalos {
428327e51cbSPeter Avalos static int done = 0;
429327e51cbSPeter Avalos const struct type_tbl_s *p;
430327e51cbSPeter Avalos
431327e51cbSPeter Avalos if (done)
432327e51cbSPeter Avalos return;
433327e51cbSPeter Avalos done++;
434327e51cbSPeter Avalos
43579343712SPeter Avalos for (p = type_tbl; p->len; p++) {
436327e51cbSPeter Avalos assert(p->type < FILE_NAMES_SIZE);
437327e51cbSPeter Avalos file_names[p->type] = p->name;
438327e51cbSPeter Avalos file_formats[p->type] = p->format;
439327e51cbSPeter Avalos }
440e8af9738SPeter Avalos assert(p - type_tbl == FILE_NAMES_SIZE);
441e8af9738SPeter Avalos }
442e8af9738SPeter Avalos
443e8af9738SPeter Avalos private int
add_mlist(struct mlist * mlp,struct magic_map * map,size_t idx)444e8af9738SPeter Avalos add_mlist(struct mlist *mlp, struct magic_map *map, size_t idx)
445e8af9738SPeter Avalos {
446e8af9738SPeter Avalos struct mlist *ml;
447e8af9738SPeter Avalos
448c30bd091SSascha Wildner mlp->map = NULL;
449e8af9738SPeter Avalos if ((ml = CAST(struct mlist *, malloc(sizeof(*ml)))) == NULL)
450e8af9738SPeter Avalos return -1;
451e8af9738SPeter Avalos
452c30bd091SSascha Wildner ml->map = idx == 0 ? map : NULL;
453e8af9738SPeter Avalos ml->magic = map->magic[idx];
454e8af9738SPeter Avalos ml->nmagic = map->nmagic[idx];
455*3b9cdfa3SAntonio Huete Jimenez if (ml->nmagic) {
456*3b9cdfa3SAntonio Huete Jimenez ml->magic_rxcomp = CAST(file_regex_t **,
457*3b9cdfa3SAntonio Huete Jimenez calloc(ml->nmagic, sizeof(*ml->magic_rxcomp)));
458*3b9cdfa3SAntonio Huete Jimenez if (ml->magic_rxcomp == NULL) {
459*3b9cdfa3SAntonio Huete Jimenez free(ml);
460*3b9cdfa3SAntonio Huete Jimenez return -1;
461*3b9cdfa3SAntonio Huete Jimenez }
462*3b9cdfa3SAntonio Huete Jimenez } else
463*3b9cdfa3SAntonio Huete Jimenez ml->magic_rxcomp = NULL;
464e8af9738SPeter Avalos mlp->prev->next = ml;
465e8af9738SPeter Avalos ml->prev = mlp->prev;
466e8af9738SPeter Avalos ml->next = mlp;
467e8af9738SPeter Avalos mlp->prev = ml;
468e8af9738SPeter Avalos return 0;
469327e51cbSPeter Avalos }
470327e51cbSPeter Avalos
471327e51cbSPeter Avalos /*
47279343712SPeter Avalos * Handle one file or directory.
473327e51cbSPeter Avalos */
474327e51cbSPeter Avalos private int
apprentice_1(struct magic_set * ms,const char * fn,int action)475e8af9738SPeter Avalos apprentice_1(struct magic_set *ms, const char *fn, int action)
476327e51cbSPeter Avalos {
477e8af9738SPeter Avalos struct magic_map *map;
47882c5fa3eSPeter Avalos #ifndef COMPILE_ONLY
47982c5fa3eSPeter Avalos struct mlist *ml;
480e8af9738SPeter Avalos size_t i;
48182c5fa3eSPeter Avalos #endif
482327e51cbSPeter Avalos
483327e51cbSPeter Avalos if (magicsize != FILE_MAGICSIZE) {
484327e51cbSPeter Avalos file_error(ms, 0, "magic element size %lu != %lu",
4856fca56fbSSascha Wildner CAST(unsigned long, sizeof(*map->magic[0])),
4866fca56fbSSascha Wildner CAST(unsigned long, FILE_MAGICSIZE));
487327e51cbSPeter Avalos return -1;
488327e51cbSPeter Avalos }
489327e51cbSPeter Avalos
490327e51cbSPeter Avalos if (action == FILE_COMPILE) {
491e8af9738SPeter Avalos map = apprentice_load(ms, fn, action);
492e8af9738SPeter Avalos if (map == NULL)
493327e51cbSPeter Avalos return -1;
494e8af9738SPeter Avalos return apprentice_compile(ms, map, fn);
495327e51cbSPeter Avalos }
496327e51cbSPeter Avalos
497327e51cbSPeter Avalos #ifndef COMPILE_ONLY
498e8af9738SPeter Avalos map = apprentice_map(ms, fn);
499e8af9738SPeter Avalos if (map == NULL) {
500327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
501327e51cbSPeter Avalos file_magwarn(ms, "using regular magic file `%s'", fn);
502e8af9738SPeter Avalos map = apprentice_load(ms, fn, action);
503e8af9738SPeter Avalos if (map == NULL)
504327e51cbSPeter Avalos return -1;
505327e51cbSPeter Avalos }
506327e51cbSPeter Avalos
507e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
508e8af9738SPeter Avalos if (add_mlist(ms->mlist[i], map, i) == -1) {
509c990e5baSDaniel Fojt /* failed to add to any list, free explicitly */
510c990e5baSDaniel Fojt if (i == 0)
511c990e5baSDaniel Fojt apprentice_unmap(map);
512c990e5baSDaniel Fojt else
513c990e5baSDaniel Fojt mlist_free_all(ms);
514327e51cbSPeter Avalos file_oomem(ms, sizeof(*ml));
515c30bd091SSascha Wildner return -1;
516327e51cbSPeter Avalos }
517e8af9738SPeter Avalos }
518327e51cbSPeter Avalos
519e4d4ce0cSPeter Avalos if (action == FILE_LIST) {
520e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
52182c5fa3eSPeter Avalos printf("Set %" SIZE_T_FORMAT "u:\nBinary patterns:\n",
52282c5fa3eSPeter Avalos i);
523e8af9738SPeter Avalos apprentice_list(ms->mlist[i], BINTEST);
524e4d4ce0cSPeter Avalos printf("Text patterns:\n");
525e8af9738SPeter Avalos apprentice_list(ms->mlist[i], TEXTTEST);
526e8af9738SPeter Avalos }
527e4d4ce0cSPeter Avalos }
52882c5fa3eSPeter Avalos return 0;
52982c5fa3eSPeter Avalos #else
530327e51cbSPeter Avalos return 0;
531327e51cbSPeter Avalos #endif /* COMPILE_ONLY */
532327e51cbSPeter Avalos }
533327e51cbSPeter Avalos
534327e51cbSPeter Avalos protected void
file_ms_free(struct magic_set * ms)535e8af9738SPeter Avalos file_ms_free(struct magic_set *ms)
536327e51cbSPeter Avalos {
537e8af9738SPeter Avalos size_t i;
538e8af9738SPeter Avalos if (ms == NULL)
539327e51cbSPeter Avalos return;
540e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++)
541e8af9738SPeter Avalos mlist_free(ms->mlist[i]);
542e8af9738SPeter Avalos free(ms->o.pbuf);
543e8af9738SPeter Avalos free(ms->o.buf);
544e8af9738SPeter Avalos free(ms->c.li);
545*3b9cdfa3SAntonio Huete Jimenez #ifdef USE_C_LOCALE
546*3b9cdfa3SAntonio Huete Jimenez freelocale(ms->c_lc_ctype);
547*3b9cdfa3SAntonio Huete Jimenez #endif
548e8af9738SPeter Avalos free(ms);
549327e51cbSPeter Avalos }
550e8af9738SPeter Avalos
551e8af9738SPeter Avalos protected struct magic_set *
file_ms_alloc(int flags)552e8af9738SPeter Avalos file_ms_alloc(int flags)
553e8af9738SPeter Avalos {
554e8af9738SPeter Avalos struct magic_set *ms;
555e8af9738SPeter Avalos size_t i, len;
556e8af9738SPeter Avalos
5576fca56fbSSascha Wildner if ((ms = CAST(struct magic_set *, calloc(CAST(size_t, 1u),
558e8af9738SPeter Avalos sizeof(struct magic_set)))) == NULL)
559e8af9738SPeter Avalos return NULL;
560e8af9738SPeter Avalos
561e8af9738SPeter Avalos if (magic_setflags(ms, flags) == -1) {
562e8af9738SPeter Avalos errno = EINVAL;
563e8af9738SPeter Avalos goto free;
564e8af9738SPeter Avalos }
565e8af9738SPeter Avalos
566e8af9738SPeter Avalos ms->o.buf = ms->o.pbuf = NULL;
567c990e5baSDaniel Fojt ms->o.blen = 0;
568e8af9738SPeter Avalos len = (ms->c.len = 10) * sizeof(*ms->c.li);
569e8af9738SPeter Avalos
570e8af9738SPeter Avalos if ((ms->c.li = CAST(struct level_info *, malloc(len))) == NULL)
571e8af9738SPeter Avalos goto free;
572e8af9738SPeter Avalos
573e8af9738SPeter Avalos ms->event_flags = 0;
574e8af9738SPeter Avalos ms->error = -1;
575e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++)
576e8af9738SPeter Avalos ms->mlist[i] = NULL;
577e8af9738SPeter Avalos ms->file = "unknown";
578e8af9738SPeter Avalos ms->line = 0;
57982c5fa3eSPeter Avalos ms->indir_max = FILE_INDIR_MAX;
58082c5fa3eSPeter Avalos ms->name_max = FILE_NAME_MAX;
58182c5fa3eSPeter Avalos ms->elf_shnum_max = FILE_ELF_SHNUM_MAX;
58282c5fa3eSPeter Avalos ms->elf_phnum_max = FILE_ELF_PHNUM_MAX;
58382c5fa3eSPeter Avalos ms->elf_notes_max = FILE_ELF_NOTES_MAX;
584c30bd091SSascha Wildner ms->regex_max = FILE_REGEX_MAX;
585c30bd091SSascha Wildner ms->bytes_max = FILE_BYTES_MAX;
586970935fdSSascha Wildner ms->encoding_max = FILE_ENCODING_MAX;
587*3b9cdfa3SAntonio Huete Jimenez #ifdef USE_C_LOCALE
588*3b9cdfa3SAntonio Huete Jimenez ms->c_lc_ctype = newlocale(LC_CTYPE_MASK, "C", 0);
589*3b9cdfa3SAntonio Huete Jimenez assert(ms->c_lc_ctype != NULL);
590*3b9cdfa3SAntonio Huete Jimenez #endif
591e8af9738SPeter Avalos return ms;
592e8af9738SPeter Avalos free:
593e8af9738SPeter Avalos free(ms);
594e8af9738SPeter Avalos return NULL;
595e8af9738SPeter Avalos }
596e8af9738SPeter Avalos
597e8af9738SPeter Avalos private void
apprentice_unmap(struct magic_map * map)598e8af9738SPeter Avalos apprentice_unmap(struct magic_map *map)
599e8af9738SPeter Avalos {
600c30bd091SSascha Wildner size_t i;
601614728caSSascha Wildner char *p;
602e8af9738SPeter Avalos if (map == NULL)
603e8af9738SPeter Avalos return;
60482c5fa3eSPeter Avalos
60582c5fa3eSPeter Avalos switch (map->type) {
606c30bd091SSascha Wildner case MAP_TYPE_USER:
607c30bd091SSascha Wildner break;
608c30bd091SSascha Wildner case MAP_TYPE_MALLOC:
609614728caSSascha Wildner p = CAST(char *, map->p);
610c30bd091SSascha Wildner for (i = 0; i < MAGIC_SETS; i++) {
611614728caSSascha Wildner char *b = RCAST(char *, map->magic[i]);
612614728caSSascha Wildner if (p != NULL && b >= p && b <= p + map->len)
613c30bd091SSascha Wildner continue;
614614728caSSascha Wildner free(b);
615c30bd091SSascha Wildner }
616614728caSSascha Wildner free(p);
617c30bd091SSascha Wildner break;
618e8af9738SPeter Avalos #ifdef QUICK
61982c5fa3eSPeter Avalos case MAP_TYPE_MMAP:
620c30bd091SSascha Wildner if (map->p && map->p != MAP_FAILED)
621e8af9738SPeter Avalos (void)munmap(map->p, map->len);
62282c5fa3eSPeter Avalos break;
623e8af9738SPeter Avalos #endif
62482c5fa3eSPeter Avalos default:
625*3b9cdfa3SAntonio Huete Jimenez fprintf(stderr, "Bad map type %d", map->type);
62682c5fa3eSPeter Avalos abort();
62782c5fa3eSPeter Avalos }
628e8af9738SPeter Avalos free(map);
629e8af9738SPeter Avalos }
630e8af9738SPeter Avalos
631e8af9738SPeter Avalos private struct mlist *
mlist_alloc(void)632e8af9738SPeter Avalos mlist_alloc(void)
633e8af9738SPeter Avalos {
634e8af9738SPeter Avalos struct mlist *mlist;
635e8af9738SPeter Avalos if ((mlist = CAST(struct mlist *, calloc(1, sizeof(*mlist)))) == NULL) {
636e8af9738SPeter Avalos return NULL;
637e8af9738SPeter Avalos }
638e8af9738SPeter Avalos mlist->next = mlist->prev = mlist;
639e8af9738SPeter Avalos return mlist;
640e8af9738SPeter Avalos }
641e8af9738SPeter Avalos
642e8af9738SPeter Avalos private void
mlist_free_all(struct magic_set * ms)643c990e5baSDaniel Fojt mlist_free_all(struct magic_set *ms)
644c990e5baSDaniel Fojt {
645c990e5baSDaniel Fojt size_t i;
646c990e5baSDaniel Fojt
647c990e5baSDaniel Fojt for (i = 0; i < MAGIC_SETS; i++) {
648c990e5baSDaniel Fojt mlist_free(ms->mlist[i]);
649c990e5baSDaniel Fojt ms->mlist[i] = NULL;
650c990e5baSDaniel Fojt }
651c990e5baSDaniel Fojt }
652c990e5baSDaniel Fojt
653c990e5baSDaniel Fojt private void
mlist_free_one(struct mlist * ml)6546fca56fbSSascha Wildner mlist_free_one(struct mlist *ml)
6556fca56fbSSascha Wildner {
656*3b9cdfa3SAntonio Huete Jimenez size_t i;
657*3b9cdfa3SAntonio Huete Jimenez
6586fca56fbSSascha Wildner if (ml->map)
6596fca56fbSSascha Wildner apprentice_unmap(CAST(struct magic_map *, ml->map));
660*3b9cdfa3SAntonio Huete Jimenez
661*3b9cdfa3SAntonio Huete Jimenez for (i = 0; i < ml->nmagic; ++i) {
662*3b9cdfa3SAntonio Huete Jimenez if (ml->magic_rxcomp[i]) {
663*3b9cdfa3SAntonio Huete Jimenez file_regfree(ml->magic_rxcomp[i]);
664*3b9cdfa3SAntonio Huete Jimenez free(ml->magic_rxcomp[i]);
665*3b9cdfa3SAntonio Huete Jimenez ml->magic_rxcomp[i] = NULL;
666*3b9cdfa3SAntonio Huete Jimenez }
667*3b9cdfa3SAntonio Huete Jimenez }
668*3b9cdfa3SAntonio Huete Jimenez free(ml->magic_rxcomp);
669*3b9cdfa3SAntonio Huete Jimenez ml->magic_rxcomp = NULL;
6706fca56fbSSascha Wildner free(ml);
6716fca56fbSSascha Wildner }
6726fca56fbSSascha Wildner
6736fca56fbSSascha Wildner private void
mlist_free(struct mlist * mlist)674e8af9738SPeter Avalos mlist_free(struct mlist *mlist)
675e8af9738SPeter Avalos {
67682c5fa3eSPeter Avalos struct mlist *ml, *next;
677e8af9738SPeter Avalos
678e8af9738SPeter Avalos if (mlist == NULL)
679e8af9738SPeter Avalos return;
680e8af9738SPeter Avalos
681c990e5baSDaniel Fojt for (ml = mlist->next; ml != mlist;) {
6826fca56fbSSascha Wildner next = ml->next;
6836fca56fbSSascha Wildner mlist_free_one(ml);
684c990e5baSDaniel Fojt ml = next;
685e8af9738SPeter Avalos }
6866fca56fbSSascha Wildner mlist_free_one(mlist);
687327e51cbSPeter Avalos }
688327e51cbSPeter Avalos
68982c5fa3eSPeter Avalos #ifndef COMPILE_ONLY
69082c5fa3eSPeter Avalos /* void **bufs: an array of compiled magic files */
69182c5fa3eSPeter Avalos protected int
buffer_apprentice(struct magic_set * ms,struct magic ** bufs,size_t * sizes,size_t nbufs)69282c5fa3eSPeter Avalos buffer_apprentice(struct magic_set *ms, struct magic **bufs,
69382c5fa3eSPeter Avalos size_t *sizes, size_t nbufs)
69482c5fa3eSPeter Avalos {
69582c5fa3eSPeter Avalos size_t i, j;
69682c5fa3eSPeter Avalos struct mlist *ml;
69782c5fa3eSPeter Avalos struct magic_map *map;
69882c5fa3eSPeter Avalos
69982c5fa3eSPeter Avalos if (nbufs == 0)
70082c5fa3eSPeter Avalos return -1;
70182c5fa3eSPeter Avalos
702c30bd091SSascha Wildner (void)file_reset(ms, 0);
70382c5fa3eSPeter Avalos
70482c5fa3eSPeter Avalos init_file_tables();
70582c5fa3eSPeter Avalos
70682c5fa3eSPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
70782c5fa3eSPeter Avalos mlist_free(ms->mlist[i]);
70882c5fa3eSPeter Avalos if ((ms->mlist[i] = mlist_alloc()) == NULL) {
70982c5fa3eSPeter Avalos file_oomem(ms, sizeof(*ms->mlist[i]));
71082c5fa3eSPeter Avalos goto fail;
71182c5fa3eSPeter Avalos }
71282c5fa3eSPeter Avalos }
71382c5fa3eSPeter Avalos
71482c5fa3eSPeter Avalos for (i = 0; i < nbufs; i++) {
71582c5fa3eSPeter Avalos map = apprentice_buf(ms, bufs[i], sizes[i]);
71682c5fa3eSPeter Avalos if (map == NULL)
71782c5fa3eSPeter Avalos goto fail;
71882c5fa3eSPeter Avalos
71982c5fa3eSPeter Avalos for (j = 0; j < MAGIC_SETS; j++) {
72082c5fa3eSPeter Avalos if (add_mlist(ms->mlist[j], map, j) == -1) {
72182c5fa3eSPeter Avalos file_oomem(ms, sizeof(*ml));
72282c5fa3eSPeter Avalos goto fail;
72382c5fa3eSPeter Avalos }
72482c5fa3eSPeter Avalos }
72582c5fa3eSPeter Avalos }
72682c5fa3eSPeter Avalos
72782c5fa3eSPeter Avalos return 0;
72882c5fa3eSPeter Avalos fail:
729c990e5baSDaniel Fojt mlist_free_all(ms);
73082c5fa3eSPeter Avalos return -1;
73182c5fa3eSPeter Avalos }
73282c5fa3eSPeter Avalos #endif
73382c5fa3eSPeter Avalos
73479343712SPeter Avalos /* const char *fn: list of magic files and directories */
735e8af9738SPeter Avalos protected int
file_apprentice(struct magic_set * ms,const char * fn,int action)736327e51cbSPeter Avalos file_apprentice(struct magic_set *ms, const char *fn, int action)
737327e51cbSPeter Avalos {
73879343712SPeter Avalos char *p, *mfn;
7396fca56fbSSascha Wildner int fileerr, errs = -1;
740c990e5baSDaniel Fojt size_t i, j;
741e8af9738SPeter Avalos
742c30bd091SSascha Wildner (void)file_reset(ms, 0);
743327e51cbSPeter Avalos
744f72f8299SJan Lentfer if ((fn = magic_getpath(fn, action)) == NULL)
745e8af9738SPeter Avalos return -1;
746327e51cbSPeter Avalos
747f72f8299SJan Lentfer init_file_tables();
748327e51cbSPeter Avalos
749327e51cbSPeter Avalos if ((mfn = strdup(fn)) == NULL) {
750327e51cbSPeter Avalos file_oomem(ms, strlen(fn));
751e8af9738SPeter Avalos return -1;
752e8af9738SPeter Avalos }
753e8af9738SPeter Avalos
754e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
755e8af9738SPeter Avalos mlist_free(ms->mlist[i]);
756e8af9738SPeter Avalos if ((ms->mlist[i] = mlist_alloc()) == NULL) {
757e8af9738SPeter Avalos file_oomem(ms, sizeof(*ms->mlist[i]));
758c990e5baSDaniel Fojt for (j = 0; j < i; j++) {
759c990e5baSDaniel Fojt mlist_free(ms->mlist[j]);
760c990e5baSDaniel Fojt ms->mlist[j] = NULL;
761e8af9738SPeter Avalos }
762e8af9738SPeter Avalos free(mfn);
763e8af9738SPeter Avalos return -1;
764e8af9738SPeter Avalos }
765327e51cbSPeter Avalos }
766327e51cbSPeter Avalos fn = mfn;
767327e51cbSPeter Avalos
768327e51cbSPeter Avalos while (fn) {
769*3b9cdfa3SAntonio Huete Jimenez p = CCAST(char *, strchr(fn, PATHSEP));
770327e51cbSPeter Avalos if (p)
771327e51cbSPeter Avalos *p++ = '\0';
772327e51cbSPeter Avalos if (*fn == '\0')
773327e51cbSPeter Avalos break;
7746fca56fbSSascha Wildner fileerr = apprentice_1(ms, fn, action);
7756fca56fbSSascha Wildner errs = MAX(errs, fileerr);
776327e51cbSPeter Avalos fn = p;
777327e51cbSPeter Avalos }
778e8af9738SPeter Avalos
779e8af9738SPeter Avalos free(mfn);
780e8af9738SPeter Avalos
781327e51cbSPeter Avalos if (errs == -1) {
782e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
783e8af9738SPeter Avalos mlist_free(ms->mlist[i]);
784e8af9738SPeter Avalos ms->mlist[i] = NULL;
785327e51cbSPeter Avalos }
786e8af9738SPeter Avalos file_error(ms, 0, "could not find any valid magic files!");
787e8af9738SPeter Avalos return -1;
788e8af9738SPeter Avalos }
789e8af9738SPeter Avalos
790e8af9738SPeter Avalos #if 0
791e8af9738SPeter Avalos /*
792e8af9738SPeter Avalos * Always leave the database loaded
793e8af9738SPeter Avalos */
794e8af9738SPeter Avalos if (action == FILE_LOAD)
795e8af9738SPeter Avalos return 0;
796e8af9738SPeter Avalos
797e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
798e8af9738SPeter Avalos mlist_free(ms->mlist[i]);
799e8af9738SPeter Avalos ms->mlist[i] = NULL;
800e8af9738SPeter Avalos }
801e8af9738SPeter Avalos #endif
802e8af9738SPeter Avalos
803e8af9738SPeter Avalos switch (action) {
804e8af9738SPeter Avalos case FILE_LOAD:
805e8af9738SPeter Avalos case FILE_COMPILE:
806e8af9738SPeter Avalos case FILE_CHECK:
807e8af9738SPeter Avalos case FILE_LIST:
808e8af9738SPeter Avalos return 0;
809e8af9738SPeter Avalos default:
810e8af9738SPeter Avalos file_error(ms, 0, "Invalid action %d", action);
811e8af9738SPeter Avalos return -1;
812e8af9738SPeter Avalos }
813e8af9738SPeter Avalos }
814e8af9738SPeter Avalos
815e8af9738SPeter Avalos /*
816e8af9738SPeter Avalos * Compute the real length of a magic expression, for the purposes
817e8af9738SPeter Avalos * of determining how "strong" a magic expression is (approximating
818e8af9738SPeter Avalos * how specific its matches are):
819e8af9738SPeter Avalos * - magic characters count 0 unless escaped.
820e8af9738SPeter Avalos * - [] expressions count 1
821e8af9738SPeter Avalos * - {} expressions count 0
822e8af9738SPeter Avalos * - regular characters or escaped magic characters count 1
823e8af9738SPeter Avalos * - 0 length expressions count as one
824e8af9738SPeter Avalos */
825e8af9738SPeter Avalos private size_t
nonmagic(const char * str)826e8af9738SPeter Avalos nonmagic(const char *str)
827e8af9738SPeter Avalos {
828e8af9738SPeter Avalos const char *p;
829e8af9738SPeter Avalos size_t rv = 0;
830e8af9738SPeter Avalos
831e8af9738SPeter Avalos for (p = str; *p; p++)
832e8af9738SPeter Avalos switch (*p) {
833e8af9738SPeter Avalos case '\\': /* Escaped anything counts 1 */
834e8af9738SPeter Avalos if (!*++p)
835e8af9738SPeter Avalos p--;
836e8af9738SPeter Avalos rv++;
837e8af9738SPeter Avalos continue;
838e8af9738SPeter Avalos case '?': /* Magic characters count 0 */
839e8af9738SPeter Avalos case '*':
840e8af9738SPeter Avalos case '.':
841e8af9738SPeter Avalos case '+':
842e8af9738SPeter Avalos case '^':
843e8af9738SPeter Avalos case '$':
844e8af9738SPeter Avalos continue;
845e8af9738SPeter Avalos case '[': /* Bracketed expressions count 1 the ']' */
846e8af9738SPeter Avalos while (*p && *p != ']')
847e8af9738SPeter Avalos p++;
848e8af9738SPeter Avalos p--;
849e8af9738SPeter Avalos continue;
850e8af9738SPeter Avalos case '{': /* Braced expressions count 0 */
851e8af9738SPeter Avalos while (*p && *p != '}')
852e8af9738SPeter Avalos p++;
853e8af9738SPeter Avalos if (!*p)
854e8af9738SPeter Avalos p--;
855e8af9738SPeter Avalos continue;
856e8af9738SPeter Avalos default: /* Anything else counts 1 */
857e8af9738SPeter Avalos rv++;
858e8af9738SPeter Avalos continue;
859e8af9738SPeter Avalos }
860e8af9738SPeter Avalos
861e8af9738SPeter Avalos return rv == 0 ? 1 : rv; /* Return at least 1 */
862327e51cbSPeter Avalos }
863327e51cbSPeter Avalos
864c30bd091SSascha Wildner
865c30bd091SSascha Wildner private size_t
typesize(int type)866c30bd091SSascha Wildner typesize(int type)
867c30bd091SSascha Wildner {
868c30bd091SSascha Wildner switch (type) {
869c30bd091SSascha Wildner case FILE_BYTE:
870c30bd091SSascha Wildner return 1;
871c30bd091SSascha Wildner
872c30bd091SSascha Wildner case FILE_SHORT:
873c30bd091SSascha Wildner case FILE_LESHORT:
874c30bd091SSascha Wildner case FILE_BESHORT:
875*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSDATE:
876*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSDATE:
877*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSDATE:
878*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSTIME:
879*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSTIME:
880*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSTIME:
881c30bd091SSascha Wildner return 2;
882c30bd091SSascha Wildner
883c30bd091SSascha Wildner case FILE_LONG:
884c30bd091SSascha Wildner case FILE_LELONG:
885c30bd091SSascha Wildner case FILE_BELONG:
886c30bd091SSascha Wildner case FILE_MELONG:
887c30bd091SSascha Wildner return 4;
888c30bd091SSascha Wildner
889c30bd091SSascha Wildner case FILE_DATE:
890c30bd091SSascha Wildner case FILE_LEDATE:
891c30bd091SSascha Wildner case FILE_BEDATE:
892c30bd091SSascha Wildner case FILE_MEDATE:
893c30bd091SSascha Wildner case FILE_LDATE:
894c30bd091SSascha Wildner case FILE_LELDATE:
895c30bd091SSascha Wildner case FILE_BELDATE:
896c30bd091SSascha Wildner case FILE_MELDATE:
897c30bd091SSascha Wildner case FILE_FLOAT:
898c30bd091SSascha Wildner case FILE_BEFLOAT:
899c30bd091SSascha Wildner case FILE_LEFLOAT:
900*3b9cdfa3SAntonio Huete Jimenez case FILE_BEID3:
901*3b9cdfa3SAntonio Huete Jimenez case FILE_LEID3:
902c30bd091SSascha Wildner return 4;
903c30bd091SSascha Wildner
904c30bd091SSascha Wildner case FILE_QUAD:
905c30bd091SSascha Wildner case FILE_BEQUAD:
906c30bd091SSascha Wildner case FILE_LEQUAD:
907c30bd091SSascha Wildner case FILE_QDATE:
908c30bd091SSascha Wildner case FILE_LEQDATE:
909c30bd091SSascha Wildner case FILE_BEQDATE:
910c30bd091SSascha Wildner case FILE_QLDATE:
911c30bd091SSascha Wildner case FILE_LEQLDATE:
912c30bd091SSascha Wildner case FILE_BEQLDATE:
913c30bd091SSascha Wildner case FILE_QWDATE:
914c30bd091SSascha Wildner case FILE_LEQWDATE:
915c30bd091SSascha Wildner case FILE_BEQWDATE:
916c30bd091SSascha Wildner case FILE_DOUBLE:
917c30bd091SSascha Wildner case FILE_BEDOUBLE:
918c30bd091SSascha Wildner case FILE_LEDOUBLE:
919c990e5baSDaniel Fojt case FILE_OFFSET:
920614728caSSascha Wildner case FILE_BEVARINT:
921614728caSSascha Wildner case FILE_LEVARINT:
922c30bd091SSascha Wildner return 8;
923c990e5baSDaniel Fojt
924c990e5baSDaniel Fojt case FILE_GUID:
925c990e5baSDaniel Fojt return 16;
926c990e5baSDaniel Fojt
927c30bd091SSascha Wildner default:
928c990e5baSDaniel Fojt return FILE_BADSIZE;
929c30bd091SSascha Wildner }
930c30bd091SSascha Wildner }
931c30bd091SSascha Wildner
932327e51cbSPeter Avalos /*
933327e51cbSPeter Avalos * Get weight of this magic entry, for sorting purposes.
934327e51cbSPeter Avalos */
935*3b9cdfa3SAntonio Huete Jimenez private ssize_t
apprentice_magic_strength_1(const struct magic * m)936*3b9cdfa3SAntonio Huete Jimenez apprentice_magic_strength_1(const struct magic *m)
937327e51cbSPeter Avalos {
9386fca56fbSSascha Wildner #define MULT 10U
9396fca56fbSSascha Wildner size_t ts, v;
9406fca56fbSSascha Wildner ssize_t val = 2 * MULT; /* baseline strength */
941327e51cbSPeter Avalos
942327e51cbSPeter Avalos switch (m->type) {
943327e51cbSPeter Avalos case FILE_DEFAULT: /* make sure this sorts last */
944*3b9cdfa3SAntonio Huete Jimenez if (m->factor_op != FILE_FACTOR_OP_NONE) {
945*3b9cdfa3SAntonio Huete Jimenez fprintf(stderr, "Bad factor_op %d", m->factor_op);
94679343712SPeter Avalos abort();
947*3b9cdfa3SAntonio Huete Jimenez }
948327e51cbSPeter Avalos return 0;
949327e51cbSPeter Avalos
950327e51cbSPeter Avalos case FILE_BYTE:
951327e51cbSPeter Avalos case FILE_SHORT:
952327e51cbSPeter Avalos case FILE_LESHORT:
953327e51cbSPeter Avalos case FILE_BESHORT:
954327e51cbSPeter Avalos case FILE_LONG:
955327e51cbSPeter Avalos case FILE_LELONG:
956327e51cbSPeter Avalos case FILE_BELONG:
957327e51cbSPeter Avalos case FILE_MELONG:
958c30bd091SSascha Wildner case FILE_DATE:
959c30bd091SSascha Wildner case FILE_LEDATE:
960c30bd091SSascha Wildner case FILE_BEDATE:
961c30bd091SSascha Wildner case FILE_MEDATE:
962c30bd091SSascha Wildner case FILE_LDATE:
963c30bd091SSascha Wildner case FILE_LELDATE:
964c30bd091SSascha Wildner case FILE_BELDATE:
965c30bd091SSascha Wildner case FILE_MELDATE:
966c30bd091SSascha Wildner case FILE_FLOAT:
967c30bd091SSascha Wildner case FILE_BEFLOAT:
968c30bd091SSascha Wildner case FILE_LEFLOAT:
969c30bd091SSascha Wildner case FILE_QUAD:
970c30bd091SSascha Wildner case FILE_BEQUAD:
971c30bd091SSascha Wildner case FILE_LEQUAD:
972c30bd091SSascha Wildner case FILE_QDATE:
973c30bd091SSascha Wildner case FILE_LEQDATE:
974c30bd091SSascha Wildner case FILE_BEQDATE:
975c30bd091SSascha Wildner case FILE_QLDATE:
976c30bd091SSascha Wildner case FILE_LEQLDATE:
977c30bd091SSascha Wildner case FILE_BEQLDATE:
978c30bd091SSascha Wildner case FILE_QWDATE:
979c30bd091SSascha Wildner case FILE_LEQWDATE:
980c30bd091SSascha Wildner case FILE_BEQWDATE:
981c30bd091SSascha Wildner case FILE_DOUBLE:
982c30bd091SSascha Wildner case FILE_BEDOUBLE:
983c30bd091SSascha Wildner case FILE_LEDOUBLE:
984614728caSSascha Wildner case FILE_BEVARINT:
985614728caSSascha Wildner case FILE_LEVARINT:
986c990e5baSDaniel Fojt case FILE_GUID:
987*3b9cdfa3SAntonio Huete Jimenez case FILE_BEID3:
988*3b9cdfa3SAntonio Huete Jimenez case FILE_LEID3:
989c990e5baSDaniel Fojt case FILE_OFFSET:
990*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSDATE:
991*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSDATE:
992*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSDATE:
993*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSTIME:
994*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSTIME:
995*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSTIME:
996c30bd091SSascha Wildner ts = typesize(m->type);
997*3b9cdfa3SAntonio Huete Jimenez if (ts == FILE_BADSIZE) {
998*3b9cdfa3SAntonio Huete Jimenez (void)fprintf(stderr, "Bad size for type %d\n",
999*3b9cdfa3SAntonio Huete Jimenez m->type);
1000c30bd091SSascha Wildner abort();
1001*3b9cdfa3SAntonio Huete Jimenez }
1002c30bd091SSascha Wildner val += ts * MULT;
1003327e51cbSPeter Avalos break;
1004327e51cbSPeter Avalos
1005327e51cbSPeter Avalos case FILE_PSTRING:
1006327e51cbSPeter Avalos case FILE_STRING:
1007*3b9cdfa3SAntonio Huete Jimenez case FILE_OCTAL:
1008327e51cbSPeter Avalos val += m->vallen * MULT;
1009327e51cbSPeter Avalos break;
1010327e51cbSPeter Avalos
1011327e51cbSPeter Avalos case FILE_BESTRING16:
1012327e51cbSPeter Avalos case FILE_LESTRING16:
1013327e51cbSPeter Avalos val += m->vallen * MULT / 2;
1014327e51cbSPeter Avalos break;
1015327e51cbSPeter Avalos
1016327e51cbSPeter Avalos case FILE_SEARCH:
10176fca56fbSSascha Wildner if (m->vallen == 0)
10186fca56fbSSascha Wildner break;
101979343712SPeter Avalos val += m->vallen * MAX(MULT / m->vallen, 1);
1020327e51cbSPeter Avalos break;
1021327e51cbSPeter Avalos
1022e8af9738SPeter Avalos case FILE_REGEX:
1023e8af9738SPeter Avalos v = nonmagic(m->value.s);
1024e8af9738SPeter Avalos val += v * MAX(MULT / v, 1);
1025e8af9738SPeter Avalos break;
1026e8af9738SPeter Avalos
1027e8af9738SPeter Avalos case FILE_INDIRECT:
1028e8af9738SPeter Avalos case FILE_NAME:
1029e8af9738SPeter Avalos case FILE_USE:
1030*3b9cdfa3SAntonio Huete Jimenez case FILE_CLEAR:
1031e8af9738SPeter Avalos break;
1032e8af9738SPeter Avalos
1033c30bd091SSascha Wildner case FILE_DER:
1034c30bd091SSascha Wildner val += MULT;
1035c30bd091SSascha Wildner break;
1036c30bd091SSascha Wildner
1037327e51cbSPeter Avalos default:
1038327e51cbSPeter Avalos (void)fprintf(stderr, "Bad type %d\n", m->type);
1039327e51cbSPeter Avalos abort();
1040327e51cbSPeter Avalos }
1041327e51cbSPeter Avalos
1042327e51cbSPeter Avalos switch (m->reln) {
1043327e51cbSPeter Avalos case 'x': /* matches anything penalize */
104479343712SPeter Avalos case '!': /* matches almost anything penalize */
1045327e51cbSPeter Avalos val = 0;
1046327e51cbSPeter Avalos break;
1047327e51cbSPeter Avalos
1048327e51cbSPeter Avalos case '=': /* Exact match, prefer */
1049327e51cbSPeter Avalos val += MULT;
1050327e51cbSPeter Avalos break;
1051327e51cbSPeter Avalos
1052327e51cbSPeter Avalos case '>':
1053327e51cbSPeter Avalos case '<': /* comparison match reduce strength */
1054327e51cbSPeter Avalos val -= 2 * MULT;
1055327e51cbSPeter Avalos break;
1056327e51cbSPeter Avalos
1057327e51cbSPeter Avalos case '^':
1058327e51cbSPeter Avalos case '&': /* masking bits, we could count them too */
1059327e51cbSPeter Avalos val -= MULT;
1060327e51cbSPeter Avalos break;
1061327e51cbSPeter Avalos
1062327e51cbSPeter Avalos default:
1063327e51cbSPeter Avalos (void)fprintf(stderr, "Bad relation %c\n", m->reln);
1064327e51cbSPeter Avalos abort();
1065327e51cbSPeter Avalos }
1066327e51cbSPeter Avalos
1067*3b9cdfa3SAntonio Huete Jimenez return val;
1068*3b9cdfa3SAntonio Huete Jimenez }
1069*3b9cdfa3SAntonio Huete Jimenez
1070*3b9cdfa3SAntonio Huete Jimenez
1071*3b9cdfa3SAntonio Huete Jimenez /*ARGSUSED*/
1072*3b9cdfa3SAntonio Huete Jimenez private size_t
apprentice_magic_strength(const struct magic * m,size_t nmagic)1073*3b9cdfa3SAntonio Huete Jimenez apprentice_magic_strength(const struct magic *m,
1074*3b9cdfa3SAntonio Huete Jimenez size_t nmagic __attribute__((__unused__)))
1075*3b9cdfa3SAntonio Huete Jimenez {
1076*3b9cdfa3SAntonio Huete Jimenez ssize_t val = apprentice_magic_strength_1(m);
1077*3b9cdfa3SAntonio Huete Jimenez
1078*3b9cdfa3SAntonio Huete Jimenez #ifdef notyet
1079*3b9cdfa3SAntonio Huete Jimenez if (m->desc[0] == '\0') {
1080*3b9cdfa3SAntonio Huete Jimenez size_t i;
1081*3b9cdfa3SAntonio Huete Jimenez /*
1082*3b9cdfa3SAntonio Huete Jimenez * Magic entries with no description get their continuations
1083*3b9cdfa3SAntonio Huete Jimenez * added
1084*3b9cdfa3SAntonio Huete Jimenez */
1085*3b9cdfa3SAntonio Huete Jimenez for (i = 1; m[i].cont_level != 0 && i < MIN(nmagic, 3); i++) {
1086*3b9cdfa3SAntonio Huete Jimenez ssize_t v = apprentice_magic_strength_1(&m[i]) >>
1087*3b9cdfa3SAntonio Huete Jimenez (i + 1);
1088*3b9cdfa3SAntonio Huete Jimenez val += v;
1089*3b9cdfa3SAntonio Huete Jimenez if (m[i].desc[0] != '\0')
1090*3b9cdfa3SAntonio Huete Jimenez break;
1091*3b9cdfa3SAntonio Huete Jimenez }
1092*3b9cdfa3SAntonio Huete Jimenez }
1093*3b9cdfa3SAntonio Huete Jimenez #endif
1094*3b9cdfa3SAntonio Huete Jimenez
109579343712SPeter Avalos switch (m->factor_op) {
109679343712SPeter Avalos case FILE_FACTOR_OP_NONE:
109779343712SPeter Avalos break;
109879343712SPeter Avalos case FILE_FACTOR_OP_PLUS:
109979343712SPeter Avalos val += m->factor;
110079343712SPeter Avalos break;
110179343712SPeter Avalos case FILE_FACTOR_OP_MINUS:
110279343712SPeter Avalos val -= m->factor;
110379343712SPeter Avalos break;
110479343712SPeter Avalos case FILE_FACTOR_OP_TIMES:
110579343712SPeter Avalos val *= m->factor;
110679343712SPeter Avalos break;
110779343712SPeter Avalos case FILE_FACTOR_OP_DIV:
110879343712SPeter Avalos val /= m->factor;
110979343712SPeter Avalos break;
111079343712SPeter Avalos default:
1111*3b9cdfa3SAntonio Huete Jimenez (void)fprintf(stderr, "Bad factor_op %u\n", m->factor_op);
111279343712SPeter Avalos abort();
111379343712SPeter Avalos }
111479343712SPeter Avalos
11156fca56fbSSascha Wildner if (val <= 0) /* ensure we only return 0 for FILE_DEFAULT */
11166fca56fbSSascha Wildner val = 1;
11176fca56fbSSascha Wildner
1118*3b9cdfa3SAntonio Huete Jimenez #ifndef notyet
111979343712SPeter Avalos /*
112079343712SPeter Avalos * Magic entries with no description get a bonus because they depend
112179343712SPeter Avalos * on subsequent magic entries to print something.
112279343712SPeter Avalos */
112379343712SPeter Avalos if (m->desc[0] == '\0')
112479343712SPeter Avalos val++;
1125*3b9cdfa3SAntonio Huete Jimenez #endif
1126*3b9cdfa3SAntonio Huete Jimenez
1127327e51cbSPeter Avalos return val;
1128327e51cbSPeter Avalos }
1129327e51cbSPeter Avalos
1130327e51cbSPeter Avalos /*
1131327e51cbSPeter Avalos * Sort callback for sorting entries by "strength" (basically length)
1132327e51cbSPeter Avalos */
1133327e51cbSPeter Avalos private int
apprentice_sort(const void * a,const void * b)1134327e51cbSPeter Avalos apprentice_sort(const void *a, const void *b)
1135327e51cbSPeter Avalos {
113679343712SPeter Avalos const struct magic_entry *ma = CAST(const struct magic_entry *, a);
113779343712SPeter Avalos const struct magic_entry *mb = CAST(const struct magic_entry *, b);
1138*3b9cdfa3SAntonio Huete Jimenez size_t sa = apprentice_magic_strength(ma->mp, ma->cont_count);
1139*3b9cdfa3SAntonio Huete Jimenez size_t sb = apprentice_magic_strength(mb->mp, mb->cont_count);
1140327e51cbSPeter Avalos if (sa == sb)
1141327e51cbSPeter Avalos return 0;
1142327e51cbSPeter Avalos else if (sa > sb)
1143327e51cbSPeter Avalos return -1;
1144327e51cbSPeter Avalos else
1145327e51cbSPeter Avalos return 1;
1146327e51cbSPeter Avalos }
1147327e51cbSPeter Avalos
1148e4d4ce0cSPeter Avalos /*
1149e4d4ce0cSPeter Avalos * Shows sorted patterns list in the order which is used for the matching
1150e4d4ce0cSPeter Avalos */
1151e4d4ce0cSPeter Avalos private void
apprentice_list(struct mlist * mlist,int mode)1152e4d4ce0cSPeter Avalos apprentice_list(struct mlist *mlist, int mode)
1153e4d4ce0cSPeter Avalos {
1154*3b9cdfa3SAntonio Huete Jimenez uint32_t magindex, descindex, mimeindex, lineindex;
1155e4d4ce0cSPeter Avalos struct mlist *ml;
1156e4d4ce0cSPeter Avalos for (ml = mlist->next; ml != mlist; ml = ml->next) {
1157e4d4ce0cSPeter Avalos for (magindex = 0; magindex < ml->nmagic; magindex++) {
1158e4d4ce0cSPeter Avalos struct magic *m = &ml->magic[magindex];
1159e4d4ce0cSPeter Avalos if ((m->flag & mode) != mode) {
1160e4d4ce0cSPeter Avalos /* Skip sub-tests */
1161e4d4ce0cSPeter Avalos while (magindex + 1 < ml->nmagic &&
1162e4d4ce0cSPeter Avalos ml->magic[magindex + 1].cont_level != 0)
1163e4d4ce0cSPeter Avalos ++magindex;
1164e4d4ce0cSPeter Avalos continue; /* Skip to next top-level test*/
1165e4d4ce0cSPeter Avalos }
1166e4d4ce0cSPeter Avalos
1167e4d4ce0cSPeter Avalos /*
1168e4d4ce0cSPeter Avalos * Try to iterate over the tree until we find item with
1169e4d4ce0cSPeter Avalos * description/mimetype.
1170e4d4ce0cSPeter Avalos */
1171*3b9cdfa3SAntonio Huete Jimenez lineindex = descindex = mimeindex = magindex;
1172*3b9cdfa3SAntonio Huete Jimenez for (magindex++; magindex < ml->nmagic &&
1173*3b9cdfa3SAntonio Huete Jimenez ml->magic[magindex].cont_level != 0; magindex++) {
1174*3b9cdfa3SAntonio Huete Jimenez if (*ml->magic[descindex].desc == '\0'
1175*3b9cdfa3SAntonio Huete Jimenez && *ml->magic[magindex].desc)
1176*3b9cdfa3SAntonio Huete Jimenez descindex = magindex;
1177*3b9cdfa3SAntonio Huete Jimenez if (*ml->magic[mimeindex].mimetype == '\0'
1178*3b9cdfa3SAntonio Huete Jimenez && *ml->magic[magindex].mimetype)
1179*3b9cdfa3SAntonio Huete Jimenez mimeindex = magindex;
1180*3b9cdfa3SAntonio Huete Jimenez }
1181e4d4ce0cSPeter Avalos
1182c30bd091SSascha Wildner printf("Strength = %3" SIZE_T_FORMAT "u@%u: %s [%s]\n",
1183*3b9cdfa3SAntonio Huete Jimenez apprentice_magic_strength(m, ml->nmagic - magindex),
1184*3b9cdfa3SAntonio Huete Jimenez ml->magic[lineindex].lineno,
1185*3b9cdfa3SAntonio Huete Jimenez ml->magic[descindex].desc,
1186*3b9cdfa3SAntonio Huete Jimenez ml->magic[mimeindex].mimetype);
1187e4d4ce0cSPeter Avalos }
1188e4d4ce0cSPeter Avalos }
1189e4d4ce0cSPeter Avalos }
1190e4d4ce0cSPeter Avalos
119179343712SPeter Avalos private void
set_test_type(struct magic * mstart,struct magic * m)119279343712SPeter Avalos set_test_type(struct magic *mstart, struct magic *m)
1193327e51cbSPeter Avalos {
119479343712SPeter Avalos switch (m->type) {
119579343712SPeter Avalos case FILE_BYTE:
119679343712SPeter Avalos case FILE_SHORT:
119779343712SPeter Avalos case FILE_LONG:
119879343712SPeter Avalos case FILE_DATE:
119979343712SPeter Avalos case FILE_BESHORT:
120079343712SPeter Avalos case FILE_BELONG:
120179343712SPeter Avalos case FILE_BEDATE:
120279343712SPeter Avalos case FILE_LESHORT:
120379343712SPeter Avalos case FILE_LELONG:
120479343712SPeter Avalos case FILE_LEDATE:
120579343712SPeter Avalos case FILE_LDATE:
120679343712SPeter Avalos case FILE_BELDATE:
120779343712SPeter Avalos case FILE_LELDATE:
120879343712SPeter Avalos case FILE_MEDATE:
120979343712SPeter Avalos case FILE_MELDATE:
121079343712SPeter Avalos case FILE_MELONG:
121179343712SPeter Avalos case FILE_QUAD:
121279343712SPeter Avalos case FILE_LEQUAD:
121379343712SPeter Avalos case FILE_BEQUAD:
121479343712SPeter Avalos case FILE_QDATE:
121579343712SPeter Avalos case FILE_LEQDATE:
121679343712SPeter Avalos case FILE_BEQDATE:
121779343712SPeter Avalos case FILE_QLDATE:
121879343712SPeter Avalos case FILE_LEQLDATE:
121979343712SPeter Avalos case FILE_BEQLDATE:
1220e8af9738SPeter Avalos case FILE_QWDATE:
1221e8af9738SPeter Avalos case FILE_LEQWDATE:
1222e8af9738SPeter Avalos case FILE_BEQWDATE:
122379343712SPeter Avalos case FILE_FLOAT:
122479343712SPeter Avalos case FILE_BEFLOAT:
122579343712SPeter Avalos case FILE_LEFLOAT:
122679343712SPeter Avalos case FILE_DOUBLE:
122779343712SPeter Avalos case FILE_BEDOUBLE:
122879343712SPeter Avalos case FILE_LEDOUBLE:
1229614728caSSascha Wildner case FILE_BEVARINT:
1230614728caSSascha Wildner case FILE_LEVARINT:
1231c30bd091SSascha Wildner case FILE_DER:
1232c990e5baSDaniel Fojt case FILE_GUID:
1233c990e5baSDaniel Fojt case FILE_OFFSET:
1234*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSDATE:
1235*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSDATE:
1236*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSDATE:
1237*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSTIME:
1238*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSTIME:
1239*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSTIME:
1240*3b9cdfa3SAntonio Huete Jimenez case FILE_OCTAL:
1241ff91a668SPeter Avalos mstart->flag |= BINTEST;
1242ff91a668SPeter Avalos break;
124379343712SPeter Avalos case FILE_STRING:
124479343712SPeter Avalos case FILE_PSTRING:
124579343712SPeter Avalos case FILE_BESTRING16:
124679343712SPeter Avalos case FILE_LESTRING16:
1247e4d4ce0cSPeter Avalos /* Allow text overrides */
1248e4d4ce0cSPeter Avalos if (mstart->str_flags & STRING_TEXTTEST)
1249e4d4ce0cSPeter Avalos mstart->flag |= TEXTTEST;
1250e4d4ce0cSPeter Avalos else
125179343712SPeter Avalos mstart->flag |= BINTEST;
125279343712SPeter Avalos break;
125379343712SPeter Avalos case FILE_REGEX:
125479343712SPeter Avalos case FILE_SEARCH:
1255f72f8299SJan Lentfer /* Check for override */
1256f72f8299SJan Lentfer if (mstart->str_flags & STRING_BINTEST)
1257f72f8299SJan Lentfer mstart->flag |= BINTEST;
1258f72f8299SJan Lentfer if (mstart->str_flags & STRING_TEXTTEST)
1259f72f8299SJan Lentfer mstart->flag |= TEXTTEST;
1260f72f8299SJan Lentfer
1261f72f8299SJan Lentfer if (mstart->flag & (TEXTTEST|BINTEST))
1262f72f8299SJan Lentfer break;
1263f72f8299SJan Lentfer
126479343712SPeter Avalos /* binary test if pattern is not text */
12656fca56fbSSascha Wildner if (file_looks_utf8(m->value.us, CAST(size_t, m->vallen), NULL,
126679343712SPeter Avalos NULL) <= 0)
126779343712SPeter Avalos mstart->flag |= BINTEST;
1268f72f8299SJan Lentfer else
1269f72f8299SJan Lentfer mstart->flag |= TEXTTEST;
127079343712SPeter Avalos break;
127179343712SPeter Avalos case FILE_DEFAULT:
127279343712SPeter Avalos /* can't deduce anything; we shouldn't see this at the
127379343712SPeter Avalos top level anyway */
127479343712SPeter Avalos break;
127579343712SPeter Avalos case FILE_INVALID:
127679343712SPeter Avalos default:
127779343712SPeter Avalos /* invalid search type, but no need to complain here */
127879343712SPeter Avalos break;
127979343712SPeter Avalos }
128079343712SPeter Avalos }
128179343712SPeter Avalos
1282e8af9738SPeter Avalos private int
addentry(struct magic_set * ms,struct magic_entry * me,struct magic_entry_set * mset)1283e8af9738SPeter Avalos addentry(struct magic_set *ms, struct magic_entry *me,
1284e8af9738SPeter Avalos struct magic_entry_set *mset)
1285e8af9738SPeter Avalos {
1286e8af9738SPeter Avalos size_t i = me->mp->type == FILE_NAME ? 1 : 0;
1287*3b9cdfa3SAntonio Huete Jimenez if (mset[i].me == NULL || mset[i].count == mset[i].max) {
1288e8af9738SPeter Avalos struct magic_entry *mp;
1289e8af9738SPeter Avalos
1290*3b9cdfa3SAntonio Huete Jimenez size_t incr = mset[i].max + ALLOC_INCR;
1291e8af9738SPeter Avalos if ((mp = CAST(struct magic_entry *,
1292*3b9cdfa3SAntonio Huete Jimenez realloc(mset[i].me, sizeof(*mp) * incr))) ==
1293e8af9738SPeter Avalos NULL) {
1294*3b9cdfa3SAntonio Huete Jimenez file_oomem(ms, sizeof(*mp) * incr);
1295e8af9738SPeter Avalos return -1;
1296e8af9738SPeter Avalos }
1297e8af9738SPeter Avalos (void)memset(&mp[mset[i].count], 0, sizeof(*mp) *
1298e8af9738SPeter Avalos ALLOC_INCR);
1299e8af9738SPeter Avalos mset[i].me = mp;
1300*3b9cdfa3SAntonio Huete Jimenez mset[i].max = CAST(uint32_t, incr);
1301*3b9cdfa3SAntonio Huete Jimenez assert(mset[i].max == incr);
1302e8af9738SPeter Avalos }
1303e8af9738SPeter Avalos mset[i].me[mset[i].count++] = *me;
1304e8af9738SPeter Avalos memset(me, 0, sizeof(*me));
1305e8af9738SPeter Avalos return 0;
1306e8af9738SPeter Avalos }
1307e8af9738SPeter Avalos
130879343712SPeter Avalos /*
130979343712SPeter Avalos * Load and parse one file.
131079343712SPeter Avalos */
131179343712SPeter Avalos private void
load_1(struct magic_set * ms,int action,const char * fn,int * errs,struct magic_entry_set * mset)131279343712SPeter Avalos load_1(struct magic_set *ms, int action, const char *fn, int *errs,
1313e8af9738SPeter Avalos struct magic_entry_set *mset)
131479343712SPeter Avalos {
1315ff91a668SPeter Avalos size_t lineno = 0, llen = 0;
1316ff91a668SPeter Avalos char *line = NULL;
1317ff91a668SPeter Avalos ssize_t len;
1318e8af9738SPeter Avalos struct magic_entry me;
1319ff91a668SPeter Avalos
132079343712SPeter Avalos FILE *f = fopen(ms->file = fn, "r");
1321327e51cbSPeter Avalos if (f == NULL) {
1322327e51cbSPeter Avalos if (errno != ENOENT)
1323327e51cbSPeter Avalos file_error(ms, errno, "cannot read magic file `%s'",
1324327e51cbSPeter Avalos fn);
132579343712SPeter Avalos (*errs)++;
1326ff91a668SPeter Avalos return;
1327ff91a668SPeter Avalos }
1328ff91a668SPeter Avalos
1329e8af9738SPeter Avalos memset(&me, 0, sizeof(me));
1330327e51cbSPeter Avalos /* read and parse this file */
1331ff91a668SPeter Avalos for (ms->line = 1; (len = getline(&line, &llen, f)) != -1;
1332f72f8299SJan Lentfer ms->line++) {
1333327e51cbSPeter Avalos if (len == 0) /* null line, garbage, etc */
1334327e51cbSPeter Avalos continue;
1335327e51cbSPeter Avalos if (line[len - 1] == '\n') {
1336327e51cbSPeter Avalos lineno++;
1337327e51cbSPeter Avalos line[len - 1] = '\0'; /* delete newline */
1338327e51cbSPeter Avalos }
1339ff91a668SPeter Avalos switch (line[0]) {
1340ff91a668SPeter Avalos case '\0': /* empty, do not parse */
1341ff91a668SPeter Avalos case '#': /* comment, do not parse */
1342327e51cbSPeter Avalos continue;
1343ff91a668SPeter Avalos case '!':
1344ff91a668SPeter Avalos if (line[1] == ':') {
134579343712SPeter Avalos size_t i;
134679343712SPeter Avalos
134779343712SPeter Avalos for (i = 0; bang[i].name != NULL; i++) {
13486fca56fbSSascha Wildner if (CAST(size_t, len - 2) > bang[i].len &&
134979343712SPeter Avalos memcmp(bang[i].name, line + 2,
135079343712SPeter Avalos bang[i].len) == 0)
135179343712SPeter Avalos break;
135279343712SPeter Avalos }
135379343712SPeter Avalos if (bang[i].name == NULL) {
135479343712SPeter Avalos file_error(ms, 0,
135579343712SPeter Avalos "Unknown !: entry `%s'", line);
135679343712SPeter Avalos (*errs)++;
135779343712SPeter Avalos continue;
135879343712SPeter Avalos }
1359e8af9738SPeter Avalos if (me.mp == NULL) {
136079343712SPeter Avalos file_error(ms, 0,
136179343712SPeter Avalos "No current entry for :!%s type",
136279343712SPeter Avalos bang[i].name);
136379343712SPeter Avalos (*errs)++;
136479343712SPeter Avalos continue;
136579343712SPeter Avalos }
1366e8af9738SPeter Avalos if ((*bang[i].fun)(ms, &me,
1367c990e5baSDaniel Fojt line + bang[i].len + 2,
1368c990e5baSDaniel Fojt len - bang[i].len - 2) != 0) {
136979343712SPeter Avalos (*errs)++;
137079343712SPeter Avalos continue;
137179343712SPeter Avalos }
137279343712SPeter Avalos continue;
137379343712SPeter Avalos }
1374ff91a668SPeter Avalos /*FALLTHROUGH*/
1375ff91a668SPeter Avalos default:
1376e8af9738SPeter Avalos again:
1377e8af9738SPeter Avalos switch (parse(ms, &me, line, lineno, action)) {
1378e8af9738SPeter Avalos case 0:
1379e8af9738SPeter Avalos continue;
1380e8af9738SPeter Avalos case 1:
1381e8af9738SPeter Avalos (void)addentry(ms, &me, mset);
1382e8af9738SPeter Avalos goto again;
1383e8af9738SPeter Avalos default:
138479343712SPeter Avalos (*errs)++;
1385ff91a668SPeter Avalos break;
1386327e51cbSPeter Avalos }
1387ff91a668SPeter Avalos }
1388e8af9738SPeter Avalos }
1389e8af9738SPeter Avalos if (me.mp)
1390e8af9738SPeter Avalos (void)addentry(ms, &me, mset);
1391ff91a668SPeter Avalos free(line);
1392327e51cbSPeter Avalos (void)fclose(f);
139379343712SPeter Avalos }
139479343712SPeter Avalos
139579343712SPeter Avalos /*
139679343712SPeter Avalos * parse a file or directory of files
139779343712SPeter Avalos * const char *fn: name of magic file or directory
139879343712SPeter Avalos */
139979343712SPeter Avalos private int
cmpstrp(const void * p1,const void * p2)1400f72f8299SJan Lentfer cmpstrp(const void *p1, const void *p2)
1401f72f8299SJan Lentfer {
14026fca56fbSSascha Wildner return strcmp(*RCAST(char *const *, p1), *RCAST(char *const *, p2));
1403f72f8299SJan Lentfer }
1404f72f8299SJan Lentfer
1405e8af9738SPeter Avalos
1406e8af9738SPeter Avalos private uint32_t
set_text_binary(struct magic_set * ms,struct magic_entry * me,uint32_t nme,uint32_t starttest)1407e8af9738SPeter Avalos set_text_binary(struct magic_set *ms, struct magic_entry *me, uint32_t nme,
1408e8af9738SPeter Avalos uint32_t starttest)
1409e8af9738SPeter Avalos {
1410e8af9738SPeter Avalos static const char text[] = "text";
1411e8af9738SPeter Avalos static const char binary[] = "binary";
1412e8af9738SPeter Avalos static const size_t len = sizeof(text);
1413e8af9738SPeter Avalos
1414e8af9738SPeter Avalos uint32_t i = starttest;
1415e8af9738SPeter Avalos
1416e8af9738SPeter Avalos do {
1417e8af9738SPeter Avalos set_test_type(me[starttest].mp, me[i].mp);
1418e8af9738SPeter Avalos if ((ms->flags & MAGIC_DEBUG) == 0)
1419e8af9738SPeter Avalos continue;
1420e8af9738SPeter Avalos (void)fprintf(stderr, "%s%s%s: %s\n",
1421e8af9738SPeter Avalos me[i].mp->mimetype,
1422e8af9738SPeter Avalos me[i].mp->mimetype[0] == '\0' ? "" : "; ",
1423e8af9738SPeter Avalos me[i].mp->desc[0] ? me[i].mp->desc : "(no description)",
1424e8af9738SPeter Avalos me[i].mp->flag & BINTEST ? binary : text);
1425e8af9738SPeter Avalos if (me[i].mp->flag & BINTEST) {
1426e8af9738SPeter Avalos char *p = strstr(me[i].mp->desc, text);
1427e8af9738SPeter Avalos if (p && (p == me[i].mp->desc ||
14286fca56fbSSascha Wildner isspace(CAST(unsigned char, p[-1]))) &&
1429e8af9738SPeter Avalos (p + len - me[i].mp->desc == MAXstring
1430e8af9738SPeter Avalos || (p[len] == '\0' ||
14316fca56fbSSascha Wildner isspace(CAST(unsigned char, p[len])))))
1432e8af9738SPeter Avalos (void)fprintf(stderr, "*** Possible "
1433e8af9738SPeter Avalos "binary test for text type\n");
1434e8af9738SPeter Avalos }
1435e8af9738SPeter Avalos } while (++i < nme && me[i].mp->cont_level != 0);
1436e8af9738SPeter Avalos return i;
1437e8af9738SPeter Avalos }
1438e8af9738SPeter Avalos
1439e8af9738SPeter Avalos private void
set_last_default(struct magic_set * ms,struct magic_entry * me,uint32_t nme)1440e8af9738SPeter Avalos set_last_default(struct magic_set *ms, struct magic_entry *me, uint32_t nme)
1441e8af9738SPeter Avalos {
1442e8af9738SPeter Avalos uint32_t i;
1443e8af9738SPeter Avalos for (i = 0; i < nme; i++) {
1444e8af9738SPeter Avalos if (me[i].mp->cont_level == 0 &&
1445e8af9738SPeter Avalos me[i].mp->type == FILE_DEFAULT) {
1446e8af9738SPeter Avalos while (++i < nme)
1447e8af9738SPeter Avalos if (me[i].mp->cont_level == 0)
1448e8af9738SPeter Avalos break;
1449e8af9738SPeter Avalos if (i != nme) {
1450e8af9738SPeter Avalos /* XXX - Ugh! */
1451e8af9738SPeter Avalos ms->line = me[i].mp->lineno;
1452e8af9738SPeter Avalos file_magwarn(ms,
1453e8af9738SPeter Avalos "level 0 \"default\" did not sort last");
1454e8af9738SPeter Avalos }
1455e8af9738SPeter Avalos return;
1456e8af9738SPeter Avalos }
1457e8af9738SPeter Avalos }
1458e8af9738SPeter Avalos }
1459e8af9738SPeter Avalos
1460f72f8299SJan Lentfer private int
coalesce_entries(struct magic_set * ms,struct magic_entry * me,uint32_t nme,struct magic ** ma,uint32_t * nma)1461e8af9738SPeter Avalos coalesce_entries(struct magic_set *ms, struct magic_entry *me, uint32_t nme,
1462e8af9738SPeter Avalos struct magic **ma, uint32_t *nma)
1463e8af9738SPeter Avalos {
1464e8af9738SPeter Avalos uint32_t i, mentrycount = 0;
1465e8af9738SPeter Avalos size_t slen;
1466e8af9738SPeter Avalos
1467e8af9738SPeter Avalos for (i = 0; i < nme; i++)
1468e8af9738SPeter Avalos mentrycount += me[i].cont_count;
1469e8af9738SPeter Avalos
1470614728caSSascha Wildner if (mentrycount == 0) {
1471614728caSSascha Wildner *ma = NULL;
1472614728caSSascha Wildner *nma = 0;
1473614728caSSascha Wildner return 0;
1474614728caSSascha Wildner }
1475614728caSSascha Wildner
1476e8af9738SPeter Avalos slen = sizeof(**ma) * mentrycount;
1477e8af9738SPeter Avalos if ((*ma = CAST(struct magic *, malloc(slen))) == NULL) {
1478e8af9738SPeter Avalos file_oomem(ms, slen);
1479e8af9738SPeter Avalos return -1;
1480e8af9738SPeter Avalos }
1481e8af9738SPeter Avalos
1482e8af9738SPeter Avalos mentrycount = 0;
1483e8af9738SPeter Avalos for (i = 0; i < nme; i++) {
1484e8af9738SPeter Avalos (void)memcpy(*ma + mentrycount, me[i].mp,
1485e8af9738SPeter Avalos me[i].cont_count * sizeof(**ma));
1486e8af9738SPeter Avalos mentrycount += me[i].cont_count;
1487e8af9738SPeter Avalos }
1488e8af9738SPeter Avalos *nma = mentrycount;
1489e8af9738SPeter Avalos return 0;
1490e8af9738SPeter Avalos }
1491e8af9738SPeter Avalos
1492e8af9738SPeter Avalos private void
magic_entry_free(struct magic_entry * me,uint32_t nme)1493e8af9738SPeter Avalos magic_entry_free(struct magic_entry *me, uint32_t nme)
1494e8af9738SPeter Avalos {
1495e8af9738SPeter Avalos uint32_t i;
1496e8af9738SPeter Avalos if (me == NULL)
1497e8af9738SPeter Avalos return;
1498e8af9738SPeter Avalos for (i = 0; i < nme; i++)
1499e8af9738SPeter Avalos free(me[i].mp);
1500e8af9738SPeter Avalos free(me);
1501e8af9738SPeter Avalos }
1502e8af9738SPeter Avalos
1503e8af9738SPeter Avalos private struct magic_map *
apprentice_load(struct magic_set * ms,const char * fn,int action)1504e8af9738SPeter Avalos apprentice_load(struct magic_set *ms, const char *fn, int action)
150579343712SPeter Avalos {
150679343712SPeter Avalos int errs = 0;
1507e8af9738SPeter Avalos uint32_t i, j;
1508e8af9738SPeter Avalos size_t files = 0, maxfiles = 0;
1509ff91a668SPeter Avalos char **filearr = NULL, *mfn;
151079343712SPeter Avalos struct stat st;
1511e8af9738SPeter Avalos struct magic_map *map;
1512e8af9738SPeter Avalos struct magic_entry_set mset[MAGIC_SETS];
151379343712SPeter Avalos DIR *dir;
151479343712SPeter Avalos struct dirent *d;
151579343712SPeter Avalos
1516e8af9738SPeter Avalos memset(mset, 0, sizeof(mset));
151779343712SPeter Avalos ms->flags |= MAGIC_CHECK; /* Enable checks for parsed files */
151879343712SPeter Avalos
1519e8af9738SPeter Avalos
1520e8af9738SPeter Avalos if ((map = CAST(struct magic_map *, calloc(1, sizeof(*map)))) == NULL)
1521e8af9738SPeter Avalos {
1522e8af9738SPeter Avalos file_oomem(ms, sizeof(*map));
1523e8af9738SPeter Avalos return NULL;
152479343712SPeter Avalos }
1525c30bd091SSascha Wildner map->type = MAP_TYPE_MALLOC;
152679343712SPeter Avalos
152779343712SPeter Avalos /* print silly verbose header for USG compat. */
152879343712SPeter Avalos if (action == FILE_CHECK)
152979343712SPeter Avalos (void)fprintf(stderr, "%s\n", usg_hdr);
153079343712SPeter Avalos
153179343712SPeter Avalos /* load directory or file */
153279343712SPeter Avalos if (stat(fn, &st) == 0 && S_ISDIR(st.st_mode)) {
153379343712SPeter Avalos dir = opendir(fn);
1534f72f8299SJan Lentfer if (!dir) {
1535f72f8299SJan Lentfer errs++;
1536f72f8299SJan Lentfer goto out;
153779343712SPeter Avalos }
1538f72f8299SJan Lentfer while ((d = readdir(dir)) != NULL) {
1539c30bd091SSascha Wildner if (d->d_name[0] == '.')
1540c30bd091SSascha Wildner continue;
1541ff91a668SPeter Avalos if (asprintf(&mfn, "%s/%s", fn, d->d_name) < 0) {
1542ff91a668SPeter Avalos file_oomem(ms,
1543ff91a668SPeter Avalos strlen(fn) + strlen(d->d_name) + 2);
1544f72f8299SJan Lentfer errs++;
15459f86ab30SPeter Avalos closedir(dir);
1546f72f8299SJan Lentfer goto out;
1547f72f8299SJan Lentfer }
1548ff91a668SPeter Avalos if (stat(mfn, &st) == -1 || !S_ISREG(st.st_mode)) {
1549ff91a668SPeter Avalos free(mfn);
1550ff91a668SPeter Avalos continue;
1551ff91a668SPeter Avalos }
1552f72f8299SJan Lentfer if (files >= maxfiles) {
1553f72f8299SJan Lentfer size_t mlen;
1554c990e5baSDaniel Fojt char **nfilearr;
1555f72f8299SJan Lentfer maxfiles = (maxfiles + 1) * 2;
1556f72f8299SJan Lentfer mlen = maxfiles * sizeof(*filearr);
1557c990e5baSDaniel Fojt if ((nfilearr = CAST(char **,
1558f72f8299SJan Lentfer realloc(filearr, mlen))) == NULL) {
1559f72f8299SJan Lentfer file_oomem(ms, mlen);
1560ff91a668SPeter Avalos free(mfn);
15619f86ab30SPeter Avalos closedir(dir);
1562f72f8299SJan Lentfer errs++;
1563f72f8299SJan Lentfer goto out;
1564f72f8299SJan Lentfer }
1565c990e5baSDaniel Fojt filearr = nfilearr;
1566f72f8299SJan Lentfer }
1567f72f8299SJan Lentfer filearr[files++] = mfn;
156879343712SPeter Avalos }
156979343712SPeter Avalos closedir(dir);
15706fca56fbSSascha Wildner if (filearr) {
1571f72f8299SJan Lentfer qsort(filearr, files, sizeof(*filearr), cmpstrp);
1572f72f8299SJan Lentfer for (i = 0; i < files; i++) {
1573e8af9738SPeter Avalos load_1(ms, action, filearr[i], &errs, mset);
1574f72f8299SJan Lentfer free(filearr[i]);
1575f72f8299SJan Lentfer }
1576f72f8299SJan Lentfer free(filearr);
1577c990e5baSDaniel Fojt filearr = NULL;
15786fca56fbSSascha Wildner }
157979343712SPeter Avalos } else
1580e8af9738SPeter Avalos load_1(ms, action, fn, &errs, mset);
1581327e51cbSPeter Avalos if (errs)
1582327e51cbSPeter Avalos goto out;
1583327e51cbSPeter Avalos
1584e8af9738SPeter Avalos for (j = 0; j < MAGIC_SETS; j++) {
158579343712SPeter Avalos /* Set types of tests */
1586e8af9738SPeter Avalos for (i = 0; i < mset[j].count; ) {
1587e8af9738SPeter Avalos if (mset[j].me[i].mp->cont_level != 0) {
158879343712SPeter Avalos i++;
158979343712SPeter Avalos continue;
159079343712SPeter Avalos }
1591e8af9738SPeter Avalos i = set_text_binary(ms, mset[j].me, mset[j].count, i);
159279343712SPeter Avalos }
1593c30bd091SSascha Wildner if (mset[j].me)
1594e8af9738SPeter Avalos qsort(mset[j].me, mset[j].count, sizeof(*mset[j].me),
1595e8af9738SPeter Avalos apprentice_sort);
159679343712SPeter Avalos
1597327e51cbSPeter Avalos /*
1598e8af9738SPeter Avalos * Make sure that any level 0 "default" line is last
1599e8af9738SPeter Avalos * (if one exists).
1600327e51cbSPeter Avalos */
1601e8af9738SPeter Avalos set_last_default(ms, mset[j].me, mset[j].count);
1602327e51cbSPeter Avalos
1603970935fdSSascha Wildner /* coalesce per file arrays into a single one, if needed */
1604970935fdSSascha Wildner if (mset[j].count == 0)
1605970935fdSSascha Wildner continue;
1606970935fdSSascha Wildner
1607e8af9738SPeter Avalos if (coalesce_entries(ms, mset[j].me, mset[j].count,
1608e8af9738SPeter Avalos &map->magic[j], &map->nmagic[j]) == -1) {
1609327e51cbSPeter Avalos errs++;
1610327e51cbSPeter Avalos goto out;
1611327e51cbSPeter Avalos }
1612327e51cbSPeter Avalos }
1613e8af9738SPeter Avalos
1614327e51cbSPeter Avalos out:
1615c990e5baSDaniel Fojt free(filearr);
1616e8af9738SPeter Avalos for (j = 0; j < MAGIC_SETS; j++)
1617e8af9738SPeter Avalos magic_entry_free(mset[j].me, mset[j].count);
1618327e51cbSPeter Avalos
1619e8af9738SPeter Avalos if (errs) {
162082c5fa3eSPeter Avalos apprentice_unmap(map);
1621e8af9738SPeter Avalos return NULL;
1622e8af9738SPeter Avalos }
1623e8af9738SPeter Avalos return map;
1624327e51cbSPeter Avalos }
1625327e51cbSPeter Avalos
1626327e51cbSPeter Avalos /*
1627327e51cbSPeter Avalos * extend the sign bit if the comparison is to be signed
1628327e51cbSPeter Avalos */
1629327e51cbSPeter Avalos protected uint64_t
file_signextend(struct magic_set * ms,struct magic * m,uint64_t v)1630327e51cbSPeter Avalos file_signextend(struct magic_set *ms, struct magic *m, uint64_t v)
1631327e51cbSPeter Avalos {
1632327e51cbSPeter Avalos if (!(m->flag & UNSIGNED)) {
1633327e51cbSPeter Avalos switch(m->type) {
1634327e51cbSPeter Avalos /*
1635327e51cbSPeter Avalos * Do not remove the casts below. They are
1636327e51cbSPeter Avalos * vital. When later compared with the data,
1637327e51cbSPeter Avalos * the sign extension must have happened.
1638327e51cbSPeter Avalos */
1639327e51cbSPeter Avalos case FILE_BYTE:
16406fca56fbSSascha Wildner v = CAST(signed char, v);
1641327e51cbSPeter Avalos break;
1642327e51cbSPeter Avalos case FILE_SHORT:
1643327e51cbSPeter Avalos case FILE_BESHORT:
1644327e51cbSPeter Avalos case FILE_LESHORT:
16456fca56fbSSascha Wildner v = CAST(short, v);
1646327e51cbSPeter Avalos break;
1647327e51cbSPeter Avalos case FILE_DATE:
1648327e51cbSPeter Avalos case FILE_BEDATE:
1649327e51cbSPeter Avalos case FILE_LEDATE:
1650327e51cbSPeter Avalos case FILE_MEDATE:
1651327e51cbSPeter Avalos case FILE_LDATE:
1652327e51cbSPeter Avalos case FILE_BELDATE:
1653327e51cbSPeter Avalos case FILE_LELDATE:
1654327e51cbSPeter Avalos case FILE_MELDATE:
1655327e51cbSPeter Avalos case FILE_LONG:
1656327e51cbSPeter Avalos case FILE_BELONG:
1657327e51cbSPeter Avalos case FILE_LELONG:
1658327e51cbSPeter Avalos case FILE_MELONG:
1659327e51cbSPeter Avalos case FILE_FLOAT:
1660327e51cbSPeter Avalos case FILE_BEFLOAT:
1661327e51cbSPeter Avalos case FILE_LEFLOAT:
1662*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSDATE:
1663*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSDATE:
1664*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSDATE:
1665*3b9cdfa3SAntonio Huete Jimenez case FILE_MSDOSTIME:
1666*3b9cdfa3SAntonio Huete Jimenez case FILE_BEMSDOSTIME:
1667*3b9cdfa3SAntonio Huete Jimenez case FILE_LEMSDOSTIME:
16686fca56fbSSascha Wildner v = CAST(int32_t, v);
1669327e51cbSPeter Avalos break;
1670327e51cbSPeter Avalos case FILE_QUAD:
1671327e51cbSPeter Avalos case FILE_BEQUAD:
1672327e51cbSPeter Avalos case FILE_LEQUAD:
1673327e51cbSPeter Avalos case FILE_QDATE:
1674327e51cbSPeter Avalos case FILE_QLDATE:
1675e8af9738SPeter Avalos case FILE_QWDATE:
1676327e51cbSPeter Avalos case FILE_BEQDATE:
1677327e51cbSPeter Avalos case FILE_BEQLDATE:
1678e8af9738SPeter Avalos case FILE_BEQWDATE:
1679327e51cbSPeter Avalos case FILE_LEQDATE:
1680327e51cbSPeter Avalos case FILE_LEQLDATE:
1681e8af9738SPeter Avalos case FILE_LEQWDATE:
1682327e51cbSPeter Avalos case FILE_DOUBLE:
1683327e51cbSPeter Avalos case FILE_BEDOUBLE:
1684327e51cbSPeter Avalos case FILE_LEDOUBLE:
1685c990e5baSDaniel Fojt case FILE_OFFSET:
1686614728caSSascha Wildner case FILE_BEVARINT:
1687614728caSSascha Wildner case FILE_LEVARINT:
16886fca56fbSSascha Wildner v = CAST(int64_t, v);
1689327e51cbSPeter Avalos break;
1690327e51cbSPeter Avalos case FILE_STRING:
1691327e51cbSPeter Avalos case FILE_PSTRING:
1692327e51cbSPeter Avalos case FILE_BESTRING16:
1693327e51cbSPeter Avalos case FILE_LESTRING16:
1694327e51cbSPeter Avalos case FILE_REGEX:
1695327e51cbSPeter Avalos case FILE_SEARCH:
1696327e51cbSPeter Avalos case FILE_DEFAULT:
169779343712SPeter Avalos case FILE_INDIRECT:
1698e8af9738SPeter Avalos case FILE_NAME:
1699e8af9738SPeter Avalos case FILE_USE:
1700e8af9738SPeter Avalos case FILE_CLEAR:
1701c30bd091SSascha Wildner case FILE_DER:
1702c990e5baSDaniel Fojt case FILE_GUID:
1703*3b9cdfa3SAntonio Huete Jimenez case FILE_OCTAL:
1704327e51cbSPeter Avalos break;
1705327e51cbSPeter Avalos default:
1706327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
1707327e51cbSPeter Avalos file_magwarn(ms, "cannot happen: m->type=%d\n",
1708327e51cbSPeter Avalos m->type);
1709c990e5baSDaniel Fojt return FILE_BADSIZE;
1710327e51cbSPeter Avalos }
1711327e51cbSPeter Avalos }
1712327e51cbSPeter Avalos return v;
1713327e51cbSPeter Avalos }
1714327e51cbSPeter Avalos
1715327e51cbSPeter Avalos private int
string_modifier_check(struct magic_set * ms,struct magic * m)171679343712SPeter Avalos string_modifier_check(struct magic_set *ms, struct magic *m)
1717327e51cbSPeter Avalos {
1718327e51cbSPeter Avalos if ((ms->flags & MAGIC_CHECK) == 0)
1719327e51cbSPeter Avalos return 0;
1720327e51cbSPeter Avalos
172182c5fa3eSPeter Avalos if ((m->type != FILE_REGEX || (m->str_flags & REGEX_LINE_COUNT) == 0) &&
172282c5fa3eSPeter Avalos (m->type != FILE_PSTRING && (m->str_flags & PSTRING_LEN) != 0)) {
1723e4d4ce0cSPeter Avalos file_magwarn(ms,
1724e4d4ce0cSPeter Avalos "'/BHhLl' modifiers are only allowed for pascal strings\n");
1725e4d4ce0cSPeter Avalos return -1;
1726e4d4ce0cSPeter Avalos }
1727327e51cbSPeter Avalos switch (m->type) {
1728327e51cbSPeter Avalos case FILE_BESTRING16:
1729327e51cbSPeter Avalos case FILE_LESTRING16:
1730327e51cbSPeter Avalos if (m->str_flags != 0) {
173179343712SPeter Avalos file_magwarn(ms,
173279343712SPeter Avalos "no modifiers allowed for 16-bit strings\n");
1733327e51cbSPeter Avalos return -1;
1734327e51cbSPeter Avalos }
1735327e51cbSPeter Avalos break;
1736327e51cbSPeter Avalos case FILE_STRING:
1737327e51cbSPeter Avalos case FILE_PSTRING:
1738327e51cbSPeter Avalos if ((m->str_flags & REGEX_OFFSET_START) != 0) {
173979343712SPeter Avalos file_magwarn(ms,
174079343712SPeter Avalos "'/%c' only allowed on regex and search\n",
1741327e51cbSPeter Avalos CHAR_REGEX_OFFSET_START);
1742327e51cbSPeter Avalos return -1;
1743327e51cbSPeter Avalos }
1744327e51cbSPeter Avalos break;
1745327e51cbSPeter Avalos case FILE_SEARCH:
174679343712SPeter Avalos if (m->str_range == 0) {
174779343712SPeter Avalos file_magwarn(ms,
174879343712SPeter Avalos "missing range; defaulting to %d\n",
174979343712SPeter Avalos STRING_DEFAULT_RANGE);
175079343712SPeter Avalos m->str_range = STRING_DEFAULT_RANGE;
175179343712SPeter Avalos return -1;
175279343712SPeter Avalos }
1753327e51cbSPeter Avalos break;
1754327e51cbSPeter Avalos case FILE_REGEX:
1755f72f8299SJan Lentfer if ((m->str_flags & STRING_COMPACT_WHITESPACE) != 0) {
1756327e51cbSPeter Avalos file_magwarn(ms, "'/%c' not allowed on regex\n",
1757f72f8299SJan Lentfer CHAR_COMPACT_WHITESPACE);
1758327e51cbSPeter Avalos return -1;
1759327e51cbSPeter Avalos }
1760f72f8299SJan Lentfer if ((m->str_flags & STRING_COMPACT_OPTIONAL_WHITESPACE) != 0) {
1761327e51cbSPeter Avalos file_magwarn(ms, "'/%c' not allowed on regex\n",
1762f72f8299SJan Lentfer CHAR_COMPACT_OPTIONAL_WHITESPACE);
1763327e51cbSPeter Avalos return -1;
1764327e51cbSPeter Avalos }
1765327e51cbSPeter Avalos break;
1766327e51cbSPeter Avalos default:
1767327e51cbSPeter Avalos file_magwarn(ms, "coding error: m->type=%d\n",
1768327e51cbSPeter Avalos m->type);
1769327e51cbSPeter Avalos return -1;
1770327e51cbSPeter Avalos }
1771327e51cbSPeter Avalos return 0;
1772327e51cbSPeter Avalos }
1773327e51cbSPeter Avalos
1774327e51cbSPeter Avalos private int
get_op(char c)1775327e51cbSPeter Avalos get_op(char c)
1776327e51cbSPeter Avalos {
1777327e51cbSPeter Avalos switch (c) {
1778327e51cbSPeter Avalos case '&':
1779327e51cbSPeter Avalos return FILE_OPAND;
1780327e51cbSPeter Avalos case '|':
1781327e51cbSPeter Avalos return FILE_OPOR;
1782327e51cbSPeter Avalos case '^':
1783327e51cbSPeter Avalos return FILE_OPXOR;
1784327e51cbSPeter Avalos case '+':
1785327e51cbSPeter Avalos return FILE_OPADD;
1786327e51cbSPeter Avalos case '-':
1787327e51cbSPeter Avalos return FILE_OPMINUS;
1788327e51cbSPeter Avalos case '*':
1789327e51cbSPeter Avalos return FILE_OPMULTIPLY;
1790327e51cbSPeter Avalos case '/':
1791327e51cbSPeter Avalos return FILE_OPDIVIDE;
1792327e51cbSPeter Avalos case '%':
1793327e51cbSPeter Avalos return FILE_OPMODULO;
1794327e51cbSPeter Avalos default:
1795327e51cbSPeter Avalos return -1;
1796327e51cbSPeter Avalos }
1797327e51cbSPeter Avalos }
1798327e51cbSPeter Avalos
1799327e51cbSPeter Avalos #ifdef ENABLE_CONDITIONALS
1800327e51cbSPeter Avalos private int
get_cond(const char * l,const char ** t)1801327e51cbSPeter Avalos get_cond(const char *l, const char **t)
1802327e51cbSPeter Avalos {
180379343712SPeter Avalos static const struct cond_tbl_s {
180479343712SPeter Avalos char name[8];
180579343712SPeter Avalos size_t len;
180679343712SPeter Avalos int cond;
1807327e51cbSPeter Avalos } cond_tbl[] = {
1808327e51cbSPeter Avalos { "if", 2, COND_IF },
1809327e51cbSPeter Avalos { "elif", 4, COND_ELIF },
1810327e51cbSPeter Avalos { "else", 4, COND_ELSE },
181179343712SPeter Avalos { "", 0, COND_NONE },
1812327e51cbSPeter Avalos };
181379343712SPeter Avalos const struct cond_tbl_s *p;
1814327e51cbSPeter Avalos
181579343712SPeter Avalos for (p = cond_tbl; p->len; p++) {
1816327e51cbSPeter Avalos if (strncmp(l, p->name, p->len) == 0 &&
18176fca56fbSSascha Wildner isspace(CAST(unsigned char, l[p->len]))) {
1818327e51cbSPeter Avalos if (t)
1819327e51cbSPeter Avalos *t = l + p->len;
1820327e51cbSPeter Avalos break;
1821327e51cbSPeter Avalos }
1822327e51cbSPeter Avalos }
1823327e51cbSPeter Avalos return p->cond;
1824327e51cbSPeter Avalos }
1825327e51cbSPeter Avalos
1826327e51cbSPeter Avalos private int
check_cond(struct magic_set * ms,int cond,uint32_t cont_level)1827327e51cbSPeter Avalos check_cond(struct magic_set *ms, int cond, uint32_t cont_level)
1828327e51cbSPeter Avalos {
1829327e51cbSPeter Avalos int last_cond;
1830327e51cbSPeter Avalos last_cond = ms->c.li[cont_level].last_cond;
1831327e51cbSPeter Avalos
1832327e51cbSPeter Avalos switch (cond) {
1833327e51cbSPeter Avalos case COND_IF:
1834327e51cbSPeter Avalos if (last_cond != COND_NONE && last_cond != COND_ELIF) {
1835327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
1836327e51cbSPeter Avalos file_magwarn(ms, "syntax error: `if'");
1837327e51cbSPeter Avalos return -1;
1838327e51cbSPeter Avalos }
1839327e51cbSPeter Avalos last_cond = COND_IF;
1840327e51cbSPeter Avalos break;
1841327e51cbSPeter Avalos
1842327e51cbSPeter Avalos case COND_ELIF:
1843327e51cbSPeter Avalos if (last_cond != COND_IF && last_cond != COND_ELIF) {
1844327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
1845327e51cbSPeter Avalos file_magwarn(ms, "syntax error: `elif'");
1846327e51cbSPeter Avalos return -1;
1847327e51cbSPeter Avalos }
1848327e51cbSPeter Avalos last_cond = COND_ELIF;
1849327e51cbSPeter Avalos break;
1850327e51cbSPeter Avalos
1851327e51cbSPeter Avalos case COND_ELSE:
1852327e51cbSPeter Avalos if (last_cond != COND_IF && last_cond != COND_ELIF) {
1853327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
1854327e51cbSPeter Avalos file_magwarn(ms, "syntax error: `else'");
1855327e51cbSPeter Avalos return -1;
1856327e51cbSPeter Avalos }
1857327e51cbSPeter Avalos last_cond = COND_NONE;
1858327e51cbSPeter Avalos break;
1859327e51cbSPeter Avalos
1860327e51cbSPeter Avalos case COND_NONE:
1861327e51cbSPeter Avalos last_cond = COND_NONE;
1862327e51cbSPeter Avalos break;
1863327e51cbSPeter Avalos }
1864327e51cbSPeter Avalos
1865327e51cbSPeter Avalos ms->c.li[cont_level].last_cond = last_cond;
1866327e51cbSPeter Avalos return 0;
1867327e51cbSPeter Avalos }
1868327e51cbSPeter Avalos #endif /* ENABLE_CONDITIONALS */
1869327e51cbSPeter Avalos
187082c5fa3eSPeter Avalos private int
parse_indirect_modifier(struct magic_set * ms,struct magic * m,const char ** lp)187182c5fa3eSPeter Avalos parse_indirect_modifier(struct magic_set *ms, struct magic *m, const char **lp)
187282c5fa3eSPeter Avalos {
187382c5fa3eSPeter Avalos const char *l = *lp;
187482c5fa3eSPeter Avalos
18756fca56fbSSascha Wildner while (!isspace(CAST(unsigned char, *++l)))
187682c5fa3eSPeter Avalos switch (*l) {
187782c5fa3eSPeter Avalos case CHAR_INDIRECT_RELATIVE:
187882c5fa3eSPeter Avalos m->str_flags |= INDIRECT_RELATIVE;
187982c5fa3eSPeter Avalos break;
188082c5fa3eSPeter Avalos default:
188182c5fa3eSPeter Avalos if (ms->flags & MAGIC_CHECK)
188282c5fa3eSPeter Avalos file_magwarn(ms, "indirect modifier `%c' "
188382c5fa3eSPeter Avalos "invalid", *l);
188482c5fa3eSPeter Avalos *lp = l;
188582c5fa3eSPeter Avalos return -1;
188682c5fa3eSPeter Avalos }
188782c5fa3eSPeter Avalos *lp = l;
188882c5fa3eSPeter Avalos return 0;
188982c5fa3eSPeter Avalos }
189082c5fa3eSPeter Avalos
189182c5fa3eSPeter Avalos private void
parse_op_modifier(struct magic_set * ms,struct magic * m,const char ** lp,int op)189282c5fa3eSPeter Avalos parse_op_modifier(struct magic_set *ms, struct magic *m, const char **lp,
189382c5fa3eSPeter Avalos int op)
189482c5fa3eSPeter Avalos {
189582c5fa3eSPeter Avalos const char *l = *lp;
189682c5fa3eSPeter Avalos char *t;
189782c5fa3eSPeter Avalos uint64_t val;
189882c5fa3eSPeter Avalos
189982c5fa3eSPeter Avalos ++l;
190082c5fa3eSPeter Avalos m->mask_op |= op;
19016fca56fbSSascha Wildner val = CAST(uint64_t, strtoull(l, &t, 0));
190282c5fa3eSPeter Avalos l = t;
190382c5fa3eSPeter Avalos m->num_mask = file_signextend(ms, m, val);
190482c5fa3eSPeter Avalos eatsize(&l);
190582c5fa3eSPeter Avalos *lp = l;
190682c5fa3eSPeter Avalos }
190782c5fa3eSPeter Avalos
190882c5fa3eSPeter Avalos private int
parse_string_modifier(struct magic_set * ms,struct magic * m,const char ** lp)190982c5fa3eSPeter Avalos parse_string_modifier(struct magic_set *ms, struct magic *m, const char **lp)
191082c5fa3eSPeter Avalos {
191182c5fa3eSPeter Avalos const char *l = *lp;
191282c5fa3eSPeter Avalos char *t;
191382c5fa3eSPeter Avalos int have_range = 0;
191482c5fa3eSPeter Avalos
19156fca56fbSSascha Wildner while (!isspace(CAST(unsigned char, *++l))) {
191682c5fa3eSPeter Avalos switch (*l) {
191782c5fa3eSPeter Avalos case '0': case '1': case '2':
191882c5fa3eSPeter Avalos case '3': case '4': case '5':
191982c5fa3eSPeter Avalos case '6': case '7': case '8':
192082c5fa3eSPeter Avalos case '9':
192182c5fa3eSPeter Avalos if (have_range && (ms->flags & MAGIC_CHECK))
192282c5fa3eSPeter Avalos file_magwarn(ms, "multiple ranges");
192382c5fa3eSPeter Avalos have_range = 1;
192482c5fa3eSPeter Avalos m->str_range = CAST(uint32_t, strtoul(l, &t, 0));
192582c5fa3eSPeter Avalos if (m->str_range == 0)
192682c5fa3eSPeter Avalos file_magwarn(ms, "zero range");
192782c5fa3eSPeter Avalos l = t - 1;
192882c5fa3eSPeter Avalos break;
192982c5fa3eSPeter Avalos case CHAR_COMPACT_WHITESPACE:
193082c5fa3eSPeter Avalos m->str_flags |= STRING_COMPACT_WHITESPACE;
193182c5fa3eSPeter Avalos break;
193282c5fa3eSPeter Avalos case CHAR_COMPACT_OPTIONAL_WHITESPACE:
193382c5fa3eSPeter Avalos m->str_flags |= STRING_COMPACT_OPTIONAL_WHITESPACE;
193482c5fa3eSPeter Avalos break;
193582c5fa3eSPeter Avalos case CHAR_IGNORE_LOWERCASE:
193682c5fa3eSPeter Avalos m->str_flags |= STRING_IGNORE_LOWERCASE;
193782c5fa3eSPeter Avalos break;
193882c5fa3eSPeter Avalos case CHAR_IGNORE_UPPERCASE:
193982c5fa3eSPeter Avalos m->str_flags |= STRING_IGNORE_UPPERCASE;
194082c5fa3eSPeter Avalos break;
194182c5fa3eSPeter Avalos case CHAR_REGEX_OFFSET_START:
194282c5fa3eSPeter Avalos m->str_flags |= REGEX_OFFSET_START;
194382c5fa3eSPeter Avalos break;
194482c5fa3eSPeter Avalos case CHAR_BINTEST:
194582c5fa3eSPeter Avalos m->str_flags |= STRING_BINTEST;
194682c5fa3eSPeter Avalos break;
194782c5fa3eSPeter Avalos case CHAR_TEXTTEST:
194882c5fa3eSPeter Avalos m->str_flags |= STRING_TEXTTEST;
194982c5fa3eSPeter Avalos break;
195082c5fa3eSPeter Avalos case CHAR_TRIM:
195182c5fa3eSPeter Avalos m->str_flags |= STRING_TRIM;
195282c5fa3eSPeter Avalos break;
1953614728caSSascha Wildner case CHAR_FULL_WORD:
1954614728caSSascha Wildner m->str_flags |= STRING_FULL_WORD;
1955614728caSSascha Wildner break;
195682c5fa3eSPeter Avalos case CHAR_PSTRING_1_LE:
195782c5fa3eSPeter Avalos #define SET_LENGTH(a) m->str_flags = (m->str_flags & ~PSTRING_LEN) | (a)
195882c5fa3eSPeter Avalos if (m->type != FILE_PSTRING)
195982c5fa3eSPeter Avalos goto bad;
196082c5fa3eSPeter Avalos SET_LENGTH(PSTRING_1_LE);
196182c5fa3eSPeter Avalos break;
196282c5fa3eSPeter Avalos case CHAR_PSTRING_2_BE:
196382c5fa3eSPeter Avalos if (m->type != FILE_PSTRING)
196482c5fa3eSPeter Avalos goto bad;
196582c5fa3eSPeter Avalos SET_LENGTH(PSTRING_2_BE);
196682c5fa3eSPeter Avalos break;
196782c5fa3eSPeter Avalos case CHAR_PSTRING_2_LE:
196882c5fa3eSPeter Avalos if (m->type != FILE_PSTRING)
196982c5fa3eSPeter Avalos goto bad;
197082c5fa3eSPeter Avalos SET_LENGTH(PSTRING_2_LE);
197182c5fa3eSPeter Avalos break;
197282c5fa3eSPeter Avalos case CHAR_PSTRING_4_BE:
197382c5fa3eSPeter Avalos if (m->type != FILE_PSTRING)
197482c5fa3eSPeter Avalos goto bad;
197582c5fa3eSPeter Avalos SET_LENGTH(PSTRING_4_BE);
197682c5fa3eSPeter Avalos break;
197782c5fa3eSPeter Avalos case CHAR_PSTRING_4_LE:
197882c5fa3eSPeter Avalos switch (m->type) {
197982c5fa3eSPeter Avalos case FILE_PSTRING:
198082c5fa3eSPeter Avalos case FILE_REGEX:
198182c5fa3eSPeter Avalos break;
198282c5fa3eSPeter Avalos default:
198382c5fa3eSPeter Avalos goto bad;
198482c5fa3eSPeter Avalos }
198582c5fa3eSPeter Avalos SET_LENGTH(PSTRING_4_LE);
198682c5fa3eSPeter Avalos break;
198782c5fa3eSPeter Avalos case CHAR_PSTRING_LENGTH_INCLUDES_ITSELF:
198882c5fa3eSPeter Avalos if (m->type != FILE_PSTRING)
198982c5fa3eSPeter Avalos goto bad;
199082c5fa3eSPeter Avalos m->str_flags |= PSTRING_LENGTH_INCLUDES_ITSELF;
199182c5fa3eSPeter Avalos break;
199282c5fa3eSPeter Avalos default:
199382c5fa3eSPeter Avalos bad:
199482c5fa3eSPeter Avalos if (ms->flags & MAGIC_CHECK)
199582c5fa3eSPeter Avalos file_magwarn(ms, "string modifier `%c' "
199682c5fa3eSPeter Avalos "invalid", *l);
199782c5fa3eSPeter Avalos goto out;
199882c5fa3eSPeter Avalos }
199982c5fa3eSPeter Avalos /* allow multiple '/' for readability */
20006fca56fbSSascha Wildner if (l[1] == '/' && !isspace(CAST(unsigned char, l[2])))
200182c5fa3eSPeter Avalos l++;
200282c5fa3eSPeter Avalos }
200382c5fa3eSPeter Avalos if (string_modifier_check(ms, m) == -1)
200482c5fa3eSPeter Avalos goto out;
200582c5fa3eSPeter Avalos *lp = l;
200682c5fa3eSPeter Avalos return 0;
200782c5fa3eSPeter Avalos out:
200882c5fa3eSPeter Avalos *lp = l;
200982c5fa3eSPeter Avalos return -1;
201082c5fa3eSPeter Avalos }
201182c5fa3eSPeter Avalos
2012327e51cbSPeter Avalos /*
2013327e51cbSPeter Avalos * parse one line from magic file, put into magic[index++] if valid
2014327e51cbSPeter Avalos */
2015327e51cbSPeter Avalos private int
parse(struct magic_set * ms,struct magic_entry * me,const char * line,size_t lineno,int action)2016e8af9738SPeter Avalos parse(struct magic_set *ms, struct magic_entry *me, const char *line,
2017e8af9738SPeter Avalos size_t lineno, int action)
2018327e51cbSPeter Avalos {
2019327e51cbSPeter Avalos #ifdef ENABLE_CONDITIONALS
2020327e51cbSPeter Avalos static uint32_t last_cont_level = 0;
2021327e51cbSPeter Avalos #endif
2022327e51cbSPeter Avalos size_t i;
2023327e51cbSPeter Avalos struct magic *m;
2024327e51cbSPeter Avalos const char *l = line;
2025327e51cbSPeter Avalos char *t;
2026327e51cbSPeter Avalos int op;
2027327e51cbSPeter Avalos uint32_t cont_level;
2028e8af9738SPeter Avalos int32_t diff;
2029327e51cbSPeter Avalos
2030327e51cbSPeter Avalos cont_level = 0;
2031327e51cbSPeter Avalos
2032e8af9738SPeter Avalos /*
2033e8af9738SPeter Avalos * Parse the offset.
2034e8af9738SPeter Avalos */
2035327e51cbSPeter Avalos while (*l == '>') {
2036327e51cbSPeter Avalos ++l; /* step over */
2037327e51cbSPeter Avalos cont_level++;
2038327e51cbSPeter Avalos }
2039327e51cbSPeter Avalos #ifdef ENABLE_CONDITIONALS
2040327e51cbSPeter Avalos if (cont_level == 0 || cont_level > last_cont_level)
2041327e51cbSPeter Avalos if (file_check_mem(ms, cont_level) == -1)
2042327e51cbSPeter Avalos return -1;
2043327e51cbSPeter Avalos last_cont_level = cont_level;
2044327e51cbSPeter Avalos #endif
2045327e51cbSPeter Avalos if (cont_level != 0) {
2046e8af9738SPeter Avalos if (me->mp == NULL) {
2047e8af9738SPeter Avalos file_magerror(ms, "No current entry for continuation");
2048327e51cbSPeter Avalos return -1;
2049327e51cbSPeter Avalos }
2050e8af9738SPeter Avalos if (me->cont_count == 0) {
2051e8af9738SPeter Avalos file_magerror(ms, "Continuations present with 0 count");
2052e8af9738SPeter Avalos return -1;
2053e8af9738SPeter Avalos }
2054e8af9738SPeter Avalos m = &me->mp[me->cont_count - 1];
20556fca56fbSSascha Wildner diff = CAST(int32_t, cont_level) - CAST(int32_t, m->cont_level);
2056e8af9738SPeter Avalos if (diff > 1)
2057e8af9738SPeter Avalos file_magwarn(ms, "New continuation level %u is more "
2058e8af9738SPeter Avalos "than one larger than current level %u", cont_level,
2059e8af9738SPeter Avalos m->cont_level);
2060327e51cbSPeter Avalos if (me->cont_count == me->max_count) {
2061327e51cbSPeter Avalos struct magic *nm;
2062327e51cbSPeter Avalos size_t cnt = me->max_count + ALLOC_CHUNK;
206379343712SPeter Avalos if ((nm = CAST(struct magic *, realloc(me->mp,
206479343712SPeter Avalos sizeof(*nm) * cnt))) == NULL) {
2065327e51cbSPeter Avalos file_oomem(ms, sizeof(*nm) * cnt);
2066327e51cbSPeter Avalos return -1;
2067327e51cbSPeter Avalos }
20686fca56fbSSascha Wildner me->mp = nm;
2069f72f8299SJan Lentfer me->max_count = CAST(uint32_t, cnt);
2070327e51cbSPeter Avalos }
2071327e51cbSPeter Avalos m = &me->mp[me->cont_count++];
2072327e51cbSPeter Avalos (void)memset(m, 0, sizeof(*m));
2073327e51cbSPeter Avalos m->cont_level = cont_level;
2074327e51cbSPeter Avalos } else {
2075e8af9738SPeter Avalos static const size_t len = sizeof(*m) * ALLOC_CHUNK;
2076e8af9738SPeter Avalos if (me->mp != NULL)
2077e8af9738SPeter Avalos return 1;
207879343712SPeter Avalos if ((m = CAST(struct magic *, malloc(len))) == NULL) {
207979343712SPeter Avalos file_oomem(ms, len);
2080327e51cbSPeter Avalos return -1;
2081327e51cbSPeter Avalos }
2082327e51cbSPeter Avalos me->mp = m;
2083327e51cbSPeter Avalos me->max_count = ALLOC_CHUNK;
2084327e51cbSPeter Avalos (void)memset(m, 0, sizeof(*m));
208579343712SPeter Avalos m->factor_op = FILE_FACTOR_OP_NONE;
2086327e51cbSPeter Avalos m->cont_level = 0;
2087327e51cbSPeter Avalos me->cont_count = 1;
2088327e51cbSPeter Avalos }
2089f72f8299SJan Lentfer m->lineno = CAST(uint32_t, lineno);
2090327e51cbSPeter Avalos
2091327e51cbSPeter Avalos if (*l == '&') { /* m->cont_level == 0 checked below. */
2092327e51cbSPeter Avalos ++l; /* step over */
2093327e51cbSPeter Avalos m->flag |= OFFADD;
2094327e51cbSPeter Avalos }
2095327e51cbSPeter Avalos if (*l == '(') {
2096327e51cbSPeter Avalos ++l; /* step over */
2097327e51cbSPeter Avalos m->flag |= INDIR;
2098327e51cbSPeter Avalos if (m->flag & OFFADD)
2099327e51cbSPeter Avalos m->flag = (m->flag & ~OFFADD) | INDIROFFADD;
2100327e51cbSPeter Avalos
2101327e51cbSPeter Avalos if (*l == '&') { /* m->cont_level == 0 checked below */
2102327e51cbSPeter Avalos ++l; /* step over */
2103327e51cbSPeter Avalos m->flag |= OFFADD;
2104327e51cbSPeter Avalos }
2105327e51cbSPeter Avalos }
2106327e51cbSPeter Avalos /* Indirect offsets are not valid at level 0. */
2107c30bd091SSascha Wildner if (m->cont_level == 0 && (m->flag & (OFFADD | INDIROFFADD))) {
2108327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2109327e51cbSPeter Avalos file_magwarn(ms, "relative offset at level 0");
2110c30bd091SSascha Wildner return -1;
2111c30bd091SSascha Wildner }
2112327e51cbSPeter Avalos
2113327e51cbSPeter Avalos /* get offset, then skip over it */
2114c990e5baSDaniel Fojt if (*l == '-') {
2115c990e5baSDaniel Fojt ++l; /* step over */
2116c990e5baSDaniel Fojt m->flag |= OFFNEGATIVE;
2117c990e5baSDaniel Fojt }
21186fca56fbSSascha Wildner m->offset = CAST(int32_t, strtol(l, &t, 0));
2119c30bd091SSascha Wildner if (l == t) {
2120327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2121327e51cbSPeter Avalos file_magwarn(ms, "offset `%s' invalid", l);
2122c30bd091SSascha Wildner return -1;
2123c30bd091SSascha Wildner }
21246fca56fbSSascha Wildner
2125327e51cbSPeter Avalos l = t;
2126327e51cbSPeter Avalos
2127327e51cbSPeter Avalos if (m->flag & INDIR) {
2128327e51cbSPeter Avalos m->in_type = FILE_LONG;
2129327e51cbSPeter Avalos m->in_offset = 0;
2130c30bd091SSascha Wildner m->in_op = 0;
2131327e51cbSPeter Avalos /*
2132c30bd091SSascha Wildner * read [.,lbs][+-]nnnnn)
2133327e51cbSPeter Avalos */
2134c30bd091SSascha Wildner if (*l == '.' || *l == ',') {
2135c30bd091SSascha Wildner if (*l == ',')
2136c30bd091SSascha Wildner m->in_op |= FILE_OPSIGNED;
2137327e51cbSPeter Avalos l++;
2138327e51cbSPeter Avalos switch (*l) {
2139327e51cbSPeter Avalos case 'l':
2140327e51cbSPeter Avalos m->in_type = FILE_LELONG;
2141327e51cbSPeter Avalos break;
2142327e51cbSPeter Avalos case 'L':
2143327e51cbSPeter Avalos m->in_type = FILE_BELONG;
2144327e51cbSPeter Avalos break;
2145327e51cbSPeter Avalos case 'm':
2146327e51cbSPeter Avalos m->in_type = FILE_MELONG;
2147327e51cbSPeter Avalos break;
2148327e51cbSPeter Avalos case 'h':
2149327e51cbSPeter Avalos case 's':
2150327e51cbSPeter Avalos m->in_type = FILE_LESHORT;
2151327e51cbSPeter Avalos break;
2152327e51cbSPeter Avalos case 'H':
2153327e51cbSPeter Avalos case 'S':
2154327e51cbSPeter Avalos m->in_type = FILE_BESHORT;
2155327e51cbSPeter Avalos break;
2156327e51cbSPeter Avalos case 'c':
2157327e51cbSPeter Avalos case 'b':
2158327e51cbSPeter Avalos case 'C':
2159327e51cbSPeter Avalos case 'B':
2160327e51cbSPeter Avalos m->in_type = FILE_BYTE;
2161327e51cbSPeter Avalos break;
2162327e51cbSPeter Avalos case 'e':
2163327e51cbSPeter Avalos case 'f':
2164327e51cbSPeter Avalos case 'g':
2165327e51cbSPeter Avalos m->in_type = FILE_LEDOUBLE;
2166327e51cbSPeter Avalos break;
2167327e51cbSPeter Avalos case 'E':
2168327e51cbSPeter Avalos case 'F':
2169327e51cbSPeter Avalos case 'G':
2170327e51cbSPeter Avalos m->in_type = FILE_BEDOUBLE;
2171327e51cbSPeter Avalos break;
217279343712SPeter Avalos case 'i':
217379343712SPeter Avalos m->in_type = FILE_LEID3;
217479343712SPeter Avalos break;
217579343712SPeter Avalos case 'I':
217679343712SPeter Avalos m->in_type = FILE_BEID3;
217779343712SPeter Avalos break;
2178*3b9cdfa3SAntonio Huete Jimenez case 'o':
2179*3b9cdfa3SAntonio Huete Jimenez m->in_type = FILE_OCTAL;
2180*3b9cdfa3SAntonio Huete Jimenez break;
21816fca56fbSSascha Wildner case 'q':
21826fca56fbSSascha Wildner m->in_type = FILE_LEQUAD;
21836fca56fbSSascha Wildner break;
21846fca56fbSSascha Wildner case 'Q':
21856fca56fbSSascha Wildner m->in_type = FILE_BEQUAD;
21866fca56fbSSascha Wildner break;
2187327e51cbSPeter Avalos default:
2188327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2189327e51cbSPeter Avalos file_magwarn(ms,
2190327e51cbSPeter Avalos "indirect offset type `%c' invalid",
2191327e51cbSPeter Avalos *l);
2192c30bd091SSascha Wildner return -1;
2193327e51cbSPeter Avalos }
2194327e51cbSPeter Avalos l++;
2195327e51cbSPeter Avalos }
2196327e51cbSPeter Avalos
2197327e51cbSPeter Avalos if (*l == '~') {
2198327e51cbSPeter Avalos m->in_op |= FILE_OPINVERSE;
2199327e51cbSPeter Avalos l++;
2200327e51cbSPeter Avalos }
2201327e51cbSPeter Avalos if ((op = get_op(*l)) != -1) {
2202327e51cbSPeter Avalos m->in_op |= op;
2203327e51cbSPeter Avalos l++;
2204327e51cbSPeter Avalos }
2205327e51cbSPeter Avalos if (*l == '(') {
2206327e51cbSPeter Avalos m->in_op |= FILE_OPINDIRECT;
2207327e51cbSPeter Avalos l++;
2208327e51cbSPeter Avalos }
22096fca56fbSSascha Wildner if (isdigit(CAST(unsigned char, *l)) || *l == '-') {
22106fca56fbSSascha Wildner m->in_offset = CAST(int32_t, strtol(l, &t, 0));
2211c30bd091SSascha Wildner if (l == t) {
2212327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2213327e51cbSPeter Avalos file_magwarn(ms,
2214327e51cbSPeter Avalos "in_offset `%s' invalid", l);
2215c30bd091SSascha Wildner return -1;
2216c30bd091SSascha Wildner }
2217327e51cbSPeter Avalos l = t;
2218327e51cbSPeter Avalos }
2219327e51cbSPeter Avalos if (*l++ != ')' ||
2220c30bd091SSascha Wildner ((m->in_op & FILE_OPINDIRECT) && *l++ != ')')) {
2221327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2222327e51cbSPeter Avalos file_magwarn(ms,
2223327e51cbSPeter Avalos "missing ')' in indirect offset");
2224c30bd091SSascha Wildner return -1;
2225c30bd091SSascha Wildner }
2226327e51cbSPeter Avalos }
2227327e51cbSPeter Avalos EATAB;
2228327e51cbSPeter Avalos
2229327e51cbSPeter Avalos #ifdef ENABLE_CONDITIONALS
2230327e51cbSPeter Avalos m->cond = get_cond(l, &l);
2231327e51cbSPeter Avalos if (check_cond(ms, m->cond, cont_level) == -1)
2232327e51cbSPeter Avalos return -1;
2233327e51cbSPeter Avalos
2234327e51cbSPeter Avalos EATAB;
2235327e51cbSPeter Avalos #endif
2236327e51cbSPeter Avalos
2237e8af9738SPeter Avalos /*
2238e8af9738SPeter Avalos * Parse the type.
2239e8af9738SPeter Avalos */
2240327e51cbSPeter Avalos if (*l == 'u') {
2241e8af9738SPeter Avalos /*
2242e8af9738SPeter Avalos * Try it as a keyword type prefixed by "u"; match what
2243e8af9738SPeter Avalos * follows the "u". If that fails, try it as an SUS
2244e8af9738SPeter Avalos * integer type.
2245e8af9738SPeter Avalos */
2246e8af9738SPeter Avalos m->type = get_type(type_tbl, l + 1, &l);
2247e8af9738SPeter Avalos if (m->type == FILE_INVALID) {
2248e8af9738SPeter Avalos /*
2249e8af9738SPeter Avalos * Not a keyword type; parse it as an SUS type,
2250e8af9738SPeter Avalos * 'u' possibly followed by a number or C/S/L.
2251e8af9738SPeter Avalos */
2252e8af9738SPeter Avalos m->type = get_standard_integer_type(l, &l);
2253e8af9738SPeter Avalos }
225482c5fa3eSPeter Avalos /* It's unsigned. */
2255e8af9738SPeter Avalos if (m->type != FILE_INVALID)
2256327e51cbSPeter Avalos m->flag |= UNSIGNED;
2257e8af9738SPeter Avalos } else {
2258e8af9738SPeter Avalos /*
2259e8af9738SPeter Avalos * Try it as a keyword type. If that fails, try it as
2260e8af9738SPeter Avalos * an SUS integer type if it begins with "d" or as an
2261e8af9738SPeter Avalos * SUS string type if it begins with "s". In any case,
2262e8af9738SPeter Avalos * it's not unsigned.
2263e8af9738SPeter Avalos */
2264e8af9738SPeter Avalos m->type = get_type(type_tbl, l, &l);
2265e8af9738SPeter Avalos if (m->type == FILE_INVALID) {
2266e8af9738SPeter Avalos /*
2267e8af9738SPeter Avalos * Not a keyword type; parse it as an SUS type,
2268e8af9738SPeter Avalos * either 'd' possibly followed by a number or
2269e8af9738SPeter Avalos * C/S/L, or just 's'.
2270e8af9738SPeter Avalos */
2271e8af9738SPeter Avalos if (*l == 'd')
2272e8af9738SPeter Avalos m->type = get_standard_integer_type(l, &l);
22736fca56fbSSascha Wildner else if (*l == 's'
22746fca56fbSSascha Wildner && !isalpha(CAST(unsigned char, l[1]))) {
2275e8af9738SPeter Avalos m->type = FILE_STRING;
2276e8af9738SPeter Avalos ++l;
2277e8af9738SPeter Avalos }
2278e8af9738SPeter Avalos }
2279327e51cbSPeter Avalos }
2280327e51cbSPeter Avalos
2281e8af9738SPeter Avalos if (m->type == FILE_INVALID) {
2282e8af9738SPeter Avalos /* Not found - try it as a special keyword. */
2283e8af9738SPeter Avalos m->type = get_type(special_tbl, l, &l);
2284e8af9738SPeter Avalos }
2285e8af9738SPeter Avalos
2286327e51cbSPeter Avalos if (m->type == FILE_INVALID) {
2287327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2288327e51cbSPeter Avalos file_magwarn(ms, "type `%s' invalid", l);
2289327e51cbSPeter Avalos return -1;
2290327e51cbSPeter Avalos }
2291327e51cbSPeter Avalos
2292970935fdSSascha Wildner if (m->type == FILE_NAME && cont_level != 0) {
2293970935fdSSascha Wildner if (ms->flags & MAGIC_CHECK)
2294970935fdSSascha Wildner file_magwarn(ms, "`name%s' entries can only be "
2295970935fdSSascha Wildner "declared at top level", l);
2296970935fdSSascha Wildner return -1;
2297970935fdSSascha Wildner }
2298970935fdSSascha Wildner
2299327e51cbSPeter Avalos /* New-style anding: "0 byte&0x80 =0x80 dynamically linked" */
2300327e51cbSPeter Avalos /* New and improved: ~ & | ^ + - * / % -- exciting, isn't it? */
2301327e51cbSPeter Avalos
2302327e51cbSPeter Avalos m->mask_op = 0;
2303327e51cbSPeter Avalos if (*l == '~') {
2304327e51cbSPeter Avalos if (!IS_STRING(m->type))
2305327e51cbSPeter Avalos m->mask_op |= FILE_OPINVERSE;
2306327e51cbSPeter Avalos else if (ms->flags & MAGIC_CHECK)
2307327e51cbSPeter Avalos file_magwarn(ms, "'~' invalid for string types");
2308327e51cbSPeter Avalos ++l;
2309327e51cbSPeter Avalos }
231079343712SPeter Avalos m->str_range = 0;
2311e4d4ce0cSPeter Avalos m->str_flags = m->type == FILE_PSTRING ? PSTRING_1_LE : 0;
2312327e51cbSPeter Avalos if ((op = get_op(*l)) != -1) {
231382c5fa3eSPeter Avalos if (IS_STRING(m->type)) {
231482c5fa3eSPeter Avalos int r;
231582c5fa3eSPeter Avalos
231682c5fa3eSPeter Avalos if (op != FILE_OPDIVIDE) {
2317327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2318327e51cbSPeter Avalos file_magwarn(ms,
231982c5fa3eSPeter Avalos "invalid string/indirect op: "
232082c5fa3eSPeter Avalos "`%c'", *t);
2321327e51cbSPeter Avalos return -1;
2322327e51cbSPeter Avalos }
232382c5fa3eSPeter Avalos
232482c5fa3eSPeter Avalos if (m->type == FILE_INDIRECT)
232582c5fa3eSPeter Avalos r = parse_indirect_modifier(ms, m, &l);
232682c5fa3eSPeter Avalos else
232782c5fa3eSPeter Avalos r = parse_string_modifier(ms, m, &l);
232882c5fa3eSPeter Avalos if (r == -1)
2329327e51cbSPeter Avalos return -1;
233082c5fa3eSPeter Avalos } else
233182c5fa3eSPeter Avalos parse_op_modifier(ms, m, &l, op);
2332327e51cbSPeter Avalos }
233382c5fa3eSPeter Avalos
2334327e51cbSPeter Avalos /*
2335327e51cbSPeter Avalos * We used to set mask to all 1's here, instead let's just not do
2336327e51cbSPeter Avalos * anything if mask = 0 (unless you have a better idea)
2337327e51cbSPeter Avalos */
2338327e51cbSPeter Avalos EATAB;
2339327e51cbSPeter Avalos
2340327e51cbSPeter Avalos switch (*l) {
2341327e51cbSPeter Avalos case '>':
2342327e51cbSPeter Avalos case '<':
234379343712SPeter Avalos m->reln = *l;
234479343712SPeter Avalos ++l;
234579343712SPeter Avalos if (*l == '=') {
234679343712SPeter Avalos if (ms->flags & MAGIC_CHECK) {
234779343712SPeter Avalos file_magwarn(ms, "%c= not supported",
234879343712SPeter Avalos m->reln);
234979343712SPeter Avalos return -1;
235079343712SPeter Avalos }
235179343712SPeter Avalos ++l;
235279343712SPeter Avalos }
235379343712SPeter Avalos break;
2354327e51cbSPeter Avalos /* Old-style anding: "0 byte &0x80 dynamically linked" */
2355327e51cbSPeter Avalos case '&':
2356327e51cbSPeter Avalos case '^':
2357327e51cbSPeter Avalos case '=':
2358327e51cbSPeter Avalos m->reln = *l;
2359327e51cbSPeter Avalos ++l;
2360327e51cbSPeter Avalos if (*l == '=') {
2361327e51cbSPeter Avalos /* HP compat: ignore &= etc. */
2362327e51cbSPeter Avalos ++l;
2363327e51cbSPeter Avalos }
2364327e51cbSPeter Avalos break;
2365327e51cbSPeter Avalos case '!':
2366327e51cbSPeter Avalos m->reln = *l;
2367327e51cbSPeter Avalos ++l;
2368327e51cbSPeter Avalos break;
2369327e51cbSPeter Avalos default:
2370327e51cbSPeter Avalos m->reln = '='; /* the default relation */
23716fca56fbSSascha Wildner if (*l == 'x' && ((isascii(CAST(unsigned char, l[1])) &&
23726fca56fbSSascha Wildner isspace(CAST(unsigned char, l[1]))) || !l[1])) {
2373327e51cbSPeter Avalos m->reln = *l;
2374327e51cbSPeter Avalos ++l;
2375327e51cbSPeter Avalos }
2376327e51cbSPeter Avalos break;
2377327e51cbSPeter Avalos }
2378327e51cbSPeter Avalos /*
2379327e51cbSPeter Avalos * Grab the value part, except for an 'x' reln.
2380327e51cbSPeter Avalos */
2381327e51cbSPeter Avalos if (m->reln != 'x' && getvalue(ms, m, &l, action))
2382327e51cbSPeter Avalos return -1;
2383327e51cbSPeter Avalos
2384327e51cbSPeter Avalos /*
2385327e51cbSPeter Avalos * TODO finish this macro and start using it!
2386c30bd091SSascha Wildner * #define offsetcheck {if (offset > ms->bytes_max -1)
2387327e51cbSPeter Avalos * magwarn("offset too big"); }
2388327e51cbSPeter Avalos */
2389327e51cbSPeter Avalos
2390327e51cbSPeter Avalos /*
2391327e51cbSPeter Avalos * Now get last part - the description
2392327e51cbSPeter Avalos */
2393327e51cbSPeter Avalos EATAB;
2394327e51cbSPeter Avalos if (l[0] == '\b') {
2395327e51cbSPeter Avalos ++l;
239679343712SPeter Avalos m->flag |= NOSPACE;
2397327e51cbSPeter Avalos } else if ((l[0] == '\\') && (l[1] == 'b')) {
2398327e51cbSPeter Avalos ++l;
2399327e51cbSPeter Avalos ++l;
240079343712SPeter Avalos m->flag |= NOSPACE;
240179343712SPeter Avalos }
2402327e51cbSPeter Avalos for (i = 0; (m->desc[i++] = *l++) != '\0' && i < sizeof(m->desc); )
2403327e51cbSPeter Avalos continue;
2404327e51cbSPeter Avalos if (i == sizeof(m->desc)) {
2405327e51cbSPeter Avalos m->desc[sizeof(m->desc) - 1] = '\0';
2406327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2407327e51cbSPeter Avalos file_magwarn(ms, "description `%s' truncated", m->desc);
2408327e51cbSPeter Avalos }
2409327e51cbSPeter Avalos
2410327e51cbSPeter Avalos /*
2411327e51cbSPeter Avalos * We only do this check while compiling, or if any of the magic
2412327e51cbSPeter Avalos * files were not compiled.
2413327e51cbSPeter Avalos */
2414327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK) {
2415327e51cbSPeter Avalos if (check_format(ms, m) == -1)
2416327e51cbSPeter Avalos return -1;
2417327e51cbSPeter Avalos }
2418327e51cbSPeter Avalos #ifndef COMPILE_ONLY
2419327e51cbSPeter Avalos if (action == FILE_CHECK) {
2420327e51cbSPeter Avalos file_mdump(m);
2421327e51cbSPeter Avalos }
2422327e51cbSPeter Avalos #endif
242379343712SPeter Avalos m->mimetype[0] = '\0'; /* initialise MIME type to none */
2424327e51cbSPeter Avalos return 0;
2425327e51cbSPeter Avalos }
2426327e51cbSPeter Avalos
242779343712SPeter Avalos /*
242879343712SPeter Avalos * parse a STRENGTH annotation line from magic file, put into magic[index - 1]
242979343712SPeter Avalos * if valid
243079343712SPeter Avalos */
2431*3b9cdfa3SAntonio Huete Jimenez /*ARGSUSED*/
243279343712SPeter Avalos private int
parse_strength(struct magic_set * ms,struct magic_entry * me,const char * line,size_t len)2433c990e5baSDaniel Fojt parse_strength(struct magic_set *ms, struct magic_entry *me, const char *line,
2434c990e5baSDaniel Fojt size_t len __attribute__((__unused__)))
243579343712SPeter Avalos {
243679343712SPeter Avalos const char *l = line;
243779343712SPeter Avalos char *el;
243879343712SPeter Avalos unsigned long factor;
243979343712SPeter Avalos struct magic *m = &me->mp[0];
244079343712SPeter Avalos
244179343712SPeter Avalos if (m->factor_op != FILE_FACTOR_OP_NONE) {
244279343712SPeter Avalos file_magwarn(ms,
244379343712SPeter Avalos "Current entry already has a strength type: %c %d",
244479343712SPeter Avalos m->factor_op, m->factor);
244579343712SPeter Avalos return -1;
244679343712SPeter Avalos }
2447e8af9738SPeter Avalos if (m->type == FILE_NAME) {
2448e8af9738SPeter Avalos file_magwarn(ms, "%s: Strength setting is not supported in "
2449e8af9738SPeter Avalos "\"name\" magic entries", m->value.s);
2450e8af9738SPeter Avalos return -1;
2451e8af9738SPeter Avalos }
245279343712SPeter Avalos EATAB;
245379343712SPeter Avalos switch (*l) {
245479343712SPeter Avalos case FILE_FACTOR_OP_NONE:
245579343712SPeter Avalos case FILE_FACTOR_OP_PLUS:
245679343712SPeter Avalos case FILE_FACTOR_OP_MINUS:
245779343712SPeter Avalos case FILE_FACTOR_OP_TIMES:
245879343712SPeter Avalos case FILE_FACTOR_OP_DIV:
245979343712SPeter Avalos m->factor_op = *l++;
246079343712SPeter Avalos break;
246179343712SPeter Avalos default:
246279343712SPeter Avalos file_magwarn(ms, "Unknown factor op `%c'", *l);
246379343712SPeter Avalos return -1;
246479343712SPeter Avalos }
246579343712SPeter Avalos EATAB;
246679343712SPeter Avalos factor = strtoul(l, &el, 0);
246779343712SPeter Avalos if (factor > 255) {
246879343712SPeter Avalos file_magwarn(ms, "Too large factor `%lu'", factor);
246979343712SPeter Avalos goto out;
247079343712SPeter Avalos }
24716fca56fbSSascha Wildner if (*el && !isspace(CAST(unsigned char, *el))) {
247279343712SPeter Avalos file_magwarn(ms, "Bad factor `%s'", l);
247379343712SPeter Avalos goto out;
247479343712SPeter Avalos }
24756fca56fbSSascha Wildner m->factor = CAST(uint8_t, factor);
247679343712SPeter Avalos if (m->factor == 0 && m->factor_op == FILE_FACTOR_OP_DIV) {
247779343712SPeter Avalos file_magwarn(ms, "Cannot have factor op `%c' and factor %u",
247879343712SPeter Avalos m->factor_op, m->factor);
247979343712SPeter Avalos goto out;
248079343712SPeter Avalos }
248179343712SPeter Avalos return 0;
248279343712SPeter Avalos out:
248379343712SPeter Avalos m->factor_op = FILE_FACTOR_OP_NONE;
248479343712SPeter Avalos m->factor = 0;
248579343712SPeter Avalos return -1;
248679343712SPeter Avalos }
248779343712SPeter Avalos
2488e8af9738SPeter Avalos private int
goodchar(unsigned char x,const char * extra)248982c5fa3eSPeter Avalos goodchar(unsigned char x, const char *extra)
249082c5fa3eSPeter Avalos {
249182c5fa3eSPeter Avalos return (isascii(x) && isalnum(x)) || strchr(extra, x);
249282c5fa3eSPeter Avalos }
249382c5fa3eSPeter Avalos
249482c5fa3eSPeter Avalos private int
parse_extra(struct magic_set * ms,struct magic_entry * me,const char * line,size_t llen,off_t off,size_t len,const char * name,const char * extra,int nt)2495e8af9738SPeter Avalos parse_extra(struct magic_set *ms, struct magic_entry *me, const char *line,
2496c990e5baSDaniel Fojt size_t llen, off_t off, size_t len, const char *name, const char *extra,
2497c990e5baSDaniel Fojt int nt)
2498e8af9738SPeter Avalos {
2499e8af9738SPeter Avalos size_t i;
2500e8af9738SPeter Avalos const char *l = line;
2501e8af9738SPeter Avalos struct magic *m = &me->mp[me->cont_count == 0 ? 0 : me->cont_count - 1];
2502c30bd091SSascha Wildner char *buf = CAST(char *, CAST(void *, m)) + off;
2503e8af9738SPeter Avalos
2504e8af9738SPeter Avalos if (buf[0] != '\0') {
2505e8af9738SPeter Avalos len = nt ? strlen(buf) : len;
2506e8af9738SPeter Avalos file_magwarn(ms, "Current entry already has a %s type "
25076fca56fbSSascha Wildner "`%.*s', new type `%s'", name, CAST(int, len), buf, l);
2508e8af9738SPeter Avalos return -1;
2509e8af9738SPeter Avalos }
2510e8af9738SPeter Avalos
2511e8af9738SPeter Avalos if (*m->desc == '\0') {
2512e8af9738SPeter Avalos file_magwarn(ms, "Current entry does not yet have a "
2513e8af9738SPeter Avalos "description for adding a %s type", name);
2514e8af9738SPeter Avalos return -1;
2515e8af9738SPeter Avalos }
2516e8af9738SPeter Avalos
2517e8af9738SPeter Avalos EATAB;
2518c990e5baSDaniel Fojt for (i = 0; *l && i < llen && i < len && goodchar(*l, extra);
2519c990e5baSDaniel Fojt buf[i++] = *l++)
2520e8af9738SPeter Avalos continue;
2521e8af9738SPeter Avalos
2522e8af9738SPeter Avalos if (i == len && *l) {
2523e8af9738SPeter Avalos if (nt)
2524e8af9738SPeter Avalos buf[len - 1] = '\0';
2525e8af9738SPeter Avalos if (ms->flags & MAGIC_CHECK)
2526e8af9738SPeter Avalos file_magwarn(ms, "%s type `%s' truncated %"
2527e8af9738SPeter Avalos SIZE_T_FORMAT "u", name, line, i);
2528e8af9738SPeter Avalos } else {
25296fca56fbSSascha Wildner if (!isspace(CAST(unsigned char, *l)) && !goodchar(*l, extra))
253082c5fa3eSPeter Avalos file_magwarn(ms, "%s type `%s' has bad char '%c'",
253182c5fa3eSPeter Avalos name, line, *l);
2532e8af9738SPeter Avalos if (nt)
2533e8af9738SPeter Avalos buf[i] = '\0';
2534e8af9738SPeter Avalos }
2535e8af9738SPeter Avalos
2536e8af9738SPeter Avalos if (i > 0)
2537e8af9738SPeter Avalos return 0;
253882c5fa3eSPeter Avalos
253982c5fa3eSPeter Avalos file_magerror(ms, "Bad magic entry '%s'", line);
2540e8af9738SPeter Avalos return -1;
2541e8af9738SPeter Avalos }
2542e8af9738SPeter Avalos
254379343712SPeter Avalos /*
2544e4d4ce0cSPeter Avalos * Parse an Apple CREATOR/TYPE annotation from magic file and put it into
2545e4d4ce0cSPeter Avalos * magic[index - 1]
254679343712SPeter Avalos */
254779343712SPeter Avalos private int
parse_apple(struct magic_set * ms,struct magic_entry * me,const char * line,size_t len)2548c990e5baSDaniel Fojt parse_apple(struct magic_set *ms, struct magic_entry *me, const char *line,
2549c990e5baSDaniel Fojt size_t len)
255079343712SPeter Avalos {
2551c990e5baSDaniel Fojt return parse_extra(ms, me, line, len,
2552c30bd091SSascha Wildner CAST(off_t, offsetof(struct magic, apple)),
2553*3b9cdfa3SAntonio Huete Jimenez sizeof(me->mp[0].apple), "APPLE", "!+-./?", 0);
2554c30bd091SSascha Wildner }
2555c30bd091SSascha Wildner
2556c30bd091SSascha Wildner /*
2557c30bd091SSascha Wildner * Parse a comma-separated list of extensions
2558c30bd091SSascha Wildner */
2559c30bd091SSascha Wildner private int
parse_ext(struct magic_set * ms,struct magic_entry * me,const char * line,size_t len)2560c990e5baSDaniel Fojt parse_ext(struct magic_set *ms, struct magic_entry *me, const char *line,
2561c990e5baSDaniel Fojt size_t len)
2562c30bd091SSascha Wildner {
2563c990e5baSDaniel Fojt return parse_extra(ms, me, line, len,
2564c30bd091SSascha Wildner CAST(off_t, offsetof(struct magic, ext)),
2565*3b9cdfa3SAntonio Huete Jimenez sizeof(me->mp[0].ext), "EXTENSION", ",!+-/@?_$&", 0); /* & for b&w */
256679343712SPeter Avalos }
256779343712SPeter Avalos
256879343712SPeter Avalos /*
256979343712SPeter Avalos * parse a MIME annotation line from magic file, put into magic[index - 1]
257079343712SPeter Avalos * if valid
257179343712SPeter Avalos */
257279343712SPeter Avalos private int
parse_mime(struct magic_set * ms,struct magic_entry * me,const char * line,size_t len)2573c990e5baSDaniel Fojt parse_mime(struct magic_set *ms, struct magic_entry *me, const char *line,
2574c990e5baSDaniel Fojt size_t len)
257579343712SPeter Avalos {
2576c990e5baSDaniel Fojt return parse_extra(ms, me, line, len,
2577c30bd091SSascha Wildner CAST(off_t, offsetof(struct magic, mimetype)),
2578*3b9cdfa3SAntonio Huete Jimenez sizeof(me->mp[0].mimetype), "MIME", "+-/.$?:{}", 1);
257979343712SPeter Avalos }
258079343712SPeter Avalos
2581327e51cbSPeter Avalos private int
check_format_type(const char * ptr,int type,const char ** estr)2582c30bd091SSascha Wildner check_format_type(const char *ptr, int type, const char **estr)
2583327e51cbSPeter Avalos {
258482c5fa3eSPeter Avalos int quad = 0, h;
2585c30bd091SSascha Wildner size_t len, cnt;
2586327e51cbSPeter Avalos if (*ptr == '\0') {
2587327e51cbSPeter Avalos /* Missing format string; bad */
2588c30bd091SSascha Wildner *estr = "missing format spec";
2589327e51cbSPeter Avalos return -1;
2590327e51cbSPeter Avalos }
2591327e51cbSPeter Avalos
259282c5fa3eSPeter Avalos switch (file_formats[type]) {
2593327e51cbSPeter Avalos case FILE_FMT_QUAD:
2594327e51cbSPeter Avalos quad = 1;
2595327e51cbSPeter Avalos /*FALLTHROUGH*/
2596327e51cbSPeter Avalos case FILE_FMT_NUM:
259782c5fa3eSPeter Avalos if (quad == 0) {
259882c5fa3eSPeter Avalos switch (type) {
259982c5fa3eSPeter Avalos case FILE_BYTE:
260082c5fa3eSPeter Avalos h = 2;
260182c5fa3eSPeter Avalos break;
260282c5fa3eSPeter Avalos case FILE_SHORT:
260382c5fa3eSPeter Avalos case FILE_BESHORT:
260482c5fa3eSPeter Avalos case FILE_LESHORT:
260582c5fa3eSPeter Avalos h = 1;
260682c5fa3eSPeter Avalos break;
260782c5fa3eSPeter Avalos case FILE_LONG:
260882c5fa3eSPeter Avalos case FILE_BELONG:
260982c5fa3eSPeter Avalos case FILE_LELONG:
261082c5fa3eSPeter Avalos case FILE_MELONG:
261182c5fa3eSPeter Avalos case FILE_LEID3:
261282c5fa3eSPeter Avalos case FILE_BEID3:
261382c5fa3eSPeter Avalos case FILE_INDIRECT:
261482c5fa3eSPeter Avalos h = 0;
261582c5fa3eSPeter Avalos break;
261682c5fa3eSPeter Avalos default:
2617*3b9cdfa3SAntonio Huete Jimenez fprintf(stderr, "Bad number format %d", type);
261882c5fa3eSPeter Avalos abort();
261982c5fa3eSPeter Avalos }
262082c5fa3eSPeter Avalos } else
262182c5fa3eSPeter Avalos h = 0;
2622614728caSSascha Wildner while (*ptr && strchr("-.#", *ptr) != NULL)
2623c30bd091SSascha Wildner ptr++;
2624c30bd091SSascha Wildner #define CHECKLEN() do { \
26256fca56fbSSascha Wildner for (len = cnt = 0; isdigit(CAST(unsigned char, *ptr)); ptr++, cnt++) \
2626c30bd091SSascha Wildner len = len * 10 + (*ptr - '0'); \
2627c30bd091SSascha Wildner if (cnt > 5 || len > 1024) \
2628c30bd091SSascha Wildner goto toolong; \
2629c30bd091SSascha Wildner } while (/*CONSTCOND*/0)
2630c30bd091SSascha Wildner
2631c30bd091SSascha Wildner CHECKLEN();
2632327e51cbSPeter Avalos if (*ptr == '.')
2633327e51cbSPeter Avalos ptr++;
2634c30bd091SSascha Wildner CHECKLEN();
2635327e51cbSPeter Avalos if (quad) {
2636327e51cbSPeter Avalos if (*ptr++ != 'l')
2637c30bd091SSascha Wildner goto invalid;
2638327e51cbSPeter Avalos if (*ptr++ != 'l')
2639c30bd091SSascha Wildner goto invalid;
2640327e51cbSPeter Avalos }
2641327e51cbSPeter Avalos
2642327e51cbSPeter Avalos switch (*ptr++) {
264382c5fa3eSPeter Avalos #ifdef STRICT_FORMAT /* "long" formats are int formats for us */
264482c5fa3eSPeter Avalos /* so don't accept the 'l' modifier */
2645327e51cbSPeter Avalos case 'l':
2646327e51cbSPeter Avalos switch (*ptr++) {
2647327e51cbSPeter Avalos case 'i':
2648327e51cbSPeter Avalos case 'd':
2649327e51cbSPeter Avalos case 'u':
2650e8af9738SPeter Avalos case 'o':
2651327e51cbSPeter Avalos case 'x':
2652327e51cbSPeter Avalos case 'X':
2653c30bd091SSascha Wildner if (h == 0)
2654c30bd091SSascha Wildner return 0;
2655c30bd091SSascha Wildner /*FALLTHROUGH*/
2656327e51cbSPeter Avalos default:
2657c30bd091SSascha Wildner goto invalid;
2658327e51cbSPeter Avalos }
2659327e51cbSPeter Avalos
266082c5fa3eSPeter Avalos /*
266182c5fa3eSPeter Avalos * Don't accept h and hh modifiers. They make writing
266282c5fa3eSPeter Avalos * magic entries more complicated, for very little benefit
266382c5fa3eSPeter Avalos */
2664327e51cbSPeter Avalos case 'h':
266582c5fa3eSPeter Avalos if (h-- <= 0)
2666c30bd091SSascha Wildner goto invalid;
2667327e51cbSPeter Avalos switch (*ptr++) {
2668327e51cbSPeter Avalos case 'h':
266982c5fa3eSPeter Avalos if (h-- <= 0)
2670c30bd091SSascha Wildner goto invalid;
2671327e51cbSPeter Avalos switch (*ptr++) {
2672327e51cbSPeter Avalos case 'i':
2673327e51cbSPeter Avalos case 'd':
2674327e51cbSPeter Avalos case 'u':
2675e8af9738SPeter Avalos case 'o':
2676327e51cbSPeter Avalos case 'x':
2677327e51cbSPeter Avalos case 'X':
2678327e51cbSPeter Avalos return 0;
2679327e51cbSPeter Avalos default:
2680c30bd091SSascha Wildner goto invalid;
2681327e51cbSPeter Avalos }
268282c5fa3eSPeter Avalos case 'i':
2683327e51cbSPeter Avalos case 'd':
268482c5fa3eSPeter Avalos case 'u':
268582c5fa3eSPeter Avalos case 'o':
268682c5fa3eSPeter Avalos case 'x':
268782c5fa3eSPeter Avalos case 'X':
2688c30bd091SSascha Wildner if (h == 0)
2689c30bd091SSascha Wildner return 0;
2690c30bd091SSascha Wildner /*FALLTHROUGH*/
2691327e51cbSPeter Avalos default:
2692c30bd091SSascha Wildner goto invalid;
2693327e51cbSPeter Avalos }
269482c5fa3eSPeter Avalos #endif
2695327e51cbSPeter Avalos case 'c':
2696c30bd091SSascha Wildner if (h == 2)
2697c30bd091SSascha Wildner return 0;
2698c30bd091SSascha Wildner goto invalid;
269982c5fa3eSPeter Avalos case 'i':
2700327e51cbSPeter Avalos case 'd':
2701327e51cbSPeter Avalos case 'u':
2702e8af9738SPeter Avalos case 'o':
2703327e51cbSPeter Avalos case 'x':
2704327e51cbSPeter Avalos case 'X':
270582c5fa3eSPeter Avalos #ifdef STRICT_FORMAT
2706c30bd091SSascha Wildner if (h == 0)
2707c30bd091SSascha Wildner return 0;
2708c30bd091SSascha Wildner /*FALLTHROUGH*/
270982c5fa3eSPeter Avalos #else
2710327e51cbSPeter Avalos return 0;
271182c5fa3eSPeter Avalos #endif
2712327e51cbSPeter Avalos default:
2713c30bd091SSascha Wildner goto invalid;
2714327e51cbSPeter Avalos }
2715327e51cbSPeter Avalos
2716327e51cbSPeter Avalos case FILE_FMT_FLOAT:
2717327e51cbSPeter Avalos case FILE_FMT_DOUBLE:
2718327e51cbSPeter Avalos if (*ptr == '-')
2719327e51cbSPeter Avalos ptr++;
2720327e51cbSPeter Avalos if (*ptr == '.')
2721327e51cbSPeter Avalos ptr++;
2722c30bd091SSascha Wildner CHECKLEN();
2723327e51cbSPeter Avalos if (*ptr == '.')
2724327e51cbSPeter Avalos ptr++;
2725c30bd091SSascha Wildner CHECKLEN();
2726327e51cbSPeter Avalos switch (*ptr++) {
2727327e51cbSPeter Avalos case 'e':
2728327e51cbSPeter Avalos case 'E':
2729327e51cbSPeter Avalos case 'f':
2730327e51cbSPeter Avalos case 'F':
2731327e51cbSPeter Avalos case 'g':
2732327e51cbSPeter Avalos case 'G':
2733327e51cbSPeter Avalos return 0;
2734327e51cbSPeter Avalos
2735327e51cbSPeter Avalos default:
2736c30bd091SSascha Wildner goto invalid;
2737327e51cbSPeter Avalos }
2738327e51cbSPeter Avalos
2739327e51cbSPeter Avalos
2740327e51cbSPeter Avalos case FILE_FMT_STR:
2741327e51cbSPeter Avalos if (*ptr == '-')
2742327e51cbSPeter Avalos ptr++;
27436fca56fbSSascha Wildner while (isdigit(CAST(unsigned char, *ptr)))
2744327e51cbSPeter Avalos ptr++;
2745327e51cbSPeter Avalos if (*ptr == '.') {
2746327e51cbSPeter Avalos ptr++;
27476fca56fbSSascha Wildner while (isdigit(CAST(unsigned char , *ptr)))
2748327e51cbSPeter Avalos ptr++;
2749327e51cbSPeter Avalos }
2750327e51cbSPeter Avalos
2751327e51cbSPeter Avalos switch (*ptr++) {
2752327e51cbSPeter Avalos case 's':
2753327e51cbSPeter Avalos return 0;
2754327e51cbSPeter Avalos default:
2755c30bd091SSascha Wildner goto invalid;
2756327e51cbSPeter Avalos }
2757327e51cbSPeter Avalos
2758327e51cbSPeter Avalos default:
2759327e51cbSPeter Avalos /* internal error */
2760*3b9cdfa3SAntonio Huete Jimenez fprintf(stderr, "Bad file format %d", type);
2761327e51cbSPeter Avalos abort();
2762327e51cbSPeter Avalos }
2763c30bd091SSascha Wildner invalid:
2764c30bd091SSascha Wildner *estr = "not valid";
2765c30bd091SSascha Wildner toolong:
2766c30bd091SSascha Wildner *estr = "too long";
2767327e51cbSPeter Avalos return -1;
2768327e51cbSPeter Avalos }
2769327e51cbSPeter Avalos
2770327e51cbSPeter Avalos /*
2771327e51cbSPeter Avalos * Check that the optional printf format in description matches
2772327e51cbSPeter Avalos * the type of the magic.
2773327e51cbSPeter Avalos */
2774327e51cbSPeter Avalos private int
check_format(struct magic_set * ms,struct magic * m)2775327e51cbSPeter Avalos check_format(struct magic_set *ms, struct magic *m)
2776327e51cbSPeter Avalos {
2777327e51cbSPeter Avalos char *ptr;
2778c30bd091SSascha Wildner const char *estr;
2779327e51cbSPeter Avalos
2780327e51cbSPeter Avalos for (ptr = m->desc; *ptr; ptr++)
2781327e51cbSPeter Avalos if (*ptr == '%')
2782327e51cbSPeter Avalos break;
2783327e51cbSPeter Avalos if (*ptr == '\0') {
2784327e51cbSPeter Avalos /* No format string; ok */
2785327e51cbSPeter Avalos return 1;
2786327e51cbSPeter Avalos }
2787327e51cbSPeter Avalos
2788327e51cbSPeter Avalos assert(file_nformats == file_nnames);
2789327e51cbSPeter Avalos
2790327e51cbSPeter Avalos if (m->type >= file_nformats) {
279179343712SPeter Avalos file_magwarn(ms, "Internal error inconsistency between "
2792327e51cbSPeter Avalos "m->type and format strings");
2793327e51cbSPeter Avalos return -1;
2794327e51cbSPeter Avalos }
2795327e51cbSPeter Avalos if (file_formats[m->type] == FILE_FMT_NONE) {
279679343712SPeter Avalos file_magwarn(ms, "No format string for `%s' with description "
2797327e51cbSPeter Avalos "`%s'", m->desc, file_names[m->type]);
2798327e51cbSPeter Avalos return -1;
2799327e51cbSPeter Avalos }
2800327e51cbSPeter Avalos
2801327e51cbSPeter Avalos ptr++;
2802c30bd091SSascha Wildner if (check_format_type(ptr, m->type, &estr) == -1) {
2803327e51cbSPeter Avalos /*
2804327e51cbSPeter Avalos * TODO: this error message is unhelpful if the format
2805327e51cbSPeter Avalos * string is not one character long
2806327e51cbSPeter Avalos */
2807c30bd091SSascha Wildner file_magwarn(ms, "Printf format is %s for type "
2808c30bd091SSascha Wildner "`%s' in description `%s'", estr,
2809327e51cbSPeter Avalos file_names[m->type], m->desc);
2810327e51cbSPeter Avalos return -1;
2811327e51cbSPeter Avalos }
2812327e51cbSPeter Avalos
2813327e51cbSPeter Avalos for (; *ptr; ptr++) {
2814327e51cbSPeter Avalos if (*ptr == '%') {
281579343712SPeter Avalos file_magwarn(ms,
2816327e51cbSPeter Avalos "Too many format strings (should have at most one) "
2817327e51cbSPeter Avalos "for `%s' with description `%s'",
2818327e51cbSPeter Avalos file_names[m->type], m->desc);
2819327e51cbSPeter Avalos return -1;
2820327e51cbSPeter Avalos }
2821327e51cbSPeter Avalos }
2822327e51cbSPeter Avalos return 0;
2823327e51cbSPeter Avalos }
2824327e51cbSPeter Avalos
2825327e51cbSPeter Avalos /*
2826327e51cbSPeter Avalos * Read a numeric value from a pointer, into the value union of a magic
2827327e51cbSPeter Avalos * pointer, according to the magic type. Update the string pointer to point
2828327e51cbSPeter Avalos * just after the number read. Return 0 for success, non-zero for failure.
2829327e51cbSPeter Avalos */
2830327e51cbSPeter Avalos private int
getvalue(struct magic_set * ms,struct magic * m,const char ** p,int action)2831327e51cbSPeter Avalos getvalue(struct magic_set *ms, struct magic *m, const char **p, int action)
2832327e51cbSPeter Avalos {
28336fca56fbSSascha Wildner char *ep;
28346fca56fbSSascha Wildner uint64_t ull;
28356fca56fbSSascha Wildner
2836327e51cbSPeter Avalos switch (m->type) {
2837327e51cbSPeter Avalos case FILE_BESTRING16:
2838327e51cbSPeter Avalos case FILE_LESTRING16:
2839327e51cbSPeter Avalos case FILE_STRING:
2840327e51cbSPeter Avalos case FILE_PSTRING:
2841327e51cbSPeter Avalos case FILE_REGEX:
2842327e51cbSPeter Avalos case FILE_SEARCH:
2843e8af9738SPeter Avalos case FILE_NAME:
2844e8af9738SPeter Avalos case FILE_USE:
2845c30bd091SSascha Wildner case FILE_DER:
2846*3b9cdfa3SAntonio Huete Jimenez case FILE_OCTAL:
284779343712SPeter Avalos *p = getstr(ms, m, *p, action == FILE_COMPILE);
2848327e51cbSPeter Avalos if (*p == NULL) {
2849327e51cbSPeter Avalos if (ms->flags & MAGIC_CHECK)
2850327e51cbSPeter Avalos file_magwarn(ms, "cannot get string from `%s'",
2851327e51cbSPeter Avalos m->value.s);
2852327e51cbSPeter Avalos return -1;
2853327e51cbSPeter Avalos }
285482c5fa3eSPeter Avalos if (m->type == FILE_REGEX) {
285582c5fa3eSPeter Avalos file_regex_t rx;
2856*3b9cdfa3SAntonio Huete Jimenez int rc = file_regcomp(ms, &rx, m->value.s,
2857*3b9cdfa3SAntonio Huete Jimenez REG_EXTENDED);
2858*3b9cdfa3SAntonio Huete Jimenez if (rc == 0) {
285982c5fa3eSPeter Avalos file_regfree(&rx);
2860*3b9cdfa3SAntonio Huete Jimenez }
286182c5fa3eSPeter Avalos return rc ? -1 : 0;
286282c5fa3eSPeter Avalos }
2863327e51cbSPeter Avalos return 0;
28646fca56fbSSascha Wildner default:
28656fca56fbSSascha Wildner if (m->reln == 'x')
28666fca56fbSSascha Wildner return 0;
28676fca56fbSSascha Wildner break;
28686fca56fbSSascha Wildner }
28696fca56fbSSascha Wildner
28706fca56fbSSascha Wildner switch (m->type) {
2871327e51cbSPeter Avalos case FILE_FLOAT:
2872327e51cbSPeter Avalos case FILE_BEFLOAT:
2873327e51cbSPeter Avalos case FILE_LEFLOAT:
2874c30bd091SSascha Wildner errno = 0;
2875327e51cbSPeter Avalos #ifdef HAVE_STRTOF
2876327e51cbSPeter Avalos m->value.f = strtof(*p, &ep);
2877327e51cbSPeter Avalos #else
2878327e51cbSPeter Avalos m->value.f = (float)strtod(*p, &ep);
2879327e51cbSPeter Avalos #endif
2880c30bd091SSascha Wildner if (errno == 0)
2881327e51cbSPeter Avalos *p = ep;
2882327e51cbSPeter Avalos return 0;
2883327e51cbSPeter Avalos case FILE_DOUBLE:
2884327e51cbSPeter Avalos case FILE_BEDOUBLE:
2885327e51cbSPeter Avalos case FILE_LEDOUBLE:
2886c30bd091SSascha Wildner errno = 0;
2887327e51cbSPeter Avalos m->value.d = strtod(*p, &ep);
2888c30bd091SSascha Wildner if (errno == 0)
2889327e51cbSPeter Avalos *p = ep;
2890327e51cbSPeter Avalos return 0;
2891c990e5baSDaniel Fojt case FILE_GUID:
2892c990e5baSDaniel Fojt if (file_parse_guid(*p, m->value.guid) == -1)
2893c990e5baSDaniel Fojt return -1;
2894c990e5baSDaniel Fojt *p += FILE_GUID_SIZE - 1;
2895c990e5baSDaniel Fojt return 0;
2896327e51cbSPeter Avalos default:
2897c30bd091SSascha Wildner errno = 0;
28986fca56fbSSascha Wildner ull = CAST(uint64_t, strtoull(*p, &ep, 0));
2899c30bd091SSascha Wildner m->value.q = file_signextend(ms, m, ull);
2900c30bd091SSascha Wildner if (*p == ep) {
2901970935fdSSascha Wildner file_magwarn(ms, "Unparsable number `%s'", *p);
2902c30bd091SSascha Wildner } else {
2903c30bd091SSascha Wildner size_t ts = typesize(m->type);
2904c30bd091SSascha Wildner uint64_t x;
2905c30bd091SSascha Wildner const char *q;
2906c30bd091SSascha Wildner
2907c990e5baSDaniel Fojt if (ts == FILE_BADSIZE) {
29086fca56fbSSascha Wildner file_magwarn(ms,
29096fca56fbSSascha Wildner "Expected numeric type got `%s'",
2910c30bd091SSascha Wildner type_tbl[m->type].name);
2911c30bd091SSascha Wildner }
29126fca56fbSSascha Wildner for (q = *p; isspace(CAST(unsigned char, *q)); q++)
2913c30bd091SSascha Wildner continue;
2914c30bd091SSascha Wildner if (*q == '-')
29156fca56fbSSascha Wildner ull = -CAST(int64_t, ull);
2916c30bd091SSascha Wildner switch (ts) {
2917c30bd091SSascha Wildner case 1:
29186fca56fbSSascha Wildner x = CAST(uint64_t, ull & ~0xffULL);
2919c30bd091SSascha Wildner break;
2920c30bd091SSascha Wildner case 2:
29216fca56fbSSascha Wildner x = CAST(uint64_t, ull & ~0xffffULL);
2922c30bd091SSascha Wildner break;
2923c30bd091SSascha Wildner case 4:
29246fca56fbSSascha Wildner x = CAST(uint64_t, ull & ~0xffffffffULL);
2925c30bd091SSascha Wildner break;
2926c30bd091SSascha Wildner case 8:
2927c30bd091SSascha Wildner x = 0;
2928c30bd091SSascha Wildner break;
2929c30bd091SSascha Wildner default:
2930*3b9cdfa3SAntonio Huete Jimenez fprintf(stderr, "Bad width %zu", ts);
2931c30bd091SSascha Wildner abort();
2932c30bd091SSascha Wildner }
2933c30bd091SSascha Wildner if (x) {
29346fca56fbSSascha Wildner file_magwarn(ms, "Overflow for numeric"
29356fca56fbSSascha Wildner " type `%s' value %#" PRIx64,
2936c30bd091SSascha Wildner type_tbl[m->type].name, ull);
2937c30bd091SSascha Wildner }
2938c30bd091SSascha Wildner }
2939c30bd091SSascha Wildner if (errno == 0) {
2940327e51cbSPeter Avalos *p = ep;
2941327e51cbSPeter Avalos eatsize(p);
2942327e51cbSPeter Avalos }
2943327e51cbSPeter Avalos return 0;
2944327e51cbSPeter Avalos }
2945327e51cbSPeter Avalos }
2946327e51cbSPeter Avalos
2947327e51cbSPeter Avalos /*
2948327e51cbSPeter Avalos * Convert a string containing C character escapes. Stop at an unescaped
2949327e51cbSPeter Avalos * space or tab.
295079343712SPeter Avalos * Copy the converted version to "m->value.s", and the length in m->vallen.
295179343712SPeter Avalos * Return updated scan pointer as function result. Warn if set.
2952327e51cbSPeter Avalos */
2953327e51cbSPeter Avalos private const char *
getstr(struct magic_set * ms,struct magic * m,const char * s,int warn)295479343712SPeter Avalos getstr(struct magic_set *ms, struct magic *m, const char *s, int warn)
2955327e51cbSPeter Avalos {
2956327e51cbSPeter Avalos const char *origs = s;
295779343712SPeter Avalos char *p = m->value.s;
295879343712SPeter Avalos size_t plen = sizeof(m->value.s);
2959327e51cbSPeter Avalos char *origp = p;
2960327e51cbSPeter Avalos char *pmax = p + plen - 1;
2961327e51cbSPeter Avalos int c;
2962327e51cbSPeter Avalos int val;
2963*3b9cdfa3SAntonio Huete Jimenez size_t bracket_nesting = 0;
2964327e51cbSPeter Avalos
2965327e51cbSPeter Avalos while ((c = *s++) != '\0') {
29666fca56fbSSascha Wildner if (isspace(CAST(unsigned char, c)))
2967327e51cbSPeter Avalos break;
2968327e51cbSPeter Avalos if (p >= pmax) {
2969327e51cbSPeter Avalos file_error(ms, 0, "string too long: `%s'", origs);
2970327e51cbSPeter Avalos return NULL;
2971327e51cbSPeter Avalos }
2972*3b9cdfa3SAntonio Huete Jimenez if (c != '\\') {
2973*3b9cdfa3SAntonio Huete Jimenez if (c == '[') {
2974*3b9cdfa3SAntonio Huete Jimenez bracket_nesting++;
2975*3b9cdfa3SAntonio Huete Jimenez }
2976*3b9cdfa3SAntonio Huete Jimenez if (c == ']' && bracket_nesting > 0) {
2977*3b9cdfa3SAntonio Huete Jimenez bracket_nesting--;
2978*3b9cdfa3SAntonio Huete Jimenez }
2979*3b9cdfa3SAntonio Huete Jimenez *p++ = CAST(char, c);
2980*3b9cdfa3SAntonio Huete Jimenez continue;
2981*3b9cdfa3SAntonio Huete Jimenez }
2982327e51cbSPeter Avalos switch(c = *s++) {
2983327e51cbSPeter Avalos
2984327e51cbSPeter Avalos case '\0':
298579343712SPeter Avalos if (warn)
2986327e51cbSPeter Avalos file_magwarn(ms, "incomplete escape");
2987c30bd091SSascha Wildner s--;
2988327e51cbSPeter Avalos goto out;
2989*3b9cdfa3SAntonio Huete Jimenez case '.':
2990*3b9cdfa3SAntonio Huete Jimenez if (m->type == FILE_REGEX &&
2991*3b9cdfa3SAntonio Huete Jimenez bracket_nesting == 0 && warn) {
2992*3b9cdfa3SAntonio Huete Jimenez file_magwarn(ms, "escaped dot ('.') found, "
2993*3b9cdfa3SAntonio Huete Jimenez "use \\\\. instead");
2994*3b9cdfa3SAntonio Huete Jimenez }
2995*3b9cdfa3SAntonio Huete Jimenez warn = 0; /* already did */
2996*3b9cdfa3SAntonio Huete Jimenez /*FALLTHROUGH*/
2997327e51cbSPeter Avalos case '\t':
299879343712SPeter Avalos if (warn) {
2999327e51cbSPeter Avalos file_magwarn(ms,
3000*3b9cdfa3SAntonio Huete Jimenez "escaped tab found, use \\\\t instead");
300179343712SPeter Avalos warn = 0; /* already did */
3002327e51cbSPeter Avalos }
3003327e51cbSPeter Avalos /*FALLTHROUGH*/
3004327e51cbSPeter Avalos default:
300579343712SPeter Avalos if (warn) {
30066fca56fbSSascha Wildner if (isprint(CAST(unsigned char, c))) {
300779343712SPeter Avalos /* Allow escaping of
300879343712SPeter Avalos * ``relations'' */
3009e4d4ce0cSPeter Avalos if (strchr("<>&^=!", c) == NULL
3010e4d4ce0cSPeter Avalos && (m->type != FILE_REGEX ||
3011e4d4ce0cSPeter Avalos strchr("[]().*?^$|{}", c)
3012e4d4ce0cSPeter Avalos == NULL)) {
301379343712SPeter Avalos file_magwarn(ms, "no "
301479343712SPeter Avalos "need to escape "
301579343712SPeter Avalos "`%c'", c);
301679343712SPeter Avalos }
301779343712SPeter Avalos } else {
3018327e51cbSPeter Avalos file_magwarn(ms,
301979343712SPeter Avalos "unknown escape sequence: "
302079343712SPeter Avalos "\\%03o", c);
302179343712SPeter Avalos }
3022327e51cbSPeter Avalos }
3023327e51cbSPeter Avalos /*FALLTHROUGH*/
3024327e51cbSPeter Avalos /* space, perhaps force people to use \040? */
3025327e51cbSPeter Avalos case ' ':
3026327e51cbSPeter Avalos #if 0
3027327e51cbSPeter Avalos /*
3028327e51cbSPeter Avalos * Other things people escape, but shouldn't need to,
3029327e51cbSPeter Avalos * so we disallow them
3030327e51cbSPeter Avalos */
3031327e51cbSPeter Avalos case '\'':
3032327e51cbSPeter Avalos case '"':
3033327e51cbSPeter Avalos case '?':
3034327e51cbSPeter Avalos #endif
3035327e51cbSPeter Avalos /* Relations */
3036327e51cbSPeter Avalos case '>':
3037327e51cbSPeter Avalos case '<':
3038327e51cbSPeter Avalos case '&':
3039327e51cbSPeter Avalos case '^':
3040327e51cbSPeter Avalos case '=':
3041327e51cbSPeter Avalos case '!':
3042*3b9cdfa3SAntonio Huete Jimenez /* and backslash itself */
3043327e51cbSPeter Avalos case '\\':
30446fca56fbSSascha Wildner *p++ = CAST(char, c);
3045327e51cbSPeter Avalos break;
3046327e51cbSPeter Avalos
3047327e51cbSPeter Avalos case 'a':
3048327e51cbSPeter Avalos *p++ = '\a';
3049327e51cbSPeter Avalos break;
3050327e51cbSPeter Avalos
3051327e51cbSPeter Avalos case 'b':
3052327e51cbSPeter Avalos *p++ = '\b';
3053327e51cbSPeter Avalos break;
3054327e51cbSPeter Avalos
3055327e51cbSPeter Avalos case 'f':
3056327e51cbSPeter Avalos *p++ = '\f';
3057327e51cbSPeter Avalos break;
3058327e51cbSPeter Avalos
3059327e51cbSPeter Avalos case 'n':
3060327e51cbSPeter Avalos *p++ = '\n';
3061327e51cbSPeter Avalos break;
3062327e51cbSPeter Avalos
3063327e51cbSPeter Avalos case 'r':
3064327e51cbSPeter Avalos *p++ = '\r';
3065327e51cbSPeter Avalos break;
3066327e51cbSPeter Avalos
3067327e51cbSPeter Avalos case 't':
3068327e51cbSPeter Avalos *p++ = '\t';
3069327e51cbSPeter Avalos break;
3070327e51cbSPeter Avalos
3071327e51cbSPeter Avalos case 'v':
3072327e51cbSPeter Avalos *p++ = '\v';
3073327e51cbSPeter Avalos break;
3074327e51cbSPeter Avalos
3075327e51cbSPeter Avalos /* \ and up to 3 octal digits */
3076327e51cbSPeter Avalos case '0':
3077327e51cbSPeter Avalos case '1':
3078327e51cbSPeter Avalos case '2':
3079327e51cbSPeter Avalos case '3':
3080327e51cbSPeter Avalos case '4':
3081327e51cbSPeter Avalos case '5':
3082327e51cbSPeter Avalos case '6':
3083327e51cbSPeter Avalos case '7':
3084327e51cbSPeter Avalos val = c - '0';
3085327e51cbSPeter Avalos c = *s++; /* try for 2 */
3086327e51cbSPeter Avalos if (c >= '0' && c <= '7') {
3087327e51cbSPeter Avalos val = (val << 3) | (c - '0');
3088327e51cbSPeter Avalos c = *s++; /* try for 3 */
3089327e51cbSPeter Avalos if (c >= '0' && c <= '7')
3090327e51cbSPeter Avalos val = (val << 3) | (c-'0');
3091327e51cbSPeter Avalos else
3092327e51cbSPeter Avalos --s;
3093327e51cbSPeter Avalos }
3094327e51cbSPeter Avalos else
3095327e51cbSPeter Avalos --s;
30966fca56fbSSascha Wildner *p++ = CAST(char, val);
3097327e51cbSPeter Avalos break;
3098327e51cbSPeter Avalos
3099327e51cbSPeter Avalos /* \x and up to 2 hex digits */
3100327e51cbSPeter Avalos case 'x':
3101327e51cbSPeter Avalos val = 'x'; /* Default if no digits */
3102327e51cbSPeter Avalos c = hextoint(*s++); /* Get next char */
3103327e51cbSPeter Avalos if (c >= 0) {
3104327e51cbSPeter Avalos val = c;
3105327e51cbSPeter Avalos c = hextoint(*s++);
3106327e51cbSPeter Avalos if (c >= 0)
3107327e51cbSPeter Avalos val = (val << 4) + c;
3108327e51cbSPeter Avalos else
3109327e51cbSPeter Avalos --s;
3110327e51cbSPeter Avalos } else
3111327e51cbSPeter Avalos --s;
31126fca56fbSSascha Wildner *p++ = CAST(char, val);
3113327e51cbSPeter Avalos break;
3114327e51cbSPeter Avalos }
3115327e51cbSPeter Avalos }
3116c30bd091SSascha Wildner --s;
3117327e51cbSPeter Avalos out:
3118327e51cbSPeter Avalos *p = '\0';
3119f72f8299SJan Lentfer m->vallen = CAST(unsigned char, (p - origp));
3120c990e5baSDaniel Fojt if (m->type == FILE_PSTRING) {
3121c990e5baSDaniel Fojt size_t l = file_pstring_length_size(ms, m);
3122c990e5baSDaniel Fojt if (l == FILE_BADSIZE)
3123c990e5baSDaniel Fojt return NULL;
3124c990e5baSDaniel Fojt m->vallen += CAST(unsigned char, l);
3125c990e5baSDaniel Fojt }
3126327e51cbSPeter Avalos return s;
3127327e51cbSPeter Avalos }
3128327e51cbSPeter Avalos
3129327e51cbSPeter Avalos
3130327e51cbSPeter Avalos /* Single hex char to int; -1 if not a hex char. */
3131327e51cbSPeter Avalos private int
hextoint(int c)3132327e51cbSPeter Avalos hextoint(int c)
3133327e51cbSPeter Avalos {
31346fca56fbSSascha Wildner if (!isascii(CAST(unsigned char, c)))
3135327e51cbSPeter Avalos return -1;
31366fca56fbSSascha Wildner if (isdigit(CAST(unsigned char, c)))
3137327e51cbSPeter Avalos return c - '0';
3138327e51cbSPeter Avalos if ((c >= 'a') && (c <= 'f'))
3139327e51cbSPeter Avalos return c + 10 - 'a';
3140327e51cbSPeter Avalos if (( c>= 'A') && (c <= 'F'))
3141327e51cbSPeter Avalos return c + 10 - 'A';
3142327e51cbSPeter Avalos return -1;
3143327e51cbSPeter Avalos }
3144327e51cbSPeter Avalos
3145327e51cbSPeter Avalos
3146327e51cbSPeter Avalos /*
3147327e51cbSPeter Avalos * Print a string containing C character escapes.
3148327e51cbSPeter Avalos */
3149327e51cbSPeter Avalos protected void
file_showstr(FILE * fp,const char * s,size_t len)3150327e51cbSPeter Avalos file_showstr(FILE *fp, const char *s, size_t len)
3151327e51cbSPeter Avalos {
3152327e51cbSPeter Avalos char c;
3153327e51cbSPeter Avalos
3154327e51cbSPeter Avalos for (;;) {
3155c990e5baSDaniel Fojt if (len == FILE_BADSIZE) {
3156f72f8299SJan Lentfer c = *s++;
3157327e51cbSPeter Avalos if (c == '\0')
3158327e51cbSPeter Avalos break;
3159327e51cbSPeter Avalos }
3160327e51cbSPeter Avalos else {
3161327e51cbSPeter Avalos if (len-- == 0)
3162327e51cbSPeter Avalos break;
3163f72f8299SJan Lentfer c = *s++;
3164327e51cbSPeter Avalos }
3165327e51cbSPeter Avalos if (c >= 040 && c <= 0176) /* TODO isprint && !iscntrl */
3166327e51cbSPeter Avalos (void) fputc(c, fp);
3167327e51cbSPeter Avalos else {
3168327e51cbSPeter Avalos (void) fputc('\\', fp);
3169327e51cbSPeter Avalos switch (c) {
3170327e51cbSPeter Avalos case '\a':
3171327e51cbSPeter Avalos (void) fputc('a', fp);
3172327e51cbSPeter Avalos break;
3173327e51cbSPeter Avalos
3174327e51cbSPeter Avalos case '\b':
3175327e51cbSPeter Avalos (void) fputc('b', fp);
3176327e51cbSPeter Avalos break;
3177327e51cbSPeter Avalos
3178327e51cbSPeter Avalos case '\f':
3179327e51cbSPeter Avalos (void) fputc('f', fp);
3180327e51cbSPeter Avalos break;
3181327e51cbSPeter Avalos
3182327e51cbSPeter Avalos case '\n':
3183327e51cbSPeter Avalos (void) fputc('n', fp);
3184327e51cbSPeter Avalos break;
3185327e51cbSPeter Avalos
3186327e51cbSPeter Avalos case '\r':
3187327e51cbSPeter Avalos (void) fputc('r', fp);
3188327e51cbSPeter Avalos break;
3189327e51cbSPeter Avalos
3190327e51cbSPeter Avalos case '\t':
3191327e51cbSPeter Avalos (void) fputc('t', fp);
3192327e51cbSPeter Avalos break;
3193327e51cbSPeter Avalos
3194327e51cbSPeter Avalos case '\v':
3195327e51cbSPeter Avalos (void) fputc('v', fp);
3196327e51cbSPeter Avalos break;
3197327e51cbSPeter Avalos
3198327e51cbSPeter Avalos default:
3199327e51cbSPeter Avalos (void) fprintf(fp, "%.3o", c & 0377);
3200327e51cbSPeter Avalos break;
3201327e51cbSPeter Avalos }
3202327e51cbSPeter Avalos }
3203327e51cbSPeter Avalos }
3204327e51cbSPeter Avalos }
3205327e51cbSPeter Avalos
3206327e51cbSPeter Avalos /*
3207327e51cbSPeter Avalos * eatsize(): Eat the size spec from a number [eg. 10UL]
3208327e51cbSPeter Avalos */
3209327e51cbSPeter Avalos private void
eatsize(const char ** p)3210327e51cbSPeter Avalos eatsize(const char **p)
3211327e51cbSPeter Avalos {
3212327e51cbSPeter Avalos const char *l = *p;
3213327e51cbSPeter Avalos
3214327e51cbSPeter Avalos if (LOWCASE(*l) == 'u')
3215327e51cbSPeter Avalos l++;
3216327e51cbSPeter Avalos
3217327e51cbSPeter Avalos switch (LOWCASE(*l)) {
3218327e51cbSPeter Avalos case 'l': /* long */
3219327e51cbSPeter Avalos case 's': /* short */
3220327e51cbSPeter Avalos case 'h': /* short */
3221327e51cbSPeter Avalos case 'b': /* char/byte */
3222327e51cbSPeter Avalos case 'c': /* char/byte */
3223327e51cbSPeter Avalos l++;
3224327e51cbSPeter Avalos /*FALLTHROUGH*/
3225327e51cbSPeter Avalos default:
3226327e51cbSPeter Avalos break;
3227327e51cbSPeter Avalos }
3228327e51cbSPeter Avalos
3229327e51cbSPeter Avalos *p = l;
3230327e51cbSPeter Avalos }
3231327e51cbSPeter Avalos
3232327e51cbSPeter Avalos /*
323382c5fa3eSPeter Avalos * handle a buffer containing a compiled file.
323482c5fa3eSPeter Avalos */
323582c5fa3eSPeter Avalos private struct magic_map *
apprentice_buf(struct magic_set * ms,struct magic * buf,size_t len)323682c5fa3eSPeter Avalos apprentice_buf(struct magic_set *ms, struct magic *buf, size_t len)
323782c5fa3eSPeter Avalos {
323882c5fa3eSPeter Avalos struct magic_map *map;
323982c5fa3eSPeter Avalos
324082c5fa3eSPeter Avalos if ((map = CAST(struct magic_map *, calloc(1, sizeof(*map)))) == NULL) {
324182c5fa3eSPeter Avalos file_oomem(ms, sizeof(*map));
324282c5fa3eSPeter Avalos return NULL;
324382c5fa3eSPeter Avalos }
324482c5fa3eSPeter Avalos map->len = len;
324582c5fa3eSPeter Avalos map->p = buf;
324682c5fa3eSPeter Avalos map->type = MAP_TYPE_USER;
324782c5fa3eSPeter Avalos if (check_buffer(ms, map, "buffer") != 0) {
324882c5fa3eSPeter Avalos apprentice_unmap(map);
324982c5fa3eSPeter Avalos return NULL;
325082c5fa3eSPeter Avalos }
325182c5fa3eSPeter Avalos return map;
325282c5fa3eSPeter Avalos }
325382c5fa3eSPeter Avalos
325482c5fa3eSPeter Avalos /*
3255327e51cbSPeter Avalos * handle a compiled file.
3256327e51cbSPeter Avalos */
3257e8af9738SPeter Avalos
3258e8af9738SPeter Avalos private struct magic_map *
apprentice_map(struct magic_set * ms,const char * fn)3259e8af9738SPeter Avalos apprentice_map(struct magic_set *ms, const char *fn)
3260327e51cbSPeter Avalos {
3261327e51cbSPeter Avalos int fd;
3262327e51cbSPeter Avalos struct stat st;
326379343712SPeter Avalos char *dbname = NULL;
3264e8af9738SPeter Avalos struct magic_map *map;
3265c30bd091SSascha Wildner struct magic_map *rv = NULL;
3266e8af9738SPeter Avalos
3267e8af9738SPeter Avalos fd = -1;
3268e8af9738SPeter Avalos if ((map = CAST(struct magic_map *, calloc(1, sizeof(*map)))) == NULL) {
3269e8af9738SPeter Avalos file_oomem(ms, sizeof(*map));
3270e8af9738SPeter Avalos goto error;
3271e8af9738SPeter Avalos }
3272c30bd091SSascha Wildner map->type = MAP_TYPE_USER; /* unspecified */
3273327e51cbSPeter Avalos
327479343712SPeter Avalos dbname = mkdbname(ms, fn, 0);
3275327e51cbSPeter Avalos if (dbname == NULL)
3276e8af9738SPeter Avalos goto error;
3277327e51cbSPeter Avalos
3278327e51cbSPeter Avalos if ((fd = open(dbname, O_RDONLY|O_BINARY)) == -1)
3279e8af9738SPeter Avalos goto error;
3280327e51cbSPeter Avalos
3281327e51cbSPeter Avalos if (fstat(fd, &st) == -1) {
3282327e51cbSPeter Avalos file_error(ms, errno, "cannot stat `%s'", dbname);
3283e8af9738SPeter Avalos goto error;
3284327e51cbSPeter Avalos }
32856fca56fbSSascha Wildner if (st.st_size < 8 || st.st_size > maxoff_t()) {
3286e8af9738SPeter Avalos file_error(ms, 0, "file `%s' is too %s", dbname,
3287e8af9738SPeter Avalos st.st_size < 8 ? "small" : "large");
3288e8af9738SPeter Avalos goto error;
3289327e51cbSPeter Avalos }
3290327e51cbSPeter Avalos
32916fca56fbSSascha Wildner map->len = CAST(size_t, st.st_size);
3292327e51cbSPeter Avalos #ifdef QUICK
3293c30bd091SSascha Wildner map->type = MAP_TYPE_MMAP;
32946fca56fbSSascha Wildner if ((map->p = mmap(0, CAST(size_t, st.st_size), PROT_READ|PROT_WRITE,
32956fca56fbSSascha Wildner MAP_PRIVATE|MAP_FILE, fd, CAST(off_t, 0))) == MAP_FAILED) {
3296327e51cbSPeter Avalos file_error(ms, errno, "cannot map `%s'", dbname);
3297e8af9738SPeter Avalos goto error;
3298327e51cbSPeter Avalos }
3299327e51cbSPeter Avalos #else
3300c30bd091SSascha Wildner map->type = MAP_TYPE_MALLOC;
3301e8af9738SPeter Avalos if ((map->p = CAST(void *, malloc(map->len))) == NULL) {
3302e8af9738SPeter Avalos file_oomem(ms, map->len);
3303e8af9738SPeter Avalos goto error;
3304327e51cbSPeter Avalos }
3305e8af9738SPeter Avalos if (read(fd, map->p, map->len) != (ssize_t)map->len) {
3306327e51cbSPeter Avalos file_badread(ms);
3307e8af9738SPeter Avalos goto error;
3308327e51cbSPeter Avalos }
3309327e51cbSPeter Avalos #endif
3310327e51cbSPeter Avalos (void)close(fd);
3311327e51cbSPeter Avalos fd = -1;
331282c5fa3eSPeter Avalos
3313c30bd091SSascha Wildner if (check_buffer(ms, map, dbname) != 0) {
331482c5fa3eSPeter Avalos goto error;
3315c30bd091SSascha Wildner }
3316c30bd091SSascha Wildner #ifdef QUICK
33176fca56fbSSascha Wildner if (mprotect(map->p, CAST(size_t, st.st_size), PROT_READ) == -1) {
3318c30bd091SSascha Wildner file_error(ms, errno, "cannot mprotect `%s'", dbname);
3319c30bd091SSascha Wildner goto error;
3320c30bd091SSascha Wildner }
3321c30bd091SSascha Wildner #endif
332282c5fa3eSPeter Avalos
332382c5fa3eSPeter Avalos free(dbname);
332482c5fa3eSPeter Avalos return map;
332582c5fa3eSPeter Avalos
332682c5fa3eSPeter Avalos error:
332782c5fa3eSPeter Avalos if (fd != -1)
332882c5fa3eSPeter Avalos (void)close(fd);
332982c5fa3eSPeter Avalos apprentice_unmap(map);
333082c5fa3eSPeter Avalos free(dbname);
3331c30bd091SSascha Wildner return rv;
333282c5fa3eSPeter Avalos }
333382c5fa3eSPeter Avalos
333482c5fa3eSPeter Avalos private int
check_buffer(struct magic_set * ms,struct magic_map * map,const char * dbname)333582c5fa3eSPeter Avalos check_buffer(struct magic_set *ms, struct magic_map *map, const char *dbname)
333682c5fa3eSPeter Avalos {
333782c5fa3eSPeter Avalos uint32_t *ptr;
333882c5fa3eSPeter Avalos uint32_t entries, nentries;
333982c5fa3eSPeter Avalos uint32_t version;
334082c5fa3eSPeter Avalos int i, needsbyteswap;
334182c5fa3eSPeter Avalos
3342e8af9738SPeter Avalos ptr = CAST(uint32_t *, map->p);
3343327e51cbSPeter Avalos if (*ptr != MAGICNO) {
3344327e51cbSPeter Avalos if (swap4(*ptr) != MAGICNO) {
334579343712SPeter Avalos file_error(ms, 0, "bad magic in `%s'", dbname);
334682c5fa3eSPeter Avalos return -1;
3347327e51cbSPeter Avalos }
3348327e51cbSPeter Avalos needsbyteswap = 1;
3349327e51cbSPeter Avalos } else
3350327e51cbSPeter Avalos needsbyteswap = 0;
3351327e51cbSPeter Avalos if (needsbyteswap)
3352327e51cbSPeter Avalos version = swap4(ptr[1]);
3353327e51cbSPeter Avalos else
3354327e51cbSPeter Avalos version = ptr[1];
3355327e51cbSPeter Avalos if (version != VERSIONNO) {
3356884044a5SPeter Avalos file_error(ms, 0, "File %s supports only version %d magic "
3357884044a5SPeter Avalos "files. `%s' is version %d", VERSION,
3358327e51cbSPeter Avalos VERSIONNO, dbname, version);
335982c5fa3eSPeter Avalos return -1;
3360327e51cbSPeter Avalos }
33616fca56fbSSascha Wildner entries = CAST(uint32_t, map->len / sizeof(struct magic));
336282c5fa3eSPeter Avalos if ((entries * sizeof(struct magic)) != map->len) {
336382c5fa3eSPeter Avalos file_error(ms, 0, "Size of `%s' %" SIZE_T_FORMAT "u is not "
336482c5fa3eSPeter Avalos "a multiple of %" SIZE_T_FORMAT "u",
336582c5fa3eSPeter Avalos dbname, map->len, sizeof(struct magic));
336682c5fa3eSPeter Avalos return -1;
3367e8af9738SPeter Avalos }
3368e8af9738SPeter Avalos map->magic[0] = CAST(struct magic *, map->p) + 1;
3369e8af9738SPeter Avalos nentries = 0;
3370e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
3371327e51cbSPeter Avalos if (needsbyteswap)
3372e8af9738SPeter Avalos map->nmagic[i] = swap4(ptr[i + 2]);
3373e8af9738SPeter Avalos else
3374e8af9738SPeter Avalos map->nmagic[i] = ptr[i + 2];
3375e8af9738SPeter Avalos if (i != MAGIC_SETS - 1)
3376e8af9738SPeter Avalos map->magic[i + 1] = map->magic[i] + map->nmagic[i];
3377e8af9738SPeter Avalos nentries += map->nmagic[i];
3378e8af9738SPeter Avalos }
3379e8af9738SPeter Avalos if (entries != nentries + 1) {
3380e8af9738SPeter Avalos file_error(ms, 0, "Inconsistent entries in `%s' %u != %u",
3381e8af9738SPeter Avalos dbname, entries, nentries + 1);
338282c5fa3eSPeter Avalos return -1;
3383e8af9738SPeter Avalos }
3384e8af9738SPeter Avalos if (needsbyteswap)
3385e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++)
3386e8af9738SPeter Avalos byteswap(map->magic[i], map->nmagic[i]);
338782c5fa3eSPeter Avalos return 0;
3388327e51cbSPeter Avalos }
3389327e51cbSPeter Avalos
3390327e51cbSPeter Avalos /*
3391327e51cbSPeter Avalos * handle an mmaped file.
3392327e51cbSPeter Avalos */
3393327e51cbSPeter Avalos private int
apprentice_compile(struct magic_set * ms,struct magic_map * map,const char * fn)3394e8af9738SPeter Avalos apprentice_compile(struct magic_set *ms, struct magic_map *map, const char *fn)
3395327e51cbSPeter Avalos {
3396e8af9738SPeter Avalos static const size_t nm = sizeof(*map->nmagic) * MAGIC_SETS;
3397e8af9738SPeter Avalos static const size_t m = sizeof(**map->magic);
33989f86ab30SPeter Avalos int fd = -1;
3399e8af9738SPeter Avalos size_t len;
340079343712SPeter Avalos char *dbname;
340179343712SPeter Avalos int rv = -1;
3402e8af9738SPeter Avalos uint32_t i;
340382c5fa3eSPeter Avalos union {
340482c5fa3eSPeter Avalos struct magic m;
340582c5fa3eSPeter Avalos uint32_t h[2 + MAGIC_SETS];
340682c5fa3eSPeter Avalos } hdr;
340779343712SPeter Avalos
340879343712SPeter Avalos dbname = mkdbname(ms, fn, 1);
3409327e51cbSPeter Avalos
3410327e51cbSPeter Avalos if (dbname == NULL)
341179343712SPeter Avalos goto out;
3412327e51cbSPeter Avalos
3413e8af9738SPeter Avalos if ((fd = open(dbname, O_WRONLY|O_CREAT|O_TRUNC|O_BINARY, 0644)) == -1)
3414e8af9738SPeter Avalos {
3415327e51cbSPeter Avalos file_error(ms, errno, "cannot open `%s'", dbname);
341679343712SPeter Avalos goto out;
3417327e51cbSPeter Avalos }
341882c5fa3eSPeter Avalos memset(&hdr, 0, sizeof(hdr));
341982c5fa3eSPeter Avalos hdr.h[0] = MAGICNO;
342082c5fa3eSPeter Avalos hdr.h[1] = VERSIONNO;
342182c5fa3eSPeter Avalos memcpy(hdr.h + 2, map->nmagic, nm);
3422327e51cbSPeter Avalos
34236fca56fbSSascha Wildner if (write(fd, &hdr, sizeof(hdr)) != CAST(ssize_t, sizeof(hdr))) {
3424327e51cbSPeter Avalos file_error(ms, errno, "error writing `%s'", dbname);
34256fca56fbSSascha Wildner goto out2;
3426327e51cbSPeter Avalos }
3427327e51cbSPeter Avalos
3428e8af9738SPeter Avalos for (i = 0; i < MAGIC_SETS; i++) {
3429e8af9738SPeter Avalos len = m * map->nmagic[i];
34306fca56fbSSascha Wildner if (write(fd, map->magic[i], len) != CAST(ssize_t, len)) {
3431327e51cbSPeter Avalos file_error(ms, errno, "error writing `%s'", dbname);
34326fca56fbSSascha Wildner goto out2;
3433327e51cbSPeter Avalos }
3434e8af9738SPeter Avalos }
3435327e51cbSPeter Avalos
34366fca56fbSSascha Wildner rv = 0;
34376fca56fbSSascha Wildner out2:
34389f86ab30SPeter Avalos if (fd != -1)
3439327e51cbSPeter Avalos (void)close(fd);
344079343712SPeter Avalos out:
3441c30bd091SSascha Wildner apprentice_unmap(map);
344279343712SPeter Avalos free(dbname);
344379343712SPeter Avalos return rv;
3444327e51cbSPeter Avalos }
3445327e51cbSPeter Avalos
3446327e51cbSPeter Avalos private const char ext[] = ".mgc";
3447327e51cbSPeter Avalos /*
3448327e51cbSPeter Avalos * make a dbname
3449327e51cbSPeter Avalos */
3450327e51cbSPeter Avalos private char *
mkdbname(struct magic_set * ms,const char * fn,int strip)345179343712SPeter Avalos mkdbname(struct magic_set *ms, const char *fn, int strip)
3452327e51cbSPeter Avalos {
345379343712SPeter Avalos const char *p, *q;
345479343712SPeter Avalos char *buf;
345579343712SPeter Avalos
3456327e51cbSPeter Avalos if (strip) {
3457327e51cbSPeter Avalos if ((p = strrchr(fn, '/')) != NULL)
3458327e51cbSPeter Avalos fn = ++p;
3459327e51cbSPeter Avalos }
3460327e51cbSPeter Avalos
346179343712SPeter Avalos for (q = fn; *q; q++)
346279343712SPeter Avalos continue;
346379343712SPeter Avalos /* Look for .mgc */
346479343712SPeter Avalos for (p = ext + sizeof(ext) - 1; p >= ext && q >= fn; p--, q--)
346579343712SPeter Avalos if (*p != *q)
346679343712SPeter Avalos break;
346779343712SPeter Avalos
346879343712SPeter Avalos /* Did not find .mgc, restore q */
346979343712SPeter Avalos if (p >= ext)
347079343712SPeter Avalos while (*q)
347179343712SPeter Avalos q++;
347279343712SPeter Avalos
347379343712SPeter Avalos q++;
347479343712SPeter Avalos /* Compatibility with old code that looked in .mime */
347579343712SPeter Avalos if (ms->flags & MAGIC_MIME) {
34766fca56fbSSascha Wildner if (asprintf(&buf, "%.*s.mime%s", CAST(int, q - fn), fn, ext)
34776fca56fbSSascha Wildner < 0)
3478e8af9738SPeter Avalos return NULL;
347979343712SPeter Avalos if (access(buf, R_OK) != -1) {
348079343712SPeter Avalos ms->flags &= MAGIC_MIME_TYPE;
348179343712SPeter Avalos return buf;
348279343712SPeter Avalos }
348379343712SPeter Avalos free(buf);
348479343712SPeter Avalos }
34856fca56fbSSascha Wildner if (asprintf(&buf, "%.*s%s", CAST(int, q - fn), fn, ext) < 0)
3486e8af9738SPeter Avalos return NULL;
348779343712SPeter Avalos
348879343712SPeter Avalos /* Compatibility with old code that looked in .mime */
3489c30bd091SSascha Wildner if (strstr(fn, ".mime") != NULL)
349079343712SPeter Avalos ms->flags &= MAGIC_MIME_TYPE;
3491327e51cbSPeter Avalos return buf;
3492327e51cbSPeter Avalos }
3493327e51cbSPeter Avalos
3494327e51cbSPeter Avalos /*
3495327e51cbSPeter Avalos * Byteswap an mmap'ed file if needed
3496327e51cbSPeter Avalos */
3497327e51cbSPeter Avalos private void
byteswap(struct magic * magic,uint32_t nmagic)3498327e51cbSPeter Avalos byteswap(struct magic *magic, uint32_t nmagic)
3499327e51cbSPeter Avalos {
3500327e51cbSPeter Avalos uint32_t i;
3501327e51cbSPeter Avalos for (i = 0; i < nmagic; i++)
3502327e51cbSPeter Avalos bs1(&magic[i]);
3503327e51cbSPeter Avalos }
3504327e51cbSPeter Avalos
3505*3b9cdfa3SAntonio Huete Jimenez #if !defined(HAVE_BYTESWAP_H) && !defined(HAVE_SYS_BSWAP_H)
3506327e51cbSPeter Avalos /*
3507327e51cbSPeter Avalos * swap a short
3508327e51cbSPeter Avalos */
3509327e51cbSPeter Avalos private uint16_t
swap2(uint16_t sv)3510327e51cbSPeter Avalos swap2(uint16_t sv)
3511327e51cbSPeter Avalos {
3512327e51cbSPeter Avalos uint16_t rv;
35136fca56fbSSascha Wildner uint8_t *s = RCAST(uint8_t *, RCAST(void *, &sv));
35146fca56fbSSascha Wildner uint8_t *d = RCAST(uint8_t *, RCAST(void *, &rv));
3515327e51cbSPeter Avalos d[0] = s[1];
3516327e51cbSPeter Avalos d[1] = s[0];
3517327e51cbSPeter Avalos return rv;
3518327e51cbSPeter Avalos }
3519327e51cbSPeter Avalos
3520327e51cbSPeter Avalos /*
3521327e51cbSPeter Avalos * swap an int
3522327e51cbSPeter Avalos */
3523327e51cbSPeter Avalos private uint32_t
swap4(uint32_t sv)3524327e51cbSPeter Avalos swap4(uint32_t sv)
3525327e51cbSPeter Avalos {
3526327e51cbSPeter Avalos uint32_t rv;
35276fca56fbSSascha Wildner uint8_t *s = RCAST(uint8_t *, RCAST(void *, &sv));
35286fca56fbSSascha Wildner uint8_t *d = RCAST(uint8_t *, RCAST(void *, &rv));
3529327e51cbSPeter Avalos d[0] = s[3];
3530327e51cbSPeter Avalos d[1] = s[2];
3531327e51cbSPeter Avalos d[2] = s[1];
3532327e51cbSPeter Avalos d[3] = s[0];
3533327e51cbSPeter Avalos return rv;
3534327e51cbSPeter Avalos }
3535327e51cbSPeter Avalos
3536327e51cbSPeter Avalos /*
3537327e51cbSPeter Avalos * swap a quad
3538327e51cbSPeter Avalos */
3539327e51cbSPeter Avalos private uint64_t
swap8(uint64_t sv)3540327e51cbSPeter Avalos swap8(uint64_t sv)
3541327e51cbSPeter Avalos {
354279343712SPeter Avalos uint64_t rv;
35436fca56fbSSascha Wildner uint8_t *s = RCAST(uint8_t *, RCAST(void *, &sv));
35446fca56fbSSascha Wildner uint8_t *d = RCAST(uint8_t *, RCAST(void *, &rv));
354579343712SPeter Avalos # if 0
3546327e51cbSPeter Avalos d[0] = s[3];
3547327e51cbSPeter Avalos d[1] = s[2];
3548327e51cbSPeter Avalos d[2] = s[1];
3549327e51cbSPeter Avalos d[3] = s[0];
3550327e51cbSPeter Avalos d[4] = s[7];
3551327e51cbSPeter Avalos d[5] = s[6];
3552327e51cbSPeter Avalos d[6] = s[5];
3553327e51cbSPeter Avalos d[7] = s[4];
355479343712SPeter Avalos # else
355579343712SPeter Avalos d[0] = s[7];
355679343712SPeter Avalos d[1] = s[6];
355779343712SPeter Avalos d[2] = s[5];
355879343712SPeter Avalos d[3] = s[4];
355979343712SPeter Avalos d[4] = s[3];
356079343712SPeter Avalos d[5] = s[2];
356179343712SPeter Avalos d[6] = s[1];
356279343712SPeter Avalos d[7] = s[0];
356379343712SPeter Avalos # endif
3564327e51cbSPeter Avalos return rv;
3565327e51cbSPeter Avalos }
3566*3b9cdfa3SAntonio Huete Jimenez #endif
3567327e51cbSPeter Avalos
3568614728caSSascha Wildner protected uintmax_t
file_varint2uintmax_t(const unsigned char * us,int t,size_t * l)3569614728caSSascha Wildner file_varint2uintmax_t(const unsigned char *us, int t, size_t *l)
3570614728caSSascha Wildner {
3571614728caSSascha Wildner uintmax_t x = 0;
3572614728caSSascha Wildner const unsigned char *c;
3573614728caSSascha Wildner if (t == FILE_LEVARINT) {
3574614728caSSascha Wildner for (c = us; *c; c++) {
3575614728caSSascha Wildner if ((*c & 0x80) == 0)
3576614728caSSascha Wildner break;
3577614728caSSascha Wildner }
3578614728caSSascha Wildner if (l)
3579614728caSSascha Wildner *l = c - us + 1;
3580614728caSSascha Wildner for (; c >= us; c--) {
3581614728caSSascha Wildner x |= *c & 0x7f;
3582614728caSSascha Wildner x <<= 7;
3583614728caSSascha Wildner }
3584614728caSSascha Wildner } else {
3585614728caSSascha Wildner for (c = us; *c; c++) {
3586614728caSSascha Wildner x |= *c & 0x7f;
3587614728caSSascha Wildner if ((*c & 0x80) == 0)
3588614728caSSascha Wildner break;
3589614728caSSascha Wildner x <<= 7;
3590614728caSSascha Wildner }
3591614728caSSascha Wildner if (l)
3592614728caSSascha Wildner *l = c - us + 1;
3593614728caSSascha Wildner }
3594614728caSSascha Wildner return x;
3595614728caSSascha Wildner }
3596614728caSSascha Wildner
3597614728caSSascha Wildner
3598327e51cbSPeter Avalos /*
3599327e51cbSPeter Avalos * byteswap a single magic entry
3600327e51cbSPeter Avalos */
3601327e51cbSPeter Avalos private void
bs1(struct magic * m)3602327e51cbSPeter Avalos bs1(struct magic *m)
3603327e51cbSPeter Avalos {
3604327e51cbSPeter Avalos m->cont_level = swap2(m->cont_level);
36056fca56fbSSascha Wildner m->offset = swap4(CAST(uint32_t, m->offset));
36066fca56fbSSascha Wildner m->in_offset = swap4(CAST(uint32_t, m->in_offset));
36076fca56fbSSascha Wildner m->lineno = swap4(CAST(uint32_t, m->lineno));
3608327e51cbSPeter Avalos if (IS_STRING(m->type)) {
360979343712SPeter Avalos m->str_range = swap4(m->str_range);
3610327e51cbSPeter Avalos m->str_flags = swap4(m->str_flags);
3611327e51cbSPeter Avalos }
3612327e51cbSPeter Avalos else {
3613327e51cbSPeter Avalos m->value.q = swap8(m->value.q);
3614327e51cbSPeter Avalos m->num_mask = swap8(m->num_mask);
3615327e51cbSPeter Avalos }
3616327e51cbSPeter Avalos }
3617e4d4ce0cSPeter Avalos
3618e4d4ce0cSPeter Avalos protected size_t
file_pstring_length_size(struct magic_set * ms,const struct magic * m)3619c990e5baSDaniel Fojt file_pstring_length_size(struct magic_set *ms, const struct magic *m)
3620e4d4ce0cSPeter Avalos {
3621e4d4ce0cSPeter Avalos switch (m->str_flags & PSTRING_LEN) {
3622e4d4ce0cSPeter Avalos case PSTRING_1_LE:
3623e4d4ce0cSPeter Avalos return 1;
3624e4d4ce0cSPeter Avalos case PSTRING_2_LE:
3625e4d4ce0cSPeter Avalos case PSTRING_2_BE:
3626e4d4ce0cSPeter Avalos return 2;
3627e4d4ce0cSPeter Avalos case PSTRING_4_LE:
3628e4d4ce0cSPeter Avalos case PSTRING_4_BE:
3629e4d4ce0cSPeter Avalos return 4;
3630e4d4ce0cSPeter Avalos default:
3631c990e5baSDaniel Fojt file_error(ms, 0, "corrupt magic file "
3632c990e5baSDaniel Fojt "(bad pascal string length %d)",
3633c990e5baSDaniel Fojt m->str_flags & PSTRING_LEN);
3634c990e5baSDaniel Fojt return FILE_BADSIZE;
3635e4d4ce0cSPeter Avalos }
3636e4d4ce0cSPeter Avalos }
3637e4d4ce0cSPeter Avalos protected size_t
file_pstring_get_length(struct magic_set * ms,const struct magic * m,const char * ss)3638c990e5baSDaniel Fojt file_pstring_get_length(struct magic_set *ms, const struct magic *m,
3639c990e5baSDaniel Fojt const char *ss)
3640e4d4ce0cSPeter Avalos {
3641e4d4ce0cSPeter Avalos size_t len = 0;
36426fca56fbSSascha Wildner const unsigned char *s = RCAST(const unsigned char *, ss);
3643c30bd091SSascha Wildner unsigned int s3, s2, s1, s0;
3644e4d4ce0cSPeter Avalos
3645e4d4ce0cSPeter Avalos switch (m->str_flags & PSTRING_LEN) {
3646e4d4ce0cSPeter Avalos case PSTRING_1_LE:
3647e4d4ce0cSPeter Avalos len = *s;
3648e4d4ce0cSPeter Avalos break;
3649e4d4ce0cSPeter Avalos case PSTRING_2_LE:
3650c30bd091SSascha Wildner s0 = s[0];
3651c30bd091SSascha Wildner s1 = s[1];
3652c30bd091SSascha Wildner len = (s1 << 8) | s0;
3653e4d4ce0cSPeter Avalos break;
3654e4d4ce0cSPeter Avalos case PSTRING_2_BE:
3655c30bd091SSascha Wildner s0 = s[0];
3656c30bd091SSascha Wildner s1 = s[1];
3657c30bd091SSascha Wildner len = (s0 << 8) | s1;
3658e4d4ce0cSPeter Avalos break;
3659e4d4ce0cSPeter Avalos case PSTRING_4_LE:
3660c30bd091SSascha Wildner s0 = s[0];
3661c30bd091SSascha Wildner s1 = s[1];
3662c30bd091SSascha Wildner s2 = s[2];
3663c30bd091SSascha Wildner s3 = s[3];
3664c30bd091SSascha Wildner len = (s3 << 24) | (s2 << 16) | (s1 << 8) | s0;
3665e4d4ce0cSPeter Avalos break;
3666e4d4ce0cSPeter Avalos case PSTRING_4_BE:
3667c30bd091SSascha Wildner s0 = s[0];
3668c30bd091SSascha Wildner s1 = s[1];
3669c30bd091SSascha Wildner s2 = s[2];
3670c30bd091SSascha Wildner s3 = s[3];
3671c30bd091SSascha Wildner len = (s0 << 24) | (s1 << 16) | (s2 << 8) | s3;
3672e4d4ce0cSPeter Avalos break;
3673e4d4ce0cSPeter Avalos default:
3674c990e5baSDaniel Fojt file_error(ms, 0, "corrupt magic file "
3675c990e5baSDaniel Fojt "(bad pascal string length %d)",
3676c990e5baSDaniel Fojt m->str_flags & PSTRING_LEN);
3677c990e5baSDaniel Fojt return FILE_BADSIZE;
3678e4d4ce0cSPeter Avalos }
3679e4d4ce0cSPeter Avalos
3680c990e5baSDaniel Fojt if (m->str_flags & PSTRING_LENGTH_INCLUDES_ITSELF) {
3681c990e5baSDaniel Fojt size_t l = file_pstring_length_size(ms, m);
3682c990e5baSDaniel Fojt if (l == FILE_BADSIZE)
3683c990e5baSDaniel Fojt return l;
3684c990e5baSDaniel Fojt len -= l;
3685c990e5baSDaniel Fojt }
3686e4d4ce0cSPeter Avalos
3687e4d4ce0cSPeter Avalos return len;
3688e4d4ce0cSPeter Avalos }
3689e8af9738SPeter Avalos
3690e8af9738SPeter Avalos protected int
file_magicfind(struct magic_set * ms,const char * name,struct mlist * v)3691e8af9738SPeter Avalos file_magicfind(struct magic_set *ms, const char *name, struct mlist *v)
3692e8af9738SPeter Avalos {
3693e8af9738SPeter Avalos uint32_t i, j;
3694e8af9738SPeter Avalos struct mlist *mlist, *ml;
3695e8af9738SPeter Avalos
3696e8af9738SPeter Avalos mlist = ms->mlist[1];
3697e8af9738SPeter Avalos
3698e8af9738SPeter Avalos for (ml = mlist->next; ml != mlist; ml = ml->next) {
3699e8af9738SPeter Avalos struct magic *ma = ml->magic;
3700*3b9cdfa3SAntonio Huete Jimenez for (i = 0; i < ml->nmagic; i++) {
3701e8af9738SPeter Avalos if (ma[i].type != FILE_NAME)
3702e8af9738SPeter Avalos continue;
3703e8af9738SPeter Avalos if (strcmp(ma[i].value.s, name) == 0) {
3704e8af9738SPeter Avalos v->magic = &ma[i];
3705*3b9cdfa3SAntonio Huete Jimenez v->magic_rxcomp = &(ml->magic_rxcomp[i]);
3706*3b9cdfa3SAntonio Huete Jimenez for (j = i + 1; j < ml->nmagic; j++)
3707e8af9738SPeter Avalos if (ma[j].cont_level == 0)
3708e8af9738SPeter Avalos break;
3709e8af9738SPeter Avalos v->nmagic = j - i;
3710e8af9738SPeter Avalos return 0;
3711e8af9738SPeter Avalos }
3712e8af9738SPeter Avalos }
3713e8af9738SPeter Avalos }
3714e8af9738SPeter Avalos return -1;
3715e8af9738SPeter Avalos }
3716