xref: /minix3/external/bsd/file/dist/src/readcdf.c (revision 0b98e8aad89f2bd4ba80b523d73cf29e9dd82ce1)
1 /*	$NetBSD: readcdf.c,v 1.8 2013/01/03 23:05:38 christos Exp $	*/
2 
3 /*-
4  * Copyright (c) 2008 Christos Zoulas
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
17  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
18  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
19  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
20  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26  * POSSIBILITY OF SUCH DAMAGE.
27  */
28 #include "file.h"
29 
30 #ifndef lint
31 #if 0
32 FILE_RCSID("@(#)$File: readcdf.c,v 1.33 2012/06/20 21:52:36 christos Exp $")
33 #else
34 __RCSID("$NetBSD: readcdf.c,v 1.8 2013/01/03 23:05:38 christos Exp $");
35 #endif
36 #endif
37 
38 #include <stdlib.h>
39 #include <unistd.h>
40 #include <string.h>
41 #include <time.h>
42 #include <ctype.h>
43 
44 #include "cdf.h"
45 #include "magic.h"
46 
47 #ifndef __arraycount
48 #define __arraycount(a) (sizeof(a) / sizeof(a[0]))
49 #endif
50 
51 #define NOTMIME(ms) (((ms)->flags & MAGIC_MIME) == 0)
52 
53 private int
54 cdf_file_property_info(struct magic_set *ms, const cdf_property_info_t *info,
55     size_t count)
56 {
57         size_t i;
58         cdf_timestamp_t tp;
59         struct timespec ts;
60         char buf[64];
61         const char *str = NULL;
62         const char *s;
63         int len;
64 
65         for (i = 0; i < count; i++) {
66                 cdf_print_property_name(buf, sizeof(buf), info[i].pi_id);
67                 switch (info[i].pi_type) {
68                 case CDF_NULL:
69                         break;
70                 case CDF_SIGNED16:
71                         if (NOTMIME(ms) && file_printf(ms, ", %s: %hd", buf,
72                             info[i].pi_s16) == -1)
73                                 return -1;
74                         break;
75                 case CDF_SIGNED32:
76                         if (NOTMIME(ms) && file_printf(ms, ", %s: %d", buf,
77                             info[i].pi_s32) == -1)
78                                 return -1;
79                         break;
80                 case CDF_UNSIGNED32:
81                         if (NOTMIME(ms) && file_printf(ms, ", %s: %u", buf,
82                             info[i].pi_u32) == -1)
83                                 return -1;
84                         break;
85                 case CDF_FLOAT:
86                         if (NOTMIME(ms) && file_printf(ms, ", %s: %g", buf,
87                             info[i].pi_f) == -1)
88                                 return -1;
89                         break;
90                 case CDF_DOUBLE:
91                         if (NOTMIME(ms) && file_printf(ms, ", %s: %g", buf,
92                             info[i].pi_d) == -1)
93                                 return -1;
94                         break;
95                 case CDF_LENGTH32_STRING:
96                 case CDF_LENGTH32_WSTRING:
97                         len = info[i].pi_str.s_len;
98                         if (len > 1) {
99                                 char vbuf[1024];
100                                 size_t j, k = 1;
101 
102                                 if (info[i].pi_type == CDF_LENGTH32_WSTRING)
103                                     k++;
104                                 s = info[i].pi_str.s_buf;
105                                 for (j = 0; j < sizeof(vbuf) && len--;
106                                     j++, s += k) {
107                                         if (*s == '\0')
108                                                 break;
109                                         if (isprint((unsigned char)*s))
110                                                 vbuf[j] = *s;
111                                 }
112                                 if (j == sizeof(vbuf))
113                                         --j;
114                                 vbuf[j] = '\0';
115                                 if (NOTMIME(ms)) {
116                                         if (vbuf[0]) {
117                                                 if (file_printf(ms, ", %s: %s",
118                                                     buf, vbuf) == -1)
119                                                         return -1;
120                                         }
121                                 } else if (info[i].pi_id ==
122                                         CDF_PROPERTY_NAME_OF_APPLICATION) {
123                                         if (strstr(vbuf, "Word"))
124                                                 str = "msword";
125                                         else if (strstr(vbuf, "Excel"))
126                                                 str = "vnd.ms-excel";
127                                         else if (strstr(vbuf, "Powerpoint"))
128                                                 str = "vnd.ms-powerpoint";
129                                         else if (strstr(vbuf,
130                                             "Crystal Reports"))
131                                                 str = "x-rpt";
132                                 }
133                         }
134                         break;
135                 case CDF_FILETIME:
136                         tp = info[i].pi_tp;
137                         if (tp != 0) {
138 				char tbuf[64];
139                                 if (tp < 1000000000000000LL) {
140                                         cdf_print_elapsed_time(tbuf,
141                                             sizeof(tbuf), tp);
142                                         if (NOTMIME(ms) && file_printf(ms,
143                                             ", %s: %s", buf, tbuf) == -1)
144                                                 return -1;
145                                 } else {
146                                         char *c, *ec;
147                                         cdf_timestamp_to_timespec(&ts, tp);
148                                         c = cdf_ctime(&ts.tv_sec, tbuf);
149                                         if ((ec = strchr(c, '\n')) != NULL)
150                                                 *ec = '\0';
151 
152                                         if (NOTMIME(ms) && file_printf(ms,
153                                             ", %s: %s", buf, c) == -1)
154                                                 return -1;
155                                 }
156                         }
157                         break;
158                 case CDF_CLIPBOARD:
159                         break;
160                 default:
161                         return -1;
162                 }
163         }
164         if (!NOTMIME(ms)) {
165 		if (str == NULL)
166 			return 0;
167                 if (file_printf(ms, "application/%s", str) == -1)
168                         return -1;
169         }
170         return 1;
171 }
172 
173 private int
174 cdf_file_summary_info(struct magic_set *ms, const cdf_header_t *h,
175     const cdf_stream_t *sst)
176 {
177         cdf_summary_info_header_t si;
178         cdf_property_info_t *info;
179         size_t count;
180         int m;
181 
182         if (cdf_unpack_summary_info(sst, h, &si, &info, &count) == -1)
183                 return -1;
184 
185         if (NOTMIME(ms)) {
186                 if (file_printf(ms, "Composite Document File V2 Document")
187 		    == -1)
188                         return -1;
189 
190                 if (file_printf(ms, ", %s Endian",
191                     si.si_byte_order == 0xfffe ?  "Little" : "Big") == -1)
192                         return -2;
193                 switch (si.si_os) {
194                 case 2:
195                         if (file_printf(ms, ", Os: Windows, Version %d.%d",
196                             si.si_os_version & 0xff,
197                             (uint32_t)si.si_os_version >> 8) == -1)
198                                 return -2;
199                         break;
200                 case 1:
201                         if (file_printf(ms, ", Os: MacOS, Version %d.%d",
202                             (uint32_t)si.si_os_version >> 8,
203                             si.si_os_version & 0xff) == -1)
204                                 return -2;
205                         break;
206                 default:
207                         if (file_printf(ms, ", Os %d, Version: %d.%d", si.si_os,
208                             si.si_os_version & 0xff,
209                             (uint32_t)si.si_os_version >> 8) == -1)
210                                 return -2;
211                         break;
212                 }
213         }
214 
215         m = cdf_file_property_info(ms, info, count);
216         free(info);
217 
218         return m == -1 ? -2 : m;
219 }
220 
221 protected int
222 file_trycdf(struct magic_set *ms, int fd, const unsigned char *buf,
223     size_t nbytes)
224 {
225         cdf_info_t info;
226         cdf_header_t h;
227         cdf_sat_t sat, ssat;
228         cdf_stream_t sst, scn;
229         cdf_dir_t dir;
230         int i;
231         const char *expn = "";
232         const char *corrupt = "corrupt: ";
233 
234         info.i_fd = fd;
235         info.i_buf = buf;
236         info.i_len = nbytes;
237         if (ms->flags & MAGIC_APPLE)
238                 return 0;
239         if (cdf_read_header(&info, &h) == -1)
240                 return 0;
241 #ifdef CDF_DEBUG
242         cdf_dump_header(&h);
243 #endif
244 
245         if ((i = cdf_read_sat(&info, &h, &sat)) == -1) {
246                 expn = "Can't read SAT";
247                 goto out0;
248         }
249 #ifdef CDF_DEBUG
250         cdf_dump_sat("SAT", &sat, CDF_SEC_SIZE(&h));
251 #endif
252 
253         if ((i = cdf_read_ssat(&info, &h, &sat, &ssat)) == -1) {
254                 expn = "Can't read SSAT";
255                 goto out1;
256         }
257 #ifdef CDF_DEBUG
258         cdf_dump_sat("SSAT", &ssat, CDF_SHORT_SEC_SIZE(&h));
259 #endif
260 
261         if ((i = cdf_read_dir(&info, &h, &sat, &dir)) == -1) {
262                 expn = "Can't read directory";
263                 goto out2;
264         }
265 
266         if ((i = cdf_read_short_stream(&info, &h, &sat, &dir, &sst)) == -1) {
267                 expn = "Cannot read short stream";
268                 goto out3;
269         }
270 #ifdef CDF_DEBUG
271         cdf_dump_dir(&info, &h, &sat, &ssat, &sst, &dir);
272 #endif
273 
274         if ((i = cdf_read_summary_info(&info, &h, &sat, &ssat, &sst, &dir,
275             &scn)) == -1) {
276                 if (errno == ESRCH) {
277                         corrupt = expn;
278                         expn = "No summary info";
279                 } else {
280                         expn = "Cannot read summary info";
281                 }
282                 goto out4;
283         }
284 #ifdef CDF_DEBUG
285         cdf_dump_summary_info(&h, &scn);
286 #endif
287         if ((i = cdf_file_summary_info(ms, &h, &scn)) < 0)
288                 expn = "Can't expand summary_info";
289 	if (i == 0) {
290 		const char *str = "vnd.ms-office";
291 		cdf_directory_t *d;
292 		char name[__arraycount(d->d_name)];
293 		size_t j, k;
294 		for (j = 0; j < dir.dir_len; j++) {
295 		    d = &dir.dir_tab[j];
296 		    for (k = 0; k < sizeof(name); k++)
297 			name[k] = (char)cdf_tole2(d->d_name[k]);
298 		    if (strstr(name, "WordDocument") != 0) {
299 			str = "msword";
300 			break;
301 		    }
302 		    if (strstr(name, "PowerPoint") != 0) {
303 			str = "vnd.ms-powerpoint";
304 			break;
305 		    }
306 		}
307                 if (file_printf(ms, "application/%s", str) == -1)
308                         return -1;
309 		i = 1;
310 	}
311         free(scn.sst_tab);
312 out4:
313         free(sst.sst_tab);
314 out3:
315         free(dir.dir_tab);
316 out2:
317         free(ssat.sat_tab);
318 out1:
319         free(sat.sat_tab);
320 out0:
321         if (i != 1) {
322 		if (i == -1) {
323 		    if (NOTMIME(ms)) {
324 			if (file_printf(ms,
325 			    "Composite Document File V2 Document") == -1)
326 			    return -1;
327 			if (*expn)
328 			    if (file_printf(ms, ", %s%s", corrupt, expn) == -1)
329 				return -1;
330 		    } else {
331 			if (file_printf(ms, "application/CDFV2-corrupt") == -1)
332 			    return -1;
333 		    }
334 		}
335                 i = 1;
336         }
337         return i;
338 }
339