readcdf.c revision 256281
1/*-
2 * Copyright (c) 2008 Christos Zoulas
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
15 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
16 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
17 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
18 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
19 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
20 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
21 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
22 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
23 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
24 * POSSIBILITY OF SUCH DAMAGE.
25 */
26#include "file.h"
27
28#ifndef lint
29FILE_RCSID("@(#)$File: readcdf.c,v 1.29 2012/02/20 20:04:58 christos Exp $")
30#endif
31
32#include <stdlib.h>
33#include <unistd.h>
34#include <string.h>
35#include <time.h>
36#include <ctype.h>
37
38#include "cdf.h"
39#include "magic.h"
40
41#define NOTMIME(ms) (((ms)->flags & MAGIC_MIME) == 0)
42
43private int
44cdf_file_property_info(struct magic_set *ms, const cdf_property_info_t *info,
45    size_t count)
46{
47        size_t i;
48        cdf_timestamp_t tp;
49        struct timespec ts;
50        char buf[64];
51        const char *str = NULL;
52        const char *s;
53        int len;
54
55        for (i = 0; i < count; i++) {
56                cdf_print_property_name(buf, sizeof(buf), info[i].pi_id);
57                switch (info[i].pi_type) {
58                case CDF_NULL:
59                        break;
60                case CDF_SIGNED16:
61                        if (NOTMIME(ms) && file_printf(ms, ", %s: %hd", buf,
62                            info[i].pi_s16) == -1)
63                                return -1;
64                        break;
65                case CDF_SIGNED32:
66                        if (NOTMIME(ms) && file_printf(ms, ", %s: %d", buf,
67                            info[i].pi_s32) == -1)
68                                return -1;
69                        break;
70                case CDF_UNSIGNED32:
71                        if (NOTMIME(ms) && file_printf(ms, ", %s: %u", buf,
72                            info[i].pi_u32) == -1)
73                                return -1;
74                        break;
75                case CDF_FLOAT:
76                        if (NOTMIME(ms) && file_printf(ms, ", %s: %g", buf,
77                            info[i].pi_f) == -1)
78                                return -1;
79                        break;
80                case CDF_DOUBLE:
81                        if (NOTMIME(ms) && file_printf(ms, ", %s: %g", buf,
82                            info[i].pi_d) == -1)
83                                return -1;
84                        break;
85                case CDF_LENGTH32_STRING:
86                case CDF_LENGTH32_WSTRING:
87                        len = info[i].pi_str.s_len;
88                        if (len > 1) {
89                                char vbuf[1024];
90                                size_t j, k = 1;
91
92                                if (info[i].pi_type == CDF_LENGTH32_WSTRING)
93                                    k++;
94                                s = info[i].pi_str.s_buf;
95                                for (j = 0; j < sizeof(vbuf) && len--;
96                                    j++, s += k) {
97                                        if (*s == '\0')
98                                                break;
99                                        if (isprint((unsigned char)*s))
100                                                vbuf[j] = *s;
101                                }
102                                if (j == sizeof(vbuf))
103                                        --j;
104                                vbuf[j] = '\0';
105                                if (NOTMIME(ms)) {
106                                        if (vbuf[0]) {
107                                                if (file_printf(ms, ", %s: %s",
108                                                    buf, vbuf) == -1)
109                                                        return -1;
110                                        }
111                                } else if (info[i].pi_id ==
112                                        CDF_PROPERTY_NAME_OF_APPLICATION) {
113                                        if (strstr(vbuf, "Word"))
114                                                str = "msword";
115                                        else if (strstr(vbuf, "Excel"))
116                                                str = "vnd.ms-excel";
117                                        else if (strstr(vbuf, "Powerpoint"))
118                                                str = "vnd.ms-powerpoint";
119                                        else if (strstr(vbuf,
120                                            "Crystal Reports"))
121                                                str = "x-rpt";
122                                }
123                        }
124                        break;
125                case CDF_FILETIME:
126                        tp = info[i].pi_tp;
127                        if (tp != 0) {
128                                if (tp < 1000000000000000LL) {
129                                        char tbuf[64];
130                                        cdf_print_elapsed_time(tbuf,
131                                            sizeof(tbuf), tp);
132                                        if (NOTMIME(ms) && file_printf(ms,
133                                            ", %s: %s", buf, tbuf) == -1)
134                                                return -1;
135                                } else {
136                                        char *c, *ec;
137                                        cdf_timestamp_to_timespec(&ts, tp);
138                                        c = cdf_ctime(&ts.tv_sec);
139                                        if ((ec = strchr(c, '\n')) != NULL)
140                                                *ec = '\0';
141
142                                        if (NOTMIME(ms) && file_printf(ms,
143                                            ", %s: %s", buf, c) == -1)
144                                                return -1;
145                                }
146                        }
147                        break;
148                case CDF_CLIPBOARD:
149                        break;
150                default:
151                        return -1;
152                }
153        }
154        if (!NOTMIME(ms)) {
155		if (str == NULL)
156			return 0;
157                if (file_printf(ms, "application/%s", str) == -1)
158                        return -1;
159        }
160        return 1;
161}
162
163private int
164cdf_file_summary_info(struct magic_set *ms, const cdf_header_t *h,
165    const cdf_stream_t *sst)
166{
167        cdf_summary_info_header_t si;
168        cdf_property_info_t *info;
169        size_t count;
170        int m;
171
172        if (cdf_unpack_summary_info(sst, h, &si, &info, &count) == -1)
173                return -1;
174
175        if (NOTMIME(ms)) {
176                if (file_printf(ms, "Composite Document File V2 Document")
177		    == -1)
178                        return -1;
179
180                if (file_printf(ms, ", %s Endian",
181                    si.si_byte_order == 0xfffe ?  "Little" : "Big") == -1)
182                        return -2;
183                switch (si.si_os) {
184                case 2:
185                        if (file_printf(ms, ", Os: Windows, Version %d.%d",
186                            si.si_os_version & 0xff,
187                            (uint32_t)si.si_os_version >> 8) == -1)
188                                return -2;
189                        break;
190                case 1:
191                        if (file_printf(ms, ", Os: MacOS, Version %d.%d",
192                            (uint32_t)si.si_os_version >> 8,
193                            si.si_os_version & 0xff) == -1)
194                                return -2;
195                        break;
196                default:
197                        if (file_printf(ms, ", Os %d, Version: %d.%d", si.si_os,
198                            si.si_os_version & 0xff,
199                            (uint32_t)si.si_os_version >> 8) == -1)
200                                return -2;
201                        break;
202                }
203        }
204
205        m = cdf_file_property_info(ms, info, count);
206        free(info);
207
208        return m == -1 ? -2 : m;
209}
210
211protected int
212file_trycdf(struct magic_set *ms, int fd, const unsigned char *buf,
213    size_t nbytes)
214{
215        cdf_info_t info;
216        cdf_header_t h;
217        cdf_sat_t sat, ssat;
218        cdf_stream_t sst, scn;
219        cdf_dir_t dir;
220        int i;
221        const char *expn = "";
222        const char *corrupt = "corrupt: ";
223
224        info.i_fd = fd;
225        info.i_buf = buf;
226        info.i_len = nbytes;
227        if (ms->flags & MAGIC_APPLE)
228                return 0;
229        if (cdf_read_header(&info, &h) == -1)
230                return 0;
231#ifdef CDF_DEBUG
232        cdf_dump_header(&h);
233#endif
234
235        if ((i = cdf_read_sat(&info, &h, &sat)) == -1) {
236                expn = "Can't read SAT";
237                goto out0;
238        }
239#ifdef CDF_DEBUG
240        cdf_dump_sat("SAT", &sat, CDF_SEC_SIZE(&h));
241#endif
242
243        if ((i = cdf_read_ssat(&info, &h, &sat, &ssat)) == -1) {
244                expn = "Can't read SSAT";
245                goto out1;
246        }
247#ifdef CDF_DEBUG
248        cdf_dump_sat("SSAT", &ssat, CDF_SHORT_SEC_SIZE(&h));
249#endif
250
251        if ((i = cdf_read_dir(&info, &h, &sat, &dir)) == -1) {
252                expn = "Can't read directory";
253                goto out2;
254        }
255
256        if ((i = cdf_read_short_stream(&info, &h, &sat, &dir, &sst)) == -1) {
257                expn = "Cannot read short stream";
258                goto out3;
259        }
260#ifdef CDF_DEBUG
261        cdf_dump_dir(&info, &h, &sat, &ssat, &sst, &dir);
262#endif
263
264        if ((i = cdf_read_summary_info(&info, &h, &sat, &ssat, &sst, &dir,
265            &scn)) == -1) {
266                if (errno == ESRCH) {
267                        corrupt = expn;
268                        expn = "No summary info";
269                } else {
270                        expn = "Cannot read summary info";
271                }
272                goto out4;
273        }
274#ifdef CDF_DEBUG
275        cdf_dump_summary_info(&h, &scn);
276#endif
277        if ((i = cdf_file_summary_info(ms, &h, &scn)) < 0)
278                expn = "Can't expand summary_info";
279	if (i == 0) {
280		const char *str = "vnd.ms-office";
281		cdf_directory_t *d;
282		char name[__arraycount(d->d_name)];
283		size_t j, k;
284		for (j = 0; j < dir.dir_len; j++) {
285		    d = &dir.dir_tab[j];
286		    for (k = 0; k < sizeof(name); k++)
287			name[k] = (char)cdf_tole2(d->d_name[k]);
288		    if (strstr(name, "WordDocument") == 0) {
289			str = "msword";
290			break;
291		    }
292		}
293                if (file_printf(ms, "application/%s", str) == -1)
294                        return -1;
295		i = 1;
296	}
297        free(scn.sst_tab);
298out4:
299        free(sst.sst_tab);
300out3:
301        free(dir.dir_tab);
302out2:
303        free(ssat.sat_tab);
304out1:
305        free(sat.sat_tab);
306out0:
307        if (i != 1) {
308		if (i == -1)
309		    if (file_printf(ms, "Composite Document File V2 Document")
310			== -1)
311			    return -1;
312                if (*expn)
313                        if (file_printf(ms, ", %s%s", corrupt, expn) == -1)
314                                return -1;
315                i = 1;
316        }
317        return i;
318}
319