2 * Copyright (c) 2008 Christos Zoulas
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
14 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
15 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
16 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
17 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
18 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
19 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
20 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
21 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
22 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
23 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
24 * POSSIBILITY OF SUCH DAMAGE.
29 FILE_RCSID("@(#)$File: readcdf.c,v 1.44 2014/05/14 23:22:48 christos Exp $")
38 #if defined(HAVE_LOCALE_H)
45 #define NOTMIME(ms) (((ms)->flags & MAGIC_MIME) == 0)
47 static const struct nv {
51 { "Word", "msword", },
52 { "Excel", "vnd.ms-excel", },
53 { "Powerpoint", "vnd.ms-powerpoint", },
54 { "Crystal Reports", "x-rpt", },
55 { "Advanced Installer", "vnd.ms-msi", },
56 { "InstallShield", "vnd.ms-msi", },
57 { "Microsoft Patch Compiler", "vnd.ms-msi", },
58 { "NAnt", "vnd.ms-msi", },
59 { "Windows Installer", "vnd.ms-msi", },
62 { "WordDocument", "msword", },
63 { "PowerPoint", "vnd.ms-powerpoint", },
64 { "DigitalSignature", "vnd.ms-msi", },
67 { "WordDocument", "Microsoft Office Word",},
68 { "PowerPoint", "Microsoft PowerPoint", },
69 { "DigitalSignature", "Microsoft Installer", },
73 static const struct cv {
78 { 0x00000000000c1084LLU, 0x46000000000000c0LLU },
86 { 0x00000000000c1084LLU, 0x46000000000000c0LLU },
95 cdf_clsid_to_mime(const uint64_t clsid[2], const struct cv *cv)
98 for (i = 0; cv[i].mime != NULL; i++) {
99 if (clsid[0] == cv[i].clsid[0] && clsid[1] == cv[i].clsid[1])
106 cdf_app_to_mime(const char *vbuf, const struct nv *nv)
109 const char *rv = NULL;
112 old_lc_ctype = setlocale(LC_CTYPE, NULL);
113 assert(old_lc_ctype != NULL);
114 old_lc_ctype = strdup(old_lc_ctype);
115 assert(old_lc_ctype != NULL);
116 (void)setlocale(LC_CTYPE, "C");
117 for (i = 0; nv[i].pattern != NULL; i++)
118 if (strcasestr(vbuf, nv[i].pattern) != NULL) {
122 (void)setlocale(LC_CTYPE, old_lc_ctype);
128 cdf_file_property_info(struct magic_set *ms, const cdf_property_info_t *info,
129 size_t count, const cdf_directory_t *root_storage)
135 const char *str = NULL;
139 if (!NOTMIME(ms) && root_storage)
140 str = cdf_clsid_to_mime(root_storage->d_storage_uuid,
143 for (i = 0; i < count; i++) {
144 cdf_print_property_name(buf, sizeof(buf), info[i].pi_id);
145 switch (info[i].pi_type) {
149 if (NOTMIME(ms) && file_printf(ms, ", %s: %hd", buf,
150 info[i].pi_s16) == -1)
154 if (NOTMIME(ms) && file_printf(ms, ", %s: %d", buf,
155 info[i].pi_s32) == -1)
159 if (NOTMIME(ms) && file_printf(ms, ", %s: %u", buf,
160 info[i].pi_u32) == -1)
164 if (NOTMIME(ms) && file_printf(ms, ", %s: %g", buf,
169 if (NOTMIME(ms) && file_printf(ms, ", %s: %g", buf,
173 case CDF_LENGTH32_STRING:
174 case CDF_LENGTH32_WSTRING:
175 len = info[i].pi_str.s_len;
180 if (info[i].pi_type == CDF_LENGTH32_WSTRING)
182 s = info[i].pi_str.s_buf;
183 for (j = 0; j < sizeof(vbuf) && len--; s += k) {
186 if (isprint((unsigned char)*s))
189 if (j == sizeof(vbuf))
194 if (file_printf(ms, ", %s: %s",
198 } else if (str == NULL && info[i].pi_id ==
199 CDF_PROPERTY_NAME_OF_APPLICATION) {
200 str = cdf_app_to_mime(vbuf, app2mime);
208 if (tp < 1000000000000000LL) {
209 cdf_print_elapsed_time(tbuf,
211 if (NOTMIME(ms) && file_printf(ms,
212 ", %s: %s", buf, tbuf) == -1)
216 cdf_timestamp_to_timespec(&ts, tp);
217 c = cdf_ctime(&ts.tv_sec, tbuf);
219 (ec = strchr(c, '\n')) != NULL)
222 if (NOTMIME(ms) && file_printf(ms,
223 ", %s: %s", buf, c) == -1)
237 if (file_printf(ms, "application/%s", str) == -1)
244 cdf_file_summary_info(struct magic_set *ms, const cdf_header_t *h,
245 const cdf_stream_t *sst, const cdf_directory_t *root_storage)
247 cdf_summary_info_header_t si;
248 cdf_property_info_t *info;
252 if (cdf_unpack_summary_info(sst, h, &si, &info, &count) == -1)
258 if (file_printf(ms, "Composite Document File V2 Document")
262 if (file_printf(ms, ", %s Endian",
263 si.si_byte_order == 0xfffe ? "Little" : "Big") == -1)
267 if (file_printf(ms, ", Os: Windows, Version %d.%d",
268 si.si_os_version & 0xff,
269 (uint32_t)si.si_os_version >> 8) == -1)
273 if (file_printf(ms, ", Os: MacOS, Version %d.%d",
274 (uint32_t)si.si_os_version >> 8,
275 si.si_os_version & 0xff) == -1)
279 if (file_printf(ms, ", Os %d, Version: %d.%d", si.si_os,
280 si.si_os_version & 0xff,
281 (uint32_t)si.si_os_version >> 8) == -1)
286 str = cdf_clsid_to_mime(root_storage->d_storage_uuid,
289 if (file_printf(ms, ", %s", str) == -1)
294 m = cdf_file_property_info(ms, info, count, root_storage);
297 return m == -1 ? -2 : m;
302 format_clsid(char *buf, size_t len, const uint64_t uuid[2]) {
303 snprintf(buf, len, "%.8" PRIx64 "-%.4" PRIx64 "-%.4" PRIx64 "-%.4"
304 PRIx64 "-%.12" PRIx64,
305 (uuid[0] >> 32) & (uint64_t)0x000000000ffffffffLLU,
306 (uuid[0] >> 16) & (uint64_t)0x0000000000000ffffLLU,
307 (uuid[0] >> 0) & (uint64_t)0x0000000000000ffffLLU,
308 (uuid[1] >> 48) & (uint64_t)0x0000000000000ffffLLU,
309 (uuid[1] >> 0) & (uint64_t)0x0000fffffffffffffLLU);
315 file_trycdf(struct magic_set *ms, int fd, const unsigned char *buf,
321 cdf_stream_t sst, scn;
324 const char *expn = "";
325 const char *corrupt = "corrupt: ";
330 if (ms->flags & MAGIC_APPLE)
332 if (cdf_read_header(&info, &h) == -1)
338 if ((i = cdf_read_sat(&info, &h, &sat)) == -1) {
339 expn = "Can't read SAT";
343 cdf_dump_sat("SAT", &sat, CDF_SEC_SIZE(&h));
346 if ((i = cdf_read_ssat(&info, &h, &sat, &ssat)) == -1) {
347 expn = "Can't read SSAT";
351 cdf_dump_sat("SSAT", &ssat, CDF_SHORT_SEC_SIZE(&h));
354 if ((i = cdf_read_dir(&info, &h, &sat, &dir)) == -1) {
355 expn = "Can't read directory";
359 const cdf_directory_t *root_storage;
360 if ((i = cdf_read_short_stream(&info, &h, &sat, &dir, &sst,
361 &root_storage)) == -1) {
362 expn = "Cannot read short stream";
366 cdf_dump_dir(&info, &h, &sat, &ssat, &sst, &dir);
372 if (file_printf(ms, "CLSID %s, ",
373 format_clsid(clsbuf, sizeof(clsbuf),
374 root_storage->d_storage_uuid)) == -1)
380 if ((i = cdf_read_user_stream(&info, &h, &sat, &ssat, &sst, &dir,
381 "FileHeader", &scn)) != -1) {
382 #define HWP5_SIGNATURE "HWP Document File"
383 if (scn.sst_dirlen >= sizeof(HWP5_SIGNATURE) - 1
384 && memcmp(scn.sst_tab, HWP5_SIGNATURE,
385 sizeof(HWP5_SIGNATURE) - 1) == 0) {
388 "Hangul (Korean) Word Processor File 5.x") == -1)
391 if (file_printf(ms, "application/x-hwp") == -1)
404 if ((i = cdf_read_summary_info(&info, &h, &sat, &ssat, &sst, &dir,
406 if (errno == ESRCH) {
408 expn = "No summary info";
410 expn = "Cannot read summary info";
415 cdf_dump_summary_info(&h, &scn);
417 if ((i = cdf_file_summary_info(ms, &h, &scn, root_storage)) < 0)
418 expn = "Can't expand summary_info";
421 const char *str = NULL;
423 char name[__arraycount(d->d_name)];
426 for (j = 0; str == NULL && j < dir.dir_len; j++) {
428 for (k = 0; k < sizeof(name); k++)
429 name[k] = (char)cdf_tole2(d->d_name[k]);
430 str = cdf_app_to_mime(name,
431 NOTMIME(ms) ? name2desc : name2mime);
435 if (file_printf(ms, "%s", str) == -1)
441 str = "vnd.ms-office";
442 if (file_printf(ms, "application/%s", str) == -1)
461 "Composite Document File V2 Document") == -1)
464 if (file_printf(ms, ", %s%s", corrupt, expn) == -1)
467 if (file_printf(ms, "application/CDFV2-corrupt") == -1)