2 * Copyright (c) Ian F. Darwin 1986-1995.
3 * Software written by Ian F. Darwin and others;
4 * maintained 1995-present by Christos Zoulas and others.
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
9 * 1. Redistributions of source code must retain the above copyright
10 * notice immediately at the beginning of the file, without modification,
11 * this list of conditions, and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
20 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * softmagic - interpret variable magic from MAGIC
35 FILE_RCSID("@(#)$File: softmagic.c,v 1.147 2011/11/05 15:44:22 rrt Exp $")
45 private int match(struct magic_set *, struct magic *, uint32_t,
46 const unsigned char *, size_t, int, int, int);
47 private int mget(struct magic_set *, const unsigned char *,
48 struct magic *, size_t, unsigned int, int, int);
49 private int magiccheck(struct magic_set *, struct magic *);
50 private int32_t mprint(struct magic_set *, struct magic *);
51 private int32_t moffset(struct magic_set *, struct magic *);
52 private void mdebug(uint32_t, const char *, size_t);
53 private int mcopy(struct magic_set *, union VALUETYPE *, int, int,
54 const unsigned char *, uint32_t, size_t, size_t);
55 private int mconvert(struct magic_set *, struct magic *);
56 private int print_sep(struct magic_set *, int);
57 private int handle_annotation(struct magic_set *, struct magic *);
58 private void cvt_8(union VALUETYPE *, const struct magic *);
59 private void cvt_16(union VALUETYPE *, const struct magic *);
60 private void cvt_32(union VALUETYPE *, const struct magic *);
61 private void cvt_64(union VALUETYPE *, const struct magic *);
63 #define OFFSET_OOB(n, o, i) ((n) < (o) || (i) > ((n) - (o)))
65 * softmagic - lookup one file in parsed, in-memory copy of database
66 * Passed the name and FILE * of one file to be typed.
68 /*ARGSUSED1*/ /* nbytes passed for regularity, maybe need later */
70 file_softmagic(struct magic_set *ms, const unsigned char *buf, size_t nbytes,
71 size_t level, int mode, int text)
75 for (ml = ms->mlist->next; ml != ms->mlist; ml = ml->next)
76 if ((rv = match(ms, ml->magic, ml->nmagic, buf, nbytes, mode,
84 * Go through the whole list, stopping if you find a match. Process all
85 * the continuations of that match before returning.
87 * We support multi-level continuations:
89 * At any time when processing a successful top-level match, there is a
90 * current continuation level; it represents the level of the last
91 * successfully matched continuation.
93 * Continuations above that level are skipped as, if we see one, it
94 * means that the continuation that controls them - i.e, the
95 * lower-level continuation preceding them - failed to match.
97 * Continuations below that level are processed as, if we see one,
98 * it means we've finished processing or skipping higher-level
99 * continuations under the control of a successful or unsuccessful
100 * lower-level continuation, and are now seeing the next lower-level
101 * continuation and should process it. The current continuation
102 * level reverts to the level of the one we're seeing.
104 * Continuations at the current level are processed as, if we see
105 * one, there's no lower-level continuation that may have failed.
107 * If a continuation matches, we bump the current continuation level
108 * so that higher-level continuations are processed.
111 match(struct magic_set *ms, struct magic *magic, uint32_t nmagic,
112 const unsigned char *s, size_t nbytes, int mode, int text,
115 uint32_t magindex = 0;
116 unsigned int cont_level = 0;
117 int need_separator = 0;
118 int returnval = 0, e; /* if a match is found it is set to 1*/
119 int firstline = 1; /* a flag to print X\n X\n- X */
120 int printed_something = 0;
121 int print = (ms->flags & (MAGIC_MIME|MAGIC_APPLE)) == 0;
123 if (file_check_mem(ms, cont_level) == -1)
126 for (magindex = 0; magindex < nmagic; magindex++) {
128 struct magic *m = &magic[magindex];
130 if ((IS_STRING(m->type) &&
131 ((text && (m->str_flags & (STRING_BINTEST | STRING_TEXTTEST)) == STRING_BINTEST) ||
132 (!text && (m->str_flags & (STRING_TEXTTEST | STRING_BINTEST)) == STRING_TEXTTEST))) ||
133 (m->flag & mode) != mode) {
135 while (magic[magindex + 1].cont_level != 0 &&
138 continue; /* Skip to next top-level test*/
141 ms->offset = m->offset;
142 ms->line = m->lineno;
144 /* if main entry matches, print it... */
145 switch (mget(ms, s, m, nbytes, cont_level, text, recursion_level + 1)) {
149 flush = m->reln != '!';
152 if (m->type == FILE_INDIRECT)
155 switch (magiccheck(ms, m)) {
169 * main entry didn't match,
170 * flush its continuations
172 while (magindex < nmagic - 1 &&
173 magic[magindex + 1].cont_level != 0)
178 if ((e = handle_annotation(ms, m)) != 0)
181 * If we are going to print something, we'll need to print
182 * a blank before we print something else.
186 printed_something = 1;
187 if (print_sep(ms, firstline) == -1)
192 if (print && mprint(ms, m) == -1)
195 ms->c.li[cont_level].off = moffset(ms, m);
197 /* and any continuations that match */
198 if (file_check_mem(ms, ++cont_level) == -1)
201 while (magic[magindex+1].cont_level != 0 &&
202 ++magindex < nmagic) {
203 m = &magic[magindex];
204 ms->line = m->lineno; /* for messages */
206 if (cont_level < m->cont_level)
208 if (cont_level > m->cont_level) {
210 * We're at the end of the level
211 * "cont_level" continuations.
213 cont_level = m->cont_level;
215 ms->offset = m->offset;
216 if (m->flag & OFFADD) {
218 ms->c.li[cont_level - 1].off;
221 #ifdef ENABLE_CONDITIONALS
222 if (m->cond == COND_ELSE ||
223 m->cond == COND_ELIF) {
224 if (ms->c.li[cont_level].last_match == 1)
228 switch (mget(ms, s, m, nbytes, cont_level, text, recursion_level + 1)) {
237 if (m->type == FILE_INDIRECT)
243 switch (flush ? 1 : magiccheck(ms, m)) {
247 #ifdef ENABLE_CONDITIONALS
248 ms->c.li[cont_level].last_match = 0;
252 #ifdef ENABLE_CONDITIONALS
253 ms->c.li[cont_level].last_match = 1;
255 if (m->type != FILE_DEFAULT)
256 ms->c.li[cont_level].got_match = 1;
257 else if (ms->c.li[cont_level].got_match) {
258 ms->c.li[cont_level].got_match = 0;
261 if ((e = handle_annotation(ms, m)) != 0)
264 * If we are going to print something,
265 * make sure that we have a separator first.
268 if (!printed_something) {
269 printed_something = 1;
270 if (print_sep(ms, firstline)
276 * This continuation matched. Print
277 * its message, with a blank before it
278 * if the previous item printed and
279 * this item isn't empty.
281 /* space if previous printed */
283 && ((m->flag & NOSPACE) == 0)
286 file_printf(ms, " ") == -1)
290 if (print && mprint(ms, m) == -1)
293 ms->c.li[cont_level].off = moffset(ms, m);
299 * If we see any continuations
303 if (file_check_mem(ms, ++cont_level) == -1)
308 if (printed_something) {
313 if ((ms->flags & MAGIC_CONTINUE) == 0 && printed_something) {
314 return returnval; /* don't keep searching */
317 return returnval; /* This is hit if -k is set or there is no match */
321 check_fmt(struct magic_set *ms, struct magic *m)
326 if (strchr(m->desc, '%') == NULL)
329 rc = regcomp(&rx, "%[-0-9\\.]*s", REG_EXTENDED|REG_NOSUB);
332 (void)regerror(rc, &rx, errmsg, sizeof(errmsg));
333 file_magerror(ms, "regex error %d, (%s)", rc, errmsg);
336 rc = regexec(&rx, m->desc, 0, 0, 0);
343 char * strndup(const char *, size_t);
346 strndup(const char *str, size_t n)
351 for (len = 0; len < n && str[len]; len++)
353 if ((copy = malloc(len + 1)) == NULL)
355 (void)memcpy(copy, str, len);
359 #endif /* HAVE_STRNDUP */
362 mprint(struct magic_set *ms, struct magic *m)
369 union VALUETYPE *p = &ms->ms_value;
373 v = file_signextend(ms, m, (uint64_t)p->b);
374 switch (check_fmt(ms, m)) {
378 (void)snprintf(buf, sizeof(buf), "%c",
380 if (file_printf(ms, m->desc, buf) == -1)
384 if (file_printf(ms, m->desc, (unsigned char) v) == -1)
388 t = ms->offset + sizeof(char);
394 v = file_signextend(ms, m, (uint64_t)p->h);
395 switch (check_fmt(ms, m)) {
399 (void)snprintf(buf, sizeof(buf), "%hu",
401 if (file_printf(ms, m->desc, buf) == -1)
406 file_printf(ms, m->desc, (unsigned short) v) == -1)
410 t = ms->offset + sizeof(short);
417 v = file_signextend(ms, m, (uint64_t)p->l);
418 switch (check_fmt(ms, m)) {
422 (void)snprintf(buf, sizeof(buf), "%u", (uint32_t)v);
423 if (file_printf(ms, m->desc, buf) == -1)
427 if (file_printf(ms, m->desc, (uint32_t) v) == -1)
431 t = ms->offset + sizeof(int32_t);
437 v = file_signextend(ms, m, p->q);
438 if (file_printf(ms, m->desc, (uint64_t) v) == -1)
440 t = ms->offset + sizeof(int64_t);
445 case FILE_BESTRING16:
446 case FILE_LESTRING16:
447 if (m->reln == '=' || m->reln == '!') {
448 if (file_printf(ms, m->desc, m->value.s) == -1)
450 t = ms->offset + m->vallen;
453 if (*m->value.s == '\0')
454 p->s[strcspn(p->s, "\n")] = '\0';
455 if (file_printf(ms, m->desc, p->s) == -1)
457 t = ms->offset + strlen(p->s);
458 if (m->type == FILE_PSTRING)
459 t += file_pstring_length_size(m);
467 if (file_printf(ms, m->desc, file_fmttime(p->l, 1)) == -1)
469 t = ms->offset + sizeof(time_t);
476 if (file_printf(ms, m->desc, file_fmttime(p->l, 0)) == -1)
478 t = ms->offset + sizeof(time_t);
484 if (file_printf(ms, m->desc, file_fmttime((uint32_t)p->q,
487 t = ms->offset + sizeof(uint64_t);
493 if (file_printf(ms, m->desc, file_fmttime((uint32_t)p->q,
496 t = ms->offset + sizeof(uint64_t);
503 switch (check_fmt(ms, m)) {
507 (void)snprintf(buf, sizeof(buf), "%g", vf);
508 if (file_printf(ms, m->desc, buf) == -1)
512 if (file_printf(ms, m->desc, vf) == -1)
516 t = ms->offset + sizeof(float);
523 switch (check_fmt(ms, m)) {
527 (void)snprintf(buf, sizeof(buf), "%g", vd);
528 if (file_printf(ms, m->desc, buf) == -1)
532 if (file_printf(ms, m->desc, vd) == -1)
536 t = ms->offset + sizeof(double);
543 cp = strndup((const char *)ms->search.s, ms->search.rm_len);
545 file_oomem(ms, ms->search.rm_len);
548 rval = file_printf(ms, m->desc, cp);
554 if ((m->str_flags & REGEX_OFFSET_START))
555 t = ms->search.offset;
557 t = ms->search.offset + ms->search.rm_len;
562 if (file_printf(ms, m->desc, m->value.s) == -1)
564 if ((m->str_flags & REGEX_OFFSET_START))
565 t = ms->search.offset;
567 t = ms->search.offset + m->vallen;
571 if (file_printf(ms, m->desc, m->value.s) == -1)
581 file_magerror(ms, "invalid m->type (%d) in mprint()", m->type);
588 moffset(struct magic_set *ms, struct magic *m)
592 return CAST(int32_t, (ms->offset + sizeof(char)));
597 return CAST(int32_t, (ms->offset + sizeof(short)));
603 return CAST(int32_t, (ms->offset + sizeof(int32_t)));
608 return CAST(int32_t, (ms->offset + sizeof(int64_t)));
612 case FILE_BESTRING16:
613 case FILE_LESTRING16:
614 if (m->reln == '=' || m->reln == '!')
615 return ms->offset + m->vallen;
617 union VALUETYPE *p = &ms->ms_value;
620 if (*m->value.s == '\0')
621 p->s[strcspn(p->s, "\n")] = '\0';
622 t = CAST(uint32_t, (ms->offset + strlen(p->s)));
623 if (m->type == FILE_PSTRING)
624 t += file_pstring_length_size(m);
632 return CAST(int32_t, (ms->offset + sizeof(time_t)));
638 return CAST(int32_t, (ms->offset + sizeof(time_t)));
643 return CAST(int32_t, (ms->offset + sizeof(uint64_t)));
648 return CAST(int32_t, (ms->offset + sizeof(uint64_t)));
653 return CAST(int32_t, (ms->offset + sizeof(float)));
658 return CAST(int32_t, (ms->offset + sizeof(double)));
661 if ((m->str_flags & REGEX_OFFSET_START) != 0)
662 return CAST(int32_t, ms->search.offset);
664 return CAST(int32_t, (ms->search.offset +
668 if ((m->str_flags & REGEX_OFFSET_START) != 0)
669 return CAST(int32_t, ms->search.offset);
671 return CAST(int32_t, (ms->search.offset + m->vallen));
684 #define DO_CVT(fld, cast) \
686 switch (m->mask_op & FILE_OPS_MASK) { \
688 p->fld &= cast m->num_mask; \
691 p->fld |= cast m->num_mask; \
694 p->fld ^= cast m->num_mask; \
697 p->fld += cast m->num_mask; \
700 p->fld -= cast m->num_mask; \
702 case FILE_OPMULTIPLY: \
703 p->fld *= cast m->num_mask; \
705 case FILE_OPDIVIDE: \
706 p->fld /= cast m->num_mask; \
708 case FILE_OPMODULO: \
709 p->fld %= cast m->num_mask; \
712 if (m->mask_op & FILE_OPINVERSE) \
716 cvt_8(union VALUETYPE *p, const struct magic *m)
718 DO_CVT(b, (uint8_t));
722 cvt_16(union VALUETYPE *p, const struct magic *m)
724 DO_CVT(h, (uint16_t));
728 cvt_32(union VALUETYPE *p, const struct magic *m)
730 DO_CVT(l, (uint32_t));
734 cvt_64(union VALUETYPE *p, const struct magic *m)
736 DO_CVT(q, (uint64_t));
739 #define DO_CVT2(fld, cast) \
741 switch (m->mask_op & FILE_OPS_MASK) { \
743 p->fld += cast m->num_mask; \
746 p->fld -= cast m->num_mask; \
748 case FILE_OPMULTIPLY: \
749 p->fld *= cast m->num_mask; \
751 case FILE_OPDIVIDE: \
752 p->fld /= cast m->num_mask; \
757 cvt_float(union VALUETYPE *p, const struct magic *m)
763 cvt_double(union VALUETYPE *p, const struct magic *m)
765 DO_CVT2(d, (double));
769 * Convert the byte order of the data we are looking at
770 * While we're here, let's apply the mask operation
771 * (unless you have a better idea)
774 mconvert(struct magic_set *ms, struct magic *m)
776 union VALUETYPE *p = &ms->ms_value;
796 case FILE_BESTRING16:
797 case FILE_LESTRING16: {
798 /* Null terminate and eat *trailing* return */
799 p->s[sizeof(p->s) - 1] = '\0';
803 char *ptr1 = p->s, *ptr2 = ptr1 + file_pstring_length_size(m);
804 size_t len = file_pstring_get_length(m, ptr1);
805 if (len >= sizeof(p->s))
806 len = sizeof(p->s) - 1;
813 p->h = (short)((p->hs[0]<<8)|(p->hs[1]));
820 ((p->hl[0]<<24)|(p->hl[1]<<16)|(p->hl[2]<<8)|(p->hl[3]));
827 (((uint64_t)p->hq[0]<<56)|((uint64_t)p->hq[1]<<48)|
828 ((uint64_t)p->hq[2]<<40)|((uint64_t)p->hq[3]<<32)|
829 ((uint64_t)p->hq[4]<<24)|((uint64_t)p->hq[5]<<16)|
830 ((uint64_t)p->hq[6]<<8)|((uint64_t)p->hq[7]));
834 p->h = (short)((p->hs[1]<<8)|(p->hs[0]));
841 ((p->hl[3]<<24)|(p->hl[2]<<16)|(p->hl[1]<<8)|(p->hl[0]));
848 (((uint64_t)p->hq[7]<<56)|((uint64_t)p->hq[6]<<48)|
849 ((uint64_t)p->hq[5]<<40)|((uint64_t)p->hq[4]<<32)|
850 ((uint64_t)p->hq[3]<<24)|((uint64_t)p->hq[2]<<16)|
851 ((uint64_t)p->hq[1]<<8)|((uint64_t)p->hq[0]));
858 ((p->hl[1]<<24)|(p->hl[0]<<16)|(p->hl[3]<<8)|(p->hl[2]));
865 p->l = ((uint32_t)p->hl[0]<<24)|((uint32_t)p->hl[1]<<16)|
866 ((uint32_t)p->hl[2]<<8) |((uint32_t)p->hl[3]);
870 p->l = ((uint32_t)p->hl[3]<<24)|((uint32_t)p->hl[2]<<16)|
871 ((uint32_t)p->hl[1]<<8) |((uint32_t)p->hl[0]);
878 p->q = ((uint64_t)p->hq[0]<<56)|((uint64_t)p->hq[1]<<48)|
879 ((uint64_t)p->hq[2]<<40)|((uint64_t)p->hq[3]<<32)|
880 ((uint64_t)p->hq[4]<<24)|((uint64_t)p->hq[5]<<16)|
881 ((uint64_t)p->hq[6]<<8) |((uint64_t)p->hq[7]);
885 p->q = ((uint64_t)p->hq[7]<<56)|((uint64_t)p->hq[6]<<48)|
886 ((uint64_t)p->hq[5]<<40)|((uint64_t)p->hq[4]<<32)|
887 ((uint64_t)p->hq[3]<<24)|((uint64_t)p->hq[2]<<16)|
888 ((uint64_t)p->hq[1]<<8) |((uint64_t)p->hq[0]);
896 file_magerror(ms, "invalid type %d in mconvert()", m->type);
903 mdebug(uint32_t offset, const char *str, size_t len)
905 (void) fprintf(stderr, "mget @%d: ", offset);
906 file_showstr(stderr, str, len);
907 (void) fputc('\n', stderr);
908 (void) fputc('\n', stderr);
912 mcopy(struct magic_set *ms, union VALUETYPE *p, int type, int indir,
913 const unsigned char *s, uint32_t offset, size_t nbytes, size_t linecnt)
916 * Note: FILE_SEARCH and FILE_REGEX do not actually copy
917 * anything, but setup pointers into the source
922 ms->search.s = RCAST(const char *, s) + offset;
923 ms->search.s_len = nbytes - offset;
924 ms->search.offset = offset;
930 const char *last; /* end of search region */
931 const char *buf; /* start of search region */
936 ms->search.s_len = 0;
940 buf = RCAST(const char *, s) + offset;
941 end = last = RCAST(const char *, s) + nbytes;
942 /* mget() guarantees buf <= last */
943 for (lines = linecnt, b = buf; lines && b < end &&
944 ((b = CAST(const char *,
945 memchr(c = b, '\n', CAST(size_t, (end - b)))))
946 || (b = CAST(const char *,
947 memchr(c, '\r', CAST(size_t, (end - c))))));
950 if (b[0] == '\r' && b[1] == '\n')
954 last = RCAST(const char *, s) + nbytes;
957 ms->search.s_len = last - buf;
958 ms->search.offset = offset;
959 ms->search.rm_len = 0;
962 case FILE_BESTRING16:
963 case FILE_LESTRING16: {
964 const unsigned char *src = s + offset;
965 const unsigned char *esrc = s + nbytes;
967 char *edst = &p->s[sizeof(p->s) - 1];
969 if (type == FILE_BESTRING16)
972 /* check for pointer overflow */
974 file_magerror(ms, "invalid offset %u in mcopy()",
978 for (/*EMPTY*/; src < esrc; src += 2, dst++) {
984 if (type == FILE_BESTRING16 ?
993 case FILE_STRING: /* XXX - these two should not need */
994 case FILE_PSTRING: /* to copy anything, but do anyway. */
1000 if (offset >= nbytes) {
1001 (void)memset(p, '\0', sizeof(*p));
1004 if (nbytes - offset < sizeof(*p))
1005 nbytes = nbytes - offset;
1007 nbytes = sizeof(*p);
1009 (void)memcpy(p, s + offset, nbytes);
1012 * the usefulness of padding with zeroes eludes me, it
1013 * might even cause problems
1015 if (nbytes < sizeof(*p))
1016 (void)memset(((char *)(void *)p) + nbytes, '\0',
1017 sizeof(*p) - nbytes);
1022 mget(struct magic_set *ms, const unsigned char *s,
1023 struct magic *m, size_t nbytes, unsigned int cont_level, int text,
1024 int recursion_level)
1026 uint32_t offset = ms->offset;
1027 uint32_t count = m->str_range;
1028 union VALUETYPE *p = &ms->ms_value;
1030 if (recursion_level >= 20) {
1031 file_error(ms, 0, "recursion nesting exceeded");
1035 if (mcopy(ms, p, m->type, m->flag & INDIR, s, offset, nbytes, count) == -1)
1038 if ((ms->flags & MAGIC_DEBUG) != 0) {
1039 mdebug(offset, (char *)(void *)p, sizeof(union VALUETYPE));
1040 #ifndef COMPILE_ONLY
1045 if (m->flag & INDIR) {
1046 int off = m->in_offset;
1047 if (m->in_op & FILE_OPINDIRECT) {
1048 const union VALUETYPE *q = CAST(const union VALUETYPE *,
1049 ((const void *)(s + offset + off)));
1050 switch (m->in_type) {
1058 off = (short)((q->hs[0]<<8)|(q->hs[1]));
1061 off = (short)((q->hs[1]<<8)|(q->hs[0]));
1068 off = (int32_t)((q->hl[0]<<24)|(q->hl[1]<<16)|
1069 (q->hl[2]<<8)|(q->hl[3]));
1073 off = (int32_t)((q->hl[3]<<24)|(q->hl[2]<<16)|
1074 (q->hl[1]<<8)|(q->hl[0]));
1077 off = (int32_t)((q->hl[1]<<24)|(q->hl[0]<<16)|
1078 (q->hl[3]<<8)|(q->hl[2]));
1082 switch (m->in_type) {
1084 if (OFFSET_OOB(nbytes, offset, 1))
1087 switch (m->in_op & FILE_OPS_MASK) {
1089 offset = p->b & off;
1092 offset = p->b | off;
1095 offset = p->b ^ off;
1098 offset = p->b + off;
1101 offset = p->b - off;
1103 case FILE_OPMULTIPLY:
1104 offset = p->b * off;
1107 offset = p->b / off;
1110 offset = p->b % off;
1115 if (m->in_op & FILE_OPINVERSE)
1119 if (OFFSET_OOB(nbytes, offset, 2))
1122 switch (m->in_op & FILE_OPS_MASK) {
1124 offset = (short)((p->hs[0]<<8)|
1129 offset = (short)((p->hs[0]<<8)|
1134 offset = (short)((p->hs[0]<<8)|
1139 offset = (short)((p->hs[0]<<8)|
1144 offset = (short)((p->hs[0]<<8)|
1148 case FILE_OPMULTIPLY:
1149 offset = (short)((p->hs[0]<<8)|
1154 offset = (short)((p->hs[0]<<8)|
1159 offset = (short)((p->hs[0]<<8)|
1165 offset = (short)((p->hs[0]<<8)|
1167 if (m->in_op & FILE_OPINVERSE)
1171 if (OFFSET_OOB(nbytes, offset, 2))
1174 switch (m->in_op & FILE_OPS_MASK) {
1176 offset = (short)((p->hs[1]<<8)|
1181 offset = (short)((p->hs[1]<<8)|
1186 offset = (short)((p->hs[1]<<8)|
1191 offset = (short)((p->hs[1]<<8)|
1196 offset = (short)((p->hs[1]<<8)|
1200 case FILE_OPMULTIPLY:
1201 offset = (short)((p->hs[1]<<8)|
1206 offset = (short)((p->hs[1]<<8)|
1211 offset = (short)((p->hs[1]<<8)|
1217 offset = (short)((p->hs[1]<<8)|
1219 if (m->in_op & FILE_OPINVERSE)
1223 if (OFFSET_OOB(nbytes, offset, 2))
1226 switch (m->in_op & FILE_OPS_MASK) {
1228 offset = p->h & off;
1231 offset = p->h | off;
1234 offset = p->h ^ off;
1237 offset = p->h + off;
1240 offset = p->h - off;
1242 case FILE_OPMULTIPLY:
1243 offset = p->h * off;
1246 offset = p->h / off;
1249 offset = p->h % off;
1255 if (m->in_op & FILE_OPINVERSE)
1260 if (OFFSET_OOB(nbytes, offset, 4))
1263 switch (m->in_op & FILE_OPS_MASK) {
1265 offset = (int32_t)((p->hl[0]<<24)|
1272 offset = (int32_t)((p->hl[0]<<24)|
1279 offset = (int32_t)((p->hl[0]<<24)|
1286 offset = (int32_t)((p->hl[0]<<24)|
1293 offset = (int32_t)((p->hl[0]<<24)|
1299 case FILE_OPMULTIPLY:
1300 offset = (int32_t)((p->hl[0]<<24)|
1307 offset = (int32_t)((p->hl[0]<<24)|
1314 offset = (int32_t)((p->hl[0]<<24)|
1322 offset = (int32_t)((p->hl[0]<<24)|
1326 if (m->in_op & FILE_OPINVERSE)
1331 if (OFFSET_OOB(nbytes, offset, 4))
1334 switch (m->in_op & FILE_OPS_MASK) {
1336 offset = (int32_t)((p->hl[3]<<24)|
1343 offset = (int32_t)((p->hl[3]<<24)|
1350 offset = (int32_t)((p->hl[3]<<24)|
1357 offset = (int32_t)((p->hl[3]<<24)|
1364 offset = (int32_t)((p->hl[3]<<24)|
1370 case FILE_OPMULTIPLY:
1371 offset = (int32_t)((p->hl[3]<<24)|
1378 offset = (int32_t)((p->hl[3]<<24)|
1385 offset = (int32_t)((p->hl[3]<<24)|
1393 offset = (int32_t)((p->hl[3]<<24)|
1397 if (m->in_op & FILE_OPINVERSE)
1401 if (OFFSET_OOB(nbytes, offset, 4))
1404 switch (m->in_op & FILE_OPS_MASK) {
1406 offset = (int32_t)((p->hl[1]<<24)|
1413 offset = (int32_t)((p->hl[1]<<24)|
1420 offset = (int32_t)((p->hl[1]<<24)|
1427 offset = (int32_t)((p->hl[1]<<24)|
1434 offset = (int32_t)((p->hl[1]<<24)|
1440 case FILE_OPMULTIPLY:
1441 offset = (int32_t)((p->hl[1]<<24)|
1448 offset = (int32_t)((p->hl[1]<<24)|
1455 offset = (int32_t)((p->hl[1]<<24)|
1463 offset = (int32_t)((p->hl[1]<<24)|
1467 if (m->in_op & FILE_OPINVERSE)
1471 if (OFFSET_OOB(nbytes, offset, 4))
1474 switch (m->in_op & FILE_OPS_MASK) {
1476 offset = p->l & off;
1479 offset = p->l | off;
1482 offset = p->l ^ off;
1485 offset = p->l + off;
1488 offset = p->l - off;
1490 case FILE_OPMULTIPLY:
1491 offset = p->l * off;
1494 offset = p->l / off;
1497 offset = p->l % off;
1502 if (m->in_op & FILE_OPINVERSE)
1507 switch (m->in_type) {
1510 offset = ((((offset >> 0) & 0x7f) << 0) |
1511 (((offset >> 8) & 0x7f) << 7) |
1512 (((offset >> 16) & 0x7f) << 14) |
1513 (((offset >> 24) & 0x7f) << 21)) + 10;
1519 if (m->flag & INDIROFFADD) {
1520 offset += ms->c.li[cont_level-1].off;
1522 if (mcopy(ms, p, m->type, 0, s, offset, nbytes, count) == -1)
1524 ms->offset = offset;
1526 if ((ms->flags & MAGIC_DEBUG) != 0) {
1527 mdebug(offset, (char *)(void *)p,
1528 sizeof(union VALUETYPE));
1529 #ifndef COMPILE_ONLY
1535 /* Verify we have enough data to match magic type */
1538 if (OFFSET_OOB(nbytes, offset, 1))
1545 if (OFFSET_OOB(nbytes, offset, 2))
1564 if (OFFSET_OOB(nbytes, offset, 4))
1571 if (OFFSET_OOB(nbytes, offset, 8))
1578 if (OFFSET_OOB(nbytes, offset, m->vallen))
1583 if (nbytes < offset)
1590 if ((ms->flags & (MAGIC_MIME|MAGIC_APPLE)) == 0 &&
1591 file_printf(ms, "%s", m->desc) == -1)
1593 if (nbytes < offset)
1595 return file_softmagic(ms, s + offset, nbytes - offset,
1596 recursion_level, BINTEST, text);
1598 case FILE_DEFAULT: /* nothing to check */
1602 if (!mconvert(ms, m))
1608 file_strncmp(const char *s1, const char *s2, size_t len, uint32_t flags)
1611 * Convert the source args to unsigned here so that (1) the
1612 * compare will be unsigned as it is in strncmp() and (2) so
1613 * the ctype functions will work correctly without extra
1616 const unsigned char *a = (const unsigned char *)s1;
1617 const unsigned char *b = (const unsigned char *)s2;
1621 * What we want here is v = strncmp(s1, s2, len),
1622 * but ignoring any nulls.
1625 if (0L == flags) { /* normal string: do it fast */
1627 if ((v = *b++ - *a++) != '\0')
1630 else { /* combine the others */
1632 if ((flags & STRING_IGNORE_LOWERCASE) &&
1634 if ((v = tolower(*b++) - *a++) != '\0')
1637 else if ((flags & STRING_IGNORE_UPPERCASE) &&
1639 if ((v = toupper(*b++) - *a++) != '\0')
1642 else if ((flags & STRING_COMPACT_WHITESPACE) &&
1645 if (isspace(*b++)) {
1655 else if ((flags & STRING_COMPACT_OPTIONAL_WHITESPACE) &&
1662 if ((v = *b++ - *a++) != '\0')
1671 file_strncmp16(const char *a, const char *b, size_t len, uint32_t flags)
1674 * XXX - The 16-bit string compare probably needs to be done
1675 * differently, especially if the flags are to be supported.
1676 * At the moment, I am unsure.
1679 return file_strncmp(a, b, len, flags);
1683 magiccheck(struct magic_set *ms, struct magic *m)
1685 uint64_t l = m->value.q;
1690 union VALUETYPE *p = &ms->ms_value;
1758 file_magerror(ms, "cannot happen with float: invalid relation `%c'",
1792 file_magerror(ms, "cannot happen with double: invalid relation `%c'", m->reln);
1805 v = file_strncmp(m->value.s, p->s, (size_t)m->vallen, m->str_flags);
1808 case FILE_BESTRING16:
1809 case FILE_LESTRING16:
1811 v = file_strncmp16(m->value.s, p->s, (size_t)m->vallen, m->str_flags);
1814 case FILE_SEARCH: { /* search ms->search.s for the string m->value.s */
1818 if (ms->search.s == NULL)
1821 slen = MIN(m->vallen, sizeof(m->value.s));
1825 for (idx = 0; m->str_range == 0 || idx < m->str_range; idx++) {
1826 if (slen + idx > ms->search.s_len)
1829 v = file_strncmp(m->value.s, ms->search.s + idx, slen, m->str_flags);
1830 if (v == 0) { /* found match */
1831 ms->search.offset += idx;
1842 if (ms->search.s == NULL)
1846 rc = regcomp(&rx, m->value.s,
1847 REG_EXTENDED|REG_NEWLINE|
1848 ((m->str_flags & STRING_IGNORE_CASE) ? REG_ICASE : 0));
1850 (void)regerror(rc, &rx, errmsg, sizeof(errmsg));
1851 file_magerror(ms, "regex error %d, (%s)",
1856 regmatch_t pmatch[1];
1857 #ifndef REG_STARTEND
1858 #define REG_STARTEND 0
1859 size_t l = ms->search.s_len - 1;
1860 char c = ms->search.s[l];
1861 ((char *)(intptr_t)ms->search.s)[l] = '\0';
1863 pmatch[0].rm_so = 0;
1864 pmatch[0].rm_eo = ms->search.s_len;
1866 rc = regexec(&rx, (const char *)ms->search.s,
1867 1, pmatch, REG_STARTEND);
1868 #if REG_STARTEND == 0
1869 ((char *)(intptr_t)ms->search.s)[l] = c;
1873 ms->search.s += (int)pmatch[0].rm_so;
1874 ms->search.offset += (size_t)pmatch[0].rm_so;
1876 (size_t)(pmatch[0].rm_eo - pmatch[0].rm_so);
1885 (void)regerror(rc, &rx, errmsg, sizeof(errmsg));
1886 file_magerror(ms, "regexec error %d, (%s)",
1893 if (v == (uint64_t)-1)
1900 file_magerror(ms, "invalid type %d in magiccheck()", m->type);
1904 v = file_signextend(ms, m, v);
1908 if ((ms->flags & MAGIC_DEBUG) != 0)
1909 (void) fprintf(stderr, "%" INT64_T_FORMAT
1910 "u == *any* = 1\n", (unsigned long long)v);
1916 if ((ms->flags & MAGIC_DEBUG) != 0)
1917 (void) fprintf(stderr, "%" INT64_T_FORMAT "u != %"
1918 INT64_T_FORMAT "u = %d\n", (unsigned long long)v,
1919 (unsigned long long)l, matched);
1924 if ((ms->flags & MAGIC_DEBUG) != 0)
1925 (void) fprintf(stderr, "%" INT64_T_FORMAT "u == %"
1926 INT64_T_FORMAT "u = %d\n", (unsigned long long)v,
1927 (unsigned long long)l, matched);
1931 if (m->flag & UNSIGNED) {
1933 if ((ms->flags & MAGIC_DEBUG) != 0)
1934 (void) fprintf(stderr, "%" INT64_T_FORMAT
1935 "u > %" INT64_T_FORMAT "u = %d\n",
1936 (unsigned long long)v,
1937 (unsigned long long)l, matched);
1940 matched = (int64_t) v > (int64_t) l;
1941 if ((ms->flags & MAGIC_DEBUG) != 0)
1942 (void) fprintf(stderr, "%" INT64_T_FORMAT
1943 "d > %" INT64_T_FORMAT "d = %d\n",
1944 (long long)v, (long long)l, matched);
1949 if (m->flag & UNSIGNED) {
1951 if ((ms->flags & MAGIC_DEBUG) != 0)
1952 (void) fprintf(stderr, "%" INT64_T_FORMAT
1953 "u < %" INT64_T_FORMAT "u = %d\n",
1954 (unsigned long long)v,
1955 (unsigned long long)l, matched);
1958 matched = (int64_t) v < (int64_t) l;
1959 if ((ms->flags & MAGIC_DEBUG) != 0)
1960 (void) fprintf(stderr, "%" INT64_T_FORMAT
1961 "d < %" INT64_T_FORMAT "d = %d\n",
1962 (long long)v, (long long)l, matched);
1967 matched = (v & l) == l;
1968 if ((ms->flags & MAGIC_DEBUG) != 0)
1969 (void) fprintf(stderr, "((%" INT64_T_FORMAT "x & %"
1970 INT64_T_FORMAT "x) == %" INT64_T_FORMAT
1971 "x) = %d\n", (unsigned long long)v,
1972 (unsigned long long)l, (unsigned long long)l,
1977 matched = (v & l) != l;
1978 if ((ms->flags & MAGIC_DEBUG) != 0)
1979 (void) fprintf(stderr, "((%" INT64_T_FORMAT "x & %"
1980 INT64_T_FORMAT "x) != %" INT64_T_FORMAT
1981 "x) = %d\n", (unsigned long long)v,
1982 (unsigned long long)l, (unsigned long long)l,
1988 file_magerror(ms, "cannot happen: invalid relation `%c'",
1997 handle_annotation(struct magic_set *ms, struct magic *m)
1999 if (ms->flags & MAGIC_APPLE) {
2000 if (file_printf(ms, "%.8s", m->apple) == -1)
2004 if ((ms->flags & MAGIC_MIME_TYPE) && m->mimetype[0]) {
2005 if (file_printf(ms, "%s", m->mimetype) == -1)
2013 print_sep(struct magic_set *ms, int firstline)
2015 if (ms->flags & MAGIC_MIME)
2020 * we found another match
2021 * put a newline and '-' to do some simple formatting
2023 return file_printf(ms, "\n- ");