/* * Copyright (c) Ian F. Darwin 1986-1995. * Software written by Ian F. Darwin and others; * maintained 1995-present by Christos Zoulas and others. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice immediately at the beginning of the file, without modification, * this list of conditions, and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. */ /* * file - find type of a file or files - main program. */ #include "file.h" #include "magic.h" #include #include #include #include #include #include /* for MAXPATHLEN */ #include #include /* for open() */ #ifdef RESTORE_TIME # if (__COHERENT__ >= 0x420) # include # else # ifdef USE_UTIMES # include # else # include # endif # endif #endif #ifdef HAVE_UNISTD_H #include /* for read() */ #endif #ifdef HAVE_LOCALE_H #include #endif #ifdef HAVE_WCHAR_H #include #endif #ifdef HAVE_GETOPT_H #include /* for long options (is this portable?)*/ #else #undef HAVE_GETOPT_LONG #endif #include /* for byte swapping */ #include "patchlevel.h" #ifndef lint FILE_RCSID("@(#)$Id: file.c,v 1.95 2004/09/27 15:28:37 christos Exp $") #endif /* lint */ #ifdef S_IFLNK #define SYMLINKFLAG "L" #else #define SYMLINKFLAG "" #endif # define USAGE "Usage: %s [-bcik" SYMLINKFLAG "nNsvz] [-f namefile] [-F separator] [-m magicfiles] file...\n %s -C -m magicfiles\n" #ifndef MAXPATHLEN #define MAXPATHLEN 512 #endif /*@unchecked@*/ private int /* Global command-line options */ bflag = 0, /* brief output format */ nopad = 0, /* Don't pad output */ nobuffer = 0; /* Do not buffer stdout */ /*@unchecked@*/ /*@observer@*/ /*@relnull@*/ private const char *magicfile = 0; /* where the magic is */ /*@unchecked@*/ /*@observer@*/ private const char *default_magicfile = MAGIC; /*@unchecked@*/ /*@observer@*/ private char *separator = ":"; /* Default field separator */ /*@unchecked@*/ /*@null@*/ private char *progname; /* used throughout */ /*@unchecked@*/ /*@only@*/ /*@null@*/ private struct magic_set *magic; private void unwrap(char *fn) /*@globals fileSystem, internalState @*/ /*@modifies fileSystem, internalState @*/; private void usage(void) /*@globals fileSystem @*/ /*@modifies fileSystem @*/; #ifdef HAVE_GETOPT_LONG private void help(void) /*@globals fileSystem @*/ /*@modifies fileSystem @*/; #endif #if 0 private int byteconv4(int, int, int) /*@*/; private short byteconv2(int, int, int) /*@*/; #endif private void process(const char *inname, int wid) /*@globals magic, fileSystem, internalState @*/ /*@modifies magic, fileSystem, internalState @*/; private void load(const char *m, int flags) /*@globals magic, fileSystem, internalState @*/ /*@modifies magic, fileSystem, internalState @*/; /* * main - parse arguments and handle options */ int main(int argc, char *argv[]) /*@globals bflag, default_magicfile, magic, magicfile, nobuffer, nopad, optind, progname, separator, fileSystem, internalState @*/ /*@modifies argv, bflag, default_magicfile, magic, magicfile, nobuffer, nopad, optind, progname, separator, fileSystem, internalState @*/ { int c; int action = 0, didsomefiles = 0, errflg = 0; int flags = 0; char *home, *usermagic; struct stat sb; #define OPTSTRING "bcCdf:F:ikLm:nNprsvz" #ifdef HAVE_GETOPT_LONG int longindex; /*@observer@*/ /*@-nullassign -readonlytrans@*/ private struct option long_options[] = { {"version", 0, 0, 'v'}, {"help", 0, 0, 0}, {"brief", 0, 0, 'b'}, {"checking-printout", 0, 0, 'c'}, {"debug", 0, 0, 'd'}, {"files-from", 1, 0, 'f'}, {"separator", 1, 0, 'F'}, {"mime", 0, 0, 'i'}, {"keep-going", 0, 0, 'k'}, #ifdef S_IFLNK {"dereference", 0, 0, 'L'}, #endif {"magic-file", 1, 0, 'm'}, #if defined(HAVE_UTIME) || defined(HAVE_UTIMES) {"preserve-date", 0, 0, 'p'}, #endif {"uncompress", 0, 0, 'z'}, {"raw", 0, 0, 'r'}, {"no-buffer", 0, 0, 'n'}, {"no-pad", 0, 0, 'N'}, {"special-files", 0, 0, 's'}, {"compile", 0, 0, 'C'}, {0, 0, 0, 0}, }; /*@=nullassign =readonlytrans@*/ #endif #ifdef LC_CTYPE setlocale(LC_CTYPE, ""); /* makes islower etc work for other langs */ #endif #ifdef __EMX__ /* sh-like wildcard expansion! Shouldn't hurt at least ... */ _wildcard(&argc, &argv); #endif if ((progname = strrchr(argv[0], '/')) != NULL) progname++; else progname = argv[0]; magicfile = default_magicfile; if ((usermagic = getenv("MAGIC")) != NULL) magicfile = usermagic; else if ((home = getenv("HOME")) != NULL) { if ((usermagic = malloc(strlen(home) + 8)) != NULL) { (void)strcpy(usermagic, home); (void)strcat(usermagic, "/.magic"); if (stat(usermagic, &sb)<0) free(usermagic); else magicfile = usermagic; } } /*@-moduncon@*/ #ifndef HAVE_GETOPT_LONG while ((c = getopt(argc, argv, OPTSTRING)) != -1) #else while ((c = getopt_long(argc, argv, OPTSTRING, long_options, &longindex)) != -1) #endif /*@=moduncon@*/ switch (c) { #ifdef HAVE_GETOPT_LONG case 0 : if (longindex == 1) help(); /*@switchbreak@*/ break; #endif case 'b': ++bflag; /*@switchbreak@*/ break; case 'c': action = FILE_CHECK; /*@switchbreak@*/ break; case 'C': action = FILE_COMPILE; /*@switchbreak@*/ break; case 'd': flags |= MAGIC_DEBUG|MAGIC_CHECK; /*@switchbreak@*/ break; case 'f': if(action) usage(); load(magicfile, flags); unwrap(optarg); ++didsomefiles; /*@switchbreak@*/ break; case 'F': separator = optarg; /*@switchbreak@*/ break; case 'i': flags |= MAGIC_MIME; /*@switchbreak@*/ break; case 'k': flags |= MAGIC_CONTINUE; /*@switchbreak@*/ break; case 'm': magicfile = optarg; /*@switchbreak@*/ break; case 'n': ++nobuffer; /*@switchbreak@*/ break; case 'N': ++nopad; /*@switchbreak@*/ break; #if defined(HAVE_UTIME) || defined(HAVE_UTIMES) case 'p': flags |= MAGIC_PRESERVE_ATIME; /*@switchbreak@*/ break; #endif case 'r': flags |= MAGIC_RAW; /*@switchbreak@*/ break; case 's': flags |= MAGIC_DEVICES; /*@switchbreak@*/ break; case 'v': (void) fprintf(stdout, "%s-%d.%.2d\n", progname, FILE_VERSION_MAJOR, patchlevel); (void) fprintf(stdout, "magic file from %s\n", magicfile); return 1; case 'z': flags |= MAGIC_COMPRESS; /*@switchbreak@*/ break; #ifdef S_IFLNK case 'L': flags |= MAGIC_SYMLINK; /*@switchbreak@*/ break; #endif case '?': default: errflg++; /*@switchbreak@*/ break; } if (errflg) { usage(); } switch(action) { case FILE_CHECK: case FILE_COMPILE: magic = magic_open(flags|MAGIC_CHECK); if (magic == NULL) { (void)fprintf(stderr, "%s: %s\n", progname, strerror(errno)); return 1; } c = action == FILE_CHECK ? magic_check(magic, magicfile) : magic_compile(magic, magicfile); if (c == -1) { (void)fprintf(stderr, "%s: %s\n", progname, magic_error(magic)); return -1; } return 0; default: load(magicfile, flags); break; } if (optind == argc) { if (!didsomefiles) { usage(); } } else { int i, wid, nw; for (wid = 0, i = optind; i < argc; i++) { nw = file_mbswidth(argv[i]); if (nw > wid) wid = nw; } for (; optind < argc; optind++) process(argv[optind], wid); } magic_close(magic); magic = NULL; return 0; } private void load(/*@unused@*/ const char *m, int flags) { if (magic) return; magic = magic_open(flags); if (magic == NULL) { (void)fprintf(stderr, "%s: %s\n", progname, strerror(errno)); exit(EXIT_FAILURE); } if (magic_load(magic, magicfile) == -1) { (void)fprintf(stderr, "%s: %s\n", progname, magic_error(magic)); exit(EXIT_FAILURE); } } /* * unwrap -- read a file of filenames, do each one. */ private void unwrap(char *fn) { char buf[MAXPATHLEN]; FILE *f; int wid = 0, cwid; if (strcmp("-", fn) == 0) { f = stdin; wid = 1; } else { if ((f = fopen(fn, "r")) == NULL) { (void)fprintf(stderr, "%s: Cannot open `%s' (%s).\n", progname, fn, strerror(errno)); exit(EXIT_FAILURE); } while (fgets(buf, MAXPATHLEN, f) != NULL) { cwid = file_mbswidth(buf) - 1; if (cwid > wid) wid = cwid; } rewind(f); } while (fgets(buf, MAXPATHLEN, f) != NULL) { // cut off CR, we _need_ bytes here, not characters buf[strlen(buf)-1] = '\0'; process(buf, wid); if(nobuffer) (void) fflush(stdout); } (void) fclose(f); } private void process(const char *inname, int wid) { const char *type; int std_in = strcmp(inname, "-") == 0; if (wid > 0 && !bflag) (void) printf("%s%s%*s ", std_in ? "/dev/stdin" : inname, separator, (int) (nopad ? 0 : (wid - file_mbswidth(inname))), ""); type = magic_file(magic, std_in ? NULL : inname); if (type == NULL) printf("ERROR: %s\n", magic_error(magic)); else printf("%s\n", type); } #if 0 /* * byteconv4 * Input: * from 4 byte quantity to convert * same whether to perform byte swapping * big_endian whether we are a big endian host */ private int byteconv4(int from, int same, int big_endian) { if (same) return from; else if (big_endian) { /* lsb -> msb conversion on msb */ union { int i; char c[4]; } retval, tmpval; tmpval.i = from; retval.c[0] = tmpval.c[3]; retval.c[1] = tmpval.c[2]; retval.c[2] = tmpval.c[1]; retval.c[3] = tmpval.c[0]; return retval.i; } else return ntohl(from); /* msb -> lsb conversion on lsb */ } /* * byteconv2 * Same as byteconv4, but for shorts */ private short byteconv2(int from, int same, int big_endian) { if (same) return from; else if (big_endian) { /* lsb -> msb conversion on msb */ union { short s; char c[2]; } retval, tmpval; tmpval.s = (short) from; retval.c[0] = tmpval.c[1]; retval.c[1] = tmpval.c[0]; return retval.s; } else return ntohs(from); /* msb -> lsb conversion on lsb */ } #endif size_t file_mbswidth(const char *s) { #if defined(HAVE_WCHAR_H) && defined(HAVE_MBRTOWC) && defined(HAVE_WCWIDTH) size_t bytesconsumed, old_n, n, width = 0; mbstate_t state; wchar_t nextchar; (void)memset(&state, 0, sizeof(mbstate_t)); old_n = n = strlen(s); while (n > 0) { bytesconsumed = mbrtowc(&nextchar, s, n, &state); if (bytesconsumed == (size_t)(-1) || bytesconsumed == (size_t)(-2)) { /* Something went wrong, return something reasonable */ return old_n; } if (s[0] == '\n') { /* * do what strlen() would do, so that caller * is always right */ width++; } else width += wcwidth(nextchar); s += bytesconsumed, n -= bytesconsumed; } return width; #else return strlen(s); #endif } private void usage(void) { (void)fprintf(stderr, USAGE, progname, progname); #ifdef HAVE_GETOPT_LONG (void)fputs("Try `file --help' for more information.\n", stderr); #endif exit(EXIT_FAILURE); } #ifdef HAVE_GETOPT_LONG private void help(void) { puts( "Usage: file [OPTION]... [FILE]...\n" "Determine file type of FILEs.\n" "\n" " -m, --magic-file LIST use LIST as a colon-separated list of magic\n" " number files\n" " -z, --uncompress try to look inside compressed files\n" " -b, --brief do not prepend filenames to output lines\n" " -c, --checking-printout print the parsed form of the magic file, use in\n" " conjunction with -m to debug a new magic file\n" " before installing it\n" " -f, --files-from FILE read the filenames to be examined from FILE\n" " -F, --separator string use string as separator instead of `:'\n" " -i, --mime output mime type strings\n" " -k, --keep-going don't stop at the first match\n" " -L, --dereference causes symlinks to be followed\n" " -n, --no-buffer do not buffer output\n" " -N, --no-pad do not pad output\n" " -p, --preserve-date preserve access times on files\n" " -r, --raw don't translate unprintable chars to \\ooo\n" " -s, --special-files treat special (block/char devices) files as\n" " ordinary ones\n" " --help display this help and exit\n" " --version output version information and exit\n" ); exit(EXIT_SUCCESS); } #endif