root/ext/fileinfo/libmagic/names.h

/* [<][>][^][v][top][bottom][index][help] */
   1 /*
   2  * Copyright (c) Ian F. Darwin 1986-1995.
   3  * Software written by Ian F. Darwin and others;
   4  * maintained 1995-present by Christos Zoulas and others.
   5  * 
   6  * Redistribution and use in source and binary forms, with or without
   7  * modification, are permitted provided that the following conditions
   8  * are met:
   9  * 1. Redistributions of source code must retain the above copyright
  10  *    notice immediately at the beginning of the file, without modification,
  11  *    this list of conditions, and the following disclaimer.
  12  * 2. Redistributions in binary form must reproduce the above copyright
  13  *    notice, this list of conditions and the following disclaimer in the
  14  *    documentation and/or other materials provided with the distribution.
  15  *  
  16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  19  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  20  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  26  * SUCH DAMAGE.
  27  */
  28 /*
  29  * Names.h - names and types used by ascmagic in file(1).
  30  * These tokens are here because they can appear anywhere in
  31  * the first HOWMANY bytes, while tokens in MAGIC must
  32  * appear at fixed offsets into the file. Don't make HOWMANY
  33  * too high unless you have a very fast CPU.
  34  *
  35  * $File: names.h,v 1.32 2008/02/11 00:19:29 rrt Exp $
  36  */
  37 
  38 /*
  39         modified by Chris Lowth - 9 April 2000
  40         to add mime type strings to the types table.
  41 */
  42 
  43 /* these types are used to index the table 'types': keep em in sync! */
  44 #define L_C     0               /* first and foremost on UNIX */
  45 #define L_CC    1               /* Bjarne's postincrement */
  46 #define L_MAKE  2               /* Makefiles */
  47 #define L_PLI   3               /* PL/1 */
  48 #define L_MACH  4               /* some kinda assembler */
  49 #define L_ENG   5               /* English */
  50 #define L_PAS   6               /* Pascal */
  51 #define L_MAIL  7               /* Electronic mail */
  52 #define L_NEWS  8               /* Usenet Netnews */
  53 #define L_JAVA  9               /* Java code */
  54 #define L_HTML  10              /* HTML */
  55 #define L_BCPL  11              /* BCPL */
  56 #define L_M4    12              /* M4 */
  57 #define L_PO    13              /* PO */
  58 
  59 static const struct {
  60         char human[48];
  61         char mime[16];
  62 } types[] = {
  63         { "C program",                                  "text/x-c", },
  64         { "C++ program",                                "text/x-c++" },
  65         { "make commands",                              "text/x-makefile" },
  66         { "PL/1 program",                               "text/x-pl1" },
  67         { "assembler program",                          "text/x-asm" },
  68         { "English",                                    "text/plain" },
  69         { "Pascal program",                             "text/x-pascal" },
  70         { "mail",                                       "text/x-mail" },
  71         { "news",                                       "text/x-news" },
  72         { "Java program",                               "text/x-java" },
  73         { "HTML document",                              "text/html", },
  74         { "BCPL program",                               "text/x-bcpl" },
  75         { "M4 macro language pre-processor",            "text/x-m4" },
  76         { "PO (gettext message catalogue)",             "text/x-po" },
  77         { "cannot happen error on names.h/types",       "error/x-error" }
  78 };
  79 
  80 /*
  81  * XXX - how should we distinguish Java from C++?
  82  * The trick used in a Debian snapshot, of having "extends" or "implements"
  83  * as tags for Java, doesn't work very well, given that those keywords
  84  * are often preceded by "class", which flags it as C++.
  85  *
  86  * Perhaps we need to be able to say
  87  *
  88  *      If "class" then
  89  *
  90  *              if "extends" or "implements" then
  91  *                      Java
  92  *              else
  93  *                      C++
  94  *      endif
  95  *
  96  * Or should we use other keywords, such as "package" or "import"?
  97  * Unfortunately, Ada95 uses "package", and Modula-3 uses "import",
  98  * although I infer from the language spec at
  99  *
 100  *      http://www.research.digital.com/SRC/m3defn/html/m3.html
 101  *
 102  * that Modula-3 uses "IMPORT" rather than "import", i.e. it must be
 103  * in all caps.
 104  *
 105  * So, for now, we go with "import".  We must put it before the C++
 106  * stuff, so that we don't misidentify Java as C++.  Not using "package"
 107  * means we won't identify stuff that defines a package but imports
 108  * nothing; hopefully, very little Java code imports nothing (one of the
 109  * reasons for doing OO programming is to import as much as possible
 110  * and write only what you need to, right?).
 111  *
 112  * Unfortunately, "import" may cause us to misidentify English text
 113  * as Java, as it comes after "the" and "The".  Perhaps we need a fancier
 114  * heuristic to identify Java?
 115  */
 116 static const struct names {
 117         char name[14];
 118         short type;
 119 } names[] = {
 120         /* These must be sorted by eye for optimal hit rate */
 121         /* Add to this list only after substantial meditation */
 122         {"msgid",       L_PO},
 123         {"dnl",         L_M4},
 124         {"import",      L_JAVA},
 125         {"\"libhdr\"",  L_BCPL},
 126         {"\"LIBHDR\"",  L_BCPL},
 127         {"//",          L_CC},
 128         {"template",    L_CC},
 129         {"virtual",     L_CC},
 130         {"class",       L_CC},
 131         {"public:",     L_CC},
 132         {"private:",    L_CC},
 133         {"/*",          L_C},   /* must precede "The", "the", etc. */
 134         {"#include",    L_C},
 135         {"char",        L_C},
 136         {"The",         L_ENG},
 137         {"the",         L_ENG},
 138         {"double",      L_C},
 139         {"extern",      L_C},
 140         {"float",       L_C},
 141         {"struct",      L_C},
 142         {"union",       L_C},
 143         {"CFLAGS",      L_MAKE},
 144         {"LDFLAGS",     L_MAKE},
 145         {"all:",        L_MAKE},
 146         {".PRECIOUS",   L_MAKE},
 147         {".ascii",      L_MACH},
 148         {".asciiz",     L_MACH},
 149         {".byte",       L_MACH},
 150         {".even",       L_MACH},
 151         {".globl",      L_MACH},
 152         {".text",       L_MACH},
 153         {"clr",         L_MACH},
 154         {"(input,",     L_PAS},
 155         {"program",     L_PAS},
 156         {"record",      L_PAS},
 157         {"dcl",         L_PLI},
 158         {"Received:",   L_MAIL},
 159         {">From",       L_MAIL},
 160         {"Return-Path:",L_MAIL},
 161         {"Cc:",         L_MAIL},
 162         {"Newsgroups:", L_NEWS},
 163         {"Path:",       L_NEWS},
 164         {"Organization:",L_NEWS},
 165         {"href=",       L_HTML},
 166         {"HREF=",       L_HTML},
 167         {"<body",       L_HTML},
 168         {"<BODY",       L_HTML},
 169         {"<html",       L_HTML},
 170         {"<HTML",       L_HTML},
 171         {"<!--",        L_HTML},
 172 };
 173 #define NNAMES (sizeof(names)/sizeof(struct names))

/* [<][>][^][v][top][bottom][index][help] */