1 /* 2 * Copyright (c) Ian F. Darwin 1986-1995. 3 * Software written by Ian F. Darwin and others; 4 * maintained 1995-present by Christos Zoulas and others. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions 8 * are met: 9 * 1. Redistributions of source code must retain the above copyright 10 * notice immediately at the beginning of the file, without modification, 11 * this list of conditions, and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR 20 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26 * SUCH DAMAGE. 27 */ 28 /* 29 * Names.h - names and types used by ascmagic in file(1). 30 * These tokens are here because they can appear anywhere in 31 * the first HOWMANY bytes, while tokens in MAGIC must 32 * appear at fixed offsets into the file. Don't make HOWMANY 33 * too high unless you have a very fast CPU. 34 * 35 * $File: names.h,v 1.32 2008/02/11 00:19:29 rrt Exp $ 36 */ 37 38 /* 39 modified by Chris Lowth - 9 April 2000 40 to add mime type strings to the types table. 41 */ 42 43 /* these types are used to index the table 'types': keep em in sync! */ 44 #define L_C 0 /* first and foremost on UNIX */ 45 #define L_CC 1 /* Bjarne's postincrement */ 46 #define L_MAKE 2 /* Makefiles */ 47 #define L_PLI 3 /* PL/1 */ 48 #define L_MACH 4 /* some kinda assembler */ 49 #define L_ENG 5 /* English */ 50 #define L_PAS 6 /* Pascal */ 51 #define L_MAIL 7 /* Electronic mail */ 52 #define L_NEWS 8 /* Usenet Netnews */ 53 #define L_JAVA 9 /* Java code */ 54 #define L_HTML 10 /* HTML */ 55 #define L_BCPL 11 /* BCPL */ 56 #define L_M4 12 /* M4 */ 57 #define L_PO 13 /* PO */ 58 59 static const struct { 60 char human[48]; 61 char mime[16]; 62 } types[] = { 63 { "C program", "text/x-c", }, 64 { "C++ program", "text/x-c++" }, 65 { "make commands", "text/x-makefile" }, 66 { "PL/1 program", "text/x-pl1" }, 67 { "assembler program", "text/x-asm" }, 68 { "English", "text/plain" }, 69 { "Pascal program", "text/x-pascal" }, 70 { "mail", "text/x-mail" }, 71 { "news", "text/x-news" }, 72 { "Java program", "text/x-java" }, 73 { "HTML document", "text/html", }, 74 { "BCPL program", "text/x-bcpl" }, 75 { "M4 macro language pre-processor", "text/x-m4" }, 76 { "PO (gettext message catalogue)", "text/x-po" }, 77 { "cannot happen error on names.h/types", "error/x-error" } 78 }; 79 80 /* 81 * XXX - how should we distinguish Java from C++? 82 * The trick used in a Debian snapshot, of having "extends" or "implements" 83 * as tags for Java, doesn't work very well, given that those keywords 84 * are often preceded by "class", which flags it as C++. 85 * 86 * Perhaps we need to be able to say 87 * 88 * If "class" then 89 * 90 * if "extends" or "implements" then 91 * Java 92 * else 93 * C++ 94 * endif 95 * 96 * Or should we use other keywords, such as "package" or "import"? 97 * Unfortunately, Ada95 uses "package", and Modula-3 uses "import", 98 * although I infer from the language spec at 99 * 100 * http://www.research.digital.com/SRC/m3defn/html/m3.html 101 * 102 * that Modula-3 uses "IMPORT" rather than "import", i.e. it must be 103 * in all caps. 104 * 105 * So, for now, we go with "import". We must put it before the C++ 106 * stuff, so that we don't misidentify Java as C++. Not using "package" 107 * means we won't identify stuff that defines a package but imports 108 * nothing; hopefully, very little Java code imports nothing (one of the 109 * reasons for doing OO programming is to import as much as possible 110 * and write only what you need to, right?). 111 * 112 * Unfortunately, "import" may cause us to misidentify English text 113 * as Java, as it comes after "the" and "The". Perhaps we need a fancier 114 * heuristic to identify Java? 115 */ 116 static const struct names { 117 char name[14]; 118 short type; 119 } names[] = { 120 /* These must be sorted by eye for optimal hit rate */ 121 /* Add to this list only after substantial meditation */ 122 {"msgid", L_PO}, 123 {"dnl", L_M4}, 124 {"import", L_JAVA}, 125 {"\"libhdr\"", L_BCPL}, 126 {"\"LIBHDR\"", L_BCPL}, 127 {"//", L_CC}, 128 {"template", L_CC}, 129 {"virtual", L_CC}, 130 {"class", L_CC}, 131 {"public:", L_CC}, 132 {"private:", L_CC}, 133 {"/*", L_C}, /* must precede "The", "the", etc. */ 134 {"#include", L_C}, 135 {"char", L_C}, 136 {"The", L_ENG}, 137 {"the", L_ENG}, 138 {"double", L_C}, 139 {"extern", L_C}, 140 {"float", L_C}, 141 {"struct", L_C}, 142 {"union", L_C}, 143 {"CFLAGS", L_MAKE}, 144 {"LDFLAGS", L_MAKE}, 145 {"all:", L_MAKE}, 146 {".PRECIOUS", L_MAKE}, 147 {".ascii", L_MACH}, 148 {".asciiz", L_MACH}, 149 {".byte", L_MACH}, 150 {".even", L_MACH}, 151 {".globl", L_MACH}, 152 {".text", L_MACH}, 153 {"clr", L_MACH}, 154 {"(input,", L_PAS}, 155 {"program", L_PAS}, 156 {"record", L_PAS}, 157 {"dcl", L_PLI}, 158 {"Received:", L_MAIL}, 159 {">From", L_MAIL}, 160 {"Return-Path:",L_MAIL}, 161 {"Cc:", L_MAIL}, 162 {"Newsgroups:", L_NEWS}, 163 {"Path:", L_NEWS}, 164 {"Organization:",L_NEWS}, 165 {"href=", L_HTML}, 166 {"HREF=", L_HTML}, 167 {"<body", L_HTML}, 168 {"<BODY", L_HTML}, 169 {"<html", L_HTML}, 170 {"<HTML", L_HTML}, 171 {"<!--", L_HTML}, 172 }; 173 #define NNAMES (sizeof(names)/sizeof(struct names)) 174