Update to file-4.19.
[dragonfly.git] / contrib / file-4 / src / names.h
CommitLineData
ab0b56cc
JS
1/*
2 * Copyright (c) Ian F. Darwin 1986-1995.
3 * Software written by Ian F. Darwin and others;
4 * maintained 1995-present by Christos Zoulas and others.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 * notice immediately at the beginning of the file, without modification,
11 * this list of conditions, and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
20 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 */
28/*
29 * Names.h - names and types used by ascmagic in file(1).
30 * These tokens are here because they can appear anywhere in
31 * the first HOWMANY bytes, while tokens in MAGIC must
32 * appear at fixed offsets into the file. Don't make HOWMANY
33 * too high unless you have a very fast CPU.
34 *
35 * $Id: names.h,v 1.25 2004/09/11 19:15:57 christos Exp $
36 */
37
38/*
39 modified by Chris Lowth - 9 April 2000
40 to add mime type strings to the types table.
41*/
42
43/* these types are used to index the table 'types': keep em in sync! */
44#define L_C 0 /* first and foremost on UNIX */
45#define L_CC 1 /* Bjarne's postincrement */
46#define L_FORT 2 /* the oldest one */
47#define L_MAKE 3 /* Makefiles */
48#define L_PLI 4 /* PL/1 */
49#define L_MACH 5 /* some kinda assembler */
50#define L_ENG 6 /* English */
51#define L_PAS 7 /* Pascal */
52#define L_MAIL 8 /* Electronic mail */
53#define L_NEWS 9 /* Usenet Netnews */
54#define L_JAVA 10 /* Java code */
55#define L_HTML 11 /* HTML */
56#define L_BCPL 12 /* BCPL */
57#define L_M4 13 /* M4 */
58#define L_PO 14 /* PO */
59
60static const struct {
61 const char *human;
62 const char *mime;
63} types[] = {
64 { "C program", "text/x-c", },
65 { "C++ program", "text/x-c++" },
66 { "FORTRAN program", "text/x-fortran" },
67 { "make commands", "text/x-makefile" },
68 { "PL/1 program", "text/x-pl1" },
69 { "assembler program", "text/x-asm" },
70 { "English", "text/plain" },
71 { "Pascal program", "text/x-pascal" },
72 { "mail", "text/x-mail" },
73 { "news", "text/x-news" },
74 { "Java program", "text/x-java" },
75 { "HTML document", "text/html", },
76 { "BCPL program", "text/x-bcpl" },
77 { "M4 macro language pre-processor", "text/x-m4" },
78 { "PO (gettext message catalogue)", "text/x-po" },
79 { "cannot happen error on names.h/types", "error/x-error" },
80 { 0, 0}
81};
82
83/*
84 * XXX - how should we distinguish Java from C++?
85 * The trick used in a Debian snapshot, of having "extends" or "implements"
86 * as tags for Java, doesn't work very well, given that those keywords
87 * are often preceded by "class", which flags it as C++.
88 *
89 * Perhaps we need to be able to say
90 *
91 * If "class" then
92 *
93 * if "extends" or "implements" then
94 * Java
95 * else
96 * C++
97 * endif
98 *
99 * Or should we use other keywords, such as "package" or "import"?
100 * Unfortunately, Ada95 uses "package", and Modula-3 uses "import",
101 * although I infer from the language spec at
102 *
103 * http://www.research.digital.com/SRC/m3defn/html/m3.html
104 *
105 * that Modula-3 uses "IMPORT" rather than "import", i.e. it must be
106 * in all caps.
107 *
108 * So, for now, we go with "import". We must put it before the C++
109 * stuff, so that we don't misidentify Java as C++. Not using "package"
110 * means we won't identify stuff that defines a package but imports
111 * nothing; hopefully, very little Java code imports nothing (one of the
112 * reasons for doing OO programming is to import as much as possible
113 * and write only what you need to, right?).
114 *
115 * Unfortunately, "import" may cause us to misidentify English text
116 * as Java, as it comes after "the" and "The". Perhaps we need a fancier
117 * heuristic to identify Java?
118 */
119static struct names {
120 const char *name;
121 short type;
122} names[] = {
123 /* These must be sorted by eye for optimal hit rate */
124 /* Add to this list only after substantial meditation */
125 {"msgid", L_PO},
126 {"dnl", L_M4},
127 {"import", L_JAVA},
128 {"\"libhdr\"", L_BCPL},
129 {"\"LIBHDR\"", L_BCPL},
130 {"//", L_CC},
131 {"template", L_CC},
132 {"virtual", L_CC},
133 {"class", L_CC},
134 {"public:", L_CC},
135 {"private:", L_CC},
136 {"/*", L_C}, /* must precede "The", "the", etc. */
137 {"#include", L_C},
138 {"char", L_C},
139 {"The", L_ENG},
140 {"the", L_ENG},
141 {"double", L_C},
142 {"extern", L_C},
143 {"float", L_C},
144 {"struct", L_C},
145 {"union", L_C},
146 {"CFLAGS", L_MAKE},
147 {"LDFLAGS", L_MAKE},
148 {"all:", L_MAKE},
149 {".PRECIOUS", L_MAKE},
150/* Too many files of text have these words in them. Find another way
151 * to recognize Fortrash.
152 */
153#ifdef NOTDEF
154 {"subroutine", L_FORT},
155 {"function", L_FORT},
156 {"block", L_FORT},
157 {"common", L_FORT},
158 {"dimension", L_FORT},
159 {"integer", L_FORT},
160 {"data", L_FORT},
161#endif /*NOTDEF*/
162 {".ascii", L_MACH},
163 {".asciiz", L_MACH},
164 {".byte", L_MACH},
165 {".even", L_MACH},
166 {".globl", L_MACH},
167 {".text", L_MACH},
168 {"clr", L_MACH},
169 {"(input,", L_PAS},
170 {"dcl", L_PLI},
171 {"Received:", L_MAIL},
172 {">From", L_MAIL},
173 {"Return-Path:",L_MAIL},
174 {"Cc:", L_MAIL},
175 {"Newsgroups:", L_NEWS},
176 {"Path:", L_NEWS},
177 {"Organization:",L_NEWS},
178 {"href=", L_HTML},
179 {"HREF=", L_HTML},
180 {"<body", L_HTML},
181 {"<BODY", L_HTML},
182 {"<html", L_HTML},
183 {"<HTML", L_HTML},
184 {NULL, 0}
185};
186#define NNAMES ((sizeof(names)/sizeof(struct names)) - 1)