content-bozo.c revision 1.17
1/*	$NetBSD: content-bozo.c,v 1.17 2020/09/12 12:39:28 rhialto Exp $	*/
2
3/*	$eterna: content-bozo.c,v 1.17 2011/11/18 09:21:15 mrg Exp $	*/
4
5/*
6 * Copyright (c) 1997-2018 Matthew R. Green
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 *    notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 *    notice, this list of conditions and the following disclaimer and
16 *    dedication in the documentation and/or other materials provided
17 *    with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
24 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 *
31 */
32
33/* this code implements content-type handling for bozohttpd */
34
35#include <sys/param.h>
36
37#include <errno.h>
38#include <string.h>
39
40#include "bozohttpd.h"
41
42/*
43 * this map and the functions below map between filenames and the
44 * content type and content encoding definitions.  this should become
45 * a configuration file, perhaps like apache's mime.types (but that
46 * has less info per-entry).
47 */
48
49static bozo_content_map_t static_content_map[] = {
50	{ ".html",	"text/html",			"",		"", NULL },
51	{ ".htm",	"text/html",			"",		"", NULL },
52	{ ".gif",	"image/gif",			"",		"", NULL },
53	{ ".jpeg",	"image/jpeg",			"",		"", NULL },
54	{ ".jpg",	"image/jpeg",			"",		"", NULL },
55	{ ".jpe",	"image/jpeg",			"",		"", NULL },
56	{ ".png",	"image/png",			"",		"", NULL },
57	{ ".mp3",	"audio/mpeg",			"",		"", NULL },
58	{ ".css",	"text/css",			"",		"", NULL },
59	{ ".txt",	"text/plain",			"",		"", NULL },
60	{ ".swf",	"application/x-shockwave-flash","",		"", NULL },
61	{ ".dcr",	"application/x-director",	"",		"", NULL },
62	{ ".pac",	"application/x-ns-proxy-autoconfig", "",	"", NULL },
63	{ ".pa",	"application/x-ns-proxy-autoconfig", "",	"", NULL },
64	{ ".tar",	"multipart/x-tar",		"",		"", NULL },
65	{ ".gtar",	"application/x-gtar-compressed", "",		"", NULL },
66	{ ".tar.Z",	"application/x-gtar-compressed", "",		"", NULL },
67	{ ".tar.gz",	"application/x-gtar-compressed", "",		"", NULL },
68	{ ".taz",	"application/x-gtar-compressed", "",		"", NULL },
69	{ ".tgz",	"application/x-gtar-compressed", "",		"", NULL },
70	{ ".tar.z",	"application/x-gtar-compressed", "",		"", NULL },
71	{ ".Z",		"application/x-compress",	"",		"", NULL },
72	{ ".gz",	"application/x-gzip",		"",		"", NULL },
73	{ ".z",		"unknown",			"",		"", NULL },
74	{ ".bz2",	"application/x-bzip2",		"",		"", NULL },
75	{ ".ogg",	"application/x-ogg",		"",		"", NULL },
76	{ ".mkv",	"video/x-matroska",		"",		"", NULL },
77	{ ".xbel",	"text/xml",			"",		"", NULL },
78	{ ".xml",	"text/xml",			"",		"", NULL },
79	{ ".xsl",	"text/xml",			"",		"", NULL },
80	{ ".hqx",	"application/mac-binhex40",	"",		"", NULL },
81	{ ".cpt",	"application/mac-compactpro",	"",		"", NULL },
82	{ ".doc",	"application/msword",		"",		"", NULL },
83	{ ".bin",	"application/octet-stream",	"",		"", NULL },
84	{ ".dms",	"application/octet-stream",	"",		"", NULL },
85	{ ".lha",	"application/octet-stream",	"",		"", NULL },
86	{ ".lzh",	"application/octet-stream",	"",		"", NULL },
87	{ ".exe",	"application/octet-stream",	"",		"", NULL },
88	{ ".class",	"application/octet-stream",	"",		"", NULL },
89	{ ".oda",	"application/oda",		"",		"", NULL },
90	{ ".pdf",	"application/pdf",		"",		"", NULL },
91	{ ".ai",	"application/postscript",	"",		"", NULL },
92	{ ".eps",	"application/postscript",	"",		"", NULL },
93	{ ".ps",	"application/postscript",	"",		"", NULL },
94	{ ".ppt",	"application/powerpoint",	"",		"", NULL },
95	{ ".rtf",	"application/rtf",		"",		"", NULL },
96	{ ".bcpio",	"application/x-bcpio",		"",		"", NULL },
97	{ ".torrent",	"application/x-bittorrent",	"",		"", NULL },
98	{ ".vcd",	"application/x-cdlink",		"",		"", NULL },
99	{ ".cpio",	"application/x-cpio",		"",		"", NULL },
100	{ ".csh",	"application/x-csh",		"",		"", NULL },
101	{ ".dir",	"application/x-director",	"",		"", NULL },
102	{ ".dxr",	"application/x-director",	"",		"", NULL },
103	{ ".dvi",	"application/x-dvi",		"",		"", NULL },
104	{ ".hdf",	"application/x-hdf",		"",		"", NULL },
105	{ ".cgi",	"application/x-httpd-cgi",	"",		"", NULL },
106	{ ".skp",	"application/x-koan",		"",		"", NULL },
107	{ ".skd",	"application/x-koan",		"",		"", NULL },
108	{ ".skt",	"application/x-koan",		"",		"", NULL },
109	{ ".skm",	"application/x-koan",		"",		"", NULL },
110	{ ".latex",	"application/x-latex",		"",		"", NULL },
111	{ ".mif",	"application/x-mif",		"",		"", NULL },
112	{ ".nc",	"application/x-netcdf",		"",		"", NULL },
113	{ ".cdf",	"application/x-netcdf",		"",		"", NULL },
114	{ ".patch",	"application/x-patch",		"",		"", NULL },
115	{ ".sh",	"application/x-sh",		"",		"", NULL },
116	{ ".shar",	"application/x-shar",		"",		"", NULL },
117	{ ".sit",	"application/x-stuffit",	"",		"", NULL },
118	{ ".sv4cpio",	"application/x-sv4cpio",	"",		"", NULL },
119	{ ".sv4crc",	"application/x-sv4crc",		"",		"", NULL },
120	{ ".tar",	"application/x-tar",		"",		"", NULL },
121	{ ".tcl",	"application/x-tcl",		"",		"", NULL },
122	{ ".tex",	"application/x-tex",		"",		"", NULL },
123	{ ".texinfo",	"application/x-texinfo",	"",		"", NULL },
124	{ ".texi",	"application/x-texinfo",	"",		"", NULL },
125	{ ".t",		"application/x-troff",		"",		"", NULL },
126	{ ".tr",	"application/x-troff",		"",		"", NULL },
127	{ ".roff",	"application/x-troff",		"",		"", NULL },
128	{ ".man",	"application/x-troff-man",	"",		"", NULL },
129	{ ".me",	"application/x-troff-me",	"",		"", NULL },
130	{ ".ms",	"application/x-troff-ms",	"",		"", NULL },
131	{ ".ustar",	"application/x-ustar",		"",		"", NULL },
132	{ ".src",	"application/x-wais-source",	"",		"", NULL },
133	{ ".zip",	"application/zip",		"",		"", NULL },
134	{ ".au",	"audio/basic",			"",		"", NULL },
135	{ ".snd",	"audio/basic",			"",		"", NULL },
136	{ ".mpga",	"audio/mpeg",			"",		"", NULL },
137	{ ".mp2",	"audio/mpeg",			"",		"", NULL },
138	{ ".m4a",	"audio/mpeg",			"",		"", NULL },
139	{ ".aif",	"audio/x-aiff",			"",		"", NULL },
140	{ ".aiff",	"audio/x-aiff",			"",		"", NULL },
141	{ ".aifc",	"audio/x-aiff",			"",		"", NULL },
142	{ ".ram",	"audio/x-pn-realaudio",		"",		"", NULL },
143	{ ".rpm",	"audio/x-pn-realaudio-plugin",	"",		"", NULL },
144	{ ".ra",	"audio/x-realaudio",		"",		"", NULL },
145	{ ".wav",	"audio/x-wav",			"",		"", NULL },
146	{ ".pdb",	"chemical/x-pdb",		"",		"", NULL },
147	{ ".xyz",	"chemical/x-pdb",		"",		"", NULL },
148	{ ".ief",	"image/ief",			"",		"", NULL },
149	{ ".tiff",	"image/tiff",			"",		"", NULL },
150	{ ".tif",	"image/tiff",			"",		"", NULL },
151	{ ".ras",	"image/x-cmu-raster",		"",		"", NULL },
152	{ ".pnm",	"image/x-portable-anymap",	"",		"", NULL },
153	{ ".pbm",	"image/x-portable-bitmap",	"",		"", NULL },
154	{ ".pgm",	"image/x-portable-graymap",	"",		"", NULL },
155	{ ".ppm",	"image/x-portable-pixmap",	"",		"", NULL },
156	{ ".rgb",	"image/x-rgb",			"",		"", NULL },
157	{ ".xbm",	"image/x-xbitmap",		"",		"", NULL },
158	{ ".xpm",	"image/x-xpixmap",		"",		"", NULL },
159	{ ".xwd",	"image/x-xwindowdump",		"",		"", NULL },
160	{ ".rtx",	"text/richtext",		"",		"", NULL },
161	{ ".tsv",	"text/tab-separated-values",	"",		"", NULL },
162	{ ".etx",	"text/x-setext",		"",		"", NULL },
163	{ ".sgml",	"text/x-sgml",			"",		"", NULL },
164	{ ".sgm",	"text/x-sgml",			"",		"", NULL },
165	{ ".mpeg",	"video/mpeg",			"",		"", NULL },
166	{ ".mpg",	"video/mpeg",			"",		"", NULL },
167	{ ".mpe",	"video/mpeg",			"",		"", NULL },
168	{ ".ts",	"video/mpeg",			"",		"", NULL },
169	{ ".vob",	"video/mpeg",			"",		"", NULL },
170	{ ".mp4",	"video/mp4",			"",		"", NULL },
171	{ ".m4v",	"video/mp4",			"",		"", NULL },
172	{ ".qt",	"video/quicktime",		"",		"", NULL },
173	{ ".mov",	"video/quicktime",		"",		"", NULL },
174	{ ".avi",	"video/x-msvideo",		"",		"", NULL },
175	{ ".movie",	"video/x-sgi-movie",		"",		"", NULL },
176	{ ".ice",	"x-conference/x-cooltalk",	"",		"", NULL },
177	{ ".wrl",	"x-world/x-vrml",		"",		"", NULL },
178	{ ".vrml",	"x-world/x-vrml",		"",		"", NULL },
179	{ ".svg",	"image/svg+xml",		"",		"", NULL },
180	{ NULL,		NULL,		NULL,		NULL, NULL }
181};
182
183static bozo_content_map_t *
184search_map(bozo_content_map_t *map, const char *name, size_t len)
185{
186
187	for ( ; map && map->name; map++) {
188		const size_t namelen = strlen(map->name);
189
190		if (namelen < len &&
191		    strcasecmp(map->name, name + (len - namelen)) == 0)
192			return map;
193	}
194	return NULL;
195}
196
197/* match a suffix on a file - dynamiconly means no static content search */
198bozo_content_map_t *
199bozo_match_content_map(bozohttpd_t *httpd, const char *name,
200		       const int dynamiconly)
201{
202	bozo_content_map_t	*map;
203	size_t			 len;
204
205	len = strlen(name);
206	map = search_map(httpd->dynamic_content_map, name, len);
207	if (map == NULL && !dynamiconly)
208		map = search_map(static_content_map, name, len);
209
210	return map;
211}
212
213/*
214 * given the file name, return a valid Content-Type: value.
215 */
216/* ARGSUSED */
217const char *
218bozo_content_type(bozo_httpreq_t *request, const char *file)
219{
220	bozohttpd_t *httpd = request->hr_httpd;
221	bozo_content_map_t	*map;
222
223	map = bozo_match_content_map(httpd, file, 0);
224	if (map)
225		return map->type;
226	return httpd->consts.text_plain;
227}
228
229/*
230 * given the file name, return a valid Content-Encoding: value.
231 */
232const char *
233bozo_content_encoding(bozo_httpreq_t *request, const char *file)
234{
235	bozohttpd_t *httpd = request->hr_httpd;
236	bozo_content_map_t	*map;
237
238	map = bozo_match_content_map(httpd, file, 0);
239	if (map)
240		return (request->hr_proto == httpd->consts.http_11) ?
241		    map->encoding11 : map->encoding;
242	return NULL;
243}
244
245#ifndef NO_DYNAMIC_CONTENT
246
247bozo_content_map_t *
248bozo_get_content_map(bozohttpd_t *httpd, const char *name)
249{
250	bozo_content_map_t	*map;
251
252	if ((map = bozo_match_content_map(httpd, name, 1)) != NULL)
253		return map;
254
255	httpd->dynamic_content_map_size++;
256	httpd->dynamic_content_map = bozorealloc(httpd,
257		httpd->dynamic_content_map,
258		(httpd->dynamic_content_map_size + 1) * sizeof *map);
259	if (httpd->dynamic_content_map == NULL)
260		bozoerr(httpd, 1, "out of memory allocating content map");
261	map = &httpd->dynamic_content_map[httpd->dynamic_content_map_size];
262	map->name = map->type = map->encoding = map->encoding11 =
263		map->cgihandler = NULL;
264	map--;
265
266	return map;
267}
268
269/*
270 * mime content maps look like:
271 *	".name type encoding encoding11"
272 * where any of type, encoding or encoding11 a dash "-" means "".
273 * eg the .gtar, .tar.Z from above  could be written like:
274 *	".gtar multipart/x-gtar - -"
275 *	".tar.Z multipart/x-tar x-compress compress"
276 * or
277 *	".gtar multipart/x-gtar"
278 *	".tar.Z multipart/x-tar x-compress compress"
279 * NOTE: we destroy 'arg'
280 */
281void
282bozo_add_content_map_mime(bozohttpd_t *httpd, const char *cmap0,
283		const char *cmap1, const char *cmap2, const char *cmap3)
284{
285	bozo_content_map_t *map;
286
287	debug((httpd, DEBUG_FAT,
288		"add_content_map: name %s type %s enc %s enc11 %s ",
289		cmap0, cmap1, cmap2, cmap3));
290
291	map = bozo_get_content_map(httpd, cmap0);
292#define CHECKMAP(s)	(!s || ((s)[0] == '-' && (s)[1] == '\0') ? "" : (s))
293	map->name = CHECKMAP(cmap0);
294	map->type = CHECKMAP(cmap1);
295	map->encoding = CHECKMAP(cmap2);
296	map->encoding11 = CHECKMAP(cmap3);
297#undef CHECKMAP
298	map->cgihandler = NULL;
299}
300#endif /* NO_DYNAMIC_CONTENT */
301