1#	$OpenBSD: compress,v 1.7 2015/10/05 22:36:23 nicm Exp $
2
3#------------------------------------------------------------------------------
4# compress:  file(1) magic for pure-compression formats (no archives)
5#
6# compress, gzip, pack, compact, huf, squeeze, crunch, freeze, yabba, etc.
7#
8# Formats for various forms of compressed data
9# Formats for "compress" proper have been moved into "compress.c",
10# because it tries to uncompress it to figure out what's inside.
11
12# standard unix compress
130	string		\037\235	compress'd data
14!:mime	application/x-compress
15!:apple	LZIVZIVU
16>2	byte&0x80	>0		block compressed
17>2	byte&0x1f	x		%d bits
18
19# gzip (GNU zip, not to be confused with Info-ZIP or PKWARE zip archiver)
20#   Edited by Chris Chittleborough <cchittleborough@yahoo.com.au>, March 2002
21#	* Original filename is only at offset 10 if "extra field" absent
22#	* Produce shorter output - notably, only report compression methods
23#         other than 8 ("deflate", the only method defined in RFC 1952).
240       string          \037\213        gzip compressed data
25!:mime	application/x-gzip
26!:strength * 2
27>2	byte		<8		\b, reserved method
28>2	byte		>8		\b, unknown method
29>3	byte		&0x01		\b, ASCII
30>3	byte		&0x02		\b, has CRC
31>3	byte		&0x04		\b, extra field
32>3	byte&0xC	=0x08
33>>10	string		x		\b, was "%s"
34>3	byte		&0x10		\b, has comment
35>3	byte		&0x20		\b, encrypted
36>4	ledate		>0		\b, last modified: %s
37>8	byte		2		\b, max compression
38>8	byte		4		\b, max speed
39>9	byte		=0x00		\b, from FAT filesystem (MS-DOS, OS/2, NT)
40>9	byte		=0x01		\b, from Amiga
41>9	byte		=0x02		\b, from VMS
42>9	byte		=0x03		\b, from Unix
43>9	byte		=0x04		\b, from VM/CMS
44>9	byte		=0x05		\b, from Atari
45>9	byte		=0x06		\b, from HPFS filesystem (OS/2, NT)
46>9	byte		=0x07		\b, from MacOS
47>9	byte		=0x08		\b, from Z-System
48>9	byte		=0x09		\b, from CP/M
49>9	byte		=0x0A		\b, from TOPS/20
50>9	byte		=0x0B		\b, from NTFS filesystem (NT)
51>9	byte		=0x0C		\b, from QDOS
52>9	byte		=0x0D		\b, from Acorn RISCOS
53
54# packed data, Huffman (minimum redundancy) codes on a byte-by-byte basis
550	string		\037\036	packed data
56!:mime	application/octet-stream
57>2	belong		>1		\b, %d characters originally
58>2	belong		=1		\b, %d character originally
59#
60# This magic number is byte-order-independent.
610	short		0x1f1f		old packed data
62!:mime	application/octet-stream
63
64# XXX - why *two* entries for "compacted data", one of which is
65# byte-order independent, and one of which is byte-order dependent?
66#
670	short		0x1fff		compacted data
68!:mime	application/octet-stream
69# This string is valid for SunOS (BE) and a matching "short" is listed
70# in the Ultrix (LE) magic file.
710	string		\377\037	compacted data
72!:mime	application/octet-stream
730	short		0145405		huf output
74!:mime	application/octet-stream
75
76# bzip2
770	string		BZh		bzip2 compressed data
78!:mime	application/x-bzip2
79>3	byte		>47		\b, block size = %c00k
80
81# lzip
820	string		LZIP		lzip compressed data
83!:mime application/x-lzip
84>4	byte		x		\b, version: %d
85
86# squeeze and crunch
87# Michael Haardt <michael@cantor.informatik.rwth-aachen.de>
880	beshort		0x76FF		squeezed data,
89>4	string		x		original name %s
900	beshort		0x76FE		crunched data,
91>2	string		x		original name %s
920	beshort		0x76FD		LZH compressed data,
93>2	string		x		original name %s
94
95# Freeze
960	string		\037\237	frozen file 2.1
970	string		\037\236	frozen file 1.0 (or gzip 0.5)
98
99# SCO compress -H (LZH)
1000	string		\037\240	SCO compress -H (LZH) data
101
102# European GSM 06.10 is a provisional standard for full-rate speech
103# transcoding, prI-ETS 300 036, which uses RPE/LTP (residual pulse
104# excitation/long term prediction) coding at 13 kbit/s.
105#
106# There's only a magic nibble (4 bits); that nibble repeats every 33
107# bytes.  This isn't suited for use, but maybe we can use it someday.
108#
109# This will cause very short GSM files to be declared as data and
110# mismatches to be declared as data too!
111#0	byte&0xF0	0xd0		data
112#>33	byte&0xF0	0xd0
113#>66	byte&0xF0	0xd0
114#>99	byte&0xF0	0xd0
115#>132	byte&0xF0	0xd0		GSM 06.10 compressed audio
116
117# bzip	a block-sorting file compressor
118#	by Julian Seward <sewardj@cs.man.ac.uk> and others
119#
120#0	string		BZ		bzip compressed data
121#>2	byte		x		\b, version: %c
122#>3	string		=1		\b, compression block size 100k
123#>3	string		=2		\b, compression block size 200k
124#>3	string		=3		\b, compression block size 300k
125#>3	string		=4		\b, compression block size 400k
126#>3	string		=5		\b, compression block size 500k
127#>3	string		=6		\b, compression block size 600k
128#>3	string		=7		\b, compression block size 700k
129#>3	string		=8		\b, compression block size 800k
130#>3	string		=9		\b, compression block size 900k
131
132# lzop from <markus.oberhumer@jk.uni-linz.ac.at>
1330	string		\x89\x4c\x5a\x4f\x00\x0d\x0a\x1a\x0a	lzop compressed data
134>9	beshort		<0x0940
135>>9	byte&0xf0	=0x00		- version 0.
136>>9	beshort&0x0fff	x		\b%03x,
137>>13	byte		1		LZO1X-1,
138>>13	byte		2		LZO1X-1(15),
139>>13	byte		3		LZO1X-999,
140## >>22	bedate		>0		last modified: %s,
141>>14	byte		=0x00		os: MS-DOS
142>>14	byte		=0x01		os: Amiga
143>>14	byte		=0x02		os: VMS
144>>14	byte		=0x03		os: Unix
145>>14	byte		=0x05		os: Atari
146>>14	byte		=0x06		os: OS/2
147>>14	byte		=0x07		os: MacOS
148>>14	byte		=0x0A		os: Tops/20
149>>14	byte		=0x0B		os: WinNT
150>>14	byte		=0x0E		os: Win32
151>9	beshort		>0x0939
152>>9	byte&0xf0	=0x00		- version 0.
153>>9	byte&0xf0	=0x10		- version 1.
154>>9	byte&0xf0	=0x20		- version 2.
155>>9	beshort&0x0fff	x		\b%03x,
156>>15	byte		1		LZO1X-1,
157>>15	byte		2		LZO1X-1(15),
158>>15	byte		3		LZO1X-999,
159## >>25	bedate		>0		last modified: %s,
160>>17	byte		=0x00		os: MS-DOS
161>>17	byte		=0x01		os: Amiga
162>>17	byte		=0x02		os: VMS
163>>17	byte		=0x03		os: Unix
164>>17	byte		=0x05		os: Atari
165>>17	byte		=0x06		os: OS/2
166>>17	byte		=0x07		os: MacOS
167>>17	byte		=0x0A		os: Tops/20
168>>17	byte		=0x0B		os: WinNT
169>>17	byte		=0x0E		os: Win32
170
171# 4.3BSD-Quasijarus Strong Compression
172# http://minnie.tuhs.org/Quasijarus/compress.html
1730	string		\037\241	Quasijarus strong compressed data
174
175# From: Cory Dikkers <cdikkers@swbell.net>
1760	string		XPKF		Amiga xpkf.library compressed data
1770	string		PP11		Power Packer 1.1 compressed data
1780	string		PP20		Power Packer 2.0 compressed data,
179>4	belong		0x09090909	fast compression
180>4	belong		0x090A0A0A	mediocre compression
181>4	belong		0x090A0B0B	good compression
182>4	belong		0x090A0C0C	very good compression
183>4	belong		0x090A0C0D	best compression
184
185# 7-zip archiver, from Thomas Klausner (wiz@danbala.tuwien.ac.at)
186# http://www.7-zip.org or DOC/7zFormat.txt
187#
1880	string		7z\274\257\047\034	7-zip archive data,
189>6	byte		x			version %d
190>7	byte		x			\b.%d
191!:mime	application/x-7z-compressed
192
193# Type: LZMA
1940	lelong&0xffffff	=0x5d
195>12	leshort		0xff			LZMA compressed data,
196!:mime	application/x-lzma
197>>5	lequad		=0xffffffffffffffff	streamed
198>>5	lequad		!0xffffffffffffffff	non-streamed, size %lld
199>12	leshort		0			LZMA compressed data,
200>>5	lequad		=0xffffffffffffffff	streamed
201>>5	lequad		!0xffffffffffffffff	non-streamed, size %lld
202
203# http://tukaani.org/xz/xz-file-format.txt
2040	ustring		\xFD7zXZ\x00		XZ compressed data
205!:strength * 2
206!:mime	application/x-xz
207
208# https://github.com/ckolivas/lrzip/blob/master/doc/magic.header.txt
2090	string		LRZI			LRZIP compressed data
210>4	byte		x			- version %d
211>5	byte		x			\b.%d
212!:mime	application/x-lrzip
213
214# http://fastcompression.blogspot.fi/2013/04/lz4-streaming-format-final.html
2150	lelong		0x184d2204	LZ4 compressed data (v1.4+)
216!:mime	application/x-lz4
217# Added by osm0sis@xda-developers.com
2180 	lelong		0x184c2103	LZ4 compressed data (v1.0-v1.3)
219!:mime	application/x-lz4
2200	lelong		0x184c2102	LZ4 compressed data (v0.1-v0.9)
221!:mime	application/x-lz4
222
223# AFX compressed files (Wolfram Kleff)
2242	string		-afx-		AFX compressed file data
225
226# Supplementary magic data for the file(1) command to support
227# rzip(1).  The format is described in magic(5).
228#
229# Copyright (C) 2003 by Andrew Tridgell.  You may do whatever you want with
230# this file.
231#
2320	string		RZIP		rzip compressed data
233>4	byte		x		- version %d
234>5	byte		x		\b.%d
235>6	belong		x		(%d bytes)
236
2370	string		ArC\x01		FreeArc archive <http://freearc.org>
238
239# Type:	DACT compressed files
2400	long	0x444354C3	DACT compressed data
241>4	byte	>-1		(version %i.
242>5	byte	>-1		%i.
243>6	byte	>-1		%i)
244>7	long	>0		, original size: %i bytes
245>15	long	>30		, block size: %i bytes
246
247# Valve Pack (VPK) files
2480	lelong	0x55aa1234	Valve Pak file
249>0x4	lelong	x		\b, version %u
250>0x8	lelong	x		\b, %u entries
251
252# Snappy framing format
253# http://code.google.com/p/snappy/source/browse/trunk/framing_format.txt
2540	string	\377\006\0\0sNaPpY	snappy framed data
255!:mime	application/x-snappy-framed
256
257# qpress, http://www.quicklz.com/
2580	string	qpress10	qpress compressed data
259!:mime	application/x-qpress
260
261# Zlib https://www.ietf.org/rfc/rfc6713.txt
2620	string/b	x
263>0	beshort%31	=0	
264>>0	byte&0xf	=8
265>>>0	byte&0x80 	=0	zlib compressed data
266!:mime	application/zlib
267