blob: 1517559c64c353429adf9bc850da81758d28ba58 [file] [log] [blame]
"Robert P. J. Day"63fc1a92006-07-02 19:47:05 +00001/* vi: set sw=4 ts=4: */
Denys Vlasenko2ab94032017-10-05 15:33:28 +02002/*
3 * uncompress for busybox -- (c) 2002 Robert Griebl
Robert Griebl94a6a952002-05-19 19:00:14 +00004 *
Eric Andersenc7bda1c2004-03-15 08:29:22 +00005 * based on the original compress42.c source
Robert Griebl94a6a952002-05-19 19:00:14 +00006 * (see disclaimer below)
7 */
Robert Griebl94a6a952002-05-19 19:00:14 +00008/* (N)compress42.c - File compression ala IEEE Computer, Mar 1992.
9 *
10 * Authors:
11 * Spencer W. Thomas (decvax!harpo!utah-cs!utah-gr!thomas)
12 * Jim McKie (decvax!mcvax!jim)
13 * Steve Davies (decvax!vax135!petsd!peora!srd)
14 * Ken Turkowski (decvax!decwrl!turtlevax!ken)
15 * James A. Woods (decvax!ihnp4!ames!jaw)
16 * Joe Orost (decvax!vax135!petsd!joe)
17 * Dave Mack (csu@alembic.acs.com)
18 * Peter Jannesen, Network Communication Systems
19 * (peter@ncs.nl)
20 *
21 * marc@suse.de : a small security fix for a buffer overflow
22 *
23 * [... History snipped ...]
Robert Griebl94a6a952002-05-19 19:00:14 +000024 */
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +000025#include "libbb.h"
Denys Vlasenkod184a722011-09-22 12:45:14 +020026#include "bb_archive.h"
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +000027
28
Eric Andersenaff114c2004-04-14 17:51:38 +000029/* Default input buffer size */
Denys Vlasenkoe4dcba12010-10-28 18:57:19 +020030#define IBUFSIZ 2048
Robert Griebl94a6a952002-05-19 19:00:14 +000031
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000032/* Default output buffer size */
Denys Vlasenkoe4dcba12010-10-28 18:57:19 +020033#define OBUFSIZ 2048
Robert Griebl94a6a952002-05-19 19:00:14 +000034
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000035/* Defines for third byte of header */
Denis Vlasenkoe8a07882007-06-10 15:08:44 +000036#define BIT_MASK 0x1f /* Mask for 'number of compresssion bits' */
37 /* Masks 0x20 and 0x40 are free. */
38 /* I think 0x20 should mean that there is */
39 /* a fourth header byte (for expansion). */
40#define BLOCK_MODE 0x80 /* Block compression if table is full and */
41 /* compression rate is dropping flush tables */
42 /* the next two codes should not be changed lightly, as they must not */
43 /* lie within the contiguous general code space. */
44#define FIRST 257 /* first free entry */
45#define CLEAR 256 /* table clear output code */
Robert Griebl94a6a952002-05-19 19:00:14 +000046
Denis Vlasenkoe8a07882007-06-10 15:08:44 +000047#define INIT_BITS 9 /* initial number of bits/code */
Robert Griebl94a6a952002-05-19 19:00:14 +000048
49
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000050/* machine variants which require cc -Dmachine: pdp11, z8000, DOS */
Denis Vlasenkoe8a07882007-06-10 15:08:44 +000051#define HBITS 17 /* 50% occupancy */
52#define HSIZE (1<<HBITS)
53#define HMASK (HSIZE-1) /* unused */
54#define HPRIME 9941 /* unused */
55#define BITS 16
56#define BITS_STR "16"
57#undef MAXSEG_64K /* unused */
58#define MAXCODE(n) (1L << (n))
Robert Griebl94a6a952002-05-19 19:00:14 +000059
Denis Vlasenkoe8a07882007-06-10 15:08:44 +000060#define htabof(i) htab[i]
61#define codetabof(i) codetab[i]
62#define tab_prefixof(i) codetabof(i)
63#define tab_suffixof(i) ((unsigned char *)(htab))[i]
64#define de_stack ((unsigned char *)&(htab[HSIZE-1]))
65#define clear_tab_prefixof() memset(codetab, 0, 256)
Robert Griebl94a6a952002-05-19 19:00:14 +000066
Robert Griebl94a6a952002-05-19 19:00:14 +000067/*
68 * Decompress stdin to stdout. This routine adapts to the codes in the
69 * file building the "string" table on-the-fly; requiring no table to
Denis Vlasenkoe8a07882007-06-10 15:08:44 +000070 * be stored in the compressed file.
Robert Griebl94a6a952002-05-19 19:00:14 +000071 */
72
Denis Vlasenko5e34ff22009-04-21 11:09:40 +000073IF_DESKTOP(long long) int FAST_FUNC
Denys Vlasenkob4c11c12014-12-07 00:44:00 +010074unpack_Z_stream(transformer_state_t *xstate)
Robert Griebl94a6a952002-05-19 19:00:14 +000075{
Denis Vlasenko5e34ff22009-04-21 11:09:40 +000076 IF_DESKTOP(long long total_written = 0;)
77 IF_DESKTOP(long long) int retval = -1;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000078 unsigned char *stackp;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000079 int finchar;
Denis Vlasenko87468852007-04-13 23:22:00 +000080 long oldcode;
81 long incode;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000082 int inbits;
83 int posbits;
84 int outpos;
85 int insize;
86 int bitmask;
Denis Vlasenko87468852007-04-13 23:22:00 +000087 long free_ent;
88 long maxcode;
89 long maxmaxcode;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +000090 int n_bits;
91 int rsize = 0;
Denis Vlasenkoe8a07882007-06-10 15:08:44 +000092 unsigned char *inbuf; /* were eating insane amounts of stack - */
93 unsigned char *outbuf; /* bad for some embedded targets */
94 unsigned char *htab;
95 unsigned short *codetab;
Denis Vlasenko447b5432007-01-05 19:49:02 +000096
97 /* Hmm, these were statics - why?! */
98 /* user settable max # bits/code */
99 int maxbits; /* = BITS; */
100 /* block compress mode -C compatible with 2.0 */
101 int block_mode; /* = BLOCK_MODE; */
102
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100103 if (check_signature16(xstate, COMPRESS_MAGIC))
Denys Vlasenko8a6a2f92012-03-06 16:27:48 +0100104 return -1;
105
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000106 inbuf = xzalloc(IBUFSIZ + 64);
107 outbuf = xzalloc(OBUFSIZ + 2048);
Denys Vlasenko59655072012-03-06 16:23:50 +0100108 htab = xzalloc(HSIZE); /* wasn't zeroed out before, maybe can xmalloc? */
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000109 codetab = xzalloc(HSIZE * sizeof(codetab[0]));
Robert Griebl94a6a952002-05-19 19:00:14 +0000110
111 insize = 0;
112
Denis Vlasenko447b5432007-01-05 19:49:02 +0000113 /* xread isn't good here, we have to return - caller may want
114 * to do some cleanup (e.g. delete incomplete unpacked file etc) */
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100115 if (full_read(xstate->src_fd, inbuf, 1) != 1) {
Denis Vlasenko447b5432007-01-05 19:49:02 +0000116 bb_error_msg("short read");
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000117 goto err;
Denis Vlasenko447b5432007-01-05 19:49:02 +0000118 }
Robert Griebl94a6a952002-05-19 19:00:14 +0000119
120 maxbits = inbuf[0] & BIT_MASK;
121 block_mode = inbuf[0] & BLOCK_MODE;
122 maxmaxcode = MAXCODE(maxbits);
123
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000124 if (maxbits > BITS) {
Denis Vlasenko447b5432007-01-05 19:49:02 +0000125 bb_error_msg("compressed with %d bits, can only handle "
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000126 BITS_STR" bits", maxbits);
127 goto err;
Robert Griebl94a6a952002-05-19 19:00:14 +0000128 }
129
Denis Vlasenko447b5432007-01-05 19:49:02 +0000130 n_bits = INIT_BITS;
131 maxcode = MAXCODE(INIT_BITS) - 1;
132 bitmask = (1 << INIT_BITS) - 1;
Robert Griebl94a6a952002-05-19 19:00:14 +0000133 oldcode = -1;
134 finchar = 0;
135 outpos = 0;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000136 posbits = 0 << 3;
Robert Griebl94a6a952002-05-19 19:00:14 +0000137
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000138 free_ent = ((block_mode) ? FIRST : 256);
Robert Griebl94a6a952002-05-19 19:00:14 +0000139
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000140 /* As above, initialize the first 256 entries in the table. */
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000141 /*clear_tab_prefixof(); - done by xzalloc */
Robert Griebl94a6a952002-05-19 19:00:14 +0000142
Denys Vlasenkoc71547c2012-12-05 01:04:54 +0100143 {
144 int i;
145 for (i = 255; i >= 0; --i)
146 tab_suffixof(i) = (unsigned char) i;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000147 }
Robert Griebl94a6a952002-05-19 19:00:14 +0000148
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000149 do {
Denis Vlasenko447b5432007-01-05 19:49:02 +0000150 resetbuf:
Robert Griebl94a6a952002-05-19 19:00:14 +0000151 {
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000152 int i;
153 int e;
154 int o;
Robert Griebl94a6a952002-05-19 19:00:14 +0000155
Denis Vlasenko447b5432007-01-05 19:49:02 +0000156 o = posbits >> 3;
157 e = insize - o;
Robert Griebl94a6a952002-05-19 19:00:14 +0000158
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000159 for (i = 0; i < e; ++i)
160 inbuf[i] = inbuf[i + o];
Robert Griebl94a6a952002-05-19 19:00:14 +0000161
162 insize = e;
163 posbits = 0;
164 }
165
Bernhard Reutner-Fischer5d725462006-09-06 15:28:32 +0000166 if (insize < (int) (IBUFSIZ + 64) - IBUFSIZ) {
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100167 rsize = safe_read(xstate->src_fd, inbuf + insize, IBUFSIZ);
Denys Vlasenko251fc702011-08-18 14:29:41 +0200168 if (rsize < 0)
Denys Vlasenkoa04e4c22011-08-22 04:59:41 +0200169 bb_error_msg_and_die(bb_msg_read_error);
Robert Griebl94a6a952002-05-19 19:00:14 +0000170 insize += rsize;
171 }
172
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000173 inbits = ((rsize > 0) ? (insize - insize % n_bits) << 3 :
174 (insize << 3) - (n_bits - 1));
Robert Griebl94a6a952002-05-19 19:00:14 +0000175
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000176 while (inbits > posbits) {
Denys Vlasenkoc71547c2012-12-05 01:04:54 +0100177 long code;
178
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000179 if (free_ent > maxcode) {
180 posbits =
181 ((posbits - 1) +
182 ((n_bits << 3) -
183 (posbits - 1 + (n_bits << 3)) % (n_bits << 3)));
Robert Griebl94a6a952002-05-19 19:00:14 +0000184 ++n_bits;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000185 if (n_bits == maxbits) {
Robert Griebl94a6a952002-05-19 19:00:14 +0000186 maxcode = maxmaxcode;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000187 } else {
188 maxcode = MAXCODE(n_bits) - 1;
189 }
190 bitmask = (1 << n_bits) - 1;
Robert Griebl94a6a952002-05-19 19:00:14 +0000191 goto resetbuf;
192 }
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000193 {
194 unsigned char *p = &inbuf[posbits >> 3];
Denys Vlasenkoc71547c2012-12-05 01:04:54 +0100195 code = ((p[0]
196 | ((long) (p[1]) << 8)
197 | ((long) (p[2]) << 16)) >> (posbits & 0x7)) & bitmask;
Robert Griebl94a6a952002-05-19 19:00:14 +0000198 }
199 posbits += n_bits;
Robert Griebl94a6a952002-05-19 19:00:14 +0000200
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000201 if (oldcode == -1) {
Denys Vlasenko251fc702011-08-18 14:29:41 +0200202 if (code >= 256)
203 bb_error_msg_and_die("corrupted data"); /* %ld", code); */
Denis Vlasenko97a8dd32006-10-01 15:55:11 +0000204 oldcode = code;
205 finchar = (int) oldcode;
206 outbuf[outpos++] = (unsigned char) finchar;
Robert Griebl94a6a952002-05-19 19:00:14 +0000207 continue;
208 }
209
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000210 if (code == CLEAR && block_mode) {
Robert Griebl94a6a952002-05-19 19:00:14 +0000211 clear_tab_prefixof();
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000212 free_ent = FIRST - 1;
213 posbits =
214 ((posbits - 1) +
215 ((n_bits << 3) -
216 (posbits - 1 + (n_bits << 3)) % (n_bits << 3)));
Denis Vlasenko447b5432007-01-05 19:49:02 +0000217 n_bits = INIT_BITS;
218 maxcode = MAXCODE(INIT_BITS) - 1;
219 bitmask = (1 << INIT_BITS) - 1;
Robert Griebl94a6a952002-05-19 19:00:14 +0000220 goto resetbuf;
221 }
222
223 incode = code;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000224 stackp = de_stack;
Robert Griebl94a6a952002-05-19 19:00:14 +0000225
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000226 /* Special case for KwKwK string. */
227 if (code >= free_ent) {
228 if (code > free_ent) {
Denys Vlasenko4d5955e2012-12-05 11:08:30 +0100229/*
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000230 unsigned char *p;
Robert Griebl94a6a952002-05-19 19:00:14 +0000231
232 posbits -= n_bits;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000233 p = &inbuf[posbits >> 3];
Manuel Novoa III cad53642003-03-19 09:13:01 +0000234 bb_error_msg
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000235 ("insize:%d posbits:%d inbuf:%02X %02X %02X %02X %02X (%d)",
Denys Vlasenko60cb48c2013-01-14 15:57:44 +0100236 insize, posbits, p[-1], p[0], p[1], p[2], p[3],
237 (posbits & 07));
Denys Vlasenkoa8461172012-12-05 01:06:05 +0100238*/
Denys Vlasenkoccb88a62010-05-27 02:22:54 +0200239 bb_error_msg("corrupted data");
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000240 goto err;
Robert Griebl94a6a952002-05-19 19:00:14 +0000241 }
242
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000243 *--stackp = (unsigned char) finchar;
244 code = oldcode;
Robert Griebl94a6a952002-05-19 19:00:14 +0000245 }
246
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000247 /* Generate output characters in reverse order */
Denys Vlasenkoc71547c2012-12-05 01:04:54 +0100248 while (code >= 256) {
Denys Vlasenko251fc702011-08-18 14:29:41 +0200249 if (stackp <= &htabof(0))
250 bb_error_msg_and_die("corrupted data");
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000251 *--stackp = tab_suffixof(code);
252 code = tab_prefixof(code);
Robert Griebl94a6a952002-05-19 19:00:14 +0000253 }
254
Denis Vlasenko447b5432007-01-05 19:49:02 +0000255 finchar = tab_suffixof(code);
256 *--stackp = (unsigned char) finchar;
Robert Griebl94a6a952002-05-19 19:00:14 +0000257
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000258 /* And put them out in forward order */
Robert Griebl94a6a952002-05-19 19:00:14 +0000259 {
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000260 int i;
Robert Griebl94a6a952002-05-19 19:00:14 +0000261
Denis Vlasenko447b5432007-01-05 19:49:02 +0000262 i = de_stack - stackp;
263 if (outpos + i >= OBUFSIZ) {
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000264 do {
265 if (i > OBUFSIZ - outpos) {
266 i = OBUFSIZ - outpos;
267 }
Robert Griebl94a6a952002-05-19 19:00:14 +0000268
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000269 if (i > 0) {
270 memcpy(outbuf + outpos, stackp, i);
Robert Griebl94a6a952002-05-19 19:00:14 +0000271 outpos += i;
272 }
273
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000274 if (outpos >= OBUFSIZ) {
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100275 xtransformer_write(xstate, outbuf, outpos);
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000276 IF_DESKTOP(total_written += outpos;)
Robert Griebl94a6a952002-05-19 19:00:14 +0000277 outpos = 0;
278 }
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000279 stackp += i;
Denis Vlasenko447b5432007-01-05 19:49:02 +0000280 i = de_stack - stackp;
281 } while (i > 0);
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000282 } else {
283 memcpy(outbuf + outpos, stackp, i);
Robert Griebl94a6a952002-05-19 19:00:14 +0000284 outpos += i;
285 }
286 }
287
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000288 /* Generate the new entry. */
Denys Vlasenkoc71547c2012-12-05 01:04:54 +0100289 if (free_ent < maxmaxcode) {
290 tab_prefixof(free_ent) = (unsigned short) oldcode;
291 tab_suffixof(free_ent) = (unsigned char) finchar;
292 free_ent++;
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000293 }
Robert Griebl94a6a952002-05-19 19:00:14 +0000294
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000295 /* Remember previous code. */
296 oldcode = incode;
Robert Griebl94a6a952002-05-19 19:00:14 +0000297 }
Glenn L McGrathfedbfe42002-11-28 09:09:47 +0000298 } while (rsize > 0);
Robert Griebl94a6a952002-05-19 19:00:14 +0000299
Glenn L McGrath2e41d0c2002-09-27 06:46:02 +0000300 if (outpos > 0) {
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100301 xtransformer_write(xstate, outbuf, outpos);
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000302 IF_DESKTOP(total_written += outpos;)
Glenn L McGrath2e41d0c2002-09-27 06:46:02 +0000303 }
Robert Griebl94a6a952002-05-19 19:00:14 +0000304
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000305 retval = IF_DESKTOP(total_written) + 0;
Denis Vlasenkoe8a07882007-06-10 15:08:44 +0000306 err:
307 free(inbuf);
308 free(outbuf);
309 free(htab);
310 free(codetab);
311 return retval;
Robert Griebl94a6a952002-05-19 19:00:14 +0000312}