blob: 7e30091d95de9de8a13dd14c1384672d0c697e1b [file] [log] [blame]
Denis Vlasenko052ad9a2009-04-29 12:01:51 +00001/*
2 This file is part of the lzop file compressor.
3
4 Copyright (C) 1996..2003 Markus Franz Xaver Johannes Oberhumer
5 All Rights Reserved.
6
7 Markus F.X.J. Oberhumer <markus@oberhumer.com>
8 http://www.oberhumer.com/opensource/lzop/
9
10 lzop and the LZO library are free software; you can redistribute them
11 and/or modify them under the terms of the GNU General Public License as
12 published by the Free Software Foundation; either version 2 of
13 the License, or (at your option) any later version.
14
15 This program is distributed in the hope that it will be useful,
16 but WITHOUT ANY WARRANTY; without even the implied warranty of
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 GNU General Public License for more details.
19
20 You should have received a copy of the GNU General Public License
21 along with this program; see the file COPYING.
22 If not, write to the Free Software Foundation, Inc.,
23 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
24
25 "Minimalized" for busybox by Alain Knaff
26*/
27
Pere Orga1f4447b2011-03-27 22:40:30 +020028//usage:#define lzop_trivial_usage
29//usage: "[-cfvd123456789CF] [FILE]..."
30//usage:#define lzop_full_usage "\n\n"
Denys Vlasenko66426762011-06-05 03:58:28 +020031//usage: " -1..9 Compression level"
Pere Orga1f4447b2011-03-27 22:40:30 +020032//usage: "\n -d Decompress"
33//usage: "\n -c Write to stdout"
34//usage: "\n -f Force"
35//usage: "\n -v Verbose"
36//usage: "\n -F Don't store or verify checksum"
37//usage: "\n -C Also write checksum of compressed block"
38//usage:
39//usage:#define lzopcat_trivial_usage
40//usage: "[-vCF] [FILE]..."
41//usage:#define lzopcat_full_usage "\n\n"
42//usage: " -v Verbose"
43//usage: "\n -F Don't store or verify checksum"
44//usage:
45//usage:#define unlzop_trivial_usage
46//usage: "[-cfvCF] [FILE]..."
47//usage:#define unlzop_full_usage "\n\n"
Denys Vlasenko66426762011-06-05 03:58:28 +020048//usage: " -c Write to stdout"
Pere Orga1f4447b2011-03-27 22:40:30 +020049//usage: "\n -f Force"
50//usage: "\n -v Verbose"
51//usage: "\n -F Don't store or verify checksum"
52
Denis Vlasenko052ad9a2009-04-29 12:01:51 +000053#include "libbb.h"
Denys Vlasenkod184a722011-09-22 12:45:14 +020054#include "bb_archive.h"
Denis Vlasenko052ad9a2009-04-29 12:01:51 +000055#include "liblzo_interface.h"
56
57/* lzo-2.03/src/lzo_ptr.h */
58#define pd(a,b) ((unsigned)((a)-(b)))
59
60#define lzo_version() LZO_VERSION
61#define lzo_sizeof_dict_t (sizeof(uint8_t*))
62
63/* lzo-2.03/include/lzo/lzo1x.h */
64#define LZO1X_1_MEM_COMPRESS (16384 * lzo_sizeof_dict_t)
65#define LZO1X_1_15_MEM_COMPRESS (32768 * lzo_sizeof_dict_t)
66#define LZO1X_999_MEM_COMPRESS (14 * 16384 * sizeof(short))
67
68/* lzo-2.03/src/lzo1x_oo.c */
69#define NO_LIT UINT_MAX
70
71/**********************************************************************/
72static void copy2(uint8_t* ip, const uint8_t* m_pos, unsigned off)
73{
74 ip[0] = m_pos[0];
75 if (off == 1)
76 ip[1] = m_pos[0];
77 else
78 ip[1] = m_pos[1];
79}
80
81static void copy3(uint8_t* ip, const uint8_t* m_pos, unsigned off)
82{
83 ip[0] = m_pos[0];
84 if (off == 1) {
85 ip[2] = ip[1] = m_pos[0];
86 }
87 else if (off == 2) {
88 ip[1] = m_pos[1];
89 ip[2] = m_pos[0];
90 }
91 else {
92 ip[1] = m_pos[1];
93 ip[2] = m_pos[2];
94 }
95}
96
97/**********************************************************************/
98// optimize a block of data.
99/**********************************************************************/
100#define TEST_IP (ip < ip_end)
101#define TEST_OP (op <= op_end)
102
Denys Vlasenkoa7bb3c12009-10-08 12:28:08 +0200103static NOINLINE int lzo1x_optimize(uint8_t *in, unsigned in_len,
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000104 uint8_t *out, unsigned *out_len,
105 void* wrkmem UNUSED_PARAM)
106{
107 uint8_t* op;
108 uint8_t* ip;
109 unsigned t;
110 uint8_t* m_pos;
111 uint8_t* const ip_end = in + in_len;
112 uint8_t* const op_end = out + *out_len;
113 uint8_t* litp = NULL;
114 unsigned lit = 0;
115 unsigned next_lit = NO_LIT;
116 unsigned nl;
117 unsigned long o_m1_a = 0, o_m1_b = 0, o_m2 = 0, o_m3_a = 0, o_m3_b = 0;
118
119// LZO_UNUSED(wrkmem);
120
121 *out_len = 0;
122
123 op = out;
124 ip = in;
125
126 if (*ip > 17) {
127 t = *ip++ - 17;
128 if (t < 4)
129 goto match_next;
130 goto first_literal_run;
131 }
132
133 while (TEST_IP && TEST_OP) {
134 t = *ip++;
135 if (t >= 16)
136 goto match;
137 /* a literal run */
138 litp = ip - 1;
139 if (t == 0) {
140 t = 15;
141 while (*ip == 0)
142 t += 255, ip++;
143 t += *ip++;
144 }
145 lit = t + 3;
146 /* copy literals */
147 copy_literal_run:
148 *op++ = *ip++;
149 *op++ = *ip++;
150 *op++ = *ip++;
151 first_literal_run:
152 do *op++ = *ip++; while (--t > 0);
153
154 t = *ip++;
155
156 if (t >= 16)
157 goto match;
158#if defined(LZO1X)
159 m_pos = op - 1 - 0x800;
160#elif defined(LZO1Y)
161 m_pos = op - 1 - 0x400;
162#endif
163 m_pos -= t >> 2;
164 m_pos -= *ip++ << 2;
165 *op++ = *m_pos++;
166 *op++ = *m_pos++;
167 *op++ = *m_pos++;
168 lit = 0;
169 goto match_done;
170
171
172 /* handle matches */
173 do {
174 if (t < 16) { /* a M1 match */
175 m_pos = op - 1;
176 m_pos -= t >> 2;
177 m_pos -= *ip++ << 2;
178
179 if (litp == NULL)
180 goto copy_m1;
181
182 nl = ip[-2] & 3;
183 /* test if a match follows */
184 if (nl == 0 && lit == 1 && ip[0] >= 16) {
185 next_lit = nl;
186 /* adjust length of previous short run */
187 lit += 2;
188 *litp = (unsigned char)((*litp & ~3) | lit);
189 /* copy over the 2 literals that replace the match */
190 copy2(ip-2, m_pos, pd(op, m_pos));
191 o_m1_a++;
192 }
193 /* test if a literal run follows */
Denys Vlasenko6b9f1632010-01-28 02:24:24 +0100194 else
195 if (nl == 0
196 && ip[0] < 16
197 && ip[0] != 0
198 && (lit + 2 + ip[0] < 16)
199 ) {
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000200 t = *ip++;
201 /* remove short run */
202 *litp &= ~3;
203 /* copy over the 2 literals that replace the match */
204 copy2(ip-3+1,m_pos,pd(op,m_pos));
205 /* move literals 1 byte ahead */
206 litp += 2;
207 if (lit > 0)
208 memmove(litp+1, litp, lit);
209 /* insert new length of long literal run */
210 lit += 2 + t + 3;
211 *litp = (unsigned char)(lit - 3);
212
213 o_m1_b++;
214 *op++ = *m_pos++; *op++ = *m_pos++;
215 goto copy_literal_run;
216 }
217 copy_m1:
218 *op++ = *m_pos++;
219 *op++ = *m_pos++;
220 } else {
221 match:
222 if (t >= 64) { /* a M2 match */
223 m_pos = op - 1;
224#if defined(LZO1X)
225 m_pos -= (t >> 2) & 7;
226 m_pos -= *ip++ << 3;
227 t = (t >> 5) - 1;
228#elif defined(LZO1Y)
229 m_pos -= (t >> 2) & 3;
230 m_pos -= *ip++ << 2;
231 t = (t >> 4) - 3;
232#endif
233 if (litp == NULL)
234 goto copy_m;
235
236 nl = ip[-2] & 3;
237 /* test if in beetween two long literal runs */
238 if (t == 1 && lit > 3 && nl == 0
239 && ip[0] < 16 && ip[0] != 0 && (lit + 3 + ip[0] < 16)
240 ) {
241 t = *ip++;
242 /* copy over the 3 literals that replace the match */
243 copy3(ip-1-2,m_pos,pd(op,m_pos));
244 /* set new length of previous literal run */
245 lit += 3 + t + 3;
246 *litp = (unsigned char)(lit - 3);
247 o_m2++;
248 *op++ = *m_pos++;
249 *op++ = *m_pos++;
250 *op++ = *m_pos++;
251 goto copy_literal_run;
252 }
253 } else {
254 if (t >= 32) { /* a M3 match */
255 t &= 31;
256 if (t == 0) {
257 t = 31;
258 while (*ip == 0)
259 t += 255, ip++;
260 t += *ip++;
261 }
262 m_pos = op - 1;
263 m_pos -= *ip++ >> 2;
264 m_pos -= *ip++ << 6;
265 } else { /* a M4 match */
266 m_pos = op;
267 m_pos -= (t & 8) << 11;
268 t &= 7;
269 if (t == 0) {
270 t = 7;
271 while (*ip == 0)
272 t += 255, ip++;
273 t += *ip++;
274 }
275 m_pos -= *ip++ >> 2;
276 m_pos -= *ip++ << 6;
277 if (m_pos == op)
278 goto eof_found;
279 m_pos -= 0x4000;
280 }
281 if (litp == NULL)
282 goto copy_m;
283
284 nl = ip[-2] & 3;
285 /* test if in beetween two matches */
286 if (t == 1 && lit == 0 && nl == 0 && ip[0] >= 16) {
287 next_lit = nl;
288 /* make a previous short run */
289 lit += 3;
290 *litp = (unsigned char)((*litp & ~3) | lit);
291 /* copy over the 3 literals that replace the match */
292 copy3(ip-3,m_pos,pd(op,m_pos));
293 o_m3_a++;
294 }
295 /* test if a literal run follows */
296 else if (t == 1 && lit <= 3 && nl == 0
297 && ip[0] < 16 && ip[0] != 0 && (lit + 3 + ip[0] < 16)
298 ) {
299 t = *ip++;
300 /* remove short run */
301 *litp &= ~3;
302 /* copy over the 3 literals that replace the match */
303 copy3(ip-4+1,m_pos,pd(op,m_pos));
304 /* move literals 1 byte ahead */
305 litp += 2;
306 if (lit > 0)
307 memmove(litp+1,litp,lit);
308 /* insert new length of long literal run */
309 lit += 3 + t + 3;
310 *litp = (unsigned char)(lit - 3);
311
312 o_m3_b++;
313 *op++ = *m_pos++;
314 *op++ = *m_pos++;
315 *op++ = *m_pos++;
316 goto copy_literal_run;
317 }
318 }
319 copy_m:
320 *op++ = *m_pos++;
321 *op++ = *m_pos++;
322 do *op++ = *m_pos++; while (--t > 0);
323 }
324
325 match_done:
326 if (next_lit == NO_LIT) {
327 t = ip[-2] & 3;
328 lit = t;
329 litp = ip - 2;
330 }
331 else
332 t = next_lit;
333 next_lit = NO_LIT;
334 if (t == 0)
335 break;
336 /* copy literals */
337 match_next:
338 do *op++ = *ip++; while (--t > 0);
339 t = *ip++;
340 } while (TEST_IP && TEST_OP);
341 }
342
343 /* no EOF code was found */
344 *out_len = pd(op, out);
345 return LZO_E_EOF_NOT_FOUND;
346
347 eof_found:
348// LZO_UNUSED(o_m1_a); LZO_UNUSED(o_m1_b); LZO_UNUSED(o_m2);
349// LZO_UNUSED(o_m3_a); LZO_UNUSED(o_m3_b);
350 *out_len = pd(op, out);
351 return (ip == ip_end ? LZO_E_OK :
352 (ip < ip_end ? LZO_E_INPUT_NOT_CONSUMED : LZO_E_INPUT_OVERRUN));
353}
354
355/**********************************************************************/
356#define F_OS F_OS_UNIX
357#define F_CS F_CS_NATIVE
358
359/**********************************************************************/
360#define ADLER32_INIT_VALUE 1
361#define CRC32_INIT_VALUE 0
362
363/**********************************************************************/
364enum {
365 M_LZO1X_1 = 1,
366 M_LZO1X_1_15 = 2,
367 M_LZO1X_999 = 3,
368};
369
370/**********************************************************************/
371/* header flags */
372#define F_ADLER32_D 0x00000001L
373#define F_ADLER32_C 0x00000002L
374#define F_H_EXTRA_FIELD 0x00000040L
375#define F_H_GMTDIFF 0x00000080L
376#define F_CRC32_D 0x00000100L
377#define F_CRC32_C 0x00000200L
378#define F_H_FILTER 0x00000800L
379#define F_H_CRC32 0x00001000L
380#define F_MASK 0x00003FFFL
381
382/* operating system & file system that created the file [mostly unused] */
383#define F_OS_UNIX 0x03000000L
384#define F_OS_SHIFT 24
385#define F_OS_MASK 0xff000000L
386
387/* character set for file name encoding [mostly unused] */
388#define F_CS_NATIVE 0x00000000L
389#define F_CS_SHIFT 20
390#define F_CS_MASK 0x00f00000L
391
392/* these bits must be zero */
393#define F_RESERVED ((F_MASK | F_OS_MASK | F_CS_MASK) ^ 0xffffffffL)
394
395typedef struct chksum_t {
396 uint32_t f_adler32;
397 uint32_t f_crc32;
398} chksum_t;
399
400typedef struct header_t {
401 unsigned version;
402 unsigned lib_version;
403 unsigned version_needed_to_extract;
404 uint32_t flags;
405 uint32_t mode;
406 uint32_t mtime;
407 uint32_t gmtdiff;
408 uint32_t header_checksum;
409
410 uint32_t extra_field_len;
411 uint32_t extra_field_checksum;
412
413 unsigned char method;
414 unsigned char level;
415
416 /* info */
417 char name[255+1];
418} header_t;
419
420struct globals {
Denys Vlasenko9ce642f2010-10-27 15:26:45 +0200421 /*const uint32_t *lzo_crc32_table;*/
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000422 chksum_t chksum_in;
423 chksum_t chksum_out;
Denys Vlasenko98a4c7c2010-02-04 15:00:15 +0100424} FIX_ALIASING;
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000425#define G (*(struct globals*)&bb_common_bufsiz1)
426#define INIT_G() do { } while (0)
427//#define G (*ptr_to_globals)
428//#define INIT_G() do {
Denys Vlasenkob7c9fb22011-02-03 00:05:48 +0100429// SET_PTR_TO_GLOBALS(xzalloc(sizeof(G)));
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000430//} while (0)
431
432
433/**********************************************************************/
434#define LZOP_VERSION 0x1010
435//#define LZOP_VERSION_STRING "1.01"
436//#define LZOP_VERSION_DATE "Apr 27th 2003"
437
438#define OPTION_STRING "cfvdt123456789CF"
439
440enum {
441 OPT_STDOUT = (1 << 0),
442 OPT_FORCE = (1 << 1),
443 OPT_VERBOSE = (1 << 2),
444 OPT_DECOMPRESS = (1 << 3),
445 OPT_TEST = (1 << 4),
446 OPT_1 = (1 << 5),
447 OPT_2 = (1 << 6),
448 OPT_3 = (1 << 7),
449 OPT_4 = (1 << 8),
450 OPT_5 = (1 << 9),
451 OPT_6 = (1 << 10),
452 OPT_789 = (7 << 11),
453 OPT_7 = (1 << 11),
454 OPT_8 = (1 << 12),
455 OPT_C = (1 << 14),
456 OPT_F = (1 << 15),
457};
458
459/**********************************************************************/
460// adler32 checksum
461// adapted from free code by Mark Adler <madler@alumni.caltech.edu>
462// see http://www.zlib.org/
463/**********************************************************************/
464static FAST_FUNC uint32_t
465lzo_adler32(uint32_t adler, const uint8_t* buf, unsigned len)
466{
467 enum {
468 LZO_BASE = 65521, /* largest prime smaller than 65536 */
469 /* NMAX is the largest n such that
470 * 255n(n+1)/2 + (n+1)(BASE-1) <= 2^32-1 */
471 LZO_NMAX = 5552,
472 };
473 uint32_t s1 = adler & 0xffff;
474 uint32_t s2 = (adler >> 16) & 0xffff;
475 unsigned k;
476
477 if (buf == NULL)
478 return 1;
479
480 while (len > 0) {
481 k = len < LZO_NMAX ? (unsigned) len : LZO_NMAX;
482 len -= k;
483 if (k != 0) do {
484 s1 += *buf++;
485 s2 += s1;
486 } while (--k > 0);
487 s1 %= LZO_BASE;
488 s2 %= LZO_BASE;
489 }
490 return (s2 << 16) | s1;
491}
492
493static FAST_FUNC uint32_t
494lzo_crc32(uint32_t c, const uint8_t* buf, unsigned len)
495{
Denys Vlasenko9ce642f2010-10-27 15:26:45 +0200496 //if (buf == NULL) - impossible
497 // return 0;
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000498
Denys Vlasenko9ce642f2010-10-27 15:26:45 +0200499 return ~crc32_block_endian0(~c, buf, len, global_crc32_table);
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000500}
501
502/**********************************************************************/
503static void init_chksum(chksum_t *ct)
504{
505 ct->f_adler32 = ADLER32_INIT_VALUE;
506 ct->f_crc32 = CRC32_INIT_VALUE;
507}
508
509static void add_bytes_to_chksum(chksum_t *ct, const void* buf, int cnt)
510{
511 /* We need to handle the two checksums at once, because at the
512 * beginning of the header, we don't know yet which one we'll
513 * eventually need */
514 ct->f_adler32 = lzo_adler32(ct->f_adler32, (const uint8_t*)buf, cnt);
515 ct->f_crc32 = lzo_crc32(ct->f_crc32, (const uint8_t*)buf, cnt);
516}
517
518static uint32_t chksum_getresult(chksum_t *ct, const header_t *h)
519{
520 return (h->flags & F_H_CRC32) ? ct->f_crc32 : ct->f_adler32;
521}
522
523/**********************************************************************/
524static uint32_t read32(void)
525{
526 uint32_t v;
527 xread(0, &v, 4);
528 return ntohl(v);
529}
530
531static void write32(uint32_t v)
532{
533 v = htonl(v);
534 xwrite(1, &v, 4);
535}
536
537static void f_write(const void* buf, int cnt)
538{
539 xwrite(1, buf, cnt);
540 add_bytes_to_chksum(&G.chksum_out, buf, cnt);
541}
542
543static void f_read(void* buf, int cnt)
544{
545 xread(0, buf, cnt);
546 add_bytes_to_chksum(&G.chksum_in, buf, cnt);
547}
548
549static int f_read8(void)
550{
551 uint8_t v;
552 f_read(&v, 1);
553 return v;
554}
555
556static void f_write8(uint8_t v)
557{
558 f_write(&v, 1);
559}
560
561static unsigned f_read16(void)
562{
563 uint16_t v;
564 f_read(&v, 2);
565 return ntohs(v);
566}
567
568static void f_write16(uint16_t v)
569{
570 v = htons(v);
571 f_write(&v, 2);
572}
573
574static uint32_t f_read32(void)
575{
576 uint32_t v;
577 f_read(&v, 4);
578 return ntohl(v);
579}
580
581static void f_write32(uint32_t v)
582{
583 v = htonl(v);
584 f_write(&v, 4);
585}
586
587/**********************************************************************/
588static int lzo_get_method(header_t *h)
589{
590 /* check method */
591 if (h->method == M_LZO1X_1) {
592 if (h->level == 0)
593 h->level = 3;
594 } else if (h->method == M_LZO1X_1_15) {
595 if (h->level == 0)
596 h->level = 1;
597 } else if (h->method == M_LZO1X_999) {
598 if (h->level == 0)
599 h->level = 9;
600 } else
601 return -1; /* not a LZO method */
602
603 /* check compression level */
604 if (h->level < 1 || h->level > 9)
605 return 15;
606
607 return 0;
608}
609
610/**********************************************************************/
611#define LZO_BLOCK_SIZE (256 * 1024l)
612#define MAX_BLOCK_SIZE (64 * 1024l * 1024l) /* DO NOT CHANGE */
613
614/* LZO may expand uncompressible data by a small amount */
615#define MAX_COMPRESSED_SIZE(x) ((x) + (x) / 16 + 64 + 3)
616
617/**********************************************************************/
618// compress a file
619/**********************************************************************/
Denys Vlasenkoef5bc2c2009-10-08 14:54:18 +0200620static NOINLINE smallint lzo_compress(const header_t *h)
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000621{
622 unsigned block_size = LZO_BLOCK_SIZE;
623 int r = 0; /* LZO_E_OK */
624 uint8_t *const b1 = xzalloc(block_size);
625 uint8_t *const b2 = xzalloc(MAX_COMPRESSED_SIZE(block_size));
626 unsigned src_len = 0, dst_len = 0;
627 uint32_t d_adler32 = ADLER32_INIT_VALUE;
628 uint32_t d_crc32 = CRC32_INIT_VALUE;
629 int l;
630 smallint ok = 1;
631 uint8_t *wrk_mem = NULL;
632
633 if (h->method == M_LZO1X_1)
634 wrk_mem = xzalloc(LZO1X_1_MEM_COMPRESS);
635 else if (h->method == M_LZO1X_1_15)
636 wrk_mem = xzalloc(LZO1X_1_15_MEM_COMPRESS);
637 else if (h->method == M_LZO1X_999)
638 wrk_mem = xzalloc(LZO1X_999_MEM_COMPRESS);
639
640 for (;;) {
641 /* read a block */
642 l = full_read(0, b1, block_size);
643 src_len = (l > 0 ? l : 0);
644
645 /* write uncompressed block size */
646 write32(src_len);
647
648 /* exit if last block */
649 if (src_len == 0)
650 break;
651
652 /* compute checksum of uncompressed block */
653 if (h->flags & F_ADLER32_D)
654 d_adler32 = lzo_adler32(ADLER32_INIT_VALUE, b1, src_len);
655 if (h->flags & F_CRC32_D)
656 d_crc32 = lzo_crc32(CRC32_INIT_VALUE, b1, src_len);
657
658 /* compress */
659 if (h->method == M_LZO1X_1)
660 r = lzo1x_1_compress(b1, src_len, b2, &dst_len, wrk_mem);
661 else if (h->method == M_LZO1X_1_15)
662 r = lzo1x_1_15_compress(b1, src_len, b2, &dst_len, wrk_mem);
663#if ENABLE_LZOP_COMPR_HIGH
664 else if (h->method == M_LZO1X_999)
665 r = lzo1x_999_compress_level(b1, src_len, b2, &dst_len,
666 wrk_mem, h->level);
667#endif
668 else
669 bb_error_msg_and_die("internal error");
670
671 if (r != 0) /* not LZO_E_OK */
672 bb_error_msg_and_die("internal error - compression failed");
673
674 /* write compressed block size */
675 if (dst_len < src_len) {
676 /* optimize */
677 if (h->method == M_LZO1X_999) {
678 unsigned new_len = src_len;
679 r = lzo1x_optimize(b2, dst_len, b1, &new_len, NULL);
680 if (r != 0 /*LZO_E_OK*/ || new_len != src_len)
681 bb_error_msg_and_die("internal error - optimization failed");
682 }
683 write32(dst_len);
684 } else {
685 /* data actually expanded => store data uncompressed */
686 write32(src_len);
687 }
688
689 /* write checksum of uncompressed block */
690 if (h->flags & F_ADLER32_D)
691 write32(d_adler32);
692 if (h->flags & F_CRC32_D)
693 write32(d_crc32);
694
695 if (dst_len < src_len) {
696 /* write checksum of compressed block */
697 if (h->flags & F_ADLER32_C)
Denys Vlasenko9ce642f2010-10-27 15:26:45 +0200698 write32(lzo_adler32(ADLER32_INIT_VALUE, b2, dst_len));
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000699 if (h->flags & F_CRC32_C)
700 write32(lzo_crc32(CRC32_INIT_VALUE, b2, dst_len));
701 /* write compressed block data */
702 xwrite(1, b2, dst_len);
703 } else {
704 /* write uncompressed block data */
705 xwrite(1, b1, src_len);
706 }
707 }
708
709 free(wrk_mem);
710 free(b1);
711 free(b2);
712 return ok;
713}
714
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200715static FAST_FUNC void lzo_check(
716 uint32_t init,
717 uint8_t* buf, unsigned len,
718 uint32_t FAST_FUNC (*fn)(uint32_t, const uint8_t*, unsigned),
719 uint32_t ref)
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000720{
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200721 /* This function, by having the same order of parameters
722 * as fn, and by being marked FAST_FUNC (same as fn),
723 * saves a dozen bytes of code.
724 */
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000725 uint32_t c = fn(init, buf, len);
726 if (c != ref)
727 bb_error_msg_and_die("checksum error");
728}
729
730/**********************************************************************/
731// decompress a file
732/**********************************************************************/
Denys Vlasenkoef5bc2c2009-10-08 14:54:18 +0200733static NOINLINE smallint lzo_decompress(const header_t *h)
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000734{
735 unsigned block_size = LZO_BLOCK_SIZE;
736 int r;
737 uint32_t src_len, dst_len;
738 uint32_t c_adler32 = ADLER32_INIT_VALUE;
739 uint32_t d_adler32 = ADLER32_INIT_VALUE;
740 uint32_t c_crc32 = CRC32_INIT_VALUE, d_crc32 = CRC32_INIT_VALUE;
741 smallint ok = 1;
742 uint8_t *b1;
743 uint32_t mcs_block_size = MAX_COMPRESSED_SIZE(block_size);
744 uint8_t *b2 = NULL;
745
746 for (;;) {
747 uint8_t *dst;
748
749 /* read uncompressed block size */
750 dst_len = read32();
751
752 /* exit if last block */
753 if (dst_len == 0)
754 break;
755
756 /* error if split file */
757 if (dst_len == 0xffffffffL)
758 /* should not happen - not yet implemented */
759 bb_error_msg_and_die("this file is a split lzop file");
760
761 if (dst_len > MAX_BLOCK_SIZE)
Denys Vlasenkoccb88a62010-05-27 02:22:54 +0200762 bb_error_msg_and_die("corrupted data");
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000763
764 /* read compressed block size */
765 src_len = read32();
766 if (src_len <= 0 || src_len > dst_len)
Denys Vlasenkoccb88a62010-05-27 02:22:54 +0200767 bb_error_msg_and_die("corrupted data");
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000768
769 if (dst_len > block_size) {
770 if (b2) {
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000771 free(b2);
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200772 b2 = NULL;
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000773 }
774 block_size = dst_len;
775 mcs_block_size = MAX_COMPRESSED_SIZE(block_size);
776 }
777
778 /* read checksum of uncompressed block */
779 if (h->flags & F_ADLER32_D)
780 d_adler32 = read32();
781 if (h->flags & F_CRC32_D)
782 d_crc32 = read32();
783
784 /* read checksum of compressed block */
785 if (src_len < dst_len) {
786 if (h->flags & F_ADLER32_C)
787 c_adler32 = read32();
788 if (h->flags & F_CRC32_C)
789 c_crc32 = read32();
790 }
791
792 if (b2 == NULL)
793 b2 = xzalloc(mcs_block_size);
794 /* read the block into the end of our buffer */
795 b1 = b2 + mcs_block_size - src_len;
796 xread(0, b1, src_len);
797
798 if (src_len < dst_len) {
799 unsigned d = dst_len;
800
801 if (!(option_mask32 & OPT_F)) {
802 /* verify checksum of compressed block */
803 if (h->flags & F_ADLER32_C)
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200804 lzo_check(ADLER32_INIT_VALUE,
805 b1, src_len,
806 lzo_adler32, c_adler32);
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000807 if (h->flags & F_CRC32_C)
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200808 lzo_check(CRC32_INIT_VALUE,
809 b1, src_len,
810 lzo_crc32, c_crc32);
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000811 }
812
813 /* decompress */
814// if (option_mask32 & OPT_F)
815// r = lzo1x_decompress(b1, src_len, b2, &d, NULL);
816// else
817 r = lzo1x_decompress_safe(b1, src_len, b2, &d, NULL);
818
819 if (r != 0 /*LZO_E_OK*/ || dst_len != d) {
Denys Vlasenkoccb88a62010-05-27 02:22:54 +0200820 bb_error_msg_and_die("corrupted data");
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000821 }
822 dst = b2;
823 } else {
824 /* "stored" block => no decompression */
825 dst = b1;
826 }
827
828 if (!(option_mask32 & OPT_F)) {
829 /* verify checksum of uncompressed block */
830 if (h->flags & F_ADLER32_D)
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200831 lzo_check(ADLER32_INIT_VALUE,
832 dst, dst_len,
833 lzo_adler32, d_adler32);
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000834 if (h->flags & F_CRC32_D)
Denys Vlasenko8ae6e9b2010-09-04 19:46:52 +0200835 lzo_check(CRC32_INIT_VALUE,
836 dst, dst_len,
837 lzo_crc32, d_crc32);
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000838 }
839
840 /* write uncompressed block data */
841 xwrite(1, dst, dst_len);
842 }
843
844 free(b2);
845 return ok;
846}
847
848/**********************************************************************/
849// lzop file signature (shamelessly borrowed from PNG)
850/**********************************************************************/
851/*
852 * The first nine bytes of a lzop file always contain the following values:
853 *
854 * 0 1 2 3 4 5 6 7 8
855 * --- --- --- --- --- --- --- --- ---
856 * (hex) 89 4c 5a 4f 00 0d 0a 1a 0a
857 * (decimal) 137 76 90 79 0 13 10 26 10
858 * (C notation - ASCII) \211 L Z O \0 \r \n \032 \n
859 */
860
861/* (vda) comparison with lzop v1.02rc1 ("lzop -1 <FILE" cmd):
862 * Only slight differences in header:
863 * -00000000 89 4c 5a 4f 00 0d 0a 1a 0a 10 20 20 20 09 40 02
864 * +00000000 89 4c 5a 4f 00 0d 0a 1a 0a 10 10 20 30 09 40 02
865 * ^^^^^ ^^^^^
866 * version lib_version
867 * -00000010 01 03 00 00 0d 00 00 81 a4 49 f7 a6 3f 00 00 00
868 * +00000010 01 03 00 00 01 00 00 00 00 00 00 00 00 00 00 00
869 * ^^^^^^^^^^^ ^^^^^^^^^^^ ^^^^^^^^^^^
870 * flags mode mtime
871 * -00000020 00 00 2d 67 04 17 00 04 00 00 00 03 ed ec 9d 6d
872 * +00000020 00 00 10 5f 00 c1 00 04 00 00 00 03 ed ec 9d 6d
873 * ^^^^^^^^^^^
874 * chksum_out
875 * The rest is identical.
876*/
877static const unsigned char lzop_magic[9] = {
878 0x89, 0x4c, 0x5a, 0x4f, 0x00, 0x0d, 0x0a, 0x1a, 0x0a
879};
880
881/* This coding is derived from Alexander Lehmann's pngcheck code. */
882static void check_magic(void)
883{
Denys Vlasenko9038d6f2009-07-15 20:02:19 +0200884 unsigned char magic[sizeof(lzop_magic)];
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000885 xread(0, magic, sizeof(magic));
886 if (memcmp(magic, lzop_magic, sizeof(lzop_magic)) != 0)
887 bb_error_msg_and_die("bad magic number");
888}
889
890/**********************************************************************/
891// lzop file header
892/**********************************************************************/
893static void write_header(const header_t *h)
894{
895 int l;
896
897 xwrite(1, lzop_magic, sizeof(lzop_magic));
898
899 init_chksum(&G.chksum_out);
900
901 f_write16(h->version);
902 f_write16(h->lib_version);
903 f_write16(h->version_needed_to_extract);
904 f_write8(h->method);
905 f_write8(h->level);
906 f_write32(h->flags);
907 f_write32(h->mode);
908 f_write32(h->mtime);
909 f_write32(h->gmtdiff);
910
911 l = (int) strlen(h->name);
912 f_write8(l);
913 if (l)
914 f_write(h->name, l);
915
916 f_write32(chksum_getresult(&G.chksum_out, h));
917}
918
919static int read_header(header_t *h)
920{
921 int r;
922 int l;
923 uint32_t checksum;
924
925 memset(h, 0, sizeof(*h));
926 h->version_needed_to_extract = 0x0900; /* first lzop version */
927 h->level = 0;
928
929 init_chksum(&G.chksum_in);
930
931 h->version = f_read16();
932 if (h->version < 0x0900)
933 return 3;
934 h->lib_version = f_read16();
935 if (h->version >= 0x0940) {
936 h->version_needed_to_extract = f_read16();
937 if (h->version_needed_to_extract > LZOP_VERSION)
938 return 16;
939 if (h->version_needed_to_extract < 0x0900)
940 return 3;
941 }
942 h->method = f_read8();
943 if (h->version >= 0x0940)
944 h->level = f_read8();
945 h->flags = f_read32();
946 if (h->flags & F_H_FILTER)
947 return 16; /* filter not supported */
948 h->mode = f_read32();
949 h->mtime = f_read32();
950 if (h->version >= 0x0940)
951 h->gmtdiff = f_read32();
952
953 l = f_read8();
954 if (l > 0)
955 f_read(h->name, l);
956 h->name[l] = 0;
957
958 checksum = chksum_getresult(&G.chksum_in, h);
959 h->header_checksum = f_read32();
960 if (h->header_checksum != checksum)
961 return 2;
962
963 if (h->method <= 0)
964 return 14;
965 r = lzo_get_method(h);
966 if (r != 0)
967 return r;
968
969 /* check reserved flags */
970 if (h->flags & F_RESERVED)
971 return -13;
972
973 /* skip extra field [not used yet] */
974 if (h->flags & F_H_EXTRA_FIELD) {
975 uint32_t k;
Denys Vlasenko9038d6f2009-07-15 20:02:19 +0200976
Denis Vlasenko052ad9a2009-04-29 12:01:51 +0000977 /* note: the checksum also covers the length */
978 init_chksum(&G.chksum_in);
979 h->extra_field_len = f_read32();
980 for (k = 0; k < h->extra_field_len; k++)
981 f_read8();
982 checksum = chksum_getresult(&G.chksum_in, h);
983 h->extra_field_checksum = f_read32();
984 if (h->extra_field_checksum != checksum)
985 return 3;
986 }
987
988 return 0;
989}
990
991static void p_header(header_t *h)
992{
993 int r;
994
995 r = read_header(h);
996 if (r == 0)
997 return;
998 bb_error_msg_and_die("header_error %d", r);
999}
1000
1001/**********************************************************************/
1002// compress
1003/**********************************************************************/
1004static void lzo_set_method(header_t *h)
1005{
1006 int level = 1;
1007
1008 if (option_mask32 & OPT_1) {
1009 h->method = M_LZO1X_1_15;
1010 } else if (option_mask32 & OPT_789) {
1011#if ENABLE_LZOP_COMPR_HIGH
1012 h->method = M_LZO1X_999;
1013 if (option_mask32 & OPT_7)
1014 level = 7;
1015 else if (option_mask32 & OPT_8)
1016 level = 8;
1017 else
1018 level = 9;
1019#else
1020 bb_error_msg_and_die("high compression not compiled in");
1021#endif
1022 } else { /* levels 2..6 or none (defaults to level 3) */
1023 h->method = M_LZO1X_1;
1024 level = 5; /* levels 2-6 are actually the same */
1025 }
1026
1027 h->level = level;
1028}
1029
1030static smallint do_lzo_compress(void)
1031{
1032 header_t header;
1033
1034#define h (&header)
1035 memset(h, 0, sizeof(*h));
1036
1037 lzo_set_method(h);
1038
1039 h->version = (LZOP_VERSION & 0xffff);
1040 h->version_needed_to_extract = 0x0940;
1041 h->lib_version = lzo_version() & 0xffff;
1042
1043 h->flags = (F_OS & F_OS_MASK) | (F_CS & F_CS_MASK);
1044
1045 if (!(option_mask32 & OPT_F) || h->method == M_LZO1X_999) {
1046 h->flags |= F_ADLER32_D;
1047 if (option_mask32 & OPT_C)
1048 h->flags |= F_ADLER32_C;
1049 }
1050 write_header(h);
1051 return lzo_compress(h);
1052#undef h
1053}
1054
1055/**********************************************************************/
1056// decompress
1057/**********************************************************************/
1058static smallint do_lzo_decompress(void)
1059{
1060 header_t header;
Denys Vlasenko9038d6f2009-07-15 20:02:19 +02001061
Denis Vlasenko052ad9a2009-04-29 12:01:51 +00001062 check_magic();
1063 p_header(&header);
1064 return lzo_decompress(&header);
1065}
1066
Denys Vlasenko39a04f72010-05-31 14:18:57 +02001067static char* FAST_FUNC make_new_name_lzop(char *filename, const char *expected_ext UNUSED_PARAM)
Denis Vlasenko052ad9a2009-04-29 12:01:51 +00001068{
1069 if (option_mask32 & OPT_DECOMPRESS) {
1070 char *extension = strrchr(filename, '.');
1071 if (!extension || strcmp(extension + 1, "lzo") != 0)
1072 return xasprintf("%s.out", filename);
1073 *extension = '\0';
1074 return filename;
1075 }
1076 return xasprintf("%s.lzo", filename);
1077}
1078
Denys Vlasenko39a04f72010-05-31 14:18:57 +02001079static IF_DESKTOP(long long) int FAST_FUNC pack_lzop(unpack_info_t *info UNUSED_PARAM)
Denis Vlasenko052ad9a2009-04-29 12:01:51 +00001080{
1081 if (option_mask32 & OPT_DECOMPRESS)
1082 return do_lzo_decompress();
1083 return do_lzo_compress();
1084}
1085
1086int lzop_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
1087int lzop_main(int argc UNUSED_PARAM, char **argv)
1088{
1089 getopt32(argv, OPTION_STRING);
1090 argv += optind;
1091 /* lzopcat? */
1092 if (applet_name[4] == 'c')
1093 option_mask32 |= (OPT_STDOUT | OPT_DECOMPRESS);
1094 /* unlzop? */
1095 if (applet_name[0] == 'u')
1096 option_mask32 |= OPT_DECOMPRESS;
1097
Denys Vlasenko9ce642f2010-10-27 15:26:45 +02001098 global_crc32_table = crc32_filltable(NULL, 0);
Denys Vlasenko39a04f72010-05-31 14:18:57 +02001099 return bbunpack(argv, pack_lzop, make_new_name_lzop, /*unused:*/ NULL);
Denis Vlasenko052ad9a2009-04-29 12:01:51 +00001100}