blob: 8eb5ca9aef43b5d728800e021ac64f3f5767d390 [file] [log] [blame]
Denis Vlasenko77f1ec12007-10-13 03:36:03 +00001/*
2 * Copyright (C) 2007 Denys Vlasenko <vda.linux@googlemail.com>
3 *
4 * This file uses bzip2 library code which is written
5 * by Julian Seward <jseward@bzip.org>.
6 * See README and LICENSE files in bz/ directory for more information
7 * about bzip2 library code.
8 */
9
10#include "libbb.h"
Denis Vlasenko1a9e9bd2008-11-01 12:54:56 +000011#include "unarchive.h"
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000012
Denis Vlasenkoef3aabe2007-10-14 00:43:01 +000013#define CONFIG_BZIP2_FEATURE_SPEED 1
14
15/* Speed test:
16 * Compiled with gcc 4.2.1, run on Athlon 64 1800 MHz (512K L2 cache).
17 * Stock bzip2 is 26.4% slower than bbox bzip2 at SPEED 1
18 * (time to compress gcc-4.2.1.tar is 126.4% compared to bbox).
19 * At SPEED 5 difference is 32.7%.
20 *
21 * Test run of all CONFIG_BZIP2_FEATURE_SPEED values on a 11Mb text file:
22 * Size Time (3 runs)
23 * 0: 10828 4.145 4.146 4.148
24 * 1: 11097 3.845 3.860 3.861
25 * 2: 11392 3.763 3.767 3.768
26 * 3: 11892 3.722 3.724 3.727
27 * 4: 12740 3.637 3.640 3.644
28 * 5: 17273 3.497 3.509 3.509
29 */
30
31
32#define BZ_DEBUG 0
33/* Takes ~300 bytes, detects corruption caused by bad RAM etc */
34#define BZ_LIGHT_DEBUG 0
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000035
36#include "bz/bzlib.h"
37
38#include "bz/bzlib_private.h"
39
40#include "bz/blocksort.c"
41#include "bz/bzlib.c"
42#include "bz/compress.c"
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000043#include "bz/huffman.c"
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000044
45/* No point in being shy and having very small buffer here.
46 * bzip2 internal buffers are much bigger anyway, hundreds of kbytes.
47 * If iobuf is several pages long, malloc() may use mmap,
48 * making iobuf is page aligned and thus (maybe) have one memcpy less
49 * if kernel is clever enough.
50 */
51enum {
52 IOBUF_SIZE = 8 * 1024
53};
54
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000055static uint8_t level;
56
57/* NB: compressStream() has to return -1 on errors, not die.
58 * bbunpack() will correctly clean up in this case
59 * (delete incomplete .bz2 file)
60 */
61
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000062/* Returns:
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000063 * -1 on errors
64 * total written bytes so far otherwise
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000065 */
66static
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000067USE_DESKTOP(long long) int bz_write(bz_stream *strm, void* rbuf, ssize_t rlen, void *wbuf)
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000068{
69 int n, n2, ret;
70
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000071 strm->avail_in = rlen;
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000072 strm->next_in = rbuf;
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000073 while (1) {
74 strm->avail_out = IOBUF_SIZE;
75 strm->next_out = wbuf;
76
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000077 ret = BZ2_bzCompress(strm, rlen ? BZ_RUN : BZ_FINISH);
78 if (ret != BZ_RUN_OK /* BZ_RUNning */
79 && ret != BZ_FINISH_OK /* BZ_FINISHing, but not done yet */
80 && ret != BZ_STREAM_END /* BZ_FINISHed */
81 ) {
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000082 bb_error_msg_and_die("internal error %d", ret);
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000083 }
84
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000085 n = IOBUF_SIZE - strm->avail_out;
86 if (n) {
87 n2 = full_write(STDOUT_FILENO, wbuf, n);
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000088 if (n2 != n) {
89 if (n2 >= 0)
90 errno = 0; /* prevent bogus error message */
91 bb_perror_msg(n2 >= 0 ? "short write" : "write error");
92 return -1;
93 }
Denis Vlasenko77f1ec12007-10-13 03:36:03 +000094 }
95
96 if (ret == BZ_STREAM_END)
97 break;
Denis Vlasenko31acd1b2007-10-17 10:14:11 +000098 if (rlen && strm->avail_in == 0)
99 break;
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000100 }
Denis Vlasenko31acd1b2007-10-17 10:14:11 +0000101 return 0 USE_DESKTOP( + strm->total_out );
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000102}
103
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000104static
Denis Vlasenko1a9e9bd2008-11-01 12:54:56 +0000105USE_DESKTOP(long long) int compressStream(unpack_info_t *info UNUSED_PARAM)
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000106{
107 USE_DESKTOP(long long) int total;
108 ssize_t count;
109 bz_stream bzs; /* it's small */
110#define strm (&bzs)
111 char *iobuf;
112#define rbuf iobuf
113#define wbuf (iobuf + IOBUF_SIZE)
114
115 iobuf = xmalloc(2 * IOBUF_SIZE);
Denis Vlasenkob6ccd322007-10-14 07:51:19 +0000116 BZ2_bzCompressInit(strm, level);
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000117
118 while (1) {
119 count = full_read(STDIN_FILENO, rbuf, IOBUF_SIZE);
Denis Vlasenko31acd1b2007-10-17 10:14:11 +0000120 if (count < 0) {
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000121 bb_perror_msg("read error");
Denis Vlasenko31acd1b2007-10-17 10:14:11 +0000122 total = -1;
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000123 break;
124 }
Denis Vlasenko31acd1b2007-10-17 10:14:11 +0000125 /* if count == 0, bz_write finalizes compression */
126 total = bz_write(strm, rbuf, count, wbuf);
127 if (count == 0 || total < 0)
128 break;
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000129 }
130
Denis Vlasenko31acd1b2007-10-17 10:14:11 +0000131#if ENABLE_FEATURE_CLEAN_UP
132 BZ2_bzCompressEnd(strm);
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000133 free(iobuf);
Denis Vlasenko31acd1b2007-10-17 10:14:11 +0000134#endif
135 return total;
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000136}
137
138static
139char* make_new_name_bzip2(char *filename)
140{
141 return xasprintf("%s.bz2", filename);
142}
143
144int bzip2_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
Denis Vlasenkoa60f84e2008-07-05 09:18:54 +0000145int bzip2_main(int argc UNUSED_PARAM, char **argv)
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000146{
147 unsigned opt;
148
Denis Vlasenkob6ccd322007-10-14 07:51:19 +0000149 /* standard bzip2 flags
150 * -d --decompress force decompression
151 * -z --compress force compression
152 * -k --keep keep (don't delete) input files
153 * -f --force overwrite existing output files
154 * -t --test test compressed file integrity
155 * -c --stdout output to standard out
156 * -q --quiet suppress noncritical error messages
157 * -v --verbose be verbose (a 2nd -v gives more)
158 * -s --small use less memory (at most 2500k)
159 * -1 .. -9 set block size to 100k .. 900k
160 * --fast alias for -1
161 * --best alias for -9
162 */
163
Denis Vlasenko008eda22007-10-16 10:47:27 +0000164 opt_complementary = "s2"; /* -s means -2 (compatibility) */
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000165 /* Must match bbunzip's constants OPT_STDOUT, OPT_FORCE! */
Denis Vlasenko55da0be2008-06-27 21:52:41 +0000166 opt = getopt32(argv, "cfv" USE_BUNZIP2("dt") "123456789qzs");
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000167#if ENABLE_BUNZIP2 /* bunzip2_main may not be visible... */
Denis Vlasenko55da0be2008-06-27 21:52:41 +0000168 if (opt & 0x18) // -d and/or -t
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000169 return bunzip2_main(argc, argv);
Denis Vlasenko55da0be2008-06-27 21:52:41 +0000170 opt >>= 5;
Denis Vlasenkob6ccd322007-10-14 07:51:19 +0000171#else
172 opt >>= 3;
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000173#endif
Denis Vlasenkob6ccd322007-10-14 07:51:19 +0000174 opt = (uint8_t)opt; /* isolate bits for -1..-8 */
175 opt |= 0x100; /* if nothing else, assume -9 */
176 level = 1;
177 while (!(opt & 1)) {
178 level++;
179 opt >>= 1;
180 }
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000181
Denis Vlasenkob6ccd322007-10-14 07:51:19 +0000182 argv += optind;
183 option_mask32 &= 0x7; /* ignore all except -cfv */
Denis Vlasenko77f1ec12007-10-13 03:36:03 +0000184 return bbunpack(argv, make_new_name_bzip2, compressStream);
185}