blob: 3dd9bbf4934eb51ed23f2e7dadad784a66dc7f99 [file] [log] [blame]
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +02001/*
2 * This file uses XZ Embedded library code which is written
3 * by Lasse Collin <lasse.collin@tukaani.org>
4 * and Igor Pavlov <http://7-zip.org/>
5 *
Denys Vlasenko6948f212010-05-30 04:18:13 +02006 * See README file in unxz/ directory for more information.
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +02007 *
8 * This file is:
9 * Copyright (C) 2010 Denys Vlasenko <vda.linux@googlemail.com>
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +020010 * Licensed under GPLv2, see file LICENSE in this source tree.
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020011 */
12#include "libbb.h"
Denys Vlasenkod184a722011-09-22 12:45:14 +020013#include "bb_archive.h"
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020014
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020015#define XZ_FUNC FAST_FUNC
16#define XZ_EXTERN static
17
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +020018#define XZ_DEC_DYNALLOC
19
Denys Vlasenko716f3f62010-06-01 14:41:39 +020020/* Skip check (rather than fail) of unsupported hash functions */
21#define XZ_DEC_ANY_CHECK 1
22
23/* We use our own crc32 function */
24#define XZ_INTERNAL_CRC32 0
Denys Vlasenko716f3f62010-06-01 14:41:39 +020025static uint32_t xz_crc32(const uint8_t *buf, size_t size, uint32_t crc)
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020026{
Denys Vlasenko9ce642f2010-10-27 15:26:45 +020027 return ~crc32_block_endian0(~crc, buf, size, global_crc32_table);
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020028}
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020029
Denys Vlasenko2c1258c2017-07-15 20:22:25 +020030/* We use arch-optimized unaligned fixed-endian accessors.
31 * They have been moved to libbb (proved to be useful elsewhere as well),
32 * just check that we have them defined:
33 */
34#if !defined(get_unaligned_le32) \
35 || !defined(get_unaligned_be32) \
36 || !defined(put_unaligned_le32) \
37 || !defined(put_unaligned_be32)
38# error get_unaligned_le32 accessors are not defined
39#endif
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020040
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020041#include "unxz/xz_dec_bcj.c"
42#include "unxz/xz_dec_lzma2.c"
43#include "unxz/xz_dec_stream.c"
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020044
45IF_DESKTOP(long long) int FAST_FUNC
Denys Vlasenkob4c11c12014-12-07 00:44:00 +010046unpack_xz_stream(transformer_state_t *xstate)
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020047{
Lasse Collin380c8a02013-02-27 17:26:40 +010048 enum xz_ret xz_result;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020049 struct xz_buf iobuf;
50 struct xz_dec *state;
51 unsigned char *membuf;
52 IF_DESKTOP(long long) int total = 0;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020053
Denys Vlasenko9ce642f2010-10-27 15:26:45 +020054 if (!global_crc32_table)
Denys Vlasenkoddacb032018-02-01 10:56:19 +010055 global_crc32_new_table_le();
Denys Vlasenko8376bfa2010-06-01 23:26:54 +020056
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020057 memset(&iobuf, 0, sizeof(iobuf));
Denys Vlasenko8a6a2f92012-03-06 16:27:48 +010058 membuf = xmalloc(2 * BUFSIZ);
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020059 iobuf.in = membuf;
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +020060 iobuf.out = membuf + BUFSIZ;
61 iobuf.out_size = BUFSIZ;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020062
Denys Vlasenko984b0a62016-06-20 11:06:42 +020063 if (!xstate || xstate->signature_skipped) {
Denys Vlasenko8a6a2f92012-03-06 16:27:48 +010064 /* Preload XZ file signature */
65 strcpy((char*)membuf, HEADER_MAGIC);
66 iobuf.in_size = HEADER_MAGIC_SIZE;
67 } /* else: let xz code read & check it */
68
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +020069 /* Limit memory usage to about 64 MiB. */
70 state = xz_dec_init(XZ_DYNALLOC, 64*1024*1024);
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020071
Lasse Collin380c8a02013-02-27 17:26:40 +010072 xz_result = X_OK;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020073 while (1) {
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +020074 if (iobuf.in_pos == iobuf.in_size) {
Denys Vlasenkob4c11c12014-12-07 00:44:00 +010075 int rd = safe_read(xstate->src_fd, membuf, BUFSIZ);
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020076 if (rd < 0) {
James Byrne69374872019-07-02 11:35:03 +020077 bb_simple_error_msg(bb_msg_read_error);
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020078 total = -1;
79 break;
80 }
Lasse Collin380c8a02013-02-27 17:26:40 +010081 if (rd == 0 && xz_result == XZ_STREAM_END)
82 break;
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +020083 iobuf.in_size = rd;
84 iobuf.in_pos = 0;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +020085 }
Lasse Collin380c8a02013-02-27 17:26:40 +010086 if (xz_result == XZ_STREAM_END) {
87 /*
88 * Try to start decoding next concatenated stream.
89 * Stream padding must always be a multiple of four
90 * bytes to preserve four-byte alignment. To keep the
91 * code slightly smaller, we aren't as strict here as
92 * the .xz spec requires. We just skip all zero-bytes
93 * without checking the alignment and thus can accept
94 * files that aren't valid, e.g. the XZ utils test
95 * files bad-0pad-empty.xz and bad-0catpad-empty.xz.
96 */
97 do {
98 if (membuf[iobuf.in_pos] != 0) {
Denys Vlasenko42f454b2019-10-11 14:11:44 +020099 /* There is more data, but is it XZ data?
100 * Example: dpkg-deb -f busybox_1.30.1-4_amd64.deb
101 * reads control.tar.xz "control" file
102 * inside the ar archive, but tar.xz
103 * extraction code reaches end of xz data,
104 * reached this code and reads the beginning
105 * of data.tar.xz's ar header, which isn't xz data,
106 * and prints "corrupted data".
107 * The correct solution is to not read
108 * past nested archive (to simulate EOF).
109 * This is a workaround:
110 */
111 if (membuf[iobuf.in_pos] != 0xfd) {
112 /* It's definitely not a xz signature
113 * (which is 0xfd,"7zXZ",0x00).
114 */
115 goto end;
116 }
Lasse Collin380c8a02013-02-27 17:26:40 +0100117 xz_dec_reset(state);
118 goto do_run;
119 }
120 iobuf.in_pos++;
121 } while (iobuf.in_pos < iobuf.in_size);
122 }
123 do_run:
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200124// bb_error_msg(">in pos:%d size:%d out pos:%d size:%d",
125// iobuf.in_pos, iobuf.in_size, iobuf.out_pos, iobuf.out_size);
Lasse Collin380c8a02013-02-27 17:26:40 +0100126 xz_result = xz_dec_run(state, &iobuf);
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200127// bb_error_msg("<in pos:%d size:%d out pos:%d size:%d r:%d",
Lasse Collin380c8a02013-02-27 17:26:40 +0100128// iobuf.in_pos, iobuf.in_size, iobuf.out_pos, iobuf.out_size, xz_result);
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +0200129 if (iobuf.out_pos) {
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100130 xtransformer_write(xstate, iobuf.out, iobuf.out_pos);
Denys Vlasenkoba73cfd2010-06-20 02:40:56 +0200131 IF_DESKTOP(total += iobuf.out_pos;)
132 iobuf.out_pos = 0;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200133 }
Lasse Collin380c8a02013-02-27 17:26:40 +0100134 if (xz_result == XZ_STREAM_END) {
135 /*
136 * Can just "break;" here, if not for concatenated
137 * .xz streams.
138 * Checking for padding may require buffer
139 * replenishment. Can't do it here.
140 */
141 continue;
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200142 }
Lasse Collin380c8a02013-02-27 17:26:40 +0100143 if (xz_result != XZ_OK && xz_result != XZ_UNSUPPORTED_CHECK) {
James Byrne69374872019-07-02 11:35:03 +0200144 bb_simple_error_msg("corrupted data");
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200145 total = -1;
146 break;
147 }
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200148 }
Denys Vlasenko42f454b2019-10-11 14:11:44 +0200149 end:
Denys Vlasenkofb6c76c2010-05-30 03:47:40 +0200150 xz_dec_end(state);
151 free(membuf);
152
153 return total;
154}