blob: 51025529dcaa2ec51beed88e317a768051074f21 [file] [log] [blame]
Glenn L McGrath87ac7022002-01-02 13:52:26 +00001/* vi: set sw=4 ts=4: */
2/*
3 * Mini unzip implementation for busybox
4 *
Paul Fox0840b762005-07-20 20:26:49 +00005 * Copyright (C) 2004 by Ed Clark
6 *
7 * Loosely based on original busybox unzip applet by Laurence Anderson.
8 * All options and features should work in this version.
Glenn L McGrath87ac7022002-01-02 13:52:26 +00009 *
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +020010 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
Glenn L McGrath87ac7022002-01-02 13:52:26 +000011 */
Glenn L McGrathf34b0e92004-06-06 10:22:43 +000012/* For reference see
Paul Fox0840b762005-07-20 20:26:49 +000013 * http://www.pkware.com/company/standards/appnote/
Glenn L McGrathf34b0e92004-06-06 10:22:43 +000014 * http://www.info-zip.org/pub/infozip/doc/appnote-iz-latest.zip
Denys Vlasenko66620fa2013-11-14 09:53:52 +010015 *
16 * TODO
Paul Fox0840b762005-07-20 20:26:49 +000017 * Zip64 + other methods
Paul Fox0840b762005-07-20 20:26:49 +000018 */
Denys Vlasenkof6beef62013-11-14 11:39:00 +010019//config:config UNZIP
20//config: bool "unzip"
21//config: default y
22//config: help
23//config: unzip will list or extract files from a ZIP archive,
24//config: commonly found on DOS/WIN systems. The default behavior
25//config: (with no options) is to extract the archive into the
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +010026//config: current directory.
27//config:
28//config:config FEATURE_UNZIP_CDF
29//config: bool "Read and use Central Directory data"
30//config: default y
31//config: depends on UNZIP
32//config: help
33//config: If you know that you only need to deal with simple
Denys Vlasenkoecba2942017-01-05 11:47:28 +010034//config: ZIP files without deleted/updated files, SFX archives etc,
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +010035//config: you can reduce code size by unselecting this option.
36//config: To support less trivial ZIPs, say Y.
Denys Vlasenko2a0867a2017-01-09 10:58:37 +010037//config:
38//config:config FEATURE_UNZIP_BZIP2
39//config: bool "Support compression method 12 (bzip2)"
40//config: default y
41//config: depends on FEATURE_UNZIP_CDF && DESKTOP
42// FEATURE_UNZIP_CDF is needed, otherwise we can't find start of next file
43// DESKTOP is needed to get back uncompressed length
44//config:
45//config:config FEATURE_UNZIP_LZMA
46//config: bool "Support compression method 14 (lzma)"
47//config: default y
48//config: depends on FEATURE_UNZIP_CDF && DESKTOP
Denys Vlasenko6b4f4b52017-01-09 11:12:01 +010049//config:
50//config:config FEATURE_UNZIP_XZ
51//config: bool "Support compression method 95 (xz)"
52//config: default y
53//config: depends on FEATURE_UNZIP_CDF && DESKTOP
Denys Vlasenkof6beef62013-11-14 11:39:00 +010054
Denys Vlasenkoac216872013-11-14 11:38:18 +010055//applet:IF_UNZIP(APPLET(unzip, BB_DIR_USR_BIN, BB_SUID_DROP))
Denys Vlasenko66620fa2013-11-14 09:53:52 +010056//kbuild:lib-$(CONFIG_UNZIP) += unzip.o
57
Pere Orga1f4447b2011-03-27 22:40:30 +020058//usage:#define unzip_trivial_usage
Denys Vlasenkoe3e0d2b2012-06-19 12:46:59 +020059//usage: "[-lnopq] FILE[.zip] [FILE]... [-x FILE...] [-d DIR]"
Pere Orga1f4447b2011-03-27 22:40:30 +020060//usage:#define unzip_full_usage "\n\n"
Denys Vlasenkoe3e0d2b2012-06-19 12:46:59 +020061//usage: "Extract FILEs from ZIP archive\n"
62//usage: "\n -l List contents (with -q for short form)"
Denys Vlasenkoc5b01012012-06-15 16:43:26 +020063//usage: "\n -n Never overwrite files (default: ask)"
Pere Orga1f4447b2011-03-27 22:40:30 +020064//usage: "\n -o Overwrite"
Denys Vlasenkoe3e0d2b2012-06-19 12:46:59 +020065//usage: "\n -p Print to stdout"
Pere Orga1f4447b2011-03-27 22:40:30 +020066//usage: "\n -q Quiet"
Denys Vlasenkoe3e0d2b2012-06-19 12:46:59 +020067//usage: "\n -x FILE Exclude FILEs"
68//usage: "\n -d DIR Extract into DIR"
Pere Orga1f4447b2011-03-27 22:40:30 +020069
Denis Vlasenkob6adbf12007-05-26 19:00:18 +000070#include "libbb.h"
Denys Vlasenkod184a722011-09-22 12:45:14 +020071#include "bb_archive.h"
Glenn L McGrath87ac7022002-01-02 13:52:26 +000072
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +020073#if 0
74# define dbg(...) bb_error_msg(__VA_ARGS__)
75#else
76# define dbg(...) ((void)0)
77#endif
78
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +000079enum {
80#if BB_BIG_ENDIAN
81 ZIP_FILEHEADER_MAGIC = 0x504b0304,
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +010082 ZIP_CDF_MAGIC = 0x504b0102, /* CDF item */
83 ZIP_CDE_MAGIC = 0x504b0506, /* End of CDF */
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +000084 ZIP_DD_MAGIC = 0x504b0708,
85#else
86 ZIP_FILEHEADER_MAGIC = 0x04034b50,
Denys Vlasenko4e8ff732010-05-24 04:33:02 +020087 ZIP_CDF_MAGIC = 0x02014b50,
Denis Vlasenko006e8622008-09-21 01:01:46 +000088 ZIP_CDE_MAGIC = 0x06054b50,
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +000089 ZIP_DD_MAGIC = 0x08074b50,
90#endif
91};
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000092
Paul Foxcb981632007-11-05 23:09:03 +000093#define ZIP_HEADER_LEN 26
94
Paul Fox0840b762005-07-20 20:26:49 +000095typedef union {
Paul Foxcb981632007-11-05 23:09:03 +000096 uint8_t raw[ZIP_HEADER_LEN];
Paul Fox0840b762005-07-20 20:26:49 +000097 struct {
Denis Vlasenko006e8622008-09-21 01:01:46 +000098 uint16_t version; /* 0-1 */
Denys Vlasenkoe98884b2010-05-24 04:46:18 +020099 uint16_t zip_flags; /* 2-3 */
Denis Vlasenko006e8622008-09-21 01:01:46 +0000100 uint16_t method; /* 4-5 */
101 uint16_t modtime; /* 6-7 */
102 uint16_t moddate; /* 8-9 */
103 uint32_t crc32 PACKED; /* 10-13 */
104 uint32_t cmpsize PACKED; /* 14-17 */
105 uint32_t ucmpsize PACKED; /* 18-21 */
106 uint16_t filename_len; /* 22-23 */
107 uint16_t extra_len; /* 24-25 */
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100108 /* filename follows (not NUL terminated) */
109 /* extra field follows */
110 /* data follows */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100111 } fmt PACKED;
Denis Vlasenkoa60f84e2008-07-05 09:18:54 +0000112} zip_header_t; /* PACKED - gcc 4.2.1 doesn't like it (spews warning) */
Paul Fox0840b762005-07-20 20:26:49 +0000113
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100114#define FIX_ENDIANNESS_ZIP(zip) \
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100115do { if (BB_BIG_ENDIAN) { \
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100116 (zip).fmt.crc32 = SWAP_LE32((zip).fmt.crc32 ); \
117 (zip).fmt.cmpsize = SWAP_LE32((zip).fmt.cmpsize ); \
118 (zip).fmt.ucmpsize = SWAP_LE32((zip).fmt.ucmpsize ); \
119 (zip).fmt.filename_len = SWAP_LE16((zip).fmt.filename_len); \
120 (zip).fmt.extra_len = SWAP_LE16((zip).fmt.extra_len ); \
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100121}} while (0)
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000122
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200123#define CDF_HEADER_LEN 42
Denis Vlasenko006e8622008-09-21 01:01:46 +0000124
125typedef union {
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200126 uint8_t raw[CDF_HEADER_LEN];
Denis Vlasenko006e8622008-09-21 01:01:46 +0000127 struct {
128 /* uint32_t signature; 50 4b 01 02 */
129 uint16_t version_made_by; /* 0-1 */
130 uint16_t version_needed; /* 2-3 */
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200131 uint16_t cdf_flags; /* 4-5 */
Denis Vlasenko006e8622008-09-21 01:01:46 +0000132 uint16_t method; /* 6-7 */
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100133 uint16_t modtime; /* 8-9 */
134 uint16_t moddate; /* 10-11 */
Denis Vlasenko006e8622008-09-21 01:01:46 +0000135 uint32_t crc32; /* 12-15 */
136 uint32_t cmpsize; /* 16-19 */
137 uint32_t ucmpsize; /* 20-23 */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100138 uint16_t filename_len; /* 24-25 */
139 uint16_t extra_len; /* 26-27 */
Denis Vlasenko006e8622008-09-21 01:01:46 +0000140 uint16_t file_comment_length; /* 28-29 */
141 uint16_t disk_number_start; /* 30-31 */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100142 uint16_t internal_attributes; /* 32-33 */
143 uint32_t external_attributes PACKED; /* 34-37 */
Denis Vlasenko006e8622008-09-21 01:01:46 +0000144 uint32_t relative_offset_of_local_header PACKED; /* 38-41 */
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100145 /* filename follows (not NUL terminated) */
146 /* extra field follows */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100147 /* file comment follows */
148 } fmt PACKED;
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200149} cdf_header_t;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000150
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100151#define FIX_ENDIANNESS_CDF(cdf) \
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100152do { if (BB_BIG_ENDIAN) { \
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100153 (cdf).fmt.version_made_by = SWAP_LE16((cdf).fmt.version_made_by); \
154 (cdf).fmt.version_needed = SWAP_LE16((cdf).fmt.version_needed); \
155 (cdf).fmt.method = SWAP_LE16((cdf).fmt.method ); \
156 (cdf).fmt.modtime = SWAP_LE16((cdf).fmt.modtime ); \
157 (cdf).fmt.moddate = SWAP_LE16((cdf).fmt.moddate ); \
158 (cdf).fmt.crc32 = SWAP_LE32((cdf).fmt.crc32 ); \
159 (cdf).fmt.cmpsize = SWAP_LE32((cdf).fmt.cmpsize ); \
160 (cdf).fmt.ucmpsize = SWAP_LE32((cdf).fmt.ucmpsize ); \
161 (cdf).fmt.filename_len = SWAP_LE16((cdf).fmt.filename_len); \
162 (cdf).fmt.extra_len = SWAP_LE16((cdf).fmt.extra_len ); \
163 (cdf).fmt.file_comment_length = SWAP_LE16((cdf).fmt.file_comment_length); \
164 (cdf).fmt.external_attributes = SWAP_LE32((cdf).fmt.external_attributes); \
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100165}} while (0)
Denis Vlasenko006e8622008-09-21 01:01:46 +0000166
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100167#define CDE_LEN 16
Denis Vlasenko006e8622008-09-21 01:01:46 +0000168
169typedef union {
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100170 uint8_t raw[CDE_LEN];
Denis Vlasenko006e8622008-09-21 01:01:46 +0000171 struct {
172 /* uint32_t signature; 50 4b 05 06 */
173 uint16_t this_disk_no;
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200174 uint16_t disk_with_cdf_no;
175 uint16_t cdf_entries_on_this_disk;
176 uint16_t cdf_entries_total;
177 uint32_t cdf_size;
178 uint32_t cdf_offset;
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100179 /* uint16_t archive_comment_length; */
180 /* archive comment follows */
181 } fmt PACKED;
182} cde_t;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000183
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100184#define FIX_ENDIANNESS_CDE(cde) \
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100185do { if (BB_BIG_ENDIAN) { \
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100186 (cde).fmt.cdf_offset = SWAP_LE32((cde).fmt.cdf_offset); \
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100187}} while (0)
188
189struct BUG {
190 /* Check the offset of the last element, not the length. This leniency
191 * allows for poor packing, whereby the overall struct may be too long,
192 * even though the elements are all in the right place.
193 */
194 char BUG_zip_header_must_be_26_bytes[
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100195 offsetof(zip_header_t, fmt.extra_len) + 2
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100196 == ZIP_HEADER_LEN ? 1 : -1];
197 char BUG_cdf_header_must_be_42_bytes[
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100198 offsetof(cdf_header_t, fmt.relative_offset_of_local_header) + 4
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100199 == CDF_HEADER_LEN ? 1 : -1];
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100200 char BUG_cde_must_be_16_bytes[
201 sizeof(cde_t) == CDE_LEN ? 1 : -1];
Denis Vlasenko006e8622008-09-21 01:01:46 +0000202};
203
Denis Vlasenko006e8622008-09-21 01:01:46 +0000204
205enum { zip_fd = 3 };
206
207
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100208/* This value means that we failed to find CDF */
209#define BAD_CDF_OFFSET ((uint32_t)0xffffffff)
Dan Fandrichb76f18d2010-06-17 21:39:44 -0700210
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100211#if !ENABLE_FEATURE_UNZIP_CDF
212
213# define find_cdf_offset() BAD_CDF_OFFSET
214
215#else
Denys Vlasenko5e87e8a2013-07-20 15:20:46 +0200216/* Seen in the wild:
217 * Self-extracting PRO2K3XP_32.exe contains 19078464 byte zip archive,
218 * where CDE was nearly 48 kbytes before EOF.
219 * (Surprisingly, it also apparently has *another* CDE structure
220 * closer to the end, with bogus cdf_offset).
221 * To make extraction work, bumped PEEK_FROM_END from 16k to 64k.
222 */
223#define PEEK_FROM_END (64*1024)
Denis Vlasenko006e8622008-09-21 01:01:46 +0000224/* NB: does not preserve file position! */
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200225static uint32_t find_cdf_offset(void)
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000226{
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100227 cde_t cde;
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100228 unsigned char *buf;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000229 unsigned char *p;
230 off_t end;
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200231 uint32_t found;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000232
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100233 end = lseek(zip_fd, 0, SEEK_END);
234 if (end == (off_t) -1)
235 return BAD_CDF_OFFSET;
236
Dan Fandrichb76f18d2010-06-17 21:39:44 -0700237 end -= PEEK_FROM_END;
Denys Vlasenkofc2bb8f2010-05-24 13:07:55 +0200238 if (end < 0)
239 end = 0;
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100240
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200241 dbg("Looking for cdf_offset starting from 0x%"OFF_FMT"x", end);
Denys Vlasenko876c1212017-03-24 15:00:12 +0100242 xlseek(zip_fd, end, SEEK_SET);
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100243 buf = xzalloc(PEEK_FROM_END);
Dan Fandrichb76f18d2010-06-17 21:39:44 -0700244 full_read(zip_fd, buf, PEEK_FROM_END);
Denis Vlasenko006e8622008-09-21 01:01:46 +0000245
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200246 found = BAD_CDF_OFFSET;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000247 p = buf;
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100248 while (p <= buf + PEEK_FROM_END - CDE_LEN - 4) {
Denis Vlasenko006e8622008-09-21 01:01:46 +0000249 if (*p != 'P') {
250 p++;
251 continue;
252 }
253 if (*++p != 'K')
254 continue;
255 if (*++p != 5)
256 continue;
257 if (*++p != 6)
258 continue;
259 /* we found CDE! */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100260 memcpy(cde.raw, p + 1, CDE_LEN);
261 FIX_ENDIANNESS_CDE(cde);
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200262 /*
263 * I've seen .ZIP files with seemingly valid CDEs
264 * where cdf_offset points past EOF - ??
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200265 * This check ignores such CDEs:
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200266 */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100267 if (cde.fmt.cdf_offset < end + (p - buf)) {
268 found = cde.fmt.cdf_offset;
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200269 dbg("Possible cdf_offset:0x%x at 0x%"OFF_FMT"x",
270 (unsigned)found, end + (p-3 - buf));
271 dbg(" cdf_offset+cdf_size:0x%x",
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100272 (unsigned)(found + SWAP_LE32(cde.fmt.cdf_size)));
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200273 /*
274 * We do not "break" here because only the last CDE is valid.
275 * I've seen a .zip archive which contained a .zip file,
276 * uncompressed, and taking the first CDE was using
277 * the CDE inside that file!
278 */
279 }
Denis Vlasenko006e8622008-09-21 01:01:46 +0000280 }
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200281 free(buf);
Denys Vlasenko0ccf52a2016-04-17 21:05:34 +0200282 dbg("Found cdf_offset:0x%x", (unsigned)found);
283 return found;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000284};
285
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100286static uint32_t read_next_cdf(uint32_t cdf_offset, cdf_header_t *cdf)
Denis Vlasenko006e8622008-09-21 01:01:46 +0000287{
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100288 uint32_t magic;
289
290 if (cdf_offset == BAD_CDF_OFFSET)
291 return cdf_offset;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000292
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100293 dbg("Reading CDF at 0x%x", (unsigned)cdf_offset);
294 xlseek(zip_fd, cdf_offset, SEEK_SET);
295 xread(zip_fd, &magic, 4);
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100296 /* Central Directory End? Assume CDF has ended.
297 * (more correct method is to use cde.cdf_entries_total counter)
298 */
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100299 if (magic == ZIP_CDE_MAGIC) {
300 dbg("got ZIP_CDE_MAGIC");
301 return 0; /* EOF */
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200302 }
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100303 xread(zip_fd, cdf->raw, CDF_HEADER_LEN);
Denis Vlasenko006e8622008-09-21 01:01:46 +0000304
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100305 FIX_ENDIANNESS_CDF(*cdf);
306 dbg(" filename_len:%u extra_len:%u file_comment_length:%u",
307 (unsigned)cdf->fmt.filename_len,
308 (unsigned)cdf->fmt.extra_len,
309 (unsigned)cdf->fmt.file_comment_length
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100310 );
311 cdf_offset += 4 + CDF_HEADER_LEN
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100312 + cdf->fmt.filename_len
313 + cdf->fmt.extra_len
314 + cdf->fmt.file_comment_length;
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100315
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200316 return cdf_offset;
Denis Vlasenko006e8622008-09-21 01:01:46 +0000317};
318#endif
319
320static void unzip_skip(off_t skip)
321{
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200322 if (skip != 0)
323 if (lseek(zip_fd, skip, SEEK_CUR) == (off_t)-1)
324 bb_copyfd_exact_size(zip_fd, -1, skip);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000325}
326
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000327static void unzip_create_leading_dirs(const char *fn)
Paul Fox0840b762005-07-20 20:26:49 +0000328{
329 /* Create all leading directories */
Rob Landleyd921b2e2006-08-03 15:41:12 +0000330 char *name = xstrdup(fn);
Paul Fox0840b762005-07-20 20:26:49 +0000331 if (bb_make_directory(dirname(name), 0777, FILEUTILS_RECUR)) {
Denys Vlasenko831756b2011-09-09 17:30:55 +0200332 xfunc_die(); /* bb_make_directory is noisy */
Paul Fox0840b762005-07-20 20:26:49 +0000333 }
334 free(name);
335}
336
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100337static void unzip_extract(zip_header_t *zip, int dst_fd)
Paul Fox0840b762005-07-20 20:26:49 +0000338{
Denys Vlasenko2a0867a2017-01-09 10:58:37 +0100339 transformer_state_t xstate;
340
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100341 if (zip->fmt.method == 0) {
Paul Fox0840b762005-07-20 20:26:49 +0000342 /* Method 0 - stored (not compressed) */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100343 off_t size = zip->fmt.ucmpsize;
Denis Vlasenko714701c2006-12-22 00:21:07 +0000344 if (size)
Denis Vlasenko006e8622008-09-21 01:01:46 +0000345 bb_copyfd_exact_size(zip_fd, dst_fd, size);
Denys Vlasenko2a0867a2017-01-09 10:58:37 +0100346 return;
347 }
348
349 init_transformer_state(&xstate);
350 xstate.bytes_in = zip->fmt.cmpsize;
351 xstate.src_fd = zip_fd;
352 xstate.dst_fd = dst_fd;
353 if (zip->fmt.method == 8) {
Paul Fox0840b762005-07-20 20:26:49 +0000354 /* Method 8 - inflate */
Denys Vlasenkob4c11c12014-12-07 00:44:00 +0100355 if (inflate_unzip(&xstate) < 0)
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000356 bb_error_msg_and_die("inflate error");
Paul Fox0840b762005-07-20 20:26:49 +0000357 /* Validate decompression - crc */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100358 if (zip->fmt.crc32 != (xstate.crc32 ^ 0xffffffffL)) {
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000359 bb_error_msg_and_die("crc error");
Paul Fox0840b762005-07-20 20:26:49 +0000360 }
Paul Fox0840b762005-07-20 20:26:49 +0000361 }
Denys Vlasenko2a0867a2017-01-09 10:58:37 +0100362#if ENABLE_FEATURE_UNZIP_BZIP2
363 else if (zip->fmt.method == 12) {
364 /* Tested. Unpacker reads too much, but we use CDF
365 * and will seek to the correct beginning of next file.
366 */
367 xstate.bytes_out = unpack_bz2_stream(&xstate);
368 if (xstate.bytes_out < 0)
369 bb_error_msg_and_die("inflate error");
370 }
371#endif
372#if ENABLE_FEATURE_UNZIP_LZMA
373 else if (zip->fmt.method == 14) {
374 /* Not tested yet */
375 xstate.bytes_out = unpack_lzma_stream(&xstate);
376 if (xstate.bytes_out < 0)
377 bb_error_msg_and_die("inflate error");
378 }
379#endif
Denys Vlasenko6b4f4b52017-01-09 11:12:01 +0100380#if ENABLE_FEATURE_UNZIP_XZ
381 else if (zip->fmt.method == 95) {
382 /* Not tested yet */
383 xstate.bytes_out = unpack_xz_stream(&xstate);
384 if (xstate.bytes_out < 0)
385 bb_error_msg_and_die("inflate error");
386 }
387#endif
Denys Vlasenko2a0867a2017-01-09 10:58:37 +0100388 else {
389 bb_error_msg_and_die("unsupported method %u", zip->fmt.method);
390 }
391
392 /* Validate decompression - size */
393 if (zip->fmt.ucmpsize != xstate.bytes_out) {
394 /* Don't die. Who knows, maybe len calculation
395 * was botched somewhere. After all, crc matched! */
396 bb_error_msg("bad length");
397 }
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000398}
399
Denys Vlasenkobf998072013-01-22 11:16:08 +0100400static void my_fgets80(char *buf80)
401{
402 fflush_all();
403 if (!fgets(buf80, 80, stdin)) {
404 bb_perror_msg_and_die("can't read standard input");
405 }
406}
407
Denis Vlasenko9b49a5e2007-10-11 10:05:36 +0000408int unzip_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
Rob Landleydfba7412006-03-06 20:47:33 +0000409int unzip_main(int argc, char **argv)
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000410{
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000411 enum { O_PROMPT, O_NEVER, O_ALWAYS };
412
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200413 smallint quiet = 0;
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100414 IF_NOT_FEATURE_UNZIP_CDF(const) smallint verbose = 0;
Paul Fox9382b382007-09-07 20:28:25 +0000415 smallint listing = 0;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000416 smallint overwrite = O_PROMPT;
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200417 smallint x_opt_seen;
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200418 uint32_t cdf_offset;
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200419 unsigned long total_usize;
420 unsigned long total_size;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000421 unsigned total_entries;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000422 int dst_fd = -1;
423 char *src_fn = NULL;
424 char *dst_fn = NULL;
Mike Frysinger69024552005-07-30 07:30:26 +0000425 llist_t *zaccept = NULL;
426 llist_t *zreject = NULL;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000427 char *base_dir = NULL;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000428 int i, opt;
Denys Vlasenkobf998072013-01-22 11:16:08 +0100429 char key_buf[80]; /* must match size used by my_fgets80 */
Paul Fox0840b762005-07-20 20:26:49 +0000430 struct stat stat_buf;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000431
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200432/* -q, -l and -v: UnZip 5.52 of 28 February 2005, by Info-ZIP:
433 *
434 * # /usr/bin/unzip -qq -v decompress_unlzma.i.zip
435 * 204372 Defl:N 35278 83% 09-06-09 14:23 0d056252 decompress_unlzma.i
436 * # /usr/bin/unzip -q -v decompress_unlzma.i.zip
437 * Length Method Size Ratio Date Time CRC-32 Name
438 * -------- ------ ------- ----- ---- ---- ------ ----
439 * 204372 Defl:N 35278 83% 09-06-09 14:23 0d056252 decompress_unlzma.i
440 * -------- ------- --- -------
441 * 204372 35278 83% 1 file
442 * # /usr/bin/unzip -v decompress_unlzma.i.zip
443 * Archive: decompress_unlzma.i.zip
444 * Length Method Size Ratio Date Time CRC-32 Name
445 * -------- ------ ------- ----- ---- ---- ------ ----
446 * 204372 Defl:N 35278 83% 09-06-09 14:23 0d056252 decompress_unlzma.i
447 * -------- ------- --- -------
448 * 204372 35278 83% 1 file
449 * # unzip -v decompress_unlzma.i.zip
450 * Archive: decompress_unlzma.i.zip
451 * Length Date Time Name
452 * -------- ---- ---- ----
453 * 204372 09-06-09 14:23 decompress_unlzma.i
454 * -------- -------
455 * 204372 1 files
456 * # /usr/bin/unzip -l -qq decompress_unlzma.i.zip
457 * 204372 09-06-09 14:23 decompress_unlzma.i
458 * # /usr/bin/unzip -l -q decompress_unlzma.i.zip
459 * Length Date Time Name
460 * -------- ---- ---- ----
461 * 204372 09-06-09 14:23 decompress_unlzma.i
462 * -------- -------
463 * 204372 1 file
464 * # /usr/bin/unzip -l decompress_unlzma.i.zip
465 * Archive: decompress_unlzma.i.zip
466 * Length Date Time Name
467 * -------- ---- ---- ----
468 * 204372 09-06-09 14:23 decompress_unlzma.i
469 * -------- -------
470 * 204372 1 file
471 */
472
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200473 x_opt_seen = 0;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000474 /* '-' makes getopt return 1 for non-options */
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200475 while ((opt = getopt(argc, argv, "-d:lnopqxv")) != -1) {
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200476 switch (opt) {
477 case 'd': /* Extract to base directory */
478 base_dir = optarg;
479 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000480
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200481 case 'l': /* List */
482 listing = 1;
483 break;
Paul Fox0840b762005-07-20 20:26:49 +0000484
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200485 case 'n': /* Never overwrite existing files */
486 overwrite = O_NEVER;
487 break;
Paul Fox0840b762005-07-20 20:26:49 +0000488
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200489 case 'o': /* Always overwrite existing files */
490 overwrite = O_ALWAYS;
491 break;
Paul Fox0840b762005-07-20 20:26:49 +0000492
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200493 case 'p': /* Extract files to stdout and fall through to set verbosity */
494 dst_fd = STDOUT_FILENO;
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200495
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200496 case 'q': /* Be quiet */
497 quiet++;
498 break;
Paul Fox0840b762005-07-20 20:26:49 +0000499
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200500 case 'v': /* Verbose list */
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100501 IF_FEATURE_UNZIP_CDF(verbose++;)
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200502 listing = 1;
503 break;
504
505 case 'x':
506 x_opt_seen = 1;
507 break;
508
509 case 1:
510 if (!src_fn) {
511 /* The zip file */
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000512 /* +5: space for ".zip" and NUL */
513 src_fn = xmalloc(strlen(optarg) + 5);
Denis Vlasenko666c40c2007-03-31 10:17:24 +0000514 strcpy(src_fn, optarg);
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200515 } else if (!x_opt_seen) {
516 /* Include files */
517 llist_add_to(&zaccept, optarg);
518 } else {
519 /* Exclude files */
520 llist_add_to(&zreject, optarg);
Paul Fox0840b762005-07-20 20:26:49 +0000521 }
522 break;
523
Paul Fox0840b762005-07-20 20:26:49 +0000524 default:
525 bb_show_usage();
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000526 }
527 }
528
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200529#ifndef __GLIBC__
530 /*
531 * This code is needed for non-GNU getopt
532 * which doesn't understand "-" in option string.
533 * The -x option won't work properly in this case:
534 * "unzip a.zip q -x w e" will be interpreted as
535 * "unzip a.zip q w e -x" = "unzip a.zip q w e"
536 */
537 argv += optind;
538 if (argv[0]) {
539 /* +5: space for ".zip" and NUL */
540 src_fn = xmalloc(strlen(argv[0]) + 5);
541 strcpy(src_fn, argv[0]);
542 while (*++argv)
543 llist_add_to(&zaccept, *argv);
544 }
545#endif
546
547 if (!src_fn) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000548 bb_show_usage();
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000549 }
550
Paul Fox0840b762005-07-20 20:26:49 +0000551 /* Open input file */
Denis Vlasenko9f739442006-12-16 23:49:13 +0000552 if (LONE_DASH(src_fn)) {
Denis Vlasenko006e8622008-09-21 01:01:46 +0000553 xdup2(STDIN_FILENO, zip_fd);
Paul Fox0840b762005-07-20 20:26:49 +0000554 /* Cannot use prompt mode since zip data is arriving on STDIN */
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000555 if (overwrite == O_PROMPT)
556 overwrite = O_NEVER;
Glenn L McGrath237ae422002-11-03 14:05:15 +0000557 } else {
Denys Vlasenko3e134eb2016-04-22 18:09:21 +0200558 static const char extn[][5] ALIGN1 = { ".zip", ".ZIP" };
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200559 char *ext = src_fn + strlen(src_fn);
560 int src_fd;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000561
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200562 i = 0;
563 for (;;) {
Paul Fox0840b762005-07-20 20:26:49 +0000564 src_fd = open(src_fn, O_RDONLY);
Denys Vlasenkoc5b01012012-06-15 16:43:26 +0200565 if (src_fd >= 0)
566 break;
567 if (++i > 2) {
568 *ext = '\0';
569 bb_error_msg_and_die("can't open %s[.zip]", src_fn);
570 }
571 strcpy(ext, extn[i - 1]);
Paul Fox0840b762005-07-20 20:26:49 +0000572 }
Denis Vlasenko006e8622008-09-21 01:01:46 +0000573 xmove_fd(src_fd, zip_fd);
Glenn L McGrath237ae422002-11-03 14:05:15 +0000574 }
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000575
Paul Fox0840b762005-07-20 20:26:49 +0000576 /* Change dir if necessary */
Bernhard Reutner-Fischerd9cf7ac2006-04-12 18:39:58 +0000577 if (base_dir)
Rob Landleyd921b2e2006-08-03 15:41:12 +0000578 xchdir(base_dir);
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000579
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200580 if (quiet <= 1) { /* not -qq */
581 if (quiet == 0)
582 printf("Archive: %s\n", src_fn);
583 if (listing) {
584 puts(verbose ?
Denys Vlasenko07bd9792016-04-18 01:43:24 +0200585 " Length Method Size Cmpr Date Time CRC-32 Name\n"
586 "-------- ------ ------- ---- ---------- ----- -------- ----"
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200587 :
Denys Vlasenko07bd9792016-04-18 01:43:24 +0200588 " Length Date Time Name\n"
589 "--------- ---------- ----- ----"
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200590 );
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000591 }
592 }
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000593
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200594/* Example of an archive with one 0-byte long file named 'z'
595 * created by Zip 2.31 on Unix:
596 * 0000 [50 4b]03 04 0a 00 00 00 00 00 42 1a b8 3c 00 00 |PK........B..<..|
597 * sig........ vneed flags compr mtime mdate crc32>
598 * 0010 00 00 00 00 00 00 00 00 00 00 01 00 15 00 7a 55 |..............zU|
599 * >..... csize...... usize...... fnlen exlen fn ex>
600 * 0020 54 09 00 03 cc d3 f9 4b cc d3 f9 4b 55 78 04 00 |T......K...KUx..|
601 * >tra_field......................................
602 * 0030 00 00 00 00[50 4b]01 02 17 03 0a 00 00 00 00 00 |....PK..........|
603 * ........... sig........ vmade vneed flags compr
604 * 0040 42 1a b8 3c 00 00 00 00 00 00 00 00 00 00 00 00 |B..<............|
605 * mtime mdate crc32...... csize...... usize......
606 * 0050 01 00 0d 00 00 00 00 00 00 00 00 00 a4 81 00 00 |................|
607 * fnlen exlen clen. dnum. iattr eattr...... relofs> (eattr = rw-r--r--)
608 * 0060 00 00 7a 55 54 05 00 03 cc d3 f9 4b 55 78 00 00 |..zUT......KUx..|
609 * >..... fn extra_field...........................
610 * 0070 [50 4b]05 06 00 00 00 00 01 00 01 00 3c 00 00 00 |PK..........<...|
611 * 0080 34 00 00 00 00 00 |4.....|
612 */
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200613 total_usize = 0;
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000614 total_size = 0;
615 total_entries = 0;
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100616 cdf_offset = find_cdf_offset(); /* try to seek to the end, find CDE and CDF start */
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000617 while (1) {
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100618 zip_header_t zip;
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200619 mode_t dir_mode = 0777;
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100620#if ENABLE_FEATURE_UNZIP_CDF
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200621 mode_t file_mode = 0666;
622#endif
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000623
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100624 if (!ENABLE_FEATURE_UNZIP_CDF || cdf_offset == BAD_CDF_OFFSET) {
625 /* Normally happens when input is unseekable.
626 *
627 * Valid ZIP file has Central Directory at the end
628 * with central directory file headers (CDFs).
629 * After it, there is a Central Directory End structure.
630 * CDFs identify what files are in the ZIP and where
631 * they are located. This allows ZIP readers to load
632 * the list of files without reading the entire ZIP archive.
633 * ZIP files may be appended to, only files specified in
634 * the CD are valid. Scanning for local file headers is
635 * not a correct algorithm.
636 *
637 * We try to do the above, and resort to "linear" reading
638 * of ZIP file only if seek failed or CDE wasn't found.
639 */
640 uint32_t magic;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000641
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100642 /* Check magic number */
643 xread(zip_fd, &magic, 4);
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100644 /* CDF item? Assume there are no more files, exit */
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100645 if (magic == ZIP_CDF_MAGIC) {
646 dbg("got ZIP_CDF_MAGIC");
647 break;
648 }
649 /* Data descriptor? It was a streaming file, go on */
650 if (magic == ZIP_DD_MAGIC) {
651 dbg("got ZIP_DD_MAGIC");
652 /* skip over duplicate crc32, cmpsize and ucmpsize */
653 unzip_skip(3 * 4);
654 continue;
655 }
656 if (magic != ZIP_FILEHEADER_MAGIC)
657 bb_error_msg_and_die("invalid zip magic %08X", (int)magic);
658 dbg("got ZIP_FILEHEADER_MAGIC");
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200659
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100660 xread(zip_fd, zip.raw, ZIP_HEADER_LEN);
661 FIX_ENDIANNESS_ZIP(zip);
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100662 if (zip.fmt.zip_flags & SWAP_LE16(0x0008)) {
663 bb_error_msg_and_die("zip flag %s is not supported",
664 "8 (streaming)");
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100665 }
666 }
667#if ENABLE_FEATURE_UNZIP_CDF
668 else {
669 /* cdf_offset is valid (and we know the file is seekable) */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100670 cdf_header_t cdf;
671 cdf_offset = read_next_cdf(cdf_offset, &cdf);
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100672 if (cdf_offset == 0) /* EOF? */
673 break;
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100674# if 1
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100675 xlseek(zip_fd,
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100676 SWAP_LE32(cdf.fmt.relative_offset_of_local_header) + 4,
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100677 SEEK_SET);
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100678 xread(zip_fd, zip.raw, ZIP_HEADER_LEN);
679 FIX_ENDIANNESS_ZIP(zip);
680 if (zip.fmt.zip_flags & SWAP_LE16(0x0008)) {
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200681 /* 0x0008 - streaming. [u]cmpsize can be reliably gotten
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100682 * only from Central Directory.
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200683 */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100684 zip.fmt.crc32 = cdf.fmt.crc32;
685 zip.fmt.cmpsize = cdf.fmt.cmpsize;
686 zip.fmt.ucmpsize = cdf.fmt.ucmpsize;
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200687 }
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100688# else
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100689 /* CDF has the same data as local header, no need to read the latter...
690 * ...not really. An archive was seen with cdf.extra_len == 6 but
691 * zip.extra_len == 0.
692 */
693 memcpy(&zip.fmt.version,
694 &cdf.fmt.version_needed, ZIP_HEADER_LEN);
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100695 xlseek(zip_fd,
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100696 SWAP_LE32(cdf.fmt.relative_offset_of_local_header) + 4 + ZIP_HEADER_LEN,
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100697 SEEK_SET);
698# endif
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100699 if ((cdf.fmt.version_made_by >> 8) == 3) {
Denys Vlasenko26cd90c2013-07-21 02:31:08 +0200700 /* This archive is created on Unix */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100701 dir_mode = file_mode = (cdf.fmt.external_attributes >> 16);
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200702 }
Denis Vlasenko48a99712008-07-26 17:32:41 +0000703 }
Denis Vlasenko006e8622008-09-21 01:01:46 +0000704#endif
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100705
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100706 if (zip.fmt.zip_flags & SWAP_LE16(0x0001)) {
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100707 /* 0x0001 - encrypted */
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100708 bb_error_msg_and_die("zip flag %s is not supported",
709 "1 (encryption)");
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100710 }
Denys Vlasenkobca4dee2016-04-18 01:14:05 +0200711 dbg("File cmpsize:0x%x extra_len:0x%x ucmpsize:0x%x",
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100712 (unsigned)zip.fmt.cmpsize,
713 (unsigned)zip.fmt.extra_len,
714 (unsigned)zip.fmt.ucmpsize
Denys Vlasenkobca4dee2016-04-18 01:14:05 +0200715 );
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000716
717 /* Read filename */
Paul Fox0840b762005-07-20 20:26:49 +0000718 free(dst_fn);
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100719 dst_fn = xzalloc(zip.fmt.filename_len + 1);
720 xread(zip_fd, dst_fn, zip.fmt.filename_len);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000721
Paul Fox0840b762005-07-20 20:26:49 +0000722 /* Skip extra header bytes */
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100723 unzip_skip(zip.fmt.extra_len);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000724
Denys Vlasenko8c06bc62015-02-10 01:30:43 +0100725 /* Guard against "/abspath", "/../" and similar attacks */
726 overlapping_strcpy(dst_fn, strip_unsafe_prefix(dst_fn));
727
Paul Fox0840b762005-07-20 20:26:49 +0000728 /* Filter zip entries */
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000729 if (find_list_entry(zreject, dst_fn)
730 || (zaccept && !find_list_entry(zaccept, dst_fn))
731 ) { /* Skip entry */
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100732 goto skip_cmpsize;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000733 }
734
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100735 if (listing) {
736 /* List entry */
737 char dtbuf[sizeof("mm-dd-yyyy hh:mm")];
738 sprintf(dtbuf, "%02u-%02u-%04u %02u:%02u",
739 (zip.fmt.moddate >> 5) & 0xf, // mm: 0x01e0
740 (zip.fmt.moddate) & 0x1f, // dd: 0x001f
741 (zip.fmt.moddate >> 9) + 1980, // yy: 0xfe00
742 (zip.fmt.modtime >> 11), // hh: 0xf800
743 (zip.fmt.modtime >> 5) & 0x3f // mm: 0x07e0
744 // seconds/2 not shown, encoded in -- 0x001f
745 );
746 if (!verbose) {
747 // " Length Date Time Name\n"
748 // "--------- ---------- ----- ----"
749 printf( "%9u " "%s " "%s\n",
750 (unsigned)zip.fmt.ucmpsize,
751 dtbuf,
752 dst_fn);
753 } else {
754 char method6[7];
755 unsigned long percents;
756
757 sprintf(method6, "%6u", zip.fmt.method);
758 if (zip.fmt.method == 0) {
759 strcpy(method6, "Stored");
760 }
761 if (zip.fmt.method == 8) {
762 strcpy(method6, "Defl:N");
763 /* normal, maximum, fast, superfast */
764 IF_DESKTOP(method6[5] = "NXFS"[(zip.fmt.zip_flags >> 1) & 3];)
765 }
766 percents = zip.fmt.ucmpsize - zip.fmt.cmpsize;
767 if ((int32_t)percents < 0)
768 percents = 0; /* happens if ucmpsize < cmpsize */
769 percents = percents * 100;
770 if (zip.fmt.ucmpsize)
771 percents /= zip.fmt.ucmpsize;
772 // " Length Method Size Cmpr Date Time CRC-32 Name\n"
773 // "-------- ------ ------- ---- ---------- ----- -------- ----"
774 printf( "%8u %s" "%9u%4u%% " "%s " "%08x " "%s\n",
775 (unsigned)zip.fmt.ucmpsize,
776 method6,
777 (unsigned)zip.fmt.cmpsize,
778 (unsigned)percents,
779 dtbuf,
780 zip.fmt.crc32,
781 dst_fn);
782 total_size += zip.fmt.cmpsize;
783 }
784 total_usize += zip.fmt.ucmpsize;
785 goto skip_cmpsize;
786 }
787
788 if (dst_fd == STDOUT_FILENO) {
789 /* Extracting to STDOUT */
790 goto do_extract;
791 }
792 if (last_char_is(dst_fn, '/')) {
793 /* Extract directory */
794 if (stat(dst_fn, &stat_buf) == -1) {
795 if (errno != ENOENT) {
796 bb_perror_msg_and_die("can't stat '%s'", dst_fn);
797 }
798 if (!quiet) {
799 printf(" creating: %s\n", dst_fn);
800 }
801 unzip_create_leading_dirs(dst_fn);
802 if (bb_make_directory(dst_fn, dir_mode, FILEUTILS_IGNORE_CHMOD_ERR)) {
803 xfunc_die();
804 }
805 } else {
806 if (!S_ISDIR(stat_buf.st_mode)) {
807 bb_error_msg_and_die("'%s' exists but is not a %s",
808 dst_fn, "directory");
809 }
810 }
811 goto skip_cmpsize;
812 }
813 check_file:
814 /* Extract file */
815 if (stat(dst_fn, &stat_buf) == -1) {
816 /* File does not exist */
817 if (errno != ENOENT) {
818 bb_perror_msg_and_die("can't stat '%s'", dst_fn);
819 }
820 goto do_open_and_extract;
821 }
822 /* File already exists */
823 if (overwrite == O_NEVER) {
824 goto skip_cmpsize;
825 }
826 if (!S_ISREG(stat_buf.st_mode)) {
827 /* File is not regular file */
828 bb_error_msg_and_die("'%s' exists but is not a %s",
829 dst_fn, "regular file");
830 }
831 /* File is regular file */
832 if (overwrite == O_ALWAYS)
833 goto do_open_and_extract;
834 printf("replace %s? [y]es, [n]o, [A]ll, [N]one, [r]ename: ", dst_fn);
835 my_fgets80(key_buf);
836
837 switch (key_buf[0]) {
Paul Fox0840b762005-07-20 20:26:49 +0000838 case 'A':
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000839 overwrite = O_ALWAYS;
Paul Fox0840b762005-07-20 20:26:49 +0000840 case 'y': /* Open file and fall into unzip */
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100841 do_open_and_extract:
Paul Fox0840b762005-07-20 20:26:49 +0000842 unzip_create_leading_dirs(dst_fn);
Denys Vlasenkoe3c4db82017-01-05 11:43:53 +0100843#if ENABLE_FEATURE_UNZIP_CDF
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200844 dst_fd = xopen3(dst_fn, O_WRONLY | O_CREAT | O_TRUNC, file_mode);
845#else
Bernhard Reutner-Fischer64d7e932006-09-11 16:01:40 +0000846 dst_fd = xopen(dst_fn, O_WRONLY | O_CREAT | O_TRUNC);
Denys Vlasenko4e8ff732010-05-24 04:33:02 +0200847#endif
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100848 do_extract:
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200849 if (!quiet) {
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100850 printf(/* zip.fmt.method == 0
851 ? " extracting: %s\n"
852 : */ " inflating: %s\n", dst_fn);
Paul Fox0840b762005-07-20 20:26:49 +0000853 }
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100854 unzip_extract(&zip, dst_fd);
Paul Fox0840b762005-07-20 20:26:49 +0000855 if (dst_fd != STDOUT_FILENO) {
856 /* closing STDOUT is potentially bad for future business */
857 close(dst_fd);
858 }
859 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000860
Paul Fox0840b762005-07-20 20:26:49 +0000861 case 'N':
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000862 overwrite = O_NEVER;
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100863 case 'n': /* Skip entry data */
864 skip_cmpsize:
Denys Vlasenko0ffac1c2017-01-08 14:14:19 +0100865 unzip_skip(zip.fmt.cmpsize);
Paul Fox0840b762005-07-20 20:26:49 +0000866 break;
867
868 case 'r':
869 /* Prompt for new name */
870 printf("new name: ");
Denys Vlasenkobf998072013-01-22 11:16:08 +0100871 my_fgets80(key_buf);
Paul Fox0840b762005-07-20 20:26:49 +0000872 free(dst_fn);
Rob Landleyd921b2e2006-08-03 15:41:12 +0000873 dst_fn = xstrdup(key_buf);
Paul Fox0840b762005-07-20 20:26:49 +0000874 chomp(dst_fn);
Denis Vlasenko48a99712008-07-26 17:32:41 +0000875 goto check_file;
Paul Fox0840b762005-07-20 20:26:49 +0000876
877 default:
Denys Vlasenko8c1d8572017-01-09 13:10:10 +0100878 printf("error: invalid response [%c]\n", (char)key_buf[0]);
Denis Vlasenko48a99712008-07-26 17:32:41 +0000879 goto check_file;
Paul Fox0840b762005-07-20 20:26:49 +0000880 }
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000881
Denis Vlasenko006e8622008-09-21 01:01:46 +0000882 total_entries++;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000883 }
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000884
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200885 if (listing && quiet <= 1) {
886 if (!verbose) {
Denys Vlasenko07bd9792016-04-18 01:43:24 +0200887 // " Length Date Time Name\n"
888 // "--------- ---------- ----- ----"
889 printf( " --------%21s" "-------\n"
890 "%9lu%21s" "%u files\n",
891 "",
892 total_usize, "", total_entries);
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200893 } else {
894 unsigned long percents = total_usize - total_size;
Denys Vlasenko07bd9792016-04-18 01:43:24 +0200895 if ((long)percents < 0)
896 percents = 0; /* happens if usize < size */
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200897 percents = percents * 100;
898 if (total_usize)
899 percents /= total_usize;
Denys Vlasenko07bd9792016-04-18 01:43:24 +0200900 // " Length Method Size Cmpr Date Time CRC-32 Name\n"
901 // "-------- ------ ------- ---- ---------- ----- -------- ----"
902 printf( "-------- ------- ----%28s" "----\n"
903 "%8lu" "%17lu%4u%%%28s" "%u files\n",
904 "",
905 total_usize, total_size, (unsigned)percents, "",
Denys Vlasenko386bc9f2009-09-06 16:52:50 +0200906 total_entries);
907 }
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000908 }
909
Denis Vlasenkobc7c5d02007-10-18 23:27:46 +0000910 return 0;
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000911}