blob: 4e357d65670e5f09b716dcd864e5f2e036db366a [file] [log] [blame]
Glenn L McGrath87ac7022002-01-02 13:52:26 +00001/* vi: set sw=4 ts=4: */
2/*
3 * Mini unzip implementation for busybox
4 *
5 * Copyright (C) 2001 by Laurence Anderson
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 *
21 */
22
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000023/* For reference to format see http://www.pkware.com/support/appnote.html */
24
25/* TODO Endian issues, exclude, should we accept input from stdin ? */
26
Glenn L McGrath87ac7022002-01-02 13:52:26 +000027#include <fcntl.h>
28#include <getopt.h>
29#include <stdlib.h>
30#include <string.h>
31#include <unistd.h>
32#include "unarchive.h"
33#include "busybox.h"
34
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000035#define ZIP_FILEHEADER_MAGIC 0x04034b50
36#define ZIP_CDS_MAGIC 0x02014b50
37#define ZIP_CDS_END_MAGIC 0x06054b50
38#define ZIP_DD_MAGIC 0x08074b50
39
40extern unsigned int gunzip_crc;
41extern unsigned int gunzip_bytes_out;
42
43static void header_list_unzip(const file_header_t *file_header)
44{
45 printf(" inflating: %s\n", file_header->name);
46}
47
48static void header_verbose_list_unzip(const file_header_t *file_header)
49{
50 unsigned int dostime = (unsigned int) file_header->mtime;
51
52 /* can printf arguments cut of the decade component ? */
53 unsigned short year = 1980 + ((dostime & 0xfe000000) >> 25);
54 while (year >= 100) {
55 year -= 100;
56 }
57
58 printf("%9u %02u-%02u-%02u %02u:%02u %s\n",
59 (unsigned int) file_header->size,
60 (dostime & 0x01e00000) >> 21,
61 (dostime & 0x001f0000) >> 16,
62 year,
63 (dostime & 0x0000f800) >> 11,
64 (dostime & 0x000007e0) >> 5,
65 file_header->name);
66}
67
Glenn L McGrath87ac7022002-01-02 13:52:26 +000068extern int unzip_main(int argc, char **argv)
69{
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000070 union {
71 unsigned char raw[26];
72 struct {
73 unsigned short version; /* 0-1 */
74 unsigned short flags; /* 2-3 */
75 unsigned short method; /* 4-5 */
76 unsigned short modtime; /* 6-7 */
77 unsigned short moddate; /* 8-9 */
78 unsigned int crc32 __attribute__ ((packed)); /* 10-13 */
79 unsigned int cmpsize __attribute__ ((packed));; /* 14-17 */
80 unsigned int ucmpsize __attribute__ ((packed));; /* 18-21 */
81 unsigned short filename_len; /* 22-23 */
82 unsigned short extra_len; /* 24-25 */
83 } formated __attribute__ ((packed));
84 } zip_header;
Glenn L McGrath87ac7022002-01-02 13:52:26 +000085
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000086 archive_handle_t *archive_handle;
87 unsigned int total_size = 0;
88 unsigned int total_entries = 0;
89 char *base_dir = NULL;
90 int opt = 0;
91
92 /* Initialise */
93 archive_handle = init_handle();
94 archive_handle->action_data = NULL;
95 archive_handle->action_header = header_list_unzip;
96
97 while ((opt = getopt(argc, argv, "lnopqd:")) != -1) {
Glenn L McGrath87ac7022002-01-02 13:52:26 +000098 switch (opt) {
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000099 case 'l': /* list */
100 archive_handle->action_header = header_verbose_list_unzip;
101 archive_handle->action_data = data_skip;
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000102 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000103 case 'n': /* never overwright existing files */
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000104 break;
105 case 'o':
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000106 archive_handle->flags = ARCHIVE_EXTRACT_UNCONDITIONAL;
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000107 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000108 case 'p': /* extract files to stdout */
109 archive_handle->action_data = data_extract_to_stdout;
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000110 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000111 case 'q': /* Extract files quietly */
112 archive_handle->action_header = header_skip;
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000113 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000114 case 'd': /* Extract files to specified base directory*/
115 base_dir = optarg;
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000116 break;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000117#if 0
118 case 'x': /* Exclude the specified files */
119 archive_handle->filter = filter_accept_reject_list;
120 break;
121#endif
122 default:
Manuel Novoa III cad53642003-03-19 09:13:01 +0000123 bb_show_usage();
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000124 }
125 }
126
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000127 if (argc == optind) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000128 bb_show_usage();
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000129 }
130
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000131 printf("Archive: %s\n", argv[optind]);
132 if (archive_handle->action_header == header_verbose_list_unzip) {
133 printf(" Length Date Time Name\n");
134 printf(" -------- ---- ---- ----\n");
135 }
136
137 if (*argv[optind] == '-') {
Eric Andersen70060d22004-03-27 10:02:48 +0000138 archive_handle->src_fd = STDIN_FILENO;
Glenn L McGrath237ae422002-11-03 14:05:15 +0000139 archive_handle->seek = seek_by_char;
140 } else {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000141 archive_handle->src_fd = bb_xopen(argv[optind++], O_RDONLY);
Glenn L McGrath237ae422002-11-03 14:05:15 +0000142 }
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000143
144 if ((base_dir) && (chdir(base_dir))) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000145 bb_perror_msg_and_die("Couldnt chdir");
Glenn L McGrath237ae422002-11-03 14:05:15 +0000146 }
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000147
148 while (optind < argc) {
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000149 archive_handle->filter = filter_accept_list;
Glenn L McGrath66125c82002-12-08 00:54:33 +0000150 archive_handle->accept = llist_add_to(archive_handle->accept, argv[optind]);
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000151 optind++;
152 }
153
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000154 while (1) {
155 unsigned int magic;
156 int dst_fd;
157
158 /* TODO Endian issues */
Glenn L McGrath237ae422002-11-03 14:05:15 +0000159 archive_xread_all(archive_handle, &magic, 4);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000160 archive_handle->offset += 4;
161
162 if (magic == ZIP_CDS_MAGIC) {
163 break;
164 }
165 else if (magic != ZIP_FILEHEADER_MAGIC) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000166 bb_error_msg_and_die("Invlaide zip magic");
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000167 }
168
169 /* Read the file header */
Glenn L McGrath237ae422002-11-03 14:05:15 +0000170 archive_xread_all(archive_handle, zip_header.raw, 26);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000171 archive_handle->offset += 26;
172 archive_handle->file_header->mode = S_IFREG | 0777;
173
174 if (zip_header.formated.method != 8) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000175 bb_error_msg_and_die("Unsupported compression method %d\n", zip_header.formated.method);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000176 }
177
178 /* Read filename */
179 archive_handle->file_header->name = xmalloc(zip_header.formated.filename_len + 1);
Glenn L McGrath237ae422002-11-03 14:05:15 +0000180 archive_xread_all(archive_handle, archive_handle->file_header->name, zip_header.formated.filename_len);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000181 archive_handle->offset += zip_header.formated.filename_len;
182 archive_handle->file_header->name[zip_header.formated.filename_len] = '\0';
183
184 /* Skip extra header bits */
185 archive_handle->file_header->size = zip_header.formated.extra_len;
186 data_skip(archive_handle);
187 archive_handle->offset += zip_header.formated.extra_len;
188
189 /* Handle directories */
190 archive_handle->file_header->mode = S_IFREG | 0777;
191 if (last_char_is(archive_handle->file_header->name, '/')) {
192 archive_handle->file_header->mode ^= S_IFREG;
193 archive_handle->file_header->mode |= S_IFDIR;
194 }
195
196 /* Data section */
197 archive_handle->file_header->size = zip_header.formated.cmpsize;
198 if (archive_handle->action_data) {
199 archive_handle->action_data(archive_handle);
200 } else {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000201 dst_fd = bb_xopen(archive_handle->file_header->name, O_WRONLY | O_CREAT);
Glenn L McGrath5699b852003-11-15 23:19:05 +0000202 inflate_init(zip_header.formated.cmpsize);
203 inflate_unzip(archive_handle->src_fd, dst_fd);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000204 close(dst_fd);
205 chmod(archive_handle->file_header->name, archive_handle->file_header->mode);
206
207 /* Validate decompression - crc */
208 if (zip_header.formated.crc32 != (gunzip_crc ^ 0xffffffffL)) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000209 bb_error_msg("Invalid compressed data--crc error");
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000210 }
211
212 /* Validate decompression - size */
213 if (gunzip_bytes_out != zip_header.formated.ucmpsize) {
Manuel Novoa III cad53642003-03-19 09:13:01 +0000214 bb_error_msg("Invalid compressed data--length error");
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000215 }
216 }
217
218 /* local file descriptor section */
219 archive_handle->offset += zip_header.formated.cmpsize;
220 /* This ISNT unix time */
221 archive_handle->file_header->mtime = zip_header.formated.modtime | (zip_header.formated.moddate << 16);
222 archive_handle->file_header->size = zip_header.formated.ucmpsize;
223 total_size += archive_handle->file_header->size;
224 total_entries++;
225
226 archive_handle->action_header(archive_handle->file_header);
227
228 /* Data descriptor section */
229 if (zip_header.formated.flags & 4) {
230 /* skip over duplicate crc, compressed size and uncompressed size */
Glenn L McGrath5699b852003-11-15 23:19:05 +0000231 unsigned char data_description[12];
232 archive_xread_all(archive_handle, data_description, 12);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000233 archive_handle->offset += 12;
234 }
235 }
236 /* Central directory section */
237
238 if (archive_handle->action_header == header_verbose_list_unzip) {
239 printf(" -------- -------\n");
240 printf("%9d %d files\n", total_size, total_entries);
241 }
242
243 return(EXIT_SUCCESS);
Glenn L McGrath87ac7022002-01-02 13:52:26 +0000244}