blob: b139dc5be6957a6f340fa190458029356c86f809 [file] [log] [blame]
Bernhard Reutner-Fischer9457e702006-04-02 20:12:31 +00001/* vi: set sw=4 ts=4: */
Denis Vlasenkof81e8db2009-04-09 12:35:13 +00002#ifndef UNARCHIVE_H
3#define UNARCHIVE_H 1
Glenn L McGrathe9fc7812001-10-25 14:57:14 +00004
Denis Vlasenkof81e8db2009-04-09 12:35:13 +00005PUSH_AND_SET_FUNCTION_VISIBILITY_TO_HIDDEN
Denis Vlasenko98636eb2008-05-09 17:59:34 +00006
Denys Vlasenko26b6ccf2010-06-02 14:14:48 +02007enum {
8#if BB_BIG_ENDIAN
9 COMPRESS_MAGIC = 0x1f9d,
Denys Vlasenko45f66162010-07-01 05:12:28 +020010 GZIP_MAGIC = 0x1f8b,
Denys Vlasenkoaef441c2011-02-06 20:01:11 +010011 BZIP2_MAGIC = 256 * 'B' + 'Z',
Denys Vlasenkocd0f6b02010-07-01 10:38:10 +020012 /* .xz signature: 0xfd, '7', 'z', 'X', 'Z', 0x00 */
13 /* More info at: http://tukaani.org/xz/xz-file-format.txt */
Denys Vlasenkoaef441c2011-02-06 20:01:11 +010014 XZ_MAGIC1 = 256 * 0xfd + '7',
15 XZ_MAGIC2 = 256 * (256 * (256 * 'z' + 'X') + 'Z') + 0,
Denys Vlasenko45f66162010-07-01 05:12:28 +020016 /* Different form: 32 bits, then 16 bits: */
Denys Vlasenkoaef441c2011-02-06 20:01:11 +010017 XZ_MAGIC1a = 256 * (256 * (256 * 0xfd + '7') + 'z') + 'X',
18 XZ_MAGIC2a = 256 * 'Z' + 0,
Denys Vlasenko26b6ccf2010-06-02 14:14:48 +020019#else
20 COMPRESS_MAGIC = 0x9d1f,
Denys Vlasenko45f66162010-07-01 05:12:28 +020021 GZIP_MAGIC = 0x8b1f,
Denys Vlasenkoaef441c2011-02-06 20:01:11 +010022 BZIP2_MAGIC = 'B' + 'Z' * 256,
23 XZ_MAGIC1 = 0xfd + '7' * 256,
24 XZ_MAGIC2 = 'z' + ('X' + ('Z' + 0 * 256) * 256) * 256,
25 XZ_MAGIC1a = 0xfd + ('7' + ('z' + 'X' * 256) * 256) * 256,
26 XZ_MAGIC2a = 'Z' + 0 * 256,
Denys Vlasenko26b6ccf2010-06-02 14:14:48 +020027#endif
28};
29
Denis Vlasenko75103842007-06-20 14:49:47 +000030typedef struct file_header_t {
Glenn L McGrathe9fc7812001-10-25 14:57:14 +000031 char *name;
Denis Vlasenko75103842007-06-20 14:49:47 +000032 char *link_target;
Denis Vlasenkoe00e5022008-02-14 20:37:54 +000033#if ENABLE_FEATURE_TAR_UNAME_GNAME
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010034 char *tar__uname;
35 char *tar__gname;
Denis Vlasenkoe00e5022008-02-14 20:37:54 +000036#endif
Glenn L McGrathe9fc7812001-10-25 14:57:14 +000037 off_t size;
38 uid_t uid;
39 gid_t gid;
40 mode_t mode;
41 time_t mtime;
42 dev_t device;
43} file_header_t;
44
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010045struct hardlinks_t;
46
Denis Vlasenko75103842007-06-20 14:49:47 +000047typedef struct archive_handle_t {
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010048 /* Flags. 1st since it is most used member */
49 unsigned ah_flags;
50
51 /* The raw stream as read from disk or stdin */
52 int src_fd;
53
Denis Vlasenkoa60936d2008-06-28 05:04:09 +000054 /* Define if the header and data component should be processed */
Denis Vlasenkodefc1ea2008-06-27 02:52:20 +000055 char FAST_FUNC (*filter)(struct archive_handle_t *);
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010056 /* List of files that have been accepted */
Glenn L McGrath66125c82002-12-08 00:54:33 +000057 llist_t *accept;
Bernhard Reutner-Fischer9457e702006-04-02 20:12:31 +000058 /* List of files that have been rejected */
Glenn L McGrath66125c82002-12-08 00:54:33 +000059 llist_t *reject;
Bernhard Reutner-Fischer9457e702006-04-02 20:12:31 +000060 /* List of files that have successfully been worked on */
61 llist_t *passed;
Glenn L McGrathe9fc7812001-10-25 14:57:14 +000062
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010063 /* Currently processed file's header */
Glenn L McGrath7ca04f32002-09-25 02:47:48 +000064 file_header_t *file_header;
Glenn L McGrathe9fc7812001-10-25 14:57:14 +000065
Denis Vlasenkoa60936d2008-06-28 05:04:09 +000066 /* Process the header component, e.g. tar -t */
Denis Vlasenkodefc1ea2008-06-27 02:52:20 +000067 void FAST_FUNC (*action_header)(const file_header_t *);
Glenn L McGrathe9fc7812001-10-25 14:57:14 +000068
Denis Vlasenkoa60936d2008-06-28 05:04:09 +000069 /* Process the data component, e.g. extract to filesystem */
Denis Vlasenkodefc1ea2008-06-27 02:52:20 +000070 void FAST_FUNC (*action_data)(struct archive_handle_t *);
Eric Andersenc7bda1c2004-03-15 08:29:22 +000071
Denys Vlasenko0a130d52009-08-28 21:09:51 +020072 /* Function that skips data */
73 void FAST_FUNC (*seek)(int fd, off_t amount);
Glenn L McGrath237ae422002-11-03 14:05:15 +000074
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010075 /* Count processed bytes */
76 off_t offset;
77
78 /* Archiver specific. Can make it a union if it ever gets big */
Denys Vlasenko6b01b712010-01-24 22:52:21 +010079#if ENABLE_TAR || ENABLE_DPKG || ENABLE_DPKG_DEB
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010080 smallint tar__end;
81# if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
82 char* tar__longname;
83 char* tar__linkname;
84# endif
Ladislav Michl2b46fd42010-06-25 01:33:00 +020085#if ENABLE_FEATURE_TAR_TO_COMMAND
86 char* tar__to_command;
Denys Vlasenko681efe22011-03-08 21:00:36 +010087 const char* tar__to_command_shell;
Ladislav Michl2b46fd42010-06-25 01:33:00 +020088#endif
J. Tang77a2c512010-03-19 14:48:51 +010089# if ENABLE_FEATURE_TAR_SELINUX
90 char* tar__global_sctx;
91 char* tar__next_file_sctx;
92# endif
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010093#endif
Denys Vlasenko6b01b712010-01-24 22:52:21 +010094#if ENABLE_CPIO || ENABLE_RPM2CPIO || ENABLE_RPM
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +010095 uoff_t cpio__blocks;
96 struct hardlinks_t *cpio__hardlinks_to_create;
97 struct hardlinks_t *cpio__created_hardlinks;
98#endif
99#if ENABLE_DPKG || ENABLE_DPKG_DEB
Glenn L McGrathf235d052003-10-29 03:37:54 +0000100 /* Temporary storage */
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100101 char *dpkg__buffer;
102 /* How to process any sub archive, e.g. get_header_tar_gz */
103 char FAST_FUNC (*dpkg__action_data_subarchive)(struct archive_handle_t *);
104 /* Contains the handle to a sub archive */
105 struct archive_handle_t *dpkg__sub_archive;
106#endif
Alexander Shishkin535584c2010-03-15 15:38:09 +0100107#if ENABLE_FEATURE_AR_CREATE
108 const char *ar__name;
109 struct archive_handle_t *ar__out;
110#endif
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000111} archive_handle_t;
Denys Vlasenko425ad9c2009-12-16 22:46:01 +0100112/* bits in ah_flags */
113#define ARCHIVE_RESTORE_DATE (1 << 0)
114#define ARCHIVE_CREATE_LEADING_DIRS (1 << 1)
115#define ARCHIVE_UNLINK_OLD (1 << 2)
116#define ARCHIVE_EXTRACT_QUIET (1 << 3)
117#define ARCHIVE_EXTRACT_NEWER (1 << 4)
118#define ARCHIVE_DONT_RESTORE_OWNER (1 << 5)
119#define ARCHIVE_DONT_RESTORE_PERM (1 << 6)
120#define ARCHIVE_NUMERIC_OWNER (1 << 7)
Denys Vlasenko8a936cf2009-12-16 23:18:59 +0100121#define ARCHIVE_O_TRUNC (1 << 8)
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000122
Denis Vlasenkobb3d0fa2007-01-03 01:57:25 +0000123
Denys Vlasenko52827e32010-06-26 18:21:36 +0200124/* POSIX tar Header Block, from POSIX 1003.1-1990 */
125#define TAR_BLOCK_SIZE 512
126#define NAME_SIZE 100
127#define NAME_SIZE_STR "100"
128typedef struct tar_header_t { /* byte offset */
129 char name[NAME_SIZE]; /* 0-99 */
130 char mode[8]; /* 100-107 */
131 char uid[8]; /* 108-115 */
132 char gid[8]; /* 116-123 */
133 char size[12]; /* 124-135 */
134 char mtime[12]; /* 136-147 */
135 char chksum[8]; /* 148-155 */
136 char typeflag; /* 156-156 */
137 char linkname[NAME_SIZE]; /* 157-256 */
138 /* POSIX: "ustar" NUL "00" */
139 /* GNU tar: "ustar " NUL */
140 /* Normally it's defined as magic[6] followed by
141 * version[2], but we put them together to save code.
142 */
143 char magic[8]; /* 257-264 */
144 char uname[32]; /* 265-296 */
145 char gname[32]; /* 297-328 */
146 char devmajor[8]; /* 329-336 */
147 char devminor[8]; /* 337-344 */
148 char prefix[155]; /* 345-499 */
149 char padding[12]; /* 500-512 (pad to exactly TAR_BLOCK_SIZE) */
150} tar_header_t;
151struct BUG_tar_header {
152 char c[sizeof(tar_header_t) == TAR_BLOCK_SIZE ? 1 : -1];
153};
154
155
156
Denis Vlasenko1a9e9bd2008-11-01 12:54:56 +0000157/* Info struct unpackers can fill out to inform users of thing like
158 * timestamps of unpacked files */
159typedef struct unpack_info_t {
160 time_t mtime;
161} unpack_info_t;
162
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100163archive_handle_t *init_handle(void) FAST_FUNC;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000164
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100165char filter_accept_all(archive_handle_t *archive_handle) FAST_FUNC;
166char filter_accept_list(archive_handle_t *archive_handle) FAST_FUNC;
167char filter_accept_list_reassign(archive_handle_t *archive_handle) FAST_FUNC;
168char filter_accept_reject_list(archive_handle_t *archive_handle) FAST_FUNC;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000169
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100170void unpack_ar_archive(archive_handle_t *ar_archive) FAST_FUNC;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000171
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100172void data_skip(archive_handle_t *archive_handle) FAST_FUNC;
173void data_extract_all(archive_handle_t *archive_handle) FAST_FUNC;
174void data_extract_to_stdout(archive_handle_t *archive_handle) FAST_FUNC;
175void data_extract_to_command(archive_handle_t *archive_handle) FAST_FUNC;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000176
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100177void header_skip(const file_header_t *file_header) FAST_FUNC;
178void header_list(const file_header_t *file_header) FAST_FUNC;
179void header_verbose_list(const file_header_t *file_header) FAST_FUNC;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000180
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100181char get_header_ar(archive_handle_t *archive_handle) FAST_FUNC;
182char get_header_cpio(archive_handle_t *archive_handle) FAST_FUNC;
183char get_header_tar(archive_handle_t *archive_handle) FAST_FUNC;
184char get_header_tar_gz(archive_handle_t *archive_handle) FAST_FUNC;
185char get_header_tar_bz2(archive_handle_t *archive_handle) FAST_FUNC;
186char get_header_tar_lzma(archive_handle_t *archive_handle) FAST_FUNC;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000187
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100188void seek_by_jump(int fd, off_t amount) FAST_FUNC;
189void seek_by_read(int fd, off_t amount) FAST_FUNC;
Glenn L McGrath60bce492002-11-03 07:28:38 +0000190
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100191const char *strip_unsafe_prefix(const char *str) FAST_FUNC;
192
193void data_align(archive_handle_t *archive_handle, unsigned boundary) FAST_FUNC;
194const llist_t *find_list_entry(const llist_t *list, const char *filename) FAST_FUNC;
195const llist_t *find_list_entry2(const llist_t *list, const char *filename) FAST_FUNC;
Glenn L McGrath237ae422002-11-03 14:05:15 +0000196
Denis Vlasenkoc6758a02007-04-10 21:40:19 +0000197/* A bit of bunzip2 internals are exposed for compressed help support: */
198typedef struct bunzip_data bunzip_data;
Denys Vlasenkocaddfc82010-10-28 23:08:53 +0200199int start_bunzip(bunzip_data **bdp, int in_fd, const void *inbuf, int len) FAST_FUNC;
Denys Vlasenko1014a9a2010-10-29 19:01:58 +0200200/* NB: read_bunzip returns < 0 on error, or the number of *unfilled* bytes
201 * in outbuf. IOW: on EOF returns len ("all bytes are not filled"), not 0: */
Denis Vlasenkodefc1ea2008-06-27 02:52:20 +0000202int read_bunzip(bunzip_data *bd, char *outbuf, int len) FAST_FUNC;
203void dealloc_bunzip(bunzip_data *bd) FAST_FUNC;
Denis Vlasenkocd42cb82007-01-05 23:56:53 +0000204
205typedef struct inflate_unzip_result {
206 off_t bytes_out;
207 uint32_t crc;
208} inflate_unzip_result;
209
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000210IF_DESKTOP(long long) int inflate_unzip(inflate_unzip_result *res, off_t compr_size, int src_fd, int dst_fd) FAST_FUNC;
Denys Vlasenko45f66162010-07-01 05:12:28 +0200211/* xz unpacker takes .xz stream from offset 6 */
Denys Vlasenko6948f212010-05-30 04:18:13 +0200212IF_DESKTOP(long long) int unpack_xz_stream(int src_fd, int dst_fd) FAST_FUNC;
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +0000213/* lzma unpacker takes .lzma stream from offset 0 */
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000214IF_DESKTOP(long long) int unpack_lzma_stream(int src_fd, int dst_fd) FAST_FUNC;
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +0000215/* the rest wants 2 first bytes already skipped by the caller */
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000216IF_DESKTOP(long long) int unpack_bz2_stream(int src_fd, int dst_fd) FAST_FUNC;
217IF_DESKTOP(long long) int unpack_gz_stream(int src_fd, int dst_fd) FAST_FUNC;
218IF_DESKTOP(long long) int unpack_gz_stream_with_info(int src_fd, int dst_fd, unpack_info_t *info) FAST_FUNC;
Denys Vlasenko6948f212010-05-30 04:18:13 +0200219IF_DESKTOP(long long) int unpack_Z_stream(int src_fd, int dst_fd) FAST_FUNC;
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +0000220/* wrapper which checks first two bytes to be "BZ" */
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000221IF_DESKTOP(long long) int unpack_bz2_stream_prime(int src_fd, int dst_fd) FAST_FUNC;
Glenn L McGrath237ae422002-11-03 14:05:15 +0000222
Denys Vlasenko39a04f72010-05-31 14:18:57 +0200223char* append_ext(char *filename, const char *expected_ext) FAST_FUNC;
Denis Vlasenko1a9e9bd2008-11-01 12:54:56 +0000224int bbunpack(char **argv,
Denys Vlasenko39a04f72010-05-31 14:18:57 +0200225 IF_DESKTOP(long long) int FAST_FUNC (*unpacker)(unpack_info_t *info),
226 char* FAST_FUNC (*make_new_name)(char *filename, const char *expected_ext),
227 const char *expected_ext
228) FAST_FUNC;
Denis Vlasenko1a9e9bd2008-11-01 12:54:56 +0000229
Denis Vlasenko211f7f82007-09-05 11:48:32 +0000230#if BB_MMU
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +0000231void open_transformer(int fd,
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000232 IF_DESKTOP(long long) int FAST_FUNC (*transformer)(int src_fd, int dst_fd)) FAST_FUNC;
Denis Vlasenkob6052722008-07-10 17:43:01 +0000233#define open_transformer(fd, transformer, transform_prog) open_transformer(fd, transformer)
Denis Vlasenko211f7f82007-09-05 11:48:32 +0000234#else
Denis Vlasenkoe9ad84d2008-08-05 13:10:34 +0000235void open_transformer(int src_fd, const char *transform_prog) FAST_FUNC;
Denis Vlasenkob6052722008-07-10 17:43:01 +0000236#define open_transformer(fd, transformer, transform_prog) open_transformer(fd, transform_prog)
Denis Vlasenko211f7f82007-09-05 11:48:32 +0000237#endif
Glenn L McGrath5699b852003-11-15 23:19:05 +0000238
Denis Vlasenkof81e8db2009-04-09 12:35:13 +0000239POP_SAVED_FUNCTION_VISIBILITY
Denis Vlasenko98636eb2008-05-09 17:59:34 +0000240
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000241#endif