blob: 2ab3c04b8c4334eef09cc2dfd7b8486db3b69fd3 [file] [log] [blame]
"Robert P. J. Day"63fc1a92006-07-02 19:47:05 +00001/* vi: set sw=4 ts=4: */
Denys Vlasenko2ab94032017-10-05 15:33:28 +02002/*
3 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
Glenn L McGrath6aa52232004-02-17 11:55:06 +00004 *
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +02005 * FIXME:
Eric Andersenaff114c2004-04-14 17:51:38 +00006 * In privileged mode if uname and gname map to a uid and gid then use the
Glenn L McGrathc9f1fce2004-02-20 02:25:18 +00007 * mapped value instead of the uid/gid values in tar header
Glenn L McGrathb0e163a2004-02-19 08:48:30 +00008 *
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +02009 * References:
Glenn L McGrathb0e163a2004-02-19 08:48:30 +000010 * GNU tar and star man pages,
11 * Opengroup's ustar interchange format,
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +020012 * http://www.opengroup.org/onlinepubs/007904975/utilities/pax.html
Glenn L McGrath95ebf612001-10-25 14:18:08 +000013 */
Glenn L McGrath95ebf612001-10-25 14:18:08 +000014#include "libbb.h"
Denys Vlasenkod184a722011-09-22 12:45:14 +020015#include "bb_archive.h"
Glenn L McGrath95ebf612001-10-25 14:18:08 +000016
Denys Vlasenko98a4c7c2010-02-04 15:00:15 +010017typedef uint32_t aliased_uint32_t FIX_ALIASING;
18typedef off_t aliased_off_t FIX_ALIASING;
19
Denis Vlasenko376ce1e2006-11-24 14:51:01 +000020/* NB: _DESTROYS_ str[len] character! */
21static unsigned long long getOctal(char *str, int len)
22{
23 unsigned long long v;
Denys Vlasenko7b48eb42010-05-06 20:08:14 +020024 char *end;
Denis Vlasenkoa60936d2008-06-28 05:04:09 +000025 /* NB: leading spaces are allowed. Using strtoull to handle that.
Denys Vlasenko8d338172009-09-23 17:16:37 +020026 * The downside is that we accept e.g. "-123" too :(
Denis Vlasenkoa60936d2008-06-28 05:04:09 +000027 */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +000028 str[len] = '\0';
Denys Vlasenko7b48eb42010-05-06 20:08:14 +020029 v = strtoull(str, &end, 8);
Denys Vlasenko8d338172009-09-23 17:16:37 +020030 /* std: "Each numeric field is terminated by one or more
31 * <space> or NUL characters". We must support ' '! */
Denys Vlasenko7b48eb42010-05-06 20:08:14 +020032 if (*end != '\0' && *end != ' ') {
33 int8_t first = str[0];
34 if (!(first & 0x80))
James Byrne69374872019-07-02 11:35:03 +020035 bb_simple_error_msg_and_die("corrupted octal value in tar header");
Denys Vlasenko7b48eb42010-05-06 20:08:14 +020036 /*
37 * GNU tar uses "base-256 encoding" for very large numbers.
38 * Encoding is binary, with highest bit always set as a marker
39 * and sign in next-highest bit:
40 * 80 00 .. 00 - zero
41 * bf ff .. ff - largest positive number
42 * ff ff .. ff - minus 1
43 * c0 00 .. 00 - smallest negative number
44 *
45 * Example of tar file with 8914993153 (0x213600001) byte file.
46 * Field starts at offset 7c:
47 * 00070 30 30 30 00 30 30 30 30 30 30 30 00 80 00 00 00 |000.0000000.....|
48 * 00080 00 00 00 02 13 60 00 01 31 31 31 32 30 33 33 36 |.....`..11120336|
49 *
50 * NB: tarballs with NEGATIVE unix times encoded that way were seen!
51 */
Denys Vlasenkof74f2802011-10-19 14:51:12 +020052 /* Sign-extend 7bit 'first' to 64bit 'v' (that is, using 6th bit as sign): */
53 first <<= 1;
54 first >>= 1; /* now 7th bit = 6th bit */
55 v = first; /* sign-extend 8 bits to 64 */
Denys Vlasenko7b48eb42010-05-06 20:08:14 +020056 while (--len != 0)
Etienne Le Sueurcfc212c2012-06-09 08:37:05 +020057 v = (v << 8) + (uint8_t) *++str;
Denys Vlasenko7b48eb42010-05-06 20:08:14 +020058 }
Denis Vlasenko376ce1e2006-11-24 14:51:01 +000059 return v;
60}
Denis Vlasenkob5963352006-11-26 01:46:59 +000061#define GET_OCTAL(a) getOctal((a), sizeof(a))
Denis Vlasenko376ce1e2006-11-24 14:51:01 +000062
Denys Vlasenko015db582016-06-19 18:15:33 +020063#define TAR_EXTD (ENABLE_FEATURE_TAR_GNU_EXTENSIONS || ENABLE_FEATURE_TAR_SELINUX)
64#if !TAR_EXTD
65#define process_pax_hdr(archive_handle, sz, global) \
66 process_pax_hdr(archive_handle, sz)
67#endif
Denys Vlasenko6111f962012-02-23 13:45:18 +010068/* "global" is 0 or 1 */
69static void process_pax_hdr(archive_handle_t *archive_handle, unsigned sz, int global)
J. Tang77a2c512010-03-19 14:48:51 +010070{
Denys Vlasenko015db582016-06-19 18:15:33 +020071#if !TAR_EXTD
72 unsigned blk_sz = (sz + 511) & (~511);
73 seek_by_read(archive_handle->src_fd, blk_sz);
74#else
75 unsigned blk_sz = (sz + 511) & (~511);
J. Tang77a2c512010-03-19 14:48:51 +010076 char *buf, *p;
J. Tang77a2c512010-03-19 14:48:51 +010077
Denys Vlasenko6111f962012-02-23 13:45:18 +010078 p = buf = xmalloc(blk_sz + 1);
79 xread(archive_handle->src_fd, buf, blk_sz);
80 archive_handle->offset += blk_sz;
81
J. Tang77a2c512010-03-19 14:48:51 +010082 /* prevent bb_strtou from running off the buffer */
83 buf[sz] = '\0';
J. Tang77a2c512010-03-19 14:48:51 +010084
J. Tang77a2c512010-03-19 14:48:51 +010085 while (sz != 0) {
86 char *end, *value;
87 unsigned len;
88
89 /* Every record has this format: "LEN NAME=VALUE\n" */
90 len = bb_strtou(p, &end, 10);
91 /* expect errno to be EINVAL, because the character
92 * following the digits should be a space
93 */
94 p += len;
95 sz -= len;
Denys Vlasenko0f592d72014-01-10 18:02:38 +010096 if (
97 /** (int)sz < 0 - not good enough for huge malicious VALUE of 2^32-1 */
98 (int)(sz|len) < 0 /* this works */
J. Tang77a2c512010-03-19 14:48:51 +010099 || len == 0
100 || errno != EINVAL
101 || *end != ' '
102 ) {
James Byrne69374872019-07-02 11:35:03 +0200103 bb_simple_error_msg("malformed extended header, skipped");
J. Tang77a2c512010-03-19 14:48:51 +0100104 // More verbose version:
105 //bb_error_msg("malformed extended header at %"OFF_FMT"d, skipped",
106 // archive_handle->offset - (sz + len));
107 break;
108 }
109 /* overwrite the terminating newline with NUL
110 * (we do not bother to check that it *was* a newline)
111 */
112 p[-1] = '\0';
J. Tang77a2c512010-03-19 14:48:51 +0100113 value = end + 1;
Denys Vlasenko6111f962012-02-23 13:45:18 +0100114
Denys Vlasenko015db582016-06-19 18:15:33 +0200115# if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
Denys Vlasenko9655f952016-11-11 17:56:45 +0100116 if (!global) {
117 if (is_prefixed_with(value, "path=")) {
118 value += sizeof("path=") - 1;
119 free(archive_handle->tar__longname);
120 archive_handle->tar__longname = xstrdup(value);
121 continue;
122 }
123 if (is_prefixed_with(value, "linkpath=")) {
124 value += sizeof("linkpath=") - 1;
125 free(archive_handle->tar__linkname);
126 archive_handle->tar__linkname = xstrdup(value);
127 continue;
128 }
Denys Vlasenko6111f962012-02-23 13:45:18 +0100129 }
Denys Vlasenko015db582016-06-19 18:15:33 +0200130# endif
Denys Vlasenko6111f962012-02-23 13:45:18 +0100131
Denys Vlasenko015db582016-06-19 18:15:33 +0200132# if ENABLE_FEATURE_TAR_SELINUX
Denys Vlasenko6111f962012-02-23 13:45:18 +0100133 /* Scan for SELinux contexts, via "RHT.security.selinux" keyword.
134 * This is what Red Hat's patched version of tar uses.
135 */
Denys Vlasenko015db582016-06-19 18:15:33 +0200136# define SELINUX_CONTEXT_KEYWORD "RHT.security.selinux"
Denys Vlasenko8dff01d2015-03-12 17:48:34 +0100137 if (is_prefixed_with(value, SELINUX_CONTEXT_KEYWORD"=")) {
J. Tang77a2c512010-03-19 14:48:51 +0100138 value += sizeof(SELINUX_CONTEXT_KEYWORD"=") - 1;
Denys Vlasenko6111f962012-02-23 13:45:18 +0100139 free(archive_handle->tar__sctx[global]);
140 archive_handle->tar__sctx[global] = xstrdup(value);
141 continue;
J. Tang77a2c512010-03-19 14:48:51 +0100142 }
Denys Vlasenko015db582016-06-19 18:15:33 +0200143# endif
J. Tang77a2c512010-03-19 14:48:51 +0100144 }
145
146 free(buf);
Denys Vlasenko015db582016-06-19 18:15:33 +0200147#endif
J. Tang77a2c512010-03-19 14:48:51 +0100148}
J. Tang77a2c512010-03-19 14:48:51 +0100149
Denis Vlasenkodefc1ea2008-06-27 02:52:20 +0000150char FAST_FUNC get_header_tar(archive_handle_t *archive_handle)
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000151{
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000152 file_header_t *file_header = archive_handle->file_header;
Denys Vlasenko52827e32010-06-26 18:21:36 +0200153 struct tar_header_t tar;
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000154 char *cp;
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100155 int tar_typeflag; /* can be "char", "int" seems give smaller code */
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000156 int i, sum_u, sum;
157#if ENABLE_FEATURE_TAR_OLDSUN_COMPATIBILITY
158 int sum_s;
159#endif
Denis Vlasenkod6772502006-11-24 17:21:44 +0000160 int parse_names;
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000161
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000162 /* Our "private data" */
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000163#if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100164# define p_longname (archive_handle->tar__longname)
165# define p_linkname (archive_handle->tar__linkname)
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000166#else
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100167# define p_longname 0
168# define p_linkname 0
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000169#endif
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000170
J. Tang77a2c512010-03-19 14:48:51 +0100171#if ENABLE_FEATURE_TAR_GNU_EXTENSIONS || ENABLE_FEATURE_TAR_SELINUX
Denis Vlasenko666da5e2006-12-26 18:17:42 +0000172 again:
173#endif
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000174 /* Align header */
Glenn L McGrath237ae422002-11-03 14:05:15 +0000175 data_align(archive_handle, 512);
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000176
Denis Vlasenkob5963352006-11-26 01:46:59 +0000177 again_after_align:
178
Denis Vlasenko1f0b95f2009-03-13 14:26:44 +0000179#if ENABLE_DESKTOP || ENABLE_FEATURE_TAR_AUTODETECT
Denis Vlasenko0381d422008-07-10 23:06:00 +0000180 /* to prevent misdetection of bz2 sig */
Denys Vlasenko98a4c7c2010-02-04 15:00:15 +0100181 *(aliased_uint32_t*)&tar = 0;
Denis Vlasenko23ffb6a2008-02-13 17:52:42 +0000182 i = full_read(archive_handle->src_fd, &tar, 512);
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000183 /* If GNU tar sees EOF in above read, it says:
Denis Vlasenko23ffb6a2008-02-13 17:52:42 +0000184 * "tar: A lone zero block at N", where N = kilobyte
185 * where EOF was met (not EOF block, actual EOF!),
Denis Vlasenko0381d422008-07-10 23:06:00 +0000186 * and exits with EXIT_SUCCESS.
Bernhard Reutner-Fischer636a1f82008-05-19 09:29:47 +0000187 * We will mimic exit(EXIT_SUCCESS), although we will not mimic
Denis Vlasenko12c06222008-02-14 08:52:30 +0000188 * the message and we don't check whether we indeed
189 * saw zero block directly before this. */
Denis Vlasenko0381d422008-07-10 23:06:00 +0000190 if (i == 0) {
Denys Vlasenko9655f952016-11-11 17:56:45 +0100191 /* GNU tar 1.29 will be silent if tar archive ends abruptly
192 * (if there are no zero blocks at all, and last read returns zero,
193 * not short read 0 < len < 512). Complain only if
194 * the very first read fails. Grrr.
195 */
196 if (archive_handle->offset == 0)
James Byrne69374872019-07-02 11:35:03 +0200197 bb_simple_error_msg("short read");
Denys Vlasenkoebfa9b52013-11-19 14:44:04 +0100198 /* this merely signals end of archive, not exit(1): */
199 return EXIT_FAILURE;
Denis Vlasenko0381d422008-07-10 23:06:00 +0000200 }
201 if (i != 512) {
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000202 IF_FEATURE_TAR_AUTODETECT(goto autodetect;)
James Byrne69374872019-07-02 11:35:03 +0200203 bb_simple_error_msg_and_die("short read");
Denis Vlasenko0381d422008-07-10 23:06:00 +0000204 }
205
Denis Vlasenko12c06222008-02-14 08:52:30 +0000206#else
Denis Vlasenko0381d422008-07-10 23:06:00 +0000207 i = 512;
208 xread(archive_handle->src_fd, &tar, i);
Denis Vlasenko12c06222008-02-14 08:52:30 +0000209#endif
Denis Vlasenko0381d422008-07-10 23:06:00 +0000210 archive_handle->offset += i;
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000211
212 /* If there is no filename its an empty header */
Denys Vlasenko9655f952016-11-11 17:56:45 +0100213 if (tar.name[0] == 0 && tar.prefix[0] == 0
214 /* Have seen a tar archive with pax 'x' header supplying UTF8 filename,
215 * with actual file having all name fields NUL-filled. Check this: */
216 && !p_longname
217 ) {
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100218 if (archive_handle->tar__end) {
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000219 /* Second consecutive empty header - end of archive.
Paul Fox94ff9f12005-07-20 19:24:13 +0000220 * Read until the end to empty the pipe from gz or bz2
221 */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000222 while (full_read(archive_handle->src_fd, &tar, 512) == 512)
Denis Vlasenko431a7c92008-02-19 11:26:28 +0000223 continue;
Denys Vlasenkoebfa9b52013-11-19 14:44:04 +0100224 return EXIT_FAILURE; /* "end of archive" */
Paul Fox94ff9f12005-07-20 19:24:13 +0000225 }
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100226 archive_handle->tar__end = 1;
Denys Vlasenkoebfa9b52013-11-19 14:44:04 +0100227 return EXIT_SUCCESS; /* "decoded one header" */
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000228 }
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100229 archive_handle->tar__end = 0;
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000230
Denis Vlasenko431a7c92008-02-19 11:26:28 +0000231 /* Check header has valid magic, "ustar" is for the proper tar,
232 * five NULs are for the old tar format */
Denys Vlasenko8dff01d2015-03-12 17:48:34 +0100233 if (!is_prefixed_with(tar.magic, "ustar")
Denis Vlasenko431a7c92008-02-19 11:26:28 +0000234 && (!ENABLE_FEATURE_TAR_OLDGNU_COMPATIBILITY
235 || memcmp(tar.magic, "\0\0\0\0", 5) != 0)
236 ) {
237#if ENABLE_FEATURE_TAR_AUTODETECT
Denis Vlasenko1f0b95f2009-03-13 14:26:44 +0000238 autodetect:
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000239 /* Two different causes for lseek() != 0:
240 * unseekable fd (would like to support that too, but...),
241 * or not first block (false positive, it's not .gz/.bz2!) */
Denis Vlasenko0381d422008-07-10 23:06:00 +0000242 if (lseek(archive_handle->src_fd, -i, SEEK_CUR) != 0)
Denis Vlasenko431a7c92008-02-19 11:26:28 +0000243 goto err;
Denys Vlasenko640ce3d2014-02-02 02:06:38 +0100244 if (setup_unzip_on_fd(archive_handle->src_fd, /*fail_if_not_compressed:*/ 0) != 0)
Denis Vlasenko431a7c92008-02-19 11:26:28 +0000245 err:
James Byrne69374872019-07-02 11:35:03 +0200246 bb_simple_error_msg_and_die("invalid tar magic");
Denys Vlasenko8a6a2f92012-03-06 16:27:48 +0100247 archive_handle->offset = 0;
248 goto again_after_align;
249#endif
James Byrne69374872019-07-02 11:35:03 +0200250 bb_simple_error_msg_and_die("invalid tar magic");
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000251 }
Denis Vlasenkodcbd51d2007-03-03 20:06:59 +0000252
253 /* Do checksum on headers.
254 * POSIX says that checksum is done on unsigned bytes, but
Denis Vlasenko940494f2007-03-04 18:09:50 +0000255 * Sun and HP-UX gets it wrong... more details in
Denis Vlasenkodcbd51d2007-03-03 20:06:59 +0000256 * GNU tar source. */
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000257 sum_u = ' ' * sizeof(tar.chksum);
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100258#if ENABLE_FEATURE_TAR_OLDSUN_COMPATIBILITY
259 sum_s = sum_u;
260#endif
Denis Vlasenkob71c6682007-07-21 15:08:09 +0000261 for (i = 0; i < 148; i++) {
Denis Vlasenkodcbd51d2007-03-03 20:06:59 +0000262 sum_u += ((unsigned char*)&tar)[i];
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000263#if ENABLE_FEATURE_TAR_OLDSUN_COMPATIBILITY
Denis Vlasenkodcbd51d2007-03-03 20:06:59 +0000264 sum_s += ((signed char*)&tar)[i];
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000265#endif
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000266 }
Denis Vlasenkob71c6682007-07-21 15:08:09 +0000267 for (i = 156; i < 512; i++) {
Denis Vlasenkodcbd51d2007-03-03 20:06:59 +0000268 sum_u += ((unsigned char*)&tar)[i];
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000269#if ENABLE_FEATURE_TAR_OLDSUN_COMPATIBILITY
Denis Vlasenkodcbd51d2007-03-03 20:06:59 +0000270 sum_s += ((signed char*)&tar)[i];
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000271#endif
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000272 }
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100273 /* Most tarfiles have tar.chksum NUL or space terminated, but
274 * github.com decided to be "special" and have unterminated field:
275 * 0090: 30343300 30303031 33323731 30000000 |043.000132710...|
276 * ^^^^^^^^|
277 * Need to use GET_OCTAL. This overwrites tar.typeflag ---+
278 * (the '0' char immediately after chksum in example above) with NUL.
279 */
280 tar_typeflag = (uint8_t)tar.typeflag; /* save it */
281 sum = GET_OCTAL(tar.chksum);
282 if (sum_u != sum
283 IF_FEATURE_TAR_OLDSUN_COMPATIBILITY(&& sum_s != sum)
284 ) {
James Byrne69374872019-07-02 11:35:03 +0200285 bb_simple_error_msg_and_die("invalid tar header checksum");
Denis Vlasenkoa80b4a02007-06-21 12:41:59 +0000286 }
Glenn L McGrath95ebf612001-10-25 14:18:08 +0000287
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100288 /* GET_OCTAL trashes subsequent field, therefore we call it
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000289 * on fields in reverse order */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000290 if (tar.devmajor[0]) {
Denis Vlasenkod93400b2008-04-29 03:54:16 +0000291 char t = tar.prefix[0];
292 /* we trash prefix[0] here, but we DO need it later! */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000293 unsigned minor = GET_OCTAL(tar.devminor);
294 unsigned major = GET_OCTAL(tar.devmajor);
295 file_header->device = makedev(major, minor);
Denis Vlasenkod93400b2008-04-29 03:54:16 +0000296 tar.prefix[0] = t;
Denis Vlasenkocba9ef52006-10-10 21:00:47 +0000297 }
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100298
299 /* 0 is reserved for high perf file, treat as normal file */
300 if (tar_typeflag == '\0') tar_typeflag = '0';
301 parse_names = (tar_typeflag >= '0' && tar_typeflag <= '7');
302
Denis Vlasenko75103842007-06-20 14:49:47 +0000303 file_header->link_target = NULL;
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000304 if (!p_linkname && parse_names && tar.linkname[0]) {
Denis Vlasenkobc1918a2008-04-15 01:17:50 +0000305 file_header->link_target = xstrndup(tar.linkname, sizeof(tar.linkname));
Denis Vlasenko75103842007-06-20 14:49:47 +0000306 /* FIXME: what if we have non-link object with link_target? */
307 /* Will link_target be free()ed? */
Denis Vlasenkod6772502006-11-24 17:21:44 +0000308 }
Denis Vlasenkoe00e5022008-02-14 20:37:54 +0000309#if ENABLE_FEATURE_TAR_UNAME_GNAME
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100310 file_header->tar__uname = tar.uname[0] ? xstrndup(tar.uname, sizeof(tar.uname)) : NULL;
311 file_header->tar__gname = tar.gname[0] ? xstrndup(tar.gname, sizeof(tar.gname)) : NULL;
Denis Vlasenkoe00e5022008-02-14 20:37:54 +0000312#endif
Denys Vlasenko7b48eb42010-05-06 20:08:14 +0200313 file_header->mtime = GET_OCTAL(tar.mtime);
314 file_header->size = GET_OCTAL(tar.size);
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000315 file_header->gid = GET_OCTAL(tar.gid);
316 file_header->uid = GET_OCTAL(tar.uid);
Glenn L McGrath916ba532004-02-20 02:34:42 +0000317 /* Set bits 0-11 of the files mode */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000318 file_header->mode = 07777 & GET_OCTAL(tar.mode);
Glenn L McGrath916ba532004-02-20 02:34:42 +0000319
Denis Vlasenkob5963352006-11-26 01:46:59 +0000320 file_header->name = NULL;
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000321 if (!p_longname && parse_names) {
Denis Vlasenkod6772502006-11-24 17:21:44 +0000322 /* we trash mode[0] here, it's ok */
Denis Vlasenkobc1918a2008-04-15 01:17:50 +0000323 //tar.name[sizeof(tar.name)] = '\0'; - gcc 4.3.0 would complain
324 tar.mode[0] = '\0';
Denis Vlasenko87cd4a82006-11-25 23:47:32 +0000325 if (tar.prefix[0]) {
326 /* and padding[0] */
Denis Vlasenkobc1918a2008-04-15 01:17:50 +0000327 //tar.prefix[sizeof(tar.prefix)] = '\0'; - gcc 4.3.0 would complain
328 tar.padding[0] = '\0';
Denis Vlasenkocf30cc82006-11-24 14:53:18 +0000329 file_header->name = concat_path_file(tar.prefix, tar.name);
Denis Vlasenko87cd4a82006-11-25 23:47:32 +0000330 } else
Denis Vlasenkocf30cc82006-11-24 14:53:18 +0000331 file_header->name = xstrdup(tar.name);
332 }
333
Glenn L McGrath916ba532004-02-20 02:34:42 +0000334 /* Set bits 12-15 of the files mode */
Denis Vlasenkod6772502006-11-24 17:21:44 +0000335 /* (typeflag was not trashed because chksum does not use getOctal) */
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100336 switch (tar_typeflag) {
Ian Wienand954dbd32011-07-29 08:33:47 +0200337 case '1': /* hardlink */
338 /* we mark hardlinks as regular files with zero size and a link name */
Glenn L McGrath916ba532004-02-20 02:34:42 +0000339 file_header->mode |= S_IFREG;
Ian Wienand954dbd32011-07-29 08:33:47 +0200340 /* on size of link fields from star(4)
341 * ... For tar archives written by pre POSIX.1-1988
342 * implementations, the size field usually contains the size of
343 * the file and needs to be ignored as no data may follow this
344 * header type. For POSIX.1- 1988 compliant archives, the size
345 * field needs to be 0. For POSIX.1-2001 compliant archives,
346 * the size field may be non zero, indicating that file data is
347 * included in the archive.
348 * i.e; always assume this is zero for safety.
349 */
350 goto size0;
Glenn L McGrathc9f1fce2004-02-20 02:25:18 +0000351 case '7':
Denis Vlasenkob5963352006-11-26 01:46:59 +0000352 /* case 0: */
Glenn L McGrath21110a02003-01-28 01:45:48 +0000353 case '0':
Denis Vlasenkod6772502006-11-24 17:21:44 +0000354#if ENABLE_FEATURE_TAR_OLDGNU_COMPATIBILITY
Denys Vlasenko16e82c62020-10-02 18:30:53 +0200355 if (file_header->name && last_char_is(file_header->name, '/')) {
Denis Vlasenkoadc772a2008-07-20 17:10:43 +0000356 goto set_dir;
357 }
Glenn L McGrathc9f1fce2004-02-20 02:25:18 +0000358#endif
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000359 file_header->mode |= S_IFREG;
Glenn L McGrath99b12542002-08-22 17:47:09 +0000360 break;
Glenn L McGrath21110a02003-01-28 01:45:48 +0000361 case '2':
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000362 file_header->mode |= S_IFLNK;
Denis Vlasenkoadc772a2008-07-20 17:10:43 +0000363 /* have seen tarballs with size field containing
364 * the size of the link target's name */
365 size0:
366 file_header->size = 0;
Glenn L McGrath99b12542002-08-22 17:47:09 +0000367 break;
Glenn L McGrath21110a02003-01-28 01:45:48 +0000368 case '3':
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000369 file_header->mode |= S_IFCHR;
Denis Vlasenkoadc772a2008-07-20 17:10:43 +0000370 goto size0; /* paranoia */
Glenn L McGrath21110a02003-01-28 01:45:48 +0000371 case '4':
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000372 file_header->mode |= S_IFBLK;
Denis Vlasenkoadc772a2008-07-20 17:10:43 +0000373 goto size0;
Glenn L McGrath21110a02003-01-28 01:45:48 +0000374 case '5':
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000375 IF_FEATURE_TAR_OLDGNU_COMPATIBILITY(set_dir:)
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000376 file_header->mode |= S_IFDIR;
Denis Vlasenkoadc772a2008-07-20 17:10:43 +0000377 goto size0;
Glenn L McGrath21110a02003-01-28 01:45:48 +0000378 case '6':
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000379 file_header->mode |= S_IFIFO;
Denis Vlasenkoadc772a2008-07-20 17:10:43 +0000380 goto size0;
Denys Vlasenkobdb540e2015-05-11 16:55:16 +0200381 case 'g': /* pax global header */
382 case 'x': { /* pax extended header */
383 if ((uoff_t)file_header->size > 0xfffff) /* paranoia */
384 goto skip_ext_hdr;
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100385 process_pax_hdr(archive_handle, file_header->size, (tar_typeflag == 'g'));
Denys Vlasenkobdb540e2015-05-11 16:55:16 +0200386 goto again_after_align;
Denis Vlasenkod6772502006-11-24 17:21:44 +0000387#if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
Denys Vlasenkobdb540e2015-05-11 16:55:16 +0200388/* See http://www.gnu.org/software/tar/manual/html_node/Extensions.html */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000389 case 'L':
Denis Vlasenkob5963352006-11-26 01:46:59 +0000390 /* free: paranoia: tar with several consecutive longnames */
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000391 free(p_longname);
Denis Vlasenkob5963352006-11-26 01:46:59 +0000392 /* For paranoia reasons we allocate extra NUL char */
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000393 p_longname = xzalloc(file_header->size + 1);
Denis Vlasenkob5963352006-11-26 01:46:59 +0000394 /* We read ASCIZ string, including NUL */
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000395 xread(archive_handle->src_fd, p_longname, file_header->size);
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000396 archive_handle->offset += file_header->size;
Denis Vlasenkob5963352006-11-26 01:46:59 +0000397 /* return get_header_tar(archive_handle); */
398 /* gcc 4.1.1 didn't optimize it into jump */
399 /* so we will do it ourself, this also saves stack */
400 goto again;
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000401 case 'K':
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000402 free(p_linkname);
403 p_linkname = xzalloc(file_header->size + 1);
404 xread(archive_handle->src_fd, p_linkname, file_header->size);
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000405 archive_handle->offset += file_header->size;
Denis Vlasenkob5963352006-11-26 01:46:59 +0000406 /* return get_header_tar(archive_handle); */
407 goto again;
Denys Vlasenkobdb540e2015-05-11 16:55:16 +0200408/*
409 * case 'S': // Sparse file
410 * Was seen in the wild. Not supported (yet?).
411 * See https://www.gnu.org/software/tar/manual/html_section/tar_92.html
412 * for the format. (An "Old GNU Format" was seen, not PAX formats).
413 */
414// case 'D': /* GNU dump dir */
415// case 'M': /* Continuation of multi volume archive */
416// case 'N': /* Old GNU for names > 100 characters */
Denys Vlasenko403d2572018-11-27 12:09:01 +0100417 case 'V': /* Volume header */
418 ; /* Fall through to skip it */
Glenn L McGrath6aa52232004-02-17 11:55:06 +0000419#endif
Denys Vlasenko6111f962012-02-23 13:45:18 +0100420 }
J. Tang77a2c512010-03-19 14:48:51 +0100421 skip_ext_hdr:
J. Tang77a2c512010-03-19 14:48:51 +0100422 {
Denis Vlasenkob5963352006-11-26 01:46:59 +0000423 off_t sz;
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100424 bb_error_msg("warning: skipping header '%c'", tar_typeflag);
Denis Vlasenkob5963352006-11-26 01:46:59 +0000425 sz = (file_header->size + 511) & ~(off_t)511;
426 archive_handle->offset += sz;
427 sz >>= 9; /* sz /= 512 but w/o contortions for signed div */
428 while (sz--)
429 xread(archive_handle->src_fd, &tar, 512);
430 /* return get_header_tar(archive_handle); */
431 goto again_after_align;
432 }
Glenn L McGrathb0e163a2004-02-19 08:48:30 +0000433 default:
Denys Vlasenkobb373db2018-01-27 19:04:08 +0100434 bb_error_msg_and_die("unknown typeflag: 0x%x", tar_typeflag);
Glenn L McGrath6aa52232004-02-17 11:55:06 +0000435 }
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000436
Denis Vlasenkod6772502006-11-24 17:21:44 +0000437#if ENABLE_FEATURE_TAR_GNU_EXTENSIONS
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000438 if (p_longname) {
439 file_header->name = p_longname;
440 p_longname = NULL;
Denis Vlasenkod6772502006-11-24 17:21:44 +0000441 }
Denis Vlasenkoa60936d2008-06-28 05:04:09 +0000442 if (p_linkname) {
443 file_header->link_target = p_linkname;
444 p_linkname = NULL;
Denis Vlasenkod6772502006-11-24 17:21:44 +0000445 }
446#endif
Denys Vlasenko5e29e262011-03-01 17:21:07 +0100447
448 /* Everything up to and including last ".." component is stripped */
Denys Vlasenkob80acf52011-03-02 01:21:02 +0100449 overlapping_strcpy(file_header->name, strip_unsafe_prefix(file_header->name));
Denys Vlasenko6c563e32015-10-22 01:07:13 +0200450//TODO: do the same for file_header->link_target?
Denis Vlasenkod6772502006-11-24 17:21:44 +0000451
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000452 /* Strip trailing '/' in directories */
Denis Vlasenko714701c2006-12-22 00:21:07 +0000453 /* Must be done after mode is set as '/' is used to check if it's a directory */
Denis Vlasenko376ce1e2006-11-24 14:51:01 +0000454 cp = last_char_is(file_header->name, '/');
Glenn L McGrath3d5828f2003-08-14 02:55:15 +0000455
Glenn L McGrath8e940982002-11-04 23:47:31 +0000456 if (archive_handle->filter(archive_handle) == EXIT_SUCCESS) {
Denis Vlasenko0381d422008-07-10 23:06:00 +0000457 archive_handle->action_header(/*archive_handle->*/ file_header);
Denis Vlasenkocf30cc82006-11-24 14:53:18 +0000458 /* Note that we kill the '/' only after action_header() */
459 /* (like GNU tar 1.15.1: verbose mode outputs "dir/dir/") */
Denys Vlasenko02365a62010-04-09 10:52:52 +0200460 if (cp)
461 *cp = '\0';
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000462 archive_handle->action_data(archive_handle);
Denys Vlasenko440a5092012-06-22 16:27:21 +0200463 if (archive_handle->accept || archive_handle->reject
464 || (archive_handle->ah_flags & ARCHIVE_REMEMBER_NAMES)
465 ) {
Denys Vlasenkob768aeb2010-06-26 18:22:41 +0200466 llist_add_to(&archive_handle->passed, file_header->name);
Denys Vlasenko440a5092012-06-22 16:27:21 +0200467 } else /* Caller isn't interested in list of unpacked files */
Denys Vlasenkob768aeb2010-06-26 18:22:41 +0200468 free(file_header->name);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000469 } else {
Eric Andersenc7bda1c2004-03-15 08:29:22 +0000470 data_skip(archive_handle);
Denis Vlasenkob5963352006-11-26 01:46:59 +0000471 free(file_header->name);
Glenn L McGrath7ca04f32002-09-25 02:47:48 +0000472 }
473 archive_handle->offset += file_header->size;
474
Denis Vlasenko75103842007-06-20 14:49:47 +0000475 free(file_header->link_target);
Denys Vlasenkob768aeb2010-06-26 18:22:41 +0200476 /* Do not free(file_header->name)!
477 * It might be inserted in archive_handle->passed - see above */
Denis Vlasenkoe00e5022008-02-14 20:37:54 +0000478#if ENABLE_FEATURE_TAR_UNAME_GNAME
Denys Vlasenkoaa4977d2010-01-06 10:53:17 +0100479 free(file_header->tar__uname);
480 free(file_header->tar__gname);
Denis Vlasenkoe00e5022008-02-14 20:37:54 +0000481#endif
Denys Vlasenkoebfa9b52013-11-19 14:44:04 +0100482 return EXIT_SUCCESS; /* "decoded one header" */
Eric Andersen2276d832002-07-11 11:11:56 +0000483}