blob: 8159497673225c0eda81fbaa345e57c83ef80738 [file] [log] [blame]
Erik Andersene49d5ec2000-02-08 19:58:47 +00001/* vi: set sw=4 ts=4: */
Eric Andersencc8ed391999-10-05 16:24:54 +00002/*
Erik Andersen68a9ea42000-04-04 18:39:50 +00003 * Mini tar implementation for busybox
Erik Andersen6acaa402000-03-26 14:03:20 +00004 *
Glenn L McGrath2e772ed2001-10-05 02:58:48 +00005 * Modifed to use common extraction code used by ar, cpio, dpkg-deb, dpkg
6 * Glenn McGrath <bug1@optushome.com.au>
7 *
Erik Andersen61677fe2000-04-13 01:18:56 +00008 * Note, that as of BusyBox-0.43, tar has been completely rewritten from the
9 * ground up. It still has remnents of the old code lying about, but it is
Eric Andersen77d92682001-05-23 20:32:09 +000010 * very different now (i.e., cleaner, less global variables, etc.)
Eric Andersenc4996011999-10-20 22:08:37 +000011 *
Eric Andersenbdfd0d72001-10-24 05:00:29 +000012 * Copyright (C) 1999,2000 by Lineo, inc. and Erik Andersen
13 * Copyright (C) 1999,2000,2001 by Erik Andersen <andersee@debian.org>
Eric Andersen96bcfd31999-11-12 01:30:18 +000014 *
Erik Andersen6acaa402000-03-26 14:03:20 +000015 * Based in part in the tar implementation in sash
16 * Copyright (c) 1999 by David I. Bell
17 * Permission is granted to use, distribute, or modify this source,
18 * provided that this copyright notice remains intact.
19 * Permission to distribute sash derived code under the GPL has been granted.
20 *
Erik Andersen68a9ea42000-04-04 18:39:50 +000021 * Based in part on the tar implementation from busybox-0.28
Erik Andersen6acaa402000-03-26 14:03:20 +000022 * Copyright (C) 1995 Bruce Perens
23 * This is free software under the GNU General Public License.
24 *
Eric Andersenc4996011999-10-20 22:08:37 +000025 * This program is free software; you can redistribute it and/or modify
26 * it under the terms of the GNU General Public License as published by
27 * the Free Software Foundation; either version 2 of the License, or
28 * (at your option) any later version.
29 *
30 * This program is distributed in the hope that it will be useful,
31 * but WITHOUT ANY WARRANTY; without even the implied warranty of
32 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
33 * General Public License for more details.
34 *
35 * You should have received a copy of the GNU General Public License
36 * along with this program; if not, write to the Free Software
37 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
38 *
Eric Andersencc8ed391999-10-05 16:24:54 +000039 */
40
Eric Andersencc8ed391999-10-05 16:24:54 +000041#include <fcntl.h>
Matt Kraai43c8c382000-09-04 16:51:55 +000042#include <getopt.h>
Glenn L McGrath2e772ed2001-10-05 02:58:48 +000043#include <search.h>
44#include <stdio.h>
Eric Andersened3ef502001-01-27 08:24:39 +000045#include <stdlib.h>
46#include <unistd.h>
Glenn L McGrath2e772ed2001-10-05 02:58:48 +000047#include <fnmatch.h>
48#include <string.h>
49#include <errno.h>
Glenn L McGrathef0eab52001-10-25 14:49:48 +000050#include "unarchive.h"
Eric Andersencbe31da2001-02-20 06:14:08 +000051#include "busybox.h"
Eric Andersencc8ed391999-10-05 16:24:54 +000052
Eric Andersenbdfd0d72001-10-24 05:00:29 +000053#ifdef CONFIG_FEATURE_TAR_CREATE
Eric Andersencc8ed391999-10-05 16:24:54 +000054
Glenn L McGrath2e772ed2001-10-05 02:58:48 +000055/* Tar file constants */
56# define TAR_MAGIC "ustar" /* ustar and a null */
57# define TAR_VERSION " " /* Be compatable with GNU tar format */
58
59# ifndef MAJOR
60# define MAJOR(dev) (((dev)>>8)&0xff)
61# define MINOR(dev) ((dev)&0xff)
62# endif
63
64static const int TAR_BLOCK_SIZE = 512;
65static const int TAR_MAGIC_LEN = 6;
66static const int TAR_VERSION_LEN = 2;
Eric Andersencc8ed391999-10-05 16:24:54 +000067
Erik Andersen298854f2000-03-23 01:09:18 +000068/* POSIX tar Header Block, from POSIX 1003.1-1990 */
Glenn L McGrath2e772ed2001-10-05 02:58:48 +000069enum { NAME_SIZE = 100 }; /* because gcc won't let me use 'static const int' */
Erik Andersen298854f2000-03-23 01:09:18 +000070struct TarHeader
Glenn L McGrath2e772ed2001-10-05 02:58:48 +000071{ /* byte offset */
Eric Andersen1b1cfde2000-09-24 00:54:37 +000072 char name[NAME_SIZE]; /* 0-99 */
Erik Andersen0817d132000-04-09 15:17:40 +000073 char mode[8]; /* 100-107 */
74 char uid[8]; /* 108-115 */
75 char gid[8]; /* 116-123 */
76 char size[12]; /* 124-135 */
77 char mtime[12]; /* 136-147 */
78 char chksum[8]; /* 148-155 */
79 char typeflag; /* 156-156 */
Eric Andersen1b1cfde2000-09-24 00:54:37 +000080 char linkname[NAME_SIZE]; /* 157-256 */
Erik Andersen0817d132000-04-09 15:17:40 +000081 char magic[6]; /* 257-262 */
82 char version[2]; /* 263-264 */
83 char uname[32]; /* 265-296 */
84 char gname[32]; /* 297-328 */
85 char devmajor[8]; /* 329-336 */
86 char devminor[8]; /* 337-344 */
87 char prefix[155]; /* 345-499 */
88 char padding[12]; /* 500-512 (pad to exactly the TAR_BLOCK_SIZE) */
Erik Andersen298854f2000-03-23 01:09:18 +000089};
90typedef struct TarHeader TarHeader;
Eric Andersencc8ed391999-10-05 16:24:54 +000091
Eric Andersen3d957c82000-12-07 00:34:58 +000092/*
93** writeTarFile(), writeFileToTarball(), and writeTarHeader() are
94** the only functions that deal with the HardLinkInfo structure.
95** Even these functions use the xxxHardLinkInfo() functions.
96*/
97typedef struct HardLinkInfo HardLinkInfo;
98struct HardLinkInfo
99{
100 HardLinkInfo *next; /* Next entry in list */
101 dev_t dev; /* Device number */
102 ino_t ino; /* Inode number */
103 short linkCount; /* (Hard) Link Count */
104 char name[1]; /* Start of filename (must be last) */
105};
106
Erik Andersen68a9ea42000-04-04 18:39:50 +0000107/* Some info to be carried along when creating a new tarball */
108struct TarBallInfo
109{
110 char* fileName; /* File name of the tarball */
111 int tarFd; /* Open-for-write file descriptor
112 for the tarball */
113 struct stat statBuf; /* Stat info for the tarball, letting
114 us know the inode and device that the
115 tarball lives, so we can avoid trying
116 to include the tarball into itself */
117 int verboseFlag; /* Whether to print extra stuff or not */
Erik Andersenecd51242000-04-08 03:08:21 +0000118 char** excludeList; /* List of files to not include */
Eric Andersen3d957c82000-12-07 00:34:58 +0000119 HardLinkInfo *hlInfoHead; /* Hard Link Tracking Information */
120 HardLinkInfo *hlInfo; /* Hard Link Info for the current file */
Erik Andersen68a9ea42000-04-04 18:39:50 +0000121};
122typedef struct TarBallInfo TarBallInfo;
123
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000124/* A nice enum with all the possible tar file content types */
125enum TarFileType
126{
127 REGTYPE = '0', /* regular file */
128 REGTYPE0 = '\0', /* regular file (ancient bug compat)*/
129 LNKTYPE = '1', /* hard link */
130 SYMTYPE = '2', /* symbolic link */
131 CHRTYPE = '3', /* character special */
132 BLKTYPE = '4', /* block special */
133 DIRTYPE = '5', /* directory */
134 FIFOTYPE = '6', /* FIFO special */
135 CONTTYPE = '7', /* reserved */
136 GNULONGLINK = 'K', /* GNU long (>100 chars) link name */
137 GNULONGNAME = 'L', /* GNU long (>100 chars) file name */
138};
139typedef enum TarFileType TarFileType;
Erik Andersen68a9ea42000-04-04 18:39:50 +0000140
Eric Andersen3d957c82000-12-07 00:34:58 +0000141/* Might be faster (and bigger) if the dev/ino were stored in numeric order;) */
142static void
143addHardLinkInfo (HardLinkInfo **hlInfoHeadPtr, dev_t dev, ino_t ino,
144 short linkCount, const char *name)
145{
146 /* Note: hlInfoHeadPtr can never be NULL! */
147 HardLinkInfo *hlInfo;
148
149 hlInfo = (HardLinkInfo *)xmalloc(sizeof(HardLinkInfo)+strlen(name)+1);
150 if (hlInfo) {
151 hlInfo->next = *hlInfoHeadPtr;
152 *hlInfoHeadPtr = hlInfo;
153 hlInfo->dev = dev;
154 hlInfo->ino = ino;
155 hlInfo->linkCount = linkCount;
156 strcpy(hlInfo->name, name);
157 }
158 return;
159}
160
161static void
162freeHardLinkInfo (HardLinkInfo **hlInfoHeadPtr)
163{
164 HardLinkInfo *hlInfo = NULL;
165 HardLinkInfo *hlInfoNext = NULL;
166
167 if (hlInfoHeadPtr) {
168 hlInfo = *hlInfoHeadPtr;
169 while (hlInfo) {
170 hlInfoNext = hlInfo->next;
171 free(hlInfo);
172 hlInfo = hlInfoNext;
173 }
174 *hlInfoHeadPtr = NULL;
175 }
176 return;
177}
178
179/* Might be faster (and bigger) if the dev/ino were stored in numeric order;) */
180static HardLinkInfo *
181findHardLinkInfo (HardLinkInfo *hlInfo, dev_t dev, ino_t ino)
182{
183 while(hlInfo) {
184 if ((ino == hlInfo->ino) && (dev == hlInfo->dev))
185 break;
186 hlInfo = hlInfo->next;
187 }
188 return(hlInfo);
189}
190
Erik Andersen6acaa402000-03-26 14:03:20 +0000191/* Put an octal string into the specified buffer.
192 * The number is zero and space padded and possibly null padded.
193 * Returns TRUE if successful. */
194static int putOctal (char *cp, int len, long value)
195{
196 int tempLength;
Erik Andersen6acaa402000-03-26 14:03:20 +0000197 char tempBuffer[32];
Erik Andersen5661fe02000-04-05 01:00:52 +0000198 char *tempString = tempBuffer;
Erik Andersen6acaa402000-03-26 14:03:20 +0000199
200 /* Create a string of the specified length with an initial space,
201 * leading zeroes and the octal number, and a trailing null. */
Erik Andersen5661fe02000-04-05 01:00:52 +0000202 sprintf (tempString, "%0*lo", len - 1, value);
Erik Andersen6acaa402000-03-26 14:03:20 +0000203
204 /* If the string is too large, suppress the leading space. */
Erik Andersen5661fe02000-04-05 01:00:52 +0000205 tempLength = strlen (tempString) + 1;
Erik Andersen6acaa402000-03-26 14:03:20 +0000206 if (tempLength > len) {
207 tempLength--;
208 tempString++;
209 }
210
211 /* If the string is still too large, suppress the trailing null. */
212 if (tempLength > len)
213 tempLength--;
214
215 /* If the string is still too large, fail. */
216 if (tempLength > len)
217 return FALSE;
218
219 /* Copy the string to the field. */
220 memcpy (cp, tempString, len);
221
222 return TRUE;
223}
224
Erik Andersen68a9ea42000-04-04 18:39:50 +0000225/* Write out a tar header for the specified file/directory/whatever */
Erik Andersen3364d782000-03-28 00:58:14 +0000226static int
Matt Kraaie80a2632000-12-19 20:45:49 +0000227writeTarHeader(struct TarBallInfo *tbInfo, const char *header_name,
228 const char *real_name, struct stat *statbuf)
Erik Andersen6acaa402000-03-26 14:03:20 +0000229{
Erik Andersen5661fe02000-04-05 01:00:52 +0000230 long chksum=0;
231 struct TarHeader header;
232 const unsigned char *cp = (const unsigned char *) &header;
233 ssize_t size = sizeof(struct TarHeader);
Eric Andersenfdd51032000-08-02 18:48:26 +0000234
Erik Andersen5661fe02000-04-05 01:00:52 +0000235 memset( &header, 0, size);
Erik Andersen3364d782000-03-28 00:58:14 +0000236
Matt Kraaie80a2632000-12-19 20:45:49 +0000237 strncpy(header.name, header_name, sizeof(header.name));
Erik Andersenecd51242000-04-08 03:08:21 +0000238
Erik Andersen5661fe02000-04-05 01:00:52 +0000239 putOctal(header.mode, sizeof(header.mode), statbuf->st_mode);
240 putOctal(header.uid, sizeof(header.uid), statbuf->st_uid);
241 putOctal(header.gid, sizeof(header.gid), statbuf->st_gid);
242 putOctal(header.size, sizeof(header.size), 0); /* Regular file size is handled later */
243 putOctal(header.mtime, sizeof(header.mtime), statbuf->st_mtime);
244 strncpy(header.magic, TAR_MAGIC TAR_VERSION,
245 TAR_MAGIC_LEN + TAR_VERSION_LEN );
Erik Andersen68a9ea42000-04-04 18:39:50 +0000246
Erik Andersen84e09e42000-04-08 20:58:35 +0000247 /* Enter the user and group names (default to root if it fails) */
Erik Andersen5661fe02000-04-05 01:00:52 +0000248 my_getpwuid(header.uname, statbuf->st_uid);
Erik Andersen5661fe02000-04-05 01:00:52 +0000249 if (! *header.uname)
Erik Andersen84e09e42000-04-08 20:58:35 +0000250 strcpy(header.uname, "root");
Erik Andersen5661fe02000-04-05 01:00:52 +0000251 my_getgrgid(header.gname, statbuf->st_gid);
252 if (! *header.uname)
Erik Andersen84e09e42000-04-08 20:58:35 +0000253 strcpy(header.uname, "root");
Erik Andersen5661fe02000-04-05 01:00:52 +0000254
Eric Andersen3d957c82000-12-07 00:34:58 +0000255 if (tbInfo->hlInfo) {
256 /* This is a hard link */
257 header.typeflag = LNKTYPE;
258 strncpy(header.linkname, tbInfo->hlInfo->name, sizeof(header.linkname));
259 } else if (S_ISLNK(statbuf->st_mode)) {
Mark Whitley8a633262001-04-30 18:17:00 +0000260 char *lpath = xreadlink(real_name);
Eric Andersen28355a32001-05-07 17:48:28 +0000261 if (!lpath) /* Already printed err msg inside xreadlink() */
262 return ( FALSE);
Erik Andersen5661fe02000-04-05 01:00:52 +0000263 header.typeflag = SYMTYPE;
Mark Whitley8a633262001-04-30 18:17:00 +0000264 strncpy(header.linkname, lpath, sizeof(header.linkname));
265 free(lpath);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000266 } else if (S_ISDIR(statbuf->st_mode)) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000267 header.typeflag = DIRTYPE;
268 strncat(header.name, "/", sizeof(header.name));
Erik Andersen68a9ea42000-04-04 18:39:50 +0000269 } else if (S_ISCHR(statbuf->st_mode)) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000270 header.typeflag = CHRTYPE;
271 putOctal(header.devmajor, sizeof(header.devmajor), MAJOR(statbuf->st_rdev));
272 putOctal(header.devminor, sizeof(header.devminor), MINOR(statbuf->st_rdev));
Erik Andersen68a9ea42000-04-04 18:39:50 +0000273 } else if (S_ISBLK(statbuf->st_mode)) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000274 header.typeflag = BLKTYPE;
275 putOctal(header.devmajor, sizeof(header.devmajor), MAJOR(statbuf->st_rdev));
276 putOctal(header.devminor, sizeof(header.devminor), MINOR(statbuf->st_rdev));
Erik Andersen68a9ea42000-04-04 18:39:50 +0000277 } else if (S_ISFIFO(statbuf->st_mode)) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000278 header.typeflag = FIFOTYPE;
279 } else if (S_ISREG(statbuf->st_mode)) {
280 header.typeflag = REGTYPE;
281 putOctal(header.size, sizeof(header.size), statbuf->st_size);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000282 } else {
Matt Kraaidd19c692001-01-31 19:00:21 +0000283 error_msg("%s: Unknown file type", real_name);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000284 return ( FALSE);
285 }
Erik Andersen68a9ea42000-04-04 18:39:50 +0000286
Eric Andersen77d92682001-05-23 20:32:09 +0000287 /* Calculate and store the checksum (i.e., the sum of all of the bytes of
Erik Andersen5661fe02000-04-05 01:00:52 +0000288 * the header). The checksum field must be filled with blanks for the
289 * calculation. The checksum field is formatted differently from the
290 * other fields: it has [6] digits, a null, then a space -- rather than
291 * digits, followed by a null like the other fields... */
292 memset(header.chksum, ' ', sizeof(header.chksum));
293 cp = (const unsigned char *) &header;
294 while (size-- > 0)
295 chksum += *cp++;
296 putOctal(header.chksum, 7, chksum);
297
298 /* Now write the header out to disk */
Mark Whitleyf57c9442000-12-07 19:56:48 +0000299 if ((size=full_write(tbInfo->tarFd, (char*)&header, sizeof(struct TarHeader))) < 0) {
Matt Kraaie80a2632000-12-19 20:45:49 +0000300 error_msg(io_error, real_name, strerror(errno));
Erik Andersen5661fe02000-04-05 01:00:52 +0000301 return ( FALSE);
302 }
303 /* Pad the header up to the tar block size */
304 for (; size<TAR_BLOCK_SIZE; size++) {
305 write(tbInfo->tarFd, "\0", 1);
306 }
307 /* Now do the verbose thing (or not) */
Eric Andersenfdd51032000-08-02 18:48:26 +0000308 if (tbInfo->verboseFlag==TRUE) {
309 FILE *vbFd = stdout;
310 if (tbInfo->tarFd == fileno(stdout)) // If the archive goes to stdout, verbose to stderr
311 vbFd = stderr;
312 fprintf(vbFd, "%s\n", header.name);
313 }
Erik Andersen3364d782000-03-28 00:58:14 +0000314
315 return ( TRUE);
316}
317
Eric Andersenc265b172001-10-27 03:20:00 +0000318# if defined CONFIG_FEATURE_TAR_EXCLUDE
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000319static int exclude_file(char **excluded_files, const char *file)
320{
321 int i;
322
323 if (excluded_files == NULL)
324 return 0;
325
326 for (i = 0; excluded_files[i] != NULL; i++) {
327 if (excluded_files[i][0] == '/') {
328 if (fnmatch(excluded_files[i], file,
329 FNM_PATHNAME | FNM_LEADING_DIR) == 0)
330 return 1;
331 } else {
332 const char *p;
333
334 for (p = file; p[0] != '\0'; p++) {
335 if ((p == file || p[-1] == '/') && p[0] != '/' &&
336 fnmatch(excluded_files[i], p,
337 FNM_PATHNAME | FNM_LEADING_DIR) == 0)
338 return 1;
339 }
340 }
341 }
342
343 return 0;
344}
Eric Andersenc265b172001-10-27 03:20:00 +0000345#endif
Erik Andersen3364d782000-03-28 00:58:14 +0000346
Erik Andersen68a9ea42000-04-04 18:39:50 +0000347static int writeFileToTarball(const char *fileName, struct stat *statbuf, void* userData)
Erik Andersen3364d782000-03-28 00:58:14 +0000348{
Erik Andersen68a9ea42000-04-04 18:39:50 +0000349 struct TarBallInfo *tbInfo = (struct TarBallInfo *)userData;
Matt Kraaie80a2632000-12-19 20:45:49 +0000350 const char *header_name;
Erik Andersen68a9ea42000-04-04 18:39:50 +0000351
Eric Andersen3d957c82000-12-07 00:34:58 +0000352 /*
353 ** Check to see if we are dealing with a hard link.
354 ** If so -
355 ** Treat the first occurance of a given dev/inode as a file while
356 ** treating any additional occurances as hard links. This is done
357 ** by adding the file information to the HardLinkInfo linked list.
358 */
359 tbInfo->hlInfo = NULL;
360 if (statbuf->st_nlink > 1) {
361 tbInfo->hlInfo = findHardLinkInfo(tbInfo->hlInfoHead, statbuf->st_dev,
362 statbuf->st_ino);
363 if (tbInfo->hlInfo == NULL)
364 addHardLinkInfo (&tbInfo->hlInfoHead, statbuf->st_dev,
365 statbuf->st_ino, statbuf->st_nlink, fileName);
366 }
367
Erik Andersen68a9ea42000-04-04 18:39:50 +0000368 /* It is against the rules to archive a socket */
369 if (S_ISSOCK(statbuf->st_mode)) {
Matt Kraaidd19c692001-01-31 19:00:21 +0000370 error_msg("%s: socket ignored", fileName);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000371 return( TRUE);
372 }
373
374 /* It is a bad idea to store the archive we are in the process of creating,
375 * so check the device and inode to be sure that this particular file isn't
376 * the new tarball */
377 if (tbInfo->statBuf.st_dev == statbuf->st_dev &&
378 tbInfo->statBuf.st_ino == statbuf->st_ino) {
Matt Kraaidd19c692001-01-31 19:00:21 +0000379 error_msg("%s: file is the archive; skipping", fileName);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000380 return( TRUE);
381 }
382
Matt Kraaie80a2632000-12-19 20:45:49 +0000383 header_name = fileName;
384 while (header_name[0] == '/') {
Matt Kraaia1f97752000-12-19 06:24:08 +0000385 static int alreadyWarned=FALSE;
386 if (alreadyWarned==FALSE) {
Matt Kraaidd19c692001-01-31 19:00:21 +0000387 error_msg("Removing leading '/' from member names");
Matt Kraaia1f97752000-12-19 06:24:08 +0000388 alreadyWarned=TRUE;
389 }
Matt Kraaie80a2632000-12-19 20:45:49 +0000390 header_name++;
Matt Kraaia1f97752000-12-19 06:24:08 +0000391 }
392
Eric Andersen1b1cfde2000-09-24 00:54:37 +0000393 if (strlen(fileName) >= NAME_SIZE) {
Mark Whitleyf57c9442000-12-07 19:56:48 +0000394 error_msg(name_longer_than_foo, NAME_SIZE);
Eric Andersen1b1cfde2000-09-24 00:54:37 +0000395 return ( TRUE);
396 }
397
Matt Kraaie80a2632000-12-19 20:45:49 +0000398 if (header_name[0] == '\0')
Matt Kraaia1f97752000-12-19 06:24:08 +0000399 return TRUE;
400
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000401# if defined CONFIG_FEATURE_TAR_EXCLUDE
Matt Kraaibe7499c2001-01-03 17:22:10 +0000402 if (exclude_file(tbInfo->excludeList, header_name)) {
403 return SKIP;
Matt Kraaia1f97752000-12-19 06:24:08 +0000404 }
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000405# endif //CONFIG_FEATURE_TAR_EXCLUDE
Matt Kraaia1f97752000-12-19 06:24:08 +0000406
Matt Kraaie80a2632000-12-19 20:45:49 +0000407 if (writeTarHeader(tbInfo, header_name, fileName, statbuf)==FALSE) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000408 return( FALSE);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000409 }
Erik Andersen5661fe02000-04-05 01:00:52 +0000410
411 /* Now, if the file is a regular file, copy it out to the tarball */
Eric Andersen3d957c82000-12-07 00:34:58 +0000412 if ((tbInfo->hlInfo == NULL)
413 && (S_ISREG(statbuf->st_mode))) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000414 int inputFileFd;
415 char buffer[BUFSIZ];
416 ssize_t size=0, readSize=0;
417
418 /* open the file we want to archive, and make sure all is well */
419 if ((inputFileFd = open(fileName, O_RDONLY)) < 0) {
Matt Kraaidd19c692001-01-31 19:00:21 +0000420 error_msg("%s: Cannot open: %s", fileName, strerror(errno));
Erik Andersen5661fe02000-04-05 01:00:52 +0000421 return( FALSE);
422 }
423
424 /* write the file to the archive */
Mark Whitleyf57c9442000-12-07 19:56:48 +0000425 while ( (size = full_read(inputFileFd, buffer, sizeof(buffer))) > 0 ) {
426 if (full_write(tbInfo->tarFd, buffer, size) != size ) {
Erik Andersen5661fe02000-04-05 01:00:52 +0000427 /* Output file seems to have a problem */
Mark Whitleyf57c9442000-12-07 19:56:48 +0000428 error_msg(io_error, fileName, strerror(errno));
Erik Andersen5661fe02000-04-05 01:00:52 +0000429 return( FALSE);
430 }
431 readSize+=size;
432 }
433 if (size == -1) {
Mark Whitleyf57c9442000-12-07 19:56:48 +0000434 error_msg(io_error, fileName, strerror(errno));
Erik Andersen5661fe02000-04-05 01:00:52 +0000435 return( FALSE);
436 }
437 /* Pad the file up to the tar block size */
438 for (; (readSize%TAR_BLOCK_SIZE) != 0; readSize++) {
439 write(tbInfo->tarFd, "\0", 1);
440 }
441 close( inputFileFd);
442 }
Erik Andersen68a9ea42000-04-04 18:39:50 +0000443
444 return( TRUE);
Erik Andersen6acaa402000-03-26 14:03:20 +0000445}
446
Matt Kraaid8ad76c2000-11-08 02:35:47 +0000447static int writeTarFile(const char* tarName, int verboseFlag, char **argv,
448 char** excludeList)
Erik Andersen6acaa402000-03-26 14:03:20 +0000449{
Erik Andersen3364d782000-03-28 00:58:14 +0000450 int tarFd=-1;
Erik Andersen68a9ea42000-04-04 18:39:50 +0000451 int errorFlag=FALSE;
Erik Andersen5661fe02000-04-05 01:00:52 +0000452 ssize_t size;
Erik Andersen68a9ea42000-04-04 18:39:50 +0000453 struct TarBallInfo tbInfo;
454 tbInfo.verboseFlag = verboseFlag;
Eric Andersen3d957c82000-12-07 00:34:58 +0000455 tbInfo.hlInfoHead = NULL;
Erik Andersen3364d782000-03-28 00:58:14 +0000456
457 /* Make sure there is at least one file to tar up. */
Matt Kraaid8ad76c2000-11-08 02:35:47 +0000458 if (*argv == NULL)
Matt Kraaidd19c692001-01-31 19:00:21 +0000459 error_msg_and_die("Cowardly refusing to create an empty archive");
Erik Andersen6acaa402000-03-26 14:03:20 +0000460
461 /* Open the tar file for writing. */
Matt Kraaid8ad76c2000-11-08 02:35:47 +0000462 if (!strcmp(tarName, "-"))
Erik Andersen68a9ea42000-04-04 18:39:50 +0000463 tbInfo.tarFd = fileno(stdout);
Erik Andersen6acaa402000-03-26 14:03:20 +0000464 else
Erik Andersen68a9ea42000-04-04 18:39:50 +0000465 tbInfo.tarFd = open (tarName, O_WRONLY | O_CREAT | O_TRUNC, 0644);
466 if (tbInfo.tarFd < 0) {
Matt Kraai1fa1ade2000-12-18 03:57:16 +0000467 perror_msg( "Error opening '%s'", tarName);
Eric Andersen3d957c82000-12-07 00:34:58 +0000468 freeHardLinkInfo(&tbInfo.hlInfoHead);
Erik Andersen6acaa402000-03-26 14:03:20 +0000469 return ( FALSE);
470 }
Erik Andersenecd51242000-04-08 03:08:21 +0000471 tbInfo.excludeList=excludeList;
Erik Andersen68a9ea42000-04-04 18:39:50 +0000472 /* Store the stat info for the tarball's file, so
473 * can avoid including the tarball into itself.... */
474 if (fstat(tbInfo.tarFd, &tbInfo.statBuf) < 0)
Mark Whitleyf57c9442000-12-07 19:56:48 +0000475 error_msg_and_die(io_error, tarName, strerror(errno));
Erik Andersen6acaa402000-03-26 14:03:20 +0000476
Erik Andersen6acaa402000-03-26 14:03:20 +0000477 /* Read the directory/files and iterate over them one at a time */
Matt Kraaid8ad76c2000-11-08 02:35:47 +0000478 while (*argv != NULL) {
Mark Whitleyf57c9442000-12-07 19:56:48 +0000479 if (recursive_action(*argv++, TRUE, FALSE, FALSE,
Erik Andersen68a9ea42000-04-04 18:39:50 +0000480 writeFileToTarball, writeFileToTarball,
481 (void*) &tbInfo) == FALSE) {
482 errorFlag = TRUE;
Erik Andersen3364d782000-03-28 00:58:14 +0000483 }
Erik Andersen6acaa402000-03-26 14:03:20 +0000484 }
Erik Andersen5661fe02000-04-05 01:00:52 +0000485 /* Write two empty blocks to the end of the archive */
486 for (size=0; size<(2*TAR_BLOCK_SIZE); size++) {
487 write(tbInfo.tarFd, "\0", 1);
488 }
Erik Andersen0817d132000-04-09 15:17:40 +0000489
490 /* To be pedantically correct, we would check if the tarball
Eric Andersen3c5ee9a2000-11-14 22:15:48 +0000491 * is smaller than 20 tar blocks, and pad it if it was smaller,
Erik Andersen0817d132000-04-09 15:17:40 +0000492 * but that isn't necessary for GNU tar interoperability, and
493 * so is considered a waste of space */
494
Erik Andersen68a9ea42000-04-04 18:39:50 +0000495 /* Hang up the tools, close up shop, head home */
Erik Andersen6acaa402000-03-26 14:03:20 +0000496 close(tarFd);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000497 if (errorFlag == TRUE) {
Matt Kraaidd19c692001-01-31 19:00:21 +0000498 error_msg("Error exit delayed from previous errors");
Eric Andersen3d957c82000-12-07 00:34:58 +0000499 freeHardLinkInfo(&tbInfo.hlInfoHead);
Erik Andersen68a9ea42000-04-04 18:39:50 +0000500 return(FALSE);
501 }
Eric Andersen3d957c82000-12-07 00:34:58 +0000502 freeHardLinkInfo(&tbInfo.hlInfoHead);
Erik Andersen6acaa402000-03-26 14:03:20 +0000503 return( TRUE);
504}
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000505#endif //tar_create
Erik Andersen6acaa402000-03-26 14:03:20 +0000506
Glenn L McGrathd642a672001-10-13 06:54:45 +0000507void append_file_to_list(const char *new_name, char ***list, int *list_count)
508{
509 *list = realloc(*list, sizeof(char *) * (*list_count + 2));
Glenn L McGrath051eee62001-10-13 07:11:03 +0000510 (*list)[*list_count] = xstrdup(new_name);
Glenn L McGrathd642a672001-10-13 06:54:45 +0000511 (*list_count)++;
512 (*list)[*list_count] = NULL;
513}
514
515void append_file_list_to_list(char *filename, char ***name_list, int *num_of_entries)
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000516{
517 FILE *src_stream;
518 char *line;
519 char *line_ptr;
520
521 src_stream = xfopen(filename, "r");
522 while ((line = get_line_from_file(src_stream)) != NULL) {
523 line_ptr = last_char_is(line, '\n');
524 if (line_ptr) {
525 *line_ptr = '\0';
526 }
Glenn L McGrathd642a672001-10-13 06:54:45 +0000527 append_file_to_list(line, name_list, num_of_entries);
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000528 free(line);
529 }
530 fclose(src_stream);
531}
Erik Andersen6acaa402000-03-26 14:03:20 +0000532
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000533#ifdef CONFIG_FEATURE_TAR_EXCLUDE
Glenn L McGrath0e766182001-10-13 05:03:29 +0000534/*
535 * Create a list of names that are in the include list AND NOT in the exclude lists
536 */
537char **list_and_not_list(char **include_list, char **exclude_list)
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000538{
539 char **new_include_list = NULL;
540 int new_include_count = 0;
541 int include_count = 0;
542 int exclude_count;
Matt Kraaif86bbfa2001-10-12 19:00:15 +0000543
Glenn L McGrath0e766182001-10-13 05:03:29 +0000544 if (include_list == NULL) {
545 return(NULL);
546 }
547
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000548 while (include_list[include_count] != NULL) {
549 int found = FALSE;
550 exclude_count = 0;
551 while (exclude_list[exclude_count] != NULL) {
552 if (strcmp(include_list[include_count], exclude_list[exclude_count]) == 0) {
553 found = TRUE;
554 break;
555 }
556 exclude_count++;
557 }
558
559 if (found == FALSE) {
560 new_include_list = realloc(new_include_list, sizeof(char *) * (include_count + 2));
561 new_include_list[new_include_count] = include_list[include_count];
562 new_include_count++;
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000563 } else {
564 free(include_list[include_count]);
565 }
566 include_count++;
567 }
Glenn L McGrath0e766182001-10-13 05:03:29 +0000568 new_include_list[new_include_count] = NULL;
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000569 return(new_include_list);
570}
Erik Andersen6acaa402000-03-26 14:03:20 +0000571#endif
572
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000573int tar_main(int argc, char **argv)
574{
575 enum untar_funct_e {
576 /* These are optional */
577 untar_from_file = 1,
578 untar_from_stdin = 2,
579 untar_unzip = 4,
580 /* Require one and only one of these */
581 untar_list = 8,
582 untar_create = 16,
583 untar_extract = 32
584 };
585
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000586 FILE *src_stream = NULL;
587 FILE *uncompressed_stream = NULL;
588 char **include_list = NULL;
Glenn L McGrath4bef7b42001-10-13 19:43:46 +0000589 char **exclude_list = NULL;
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000590 char *src_filename = NULL;
591 char *dst_prefix = NULL;
592 char *file_list_name = NULL;
593 int opt;
594 unsigned short untar_funct = 0;
595 unsigned short untar_funct_required = 0;
596 unsigned short extract_function = 0;
Glenn L McGrath0e766182001-10-13 05:03:29 +0000597 int include_list_count = 0;
Glenn L McGrath4bef7b42001-10-13 19:43:46 +0000598 int exclude_list_count = 0;
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000599 int gunzip_pid;
600 int gz_fd = 0;
601
602 if (argc < 2) {
603 show_usage();
604 }
605
606 /* Prepend '-' to the first argument if required */
607 if (argv[1][0] != '-') {
608 char *tmp = xmalloc(strlen(argv[1]) + 2);
609 tmp[0] = '-';
610 strcpy(tmp + 1, argv[1]);
611 argv[1] = tmp;
612 }
613
614 while ((opt = getopt(argc, argv, "ctxT:X:C:f:Opvz")) != -1) {
615 switch (opt) {
616
617 /* One and only one of these is required */
618 case 'c':
619 untar_funct_required |= untar_create;
620 break;
621 case 't':
622 untar_funct_required |= untar_list;
623 extract_function |= extract_list |extract_unconditional;
624 break;
625 case 'x':
626 untar_funct_required |= untar_extract;
627 extract_function |= (extract_all_to_fs | extract_unconditional | extract_create_leading_dirs);
628 break;
629
630 /* These are optional */
631 /* Exclude or Include files listed in <filename>*/
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000632#ifdef CONFIG_FEATURE_TAR_EXCLUDE
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000633 case 'X':
Glenn L McGrathd642a672001-10-13 06:54:45 +0000634 append_file_list_to_list(optarg, &exclude_list, &exclude_list_count);
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000635 break;
636#endif
637 case 'T':
638 // by default a list is an include list
Glenn L McGrathd642a672001-10-13 06:54:45 +0000639 append_file_list_to_list(optarg, &include_list, &include_list_count);
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000640 break;
641
642 case 'C': // Change to dir <optarg>
643 /* Make sure dst_prefix ends in a '/' */
644 dst_prefix = concat_path_file(optarg, "/");
645 break;
646 case 'f': // archive filename
647 if (strcmp(optarg, "-") == 0) {
648 // Untar from stdin to stdout
649 untar_funct |= untar_from_stdin;
650 } else {
651 untar_funct |= untar_from_file;
652 src_filename = xstrdup(optarg);
653 }
654 break;
655 case 'O':
656 extract_function |= extract_to_stdout;
657 break;
658 case 'p':
659 break;
660 case 'v':
661 if (extract_function & extract_list) {
662 extract_function |= extract_verbose_list;
663 }
664 extract_function |= extract_list;
665 break;
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000666#ifdef CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000667 case 'z':
668 untar_funct |= untar_unzip;
669 break;
670#endif
671 default:
672 show_usage();
673 }
674 }
675
676 /* Make sure the valid arguments were passed */
677 if (untar_funct_required == 0) {
678 error_msg_and_die("You must specify one of the `-ctx' options");
679 }
680 if ((untar_funct_required != untar_create) &&
681 (untar_funct_required != untar_extract) &&
682 (untar_funct_required != untar_list)) {
683 error_msg_and_die("You may not specify more than one `ctx' option.");
684 }
685 untar_funct |= untar_funct_required;
686
687 /* Setup an array of filenames to work with */
688 while (optind < argc) {
Glenn L McGrathd642a672001-10-13 06:54:45 +0000689 append_file_to_list(argv[optind], &include_list, &include_list_count);
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000690 optind++;
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000691 }
692
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000693 if (extract_function & (extract_list | extract_all_to_fs)) {
694 if (dst_prefix == NULL) {
695 dst_prefix = xstrdup("./");
696 }
697
698 /* Setup the source of the tar data */
699 if (untar_funct & untar_from_file) {
700 src_stream = xfopen(src_filename, "r");
701 } else {
702 src_stream = stdin;
703 }
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000704#ifdef CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000705 /* Get a binary tree of all the tar file headers */
706 if (untar_funct & untar_unzip) {
707 uncompressed_stream = gz_open(src_stream, &gunzip_pid);
708 } else
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000709#endif // CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000710 uncompressed_stream = src_stream;
711
712 /* extract or list archive */
Glenn L McGrath4bef7b42001-10-13 19:43:46 +0000713 unarchive(uncompressed_stream, stdout, &get_header_tar, extract_function, dst_prefix, include_list, exclude_list);
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000714 fclose(uncompressed_stream);
715 }
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000716#ifdef CONFIG_FEATURE_TAR_CREATE
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000717 /* create an archive */
718 else if (untar_funct & untar_create) {
719 int verboseFlag = FALSE;
720
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000721#ifdef CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000722 if (untar_funct && untar_unzip) {
723 error_msg_and_die("Creation of compressed tarfile not internally support by tar, pipe to busybox gunzip");
724 }
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000725#endif // CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000726 if (extract_function & extract_verbose_list) {
727 verboseFlag = TRUE;
728 }
Glenn L McGrath4bef7b42001-10-13 19:43:46 +0000729 writeTarFile(src_filename, verboseFlag, &argv[argc - 1], include_list);
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000730 }
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000731#endif // CONFIG_FEATURE_TAR_CREATE
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000732
733 /* Cleanups */
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000734#ifdef CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000735 if (untar_funct & untar_unzip) {
736 fclose(src_stream);
737 close(gz_fd);
738 gz_close(gunzip_pid);
739 }
Eric Andersenbdfd0d72001-10-24 05:00:29 +0000740#endif // CONFIG_FEATURE_TAR_GZIP
Glenn L McGrath2e772ed2001-10-05 02:58:48 +0000741 if (src_filename) {
742 free(src_filename);
743 }
744 if (file_list_name) {
745 free(file_list_name);
746 }
747 return(EXIT_SUCCESS);
748}