123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747 |
- /* Extract files from a tar archive.
- Copyright (C) 1988 Free Software Foundation
- This file is part of GNU Tar.
- GNU Tar is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2, or (at your option)
- any later version.
- GNU Tar is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with GNU Tar; see the file COPYING. If not, write to
- the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
- /*
- * Extract files from a tar archive.
- *
- * Written 19 Nov 1985 by John Gilmore, ihnp4!hoptoad!gnu.
- */
- #include <stdio.h>
- #include <errno.h>
- #ifndef STDC_HEADERS
- extern int errno;
- #endif
- #include <sys/types.h>
- #include <time.h>
- time_t time();
- #ifdef BSD42
- #include <sys/file.h>
- #else
- #ifndef V7
- #include <fcntl.h>
- #endif
- #endif
- #if defined(POSIX)
- #include <utime.h>
- #endif
- #ifdef NO_OPEN3
- /* We need the #define's even though we don't use them. */
- #include "open3.h"
- #endif
- #ifdef EMUL_OPEN3
- /* Simulated 3-argument open for systems that don't have it */
- #include "open3.h"
- #endif
- #include "tar.h"
- #include "port.h"
- extern FILE *msg_file;
- extern union record *head; /* Points to current tape header */
- extern struct stat hstat; /* Stat struct corresponding */
- extern int head_standard; /* Tape header is in ANSI format */
- extern char *save_name;
- extern long save_totsize;
- extern long save_sizeleft;
- int confirm();
- void decode_header();
- void extract_mangle();
- void extract_sparse_file();
- long from_oct();
- void gnu_restore();
- extern void print_header();
- extern void skip_file();
- extern void skip_extended_headers();
- extern void pr_mkdir();
- void saverec();
- int make_dirs(); /* Makes required directories */
- static time_t now = 0; /* Current time */
- static we_are_root = 0; /* True if our effective uid == 0 */
- static int notumask = ~0; /* Masks out bits user doesn't want */
- /*
- * "Scratch" space to store the information about a sparse file before
- * writing the info into the header or extended header
- */
- /*struct sp_array *sparsearray;*/
- /* number of elts storable in the sparsearray */
- /*int sp_array_size = 10;*/
- /*
- * Set up to extract files.
- */
- void
- extr_init()
- {
- int ourmask;
- now = time((time_t *)0);
- if (geteuid() == 0)
- we_are_root = 1;
- /*
- * We need to know our umask. But if f_use_protection is set,
- * leave our kernel umask at 0, and our "notumask" at ~0.
- */
- ourmask = umask(0); /* Read it */
- if (!f_use_protection) {
- (void) umask (ourmask); /* Set it back how it was */
- notumask = ~ourmask; /* Make umask override permissions */
- }
- }
- /*
- * Extract a file from the archive.
- */
- void
- extract_archive()
- {
- register char *data;
- int fd, check, namelen, written, openflag;
- long size;
- time_t acc_upd_times[2];
- register int skipcrud;
- register int i;
- /* int sparse_ind = 0;*/
- union record *exhdr;
- /* int end_nulls; */
-
- saverec(&head); /* Make sure it sticks around */
- userec(head); /* And go past it in the archive */
- decode_header(head, &hstat, &head_standard, 1); /* Snarf fields */
- if(f_confirm && !confirm("extract",head->header.name)) {
- if (head->header.isextended)
- skip_extended_headers();
- skip_file((long)hstat.st_size);
- saverec((union record **)0);
- return;
- }
- /* Print the record from 'head' and 'hstat' */
- if (f_verbose)
- print_header();
- /*
- * Check for fully specified pathnames and other atrocities.
- *
- * Note, we can't just make a pointer to the new file name,
- * since saverec() might move the header and adjust "head".
- * We have to start from "head" every time we want to touch
- * the header record.
- */
- skipcrud = 0;
- while (!f_absolute_paths && '/' == head->header.name[skipcrud]) {
- static int warned_once = 0;
- skipcrud++; /* Force relative path */
- if (!warned_once++) {
- msg("Removing leading / from absolute path names in the archive.");
- }
- }
- switch (head->header.linkflag) {
- default:
- msg("Unknown file type '%c' for %s, extracted as normal file",
- head->header.linkflag, skipcrud+head->header.name);
- /* FALL THRU */
- /*
- * JK - What we want to do if the file is sparse is loop through
- * the array of sparse structures in the header and read in
- * and translate the character strings representing 1) the offset
- * at which to write and 2) how many bytes to write into numbers,
- * which we store into the scratch array, "sparsearray". This
- * array makes our life easier the same way it did in creating
- * the tar file that had to deal with a sparse file.
- *
- * After we read in the first five (at most) sparse structures,
- * we check to see if the file has an extended header, i.e.,
- * if more sparse structures are needed to describe the contents
- * of the new file. If so, we read in the extended headers
- * and continue to store their contents into the sparsearray.
- */
- case LF_SPARSE:
- sp_array_size = 10;
- sparsearray = (struct sp_array *) malloc(sp_array_size * sizeof(struct sp_array));
- for (i = 0; i < SPARSE_IN_HDR; i++) {
- sparsearray[i].offset =
- from_oct(1+12, head->header.sp[i].offset);
- sparsearray[i].numbytes =
- from_oct(1+12, head->header.sp[i].numbytes);
- if (!sparsearray[i].numbytes)
- break;
- }
-
- /* end_nulls = from_oct(1+12, head->header.ending_blanks);*/
-
- if (head->header.isextended) {
- /* read in the list of extended headers
- and translate them into the sparsearray
- as before */
- /* static */ int ind = SPARSE_IN_HDR;
-
- for (;;) {
-
- exhdr = findrec();
- for (i = 0; i < SPARSE_EXT_HDR; i++) {
-
- if (i+ind > sp_array_size-1) {
- /*
- * realloc the scratch area
- * since we've run out of room --
- */
- sparsearray = (struct sp_array *)
- realloc(sparsearray,
- 2 * sp_array_size * (sizeof(struct sp_array)));
- sp_array_size *= 2;
- }
- if (!exhdr->ext_hdr.sp[i].numbytes)
- break;
- sparsearray[i+ind].offset =
- from_oct(1+12, exhdr->ext_hdr.sp[i].offset);
- sparsearray[i+ind].numbytes =
- from_oct(1+12, exhdr->ext_hdr.sp[i].numbytes);
- }
- if (!exhdr->ext_hdr.isextended)
- break;
- else {
- ind += SPARSE_EXT_HDR;
- userec(exhdr);
- }
- }
- userec(exhdr);
- }
-
- /* FALL THRU */
- case LF_OLDNORMAL:
- case LF_NORMAL:
- case LF_CONTIG:
- /*
- * Appears to be a file.
- * See if it's really a directory.
- */
- namelen = strlen(skipcrud+head->header.name)-1;
- if (head->header.name[skipcrud+namelen] == '/')
- goto really_dir;
- /* FIXME, deal with protection issues */
- again_file:
- openflag = (f_keep?
- O_BINARY|O_NDELAY|O_WRONLY|O_CREAT|O_EXCL:
- O_BINARY|O_NDELAY|O_WRONLY|O_CREAT|O_TRUNC)
- | ((head->header.linkflag == LF_SPARSE) ? 0 : O_APPEND);
- /*
- * JK - The last | is a kludge to solve the problem
- * the O_APPEND flag causes with files we are
- * trying to make sparse: when a file is opened
- * with O_APPEND, it writes to the last place
- * that something was written, thereby ignoring
- * any lseeks that we have done. We add this
- * extra condition to make it able to lseek when
- * a file is sparse, i.e., we don't open the new
- * file with this flag. (Grump -- this bug caused
- * me to waste a good deal of time, I might add)
- */
- if(f_exstdout) {
- fd = 1;
- goto extract_file;
- }
- #ifdef O_CTG
- /*
- * Contiguous files (on the Masscomp) have to specify
- * the size in the open call that creates them.
- */
- if (head->header.linkflag == LF_CONTIG)
- fd = open(skipcrud+head->header.name, openflag | O_CTG,
- hstat.st_mode, hstat.st_size);
- else
- #endif
- {
- #ifdef NO_OPEN3
- /*
- * On raw V7 we won't let them specify -k (f_keep), but
- * we just bull ahead and create the files.
- */
- fd = creat(skipcrud+head->header.name,
- hstat.st_mode);
- #else
- /*
- * With 3-arg open(), we can do this up right.
- */
- fd = open(skipcrud+head->header.name, openflag,
- hstat.st_mode);
- #endif
- }
- if (fd < 0) {
- if (make_dirs(skipcrud+head->header.name))
- goto again_file;
- msg_perror("Could not create file %s",skipcrud+head->header.name);
- if (head->header.isextended)
- skip_extended_headers();
- skip_file((long)hstat.st_size);
- goto quit;
- }
- extract_file:
- if (head->header.linkflag == LF_SPARSE) {
- char *name;
- int namelen;
- /*
- * Kludge alert. NAME is assigned to header.name
- * because during the extraction, the space that
- * contains the header will get scribbled on, and
- * the name will get munged, so any error messages
- * that happen to contain the filename will look
- * REAL interesting unless we do this.
- */
- namelen = strlen(skipcrud+head->header.name);
- name = (char *) malloc((sizeof(char)) * namelen);
- bcopy(skipcrud+head->header.name, name, namelen);
- size = hstat.st_size;
- extract_sparse_file(fd, &size, hstat.st_size,
- name);
- }
- else
- for (size = hstat.st_size;
- size > 0;
- size -= written) {
- /* long offset,
- numbytes;*/
- if(f_multivol) {
- save_name=head->header.name;
- save_totsize=hstat.st_size;
- save_sizeleft=size;
- }
-
- /*
- * Locate data, determine max length
- * writeable, write it, record that
- * we have used the data, then check
- * if the write worked.
- */
- data = findrec()->charptr;
- if (data == NULL) { /* Check it... */
- msg("Unexpected EOF on archive file");
- break;
- }
- /*
- * JK - If the file is sparse, use the sparsearray
- * that we created before to lseek into the new
- * file the proper amount, and to see how many
- * bytes we want to write at that position.
- */
- /* if (head->header.linkflag == LF_SPARSE) {
- off_t pos;
-
- pos = lseek(fd, (off_t) sparsearray[sparse_ind].offset, 0);
- printf("%d at %d\n", (int) pos, sparse_ind);
- written = sparsearray[sparse_ind++].numbytes;
- } else*/
- written = endofrecs()->charptr - data;
- if (written > size)
- written = size;
- errno = 0;
- check = write(fd, data, written);
- /*
- * The following is in violation of strict
- * typing, since the arg to userec
- * should be a struct rec *. FIXME.
- */
- userec((union record *)(data + written - 1));
- if (check == written) continue;
- /*
- * Error in writing to file.
- * Print it, skip to next file in archive.
- */
- if(check<0)
- msg_perror("couldn't write to file %s",skipcrud+head->header.name);
- else
- msg("could only write %d of %d bytes to file %s",written,check,skipcrud+head->header.name);
- skip_file((long)(size - written));
- break; /* Still do the close, mod time, chmod, etc */
- }
- if(f_multivol)
- save_name = 0;
- /* If writing to stdout, don't try to do anything
- to the filename; it doesn't exist, or we don't
- want to touch it anyway */
- if(f_exstdout)
- break;
-
- /* if (head->header.isextended) {
- register union record *exhdr;
- register int i;
-
- for (i = 0; i < 21; i++) {
- long offset;
-
- if (!exhdr->ext_hdr.sp[i].numbytes)
- break;
- offset = from_oct(1+12,
- exhdr->ext_hdr.sp[i].offset);
- written = from_oct(1+12,
- exhdr->ext_hdr.sp[i].numbytes);
- lseek(fd, offset, 0);
- check = write(fd, data, written);
- if (check == written) continue;
- }
-
- }*/
- check = close(fd);
- if (check < 0) {
- msg_perror("Error while closing %s",skipcrud+head->header.name);
- }
-
- set_filestat:
- /*
- * If we are root, set the owner and group of the extracted
- * file. This does what is wanted both on real Unix and on
- * System V. If we are running as a user, we extract as that
- * user; if running as root, we extract as the original owner.
- */
- if (we_are_root || f_do_chown) {
- if (chown(skipcrud+head->header.name, hstat.st_uid,
- hstat.st_gid) < 0) {
- msg_perror("cannot chown file %s to uid %d gid %d",skipcrud+head->header.name,hstat.st_uid,hstat.st_gid);
- }
- }
- /*
- * Set the modified time of the file.
- *
- * Note that we set the accessed time to "now", which
- * is really "the time we started extracting files".
- * unless f_gnudump is used, in which case .st_atime is used
- */
- if (!f_modified) {
- /* fixme if f_gnudump should set ctime too, but how? */
- if(f_gnudump)
- acc_upd_times[0]=hstat.st_atime;
- else acc_upd_times[0] = now; /* Accessed now */
- acc_upd_times[1] = hstat.st_mtime; /* Mod'd */
- if (utime(skipcrud+head->header.name,
- acc_upd_times) < 0) {
- msg_perror("couldn't change access and modification times of %s",skipcrud+head->header.name);
- }
- }
- /* We do the utime before the chmod because some versions of
- utime are broken and trash the modes of the file. Since
- we then change the mode anyway, we don't care. . . */
- /*
- * If '-k' is not set, open() or creat() could have saved
- * the permission bits from a previously created file,
- * ignoring the ones we specified.
- * Even if -k is set, if the file has abnormal
- * mode bits, we must chmod since writing or chown() has
- * probably reset them.
- *
- * If -k is set, we know *we* created this file, so the mode
- * bits were set by our open(). If the file is "normal", we
- * skip the chmod. This works because we did umask(0) if -p
- * is set, so umask will have left the specified mode alone.
- */
- if ((!f_keep)
- || (hstat.st_mode & (S_ISUID|S_ISGID|S_ISVTX))) {
- if (chmod(skipcrud+head->header.name,
- notumask & (int)hstat.st_mode) < 0) {
- msg_perror("cannot change mode of file %s to %ld",skipcrud+head->header.name,notumask & (int)hstat.st_mode);
- }
- }
- quit:
- break;
- case LF_LINK:
- again_link:
- {
- struct stat st1,st2;
- check = link (head->header.linkname,
- skipcrud+head->header.name);
- if (check == 0)
- break;
- if (make_dirs(skipcrud+head->header.name))
- goto again_link;
- if(f_gnudump && errno==EEXIST)
- break;
- if( stat(head->header.linkname, &st1) == 0
- && stat(skipcrud+head->header.name, &st2)==0
- && st1.st_dev==st2.st_dev
- && st1.st_ino==st2.st_ino)
- break;
- msg_perror("Could not link %s to %s",
- skipcrud+head->header.name,head->header.linkname);
- }
- break;
- #ifdef S_ISLNK
- case LF_SYMLINK:
- again_symlink:
- check = symlink(head->header.linkname,
- skipcrud+head->header.name);
- /* FIXME, don't worry uid, gid, etc... */
- if (check == 0)
- break;
- if (make_dirs(skipcrud+head->header.name))
- goto again_symlink;
- msg_perror("Could not create symlink to %s",head->header.linkname);
- break;
- #endif
- #ifdef S_IFCHR
- case LF_CHR:
- hstat.st_mode |= S_IFCHR;
- goto make_node;
- #endif
- #ifdef S_IFBLK
- case LF_BLK:
- hstat.st_mode |= S_IFBLK;
- #endif
- #if defined(S_IFCHR) || defined(S_IFBLK)
- make_node:
- check = mknod(skipcrud+head->header.name,
- (int) hstat.st_mode, (int) hstat.st_rdev);
- if (check != 0) {
- if (make_dirs(skipcrud+head->header.name))
- goto make_node;
- msg_perror("Could not make %s",skipcrud+head->header.name);
- break;
- };
- goto set_filestat;
- #endif
- #ifdef S_ISFIFO
- /* If local system doesn't support FIFOs, use default case */
- case LF_FIFO:
- make_fifo:
- check = mkfifo(skipcrud+head->header.name,
- (int) hstat.st_mode);
- if (check != 0) {
- if (make_dirs(skipcrud+head->header.name))
- goto make_fifo;
- msg_perror("Could not make %s",skipcrud+head->header.name);
- break;
- };
- goto set_filestat;
- #endif
- case LF_DIR:
- case LF_DUMPDIR:
- namelen = strlen(skipcrud+head->header.name)-1;
- really_dir:
- /* Check for trailing /, and zap as many as we find. */
- while (namelen && head->header.name[skipcrud+namelen] == '/')
- head->header.name[skipcrud+namelen--] = '\0';
- if(f_gnudump) { /* Read the entry and delete files
- that aren't listed in the archive */
- gnu_restore(skipcrud);
-
- } else if(head->header.linkflag==LF_DUMPDIR)
- skip_file((long)(hstat.st_size));
-
- again_dir:
- check = mkdir(skipcrud+head->header.name,
- (we_are_root ? 0 : 0300) | (int)hstat.st_mode);
- if (check != 0) {
- struct stat st1;
- if (make_dirs(skipcrud+head->header.name))
- goto again_dir;
- /* If we're trying to create '.', let it be. */
- if (head->header.name[skipcrud+namelen] == '.' &&
- (namelen==0 ||
- head->header.name[skipcrud+namelen-1]=='/'))
- goto check_perms;
- if( errno==EEXIST
- && stat(skipcrud+head->header.name,&st1)==0
- && (S_ISDIR(st1.st_mode)))
- break;
- msg_perror("Could not create directory %s",skipcrud+head->header.name);
- break;
- }
-
- check_perms:
- if (!we_are_root && 0300 != (0300 & (int) hstat.st_mode)) {
- hstat.st_mode |= 0300;
- msg("Added write and execute permission to directory %s",
- skipcrud+head->header.name);
- }
- goto set_filestat;
- /* FIXME, Remember timestamps for after files created? */
- /* FIXME, change mode after files created (if was R/O dir) */
- case LF_VOLHDR:
- if(f_verbose) {
- printf("Reading %s\n",head->header.name);
- }
- break;
- case LF_NAMES:
- extract_mangle(head);
- break;
- case LF_MULTIVOL:
- msg("Can't extract '%s'--file is continued from another volume\n",head->header.name);
- skip_file((long)hstat.st_size);
- break;
- }
- /* We don't need to save it any longer. */
- saverec((union record **) 0); /* Unsave it */
- }
- /*
- * After a file/link/symlink/dir creation has failed, see if
- * it's because some required directory was not present, and if
- * so, create all required dirs.
- */
- int
- make_dirs(pathname)
- char *pathname;
- {
- char *p; /* Points into path */
- int madeone = 0; /* Did we do anything yet? */
- int save_errno = errno; /* Remember caller's errno */
- int check;
- if (errno != ENOENT)
- return 0; /* Not our problem */
- for (p = index(pathname, '/'); p != NULL; p = index(p+1, '/')) {
- /* Avoid mkdir of empty string, if leading or double '/' */
- if (p == pathname || p[-1] == '/')
- continue;
- /* Avoid mkdir where last part of path is '.' */
- if (p[-1] == '.' && (p == pathname+1 || p[-2] == '/'))
- continue;
- *p = 0; /* Truncate the path there */
- check = mkdir (pathname, 0777); /* Try to create it as a dir */
- if (check == 0) {
- /* Fix ownership */
- if (we_are_root) {
- if (chown(pathname, hstat.st_uid,
- hstat.st_gid) < 0) {
- msg_perror("cannot change owner of %s to uid %d gid %d",pathname,hstat.st_uid,hstat.st_gid);
- }
- }
- pr_mkdir(pathname, p-pathname, notumask&0777);
- madeone++; /* Remember if we made one */
- *p = '/';
- continue;
- }
- *p = '/';
- if (errno == EEXIST) /* Directory already exists */
- continue;
- /*
- * Some other error in the mkdir. We return to the caller.
- */
- break;
- }
- errno = save_errno; /* Restore caller's errno */
- return madeone; /* Tell them to retry if we made one */
- }
- void
- extract_sparse_file(fd, sizeleft, totalsize, name)
- int fd;
- long *sizeleft,
- totalsize;
- char *name;
- {
- /* register char *data;*/
- union record *datarec;
- int sparse_ind = 0;
- int written,
- count;
-
- /* assuming sizeleft is initially totalsize */
- while (*sizeleft > 0) {
- datarec = findrec();
- if (datarec == NULL) {
- msg("Unexpected EOF on archive file");
- return;
- }
- lseek(fd, sparsearray[sparse_ind].offset, 0);
- written = sparsearray[sparse_ind++].numbytes;
- while (written > RECORDSIZE) {
- count = write(fd, datarec->charptr, RECORDSIZE);
- if (count < 0)
- msg_perror("couldn't write to file %s", name);
- written -= count;
- *sizeleft -= count;
- userec(datarec);
- datarec = findrec();
- }
- count = write(fd, datarec->charptr, written);
-
- if (count < 0) {
- msg_perror("couldn't write to file %s", name);
- } else if (count != written) {
- msg("could only write %d of %d bytes to file %s", totalsize - *sizeleft, totalsize, name);
- skip_file((long) (*sizeleft));
- }
- written -= count;
- *sizeleft -= count;
- userec(datarec);
- }
- free(sparsearray);
- /* if (end_nulls) {
- register int i;
- printf("%d\n", (int) end_nulls);
- for (i = 0; i < end_nulls; i++)
- write(fd, "\000", 1);
- }*/
- userec(datarec);
- }
|