1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504 |
- /* Create a tar archive.
- Copyright 1985, 92, 93, 94, 96, 97, 1999 Free Software Foundation, Inc.
- Written by John Gilmore, on 1985-08-25.
- This program is free software; you can redistribute it and/or modify it
- under the terms of the GNU General Public License as published by the
- Free Software Foundation; either version 2, or (at your option) any later
- version.
- This program is distributed in the hope that it will be useful, but
- WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
- Public License for more details.
- You should have received a copy of the GNU General Public License along
- with this program; if not, write to the Free Software Foundation, Inc.,
- 59 Place - Suite 330, Boston, MA 02111-1307, USA. */
- #include "system.h"
- #if !MSDOS
- # include <pwd.h>
- # include <grp.h>
- #endif
- #if HAVE_UTIME_H
- # include <utime.h>
- #else
- struct utimbuf
- {
- long actime;
- long modtime;
- };
- #endif
- #include "common.h"
- #ifndef MSDOS
- extern dev_t ar_dev;
- extern ino_t ar_ino;
- #endif
- extern struct name *gnu_list_name;
- /* This module is the only one that cares about `struct link's. */
- struct link
- {
- struct link *next;
- dev_t dev;
- ino_t ino;
- short linkcount;
- char name[1];
- };
- struct link *linklist = NULL; /* points to first link in list */
- /*------------------------------------------------------------------------.
- | Convert VALUE into a size-SIZE field at WHERE, including a |
- | trailing space. For example, 3 for SIZE means two digits and a space. |
- | |
- | We assume the trailing NUL is already there and don't fill it in. This |
- | fact is used by start_header and finish_header, so don't change it! |
- `------------------------------------------------------------------------*/
- /* This should be equivalent to: sprintf (WHERE, "%*lo ", SIZE - 1, VALUE);
- except that we don't assume VALUE fits in an unsigned long, and
- except that sprintf fills in the trailing NUL and we don't. */
- static void
- to_oct (uintmax_t value, char *where, size_t size, const char *type)
- {
- uintmax_t v = value;
- size_t i = size;
- where[--i] = ' '; /* put in the space, though */
- /* Produce the digits -- at least one. */
- do
- {
- where[--i] = '0' + (int) (v & 7); /* one octal digit */
- v >>= 3;
- }
- while (i != 0 && v != 0);
- /* Leading spaces, if necessary. */
- while (i != 0)
- where[--i] = ' ';
- if (v != 0)
- {
- char buf[UINTMAX_STRSIZE_BOUND];
- ERROR ((0, 0, _("%s value %s is too large to fit in a %u-bit field"),
- type, STRINGIFY_BIGINT (value, buf),
- (unsigned) ((size - 1) * 3)));
- }
- }
- void
- gid_to_oct (gid_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "gid_t");
- }
- void
- major_to_oct (major_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "major_t");
- }
- void
- minor_to_oct (minor_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "minor_t");
- }
- void
- mode_to_oct (mode_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "mode_t");
- }
- void
- off_to_oct (off_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "off_t");
- }
- void
- size_to_oct (size_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "size_t");
- }
- void
- time_to_oct (time_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "time_t");
- }
- void
- uid_to_oct (uid_t v, char *p, size_t s)
- {
- to_oct ((uintmax_t) v, p, s, "uid_t");
- }
- void
- uintmax_to_oct (uintmax_t v, char *p, size_t s)
- {
- to_oct (v, p, s, "uintmax_t");
- }
- /* Writing routines. */
- /*-----------------------------------------------------------------------.
- | Just zeroes out the buffer so we don't confuse ourselves with leftover |
- | data. |
- `-----------------------------------------------------------------------*/
- static void
- clear_buffer (char *buffer)
- {
- memset (buffer, 0, BLOCKSIZE);
- }
- /*-------------------------------------------------------------------------.
- | Write the EOT block(s). We actually zero at least one block, through |
- | the end of the record. Old tar, as previous versions of GNU tar, writes |
- | garbage after two zeroed blocks. |
- `-------------------------------------------------------------------------*/
- void
- write_eot (void)
- {
- union block *pointer = find_next_block ();
- if (pointer)
- {
- size_t space = available_space_after (pointer);
- memset (pointer->buffer, 0, space);
- set_next_block_after (pointer);
- }
- }
- /*-----------------------------------------------------.
- | Write a GNUTYPE_LONGLINK or GNUTYPE_LONGNAME block. |
- `-----------------------------------------------------*/
- /* FIXME: Cross recursion between start_header and write_long! */
- static union block *start_header PARAMS ((const char *, struct stat *));
- static void
- write_long (const char *p, char type)
- {
- size_t size = strlen (p) + 1;
- size_t bufsize;
- union block *header;
- struct stat foo;
- memset (&foo, 0, sizeof foo);
- foo.st_size = size;
- header = start_header ("././@LongLink", &foo);
- header->header.typeflag = type;
- finish_header (header);
- header = find_next_block ();
- bufsize = available_space_after (header);
- while (bufsize < size)
- {
- memcpy (header->buffer, p, bufsize);
- p += bufsize;
- size -= bufsize;
- set_next_block_after (header + (bufsize - 1) / BLOCKSIZE);
- header = find_next_block ();
- bufsize = available_space_after (header);
- }
- memcpy (header->buffer, p, size);
- memset (header->buffer + size, 0, bufsize - size);
- set_next_block_after (header + (size - 1) / BLOCKSIZE);
- }
- /* Header handling. */
- /*---------------------------------------------------------------------.
- | Make a header block for the file name whose stat info is st. Return |
- | header pointer for success, NULL if the name is too long. |
- `---------------------------------------------------------------------*/
- static union block *
- start_header (const char *name, struct stat *st)
- {
- union block *header;
- if (!absolute_names_option)
- {
- static int warned_once = 0;
- #if MSDOS
- if (name[1] == ':')
- {
- name += 2;
- if (!warned_once)
- {
- warned_once = 1;
- WARN ((0, 0, _("Removing drive spec from names in the archive")));
- }
- }
- #endif
- while (*name == '/')
- {
- name++; /* force relative path */
- if (!warned_once)
- {
- warned_once = 1;
- WARN ((0, 0, _("\
- Removing leading `/' from absolute path names in the archive")));
- }
- }
- }
- /* Check the file name and put it in the block. */
- if (strlen (name) >= (size_t) NAME_FIELD_SIZE)
- write_long (name, GNUTYPE_LONGNAME);
- header = find_next_block ();
- memset (header->buffer, 0, sizeof (union block));
- assign_string (¤t_file_name, name);
- strncpy (header->header.name, name, NAME_FIELD_SIZE);
- header->header.name[NAME_FIELD_SIZE - 1] = '\0';
- /* Override some stat fields, if requested to do so. */
- if (owner_option != (uid_t) -1)
- st->st_uid = owner_option;
- if (group_option != (gid_t) -1)
- st->st_gid = group_option;
- if (mode_option)
- st->st_mode = ((st->st_mode & S_IFMT)
- | mode_adjust (st->st_mode, mode_option));
- /* Paul Eggert tried the trivial test ($WRITER cf a b; $READER tvf a)
- for a few tars and came up with the following interoperability
- matrix:
- WRITER
- 1 2 3 4 5 6 7 8 9 READER
- . . . . . . . . . 1 = SunOS 4.2 tar
- # . . # # . . # # 2 = NEC SVR4.0.2 tar
- . . . # # . . # . 3 = Solaris 2.1 tar
- . . . . . . . . . 4 = GNU tar 1.11.1
- . . . . . . . . . 5 = HP-UX 8.07 tar
- . . . . . . . . . 6 = Ultrix 4.1
- . . . . . . . . . 7 = AIX 3.2
- . . . . . . . . . 8 = Hitachi HI-UX 1.03
- . . . . . . . . . 9 = Omron UNIOS-B 4.3BSD 1.60Beta
- . = works
- # = ``impossible file type''
- The following mask for old archive removes the `#'s in column 4
- above, thus making GNU tar both a universal donor and a universal
- acceptor for Paul's test. */
- if (archive_format == V7_FORMAT)
- MODE_TO_OCT (st->st_mode & 07777, header->header.mode);
- else
- MODE_TO_OCT (st->st_mode, header->header.mode);
- UID_TO_OCT (st->st_uid, header->header.uid);
- GID_TO_OCT (st->st_gid, header->header.gid);
- OFF_TO_OCT (st->st_size, header->header.size);
- TIME_TO_OCT (st->st_mtime, header->header.mtime);
- if (incremental_option)
- if (archive_format == OLDGNU_FORMAT)
- {
- TIME_TO_OCT (st->st_atime, header->oldgnu_header.atime);
- TIME_TO_OCT (st->st_ctime, header->oldgnu_header.ctime);
- }
- header->header.typeflag = archive_format == V7_FORMAT ? AREGTYPE : REGTYPE;
- switch (archive_format)
- {
- case DEFAULT_FORMAT:
- case V7_FORMAT:
- break;
- case OLDGNU_FORMAT:
- /* Overwrite header->header.magic and header.version in one blow. */
- strcpy (header->header.magic, OLDGNU_MAGIC);
- break;
- case POSIX_FORMAT:
- case GNU_FORMAT:
- strncpy (header->header.magic, TMAGIC, TMAGLEN);
- strncpy (header->header.version, TVERSION, TVERSLEN);
- break;
- }
- if (archive_format == V7_FORMAT || numeric_owner_option)
- {
- /* header->header.[ug]name are left as the empty string. */
- }
- else
- {
- uid_to_uname (st->st_uid, header->header.uname);
- gid_to_gname (st->st_gid, header->header.gname);
- }
- return header;
- }
- /*-------------------------------------------------------------------------.
- | Finish off a filled-in header block and write it out. We also print the |
- | file name and/or full info if verbose is on. |
- `-------------------------------------------------------------------------*/
- void
- finish_header (union block *header)
- {
- size_t i;
- int sum;
- char *p;
- memcpy (header->header.chksum, CHKBLANKS, sizeof (header->header.chksum));
- sum = 0;
- p = header->buffer;
- for (i = sizeof (*header); i-- != 0; )
- /* We can't use unsigned char here because of old compilers, e.g. V7. */
- sum += 0xFF & *p++;
- /* Fill in the checksum field. It's formatted differently from the
- other fields: it has [6] digits, a null, then a space -- rather than
- digits, a space, then a null. We use to_oct then write the null in
- over to_oct's space. The final space is already there, from
- checksumming, and to_oct doesn't modify it.
- This is a fast way to do:
- sprintf(header->header.chksum, "%6o", sum); */
- UINTMAX_TO_OCT ((uintmax_t) sum, header->header.chksum);
- header->header.chksum[6] = '\0'; /* zap the space */
- set_next_block_after (header);
- if (verbose_option
- && header->header.typeflag != GNUTYPE_LONGLINK
- && header->header.typeflag != GNUTYPE_LONGNAME)
- {
- /* These globals are parameters to print_header, sigh. */
- current_header = header;
- /* current_stat is already set up. */
- current_format = archive_format;
- print_header ();
- }
- }
- /* Sparse file processing. */
- /*-------------------------------------------------------------------------.
- | Takes a blockful of data and basically cruises through it to see if it's |
- | made *entirely* of zeros, returning a 0 the instant it finds something |
- | that is a nonzero, i.e., useful data. |
- `-------------------------------------------------------------------------*/
- static int
- zero_block_p (char *buffer)
- {
- int counter;
- for (counter = 0; counter < BLOCKSIZE; counter++)
- if (buffer[counter] != '\0')
- return 0;
- return 1;
- }
- /*---.
- | ? |
- `---*/
- static void
- init_sparsearray (void)
- {
- int counter;
- sp_array_size = 10;
- /* Make room for our scratch space -- initially is 10 elts long. */
- sparsearray = (struct sp_array *)
- xmalloc (sp_array_size * sizeof (struct sp_array));
- for (counter = 0; counter < sp_array_size; counter++)
- {
- sparsearray[counter].offset = 0;
- sparsearray[counter].numbytes = 0;
- }
- }
- /*---.
- | ? |
- `---*/
- static void
- find_new_file_size (off_t *filesize, int highest_index)
- {
- int counter;
- *filesize = 0;
- for (counter = 0;
- sparsearray[counter].numbytes && counter <= highest_index;
- counter++)
- *filesize += sparsearray[counter].numbytes;
- }
- /*-----------------------------------------------------------------------.
- | Make one pass over the file NAME, studying where any non-zero data is, |
- | that is, how far into the file each instance of data is, and how many |
- | bytes are there. Save this information in the sparsearray, which will |
- | later be translated into header information. |
- `-----------------------------------------------------------------------*/
- /* There is little point in trimming small amounts of null data at the head
- and tail of blocks, only avoid dumping full null blocks. */
- /* FIXME: this routine might accept bits of algorithmic cleanup, it is
- too kludgey for my taste... */
- static int
- deal_with_sparse (char *name, union block *header)
- {
- size_t numbytes = 0;
- off_t offset = 0;
- int file;
- int sparse_index = 0;
- ssize_t count;
- char buffer[BLOCKSIZE];
- if (archive_format == OLDGNU_FORMAT)
- header->oldgnu_header.isextended = 0;
- if (file = open (name, O_RDONLY), file < 0)
- /* This problem will be caught later on, so just return. */
- return 0;
- init_sparsearray ();
- clear_buffer (buffer);
- while (count = read (file, buffer, sizeof buffer), count != 0)
- {
- /* Realloc the scratch area as necessary. FIXME: should reallocate
- only at beginning of a new instance of non-zero data. */
- if (sparse_index > sp_array_size - 1)
- {
- sparsearray = (struct sp_array *)
- xrealloc (sparsearray,
- 2 * sp_array_size * sizeof (struct sp_array));
- sp_array_size *= 2;
- }
- /* Process one block. */
- if (count == sizeof buffer)
- if (zero_block_p (buffer))
- {
- if (numbytes)
- {
- sparsearray[sparse_index++].numbytes = numbytes;
- numbytes = 0;
- }
- }
- else
- {
- if (!numbytes)
- sparsearray[sparse_index].offset = offset;
- numbytes += count;
- }
- else
- /* Since count < sizeof buffer, we have the last bit of the file. */
- if (!zero_block_p (buffer))
- {
- if (!numbytes)
- sparsearray[sparse_index].offset = offset;
- numbytes += count;
- }
- else
- /* The next two lines are suggested by Andreas Degert, who says
- they are required for trailing full blocks to be written to the
- archive, when all zeroed. Yet, it seems to me that the case
- does not apply. Further, at restore time, the file is not as
- sparse as it should. So, some serious cleanup is *also* needed
- in this area. Just one more... :-(. FIXME. */
- if (numbytes)
- numbytes += count;
- /* Prepare for next block. */
- offset += count;
- /* FIXME: do not clear unless necessary. */
- clear_buffer (buffer);
- }
- if (numbytes)
- sparsearray[sparse_index++].numbytes = numbytes;
- else
- {
- sparsearray[sparse_index].offset = offset - 1;
- sparsearray[sparse_index++].numbytes = 1;
- }
- close (file);
- return sparse_index - 1;
- }
- /*---.
- | ? |
- `---*/
- static int
- finish_sparse_file (int file, off_t *sizeleft, off_t fullsize, char *name)
- {
- union block *start;
- size_t bufsize;
- int sparse_index = 0;
- ssize_t count;
- while (*sizeleft > 0)
- {
- start = find_next_block ();
- memset (start->buffer, 0, BLOCKSIZE);
- bufsize = sparsearray[sparse_index].numbytes;
- if (!bufsize)
- {
- /* We blew it, maybe. */
- char buf1[UINTMAX_STRSIZE_BOUND];
- char buf2[UINTMAX_STRSIZE_BOUND];
- ERROR ((0, 0, _("Wrote %s of %s bytes to file %s"),
- STRINGIFY_BIGINT (fullsize - *sizeleft, buf1),
- STRINGIFY_BIGINT (fullsize, buf2),
- name));
- break;
- }
- if (lseek (file, sparsearray[sparse_index++].offset, 0) < 0)
- {
- char buf[UINTMAX_STRSIZE_BOUND];
- ERROR ((0, errno, _("lseek error at byte %s in file %s"),
- STRINGIFY_BIGINT (sparsearray[sparse_index - 1].offset, buf),
- name));
- break;
- }
- /* If the number of bytes to be written here exceeds the size of
- the temporary buffer, do it in steps. */
- while (bufsize > BLOCKSIZE)
- {
- #if 0
- if (amount_read)
- {
- count = read (file, start->buffer + amount_read,
- BLOCKSIZE - amount_read);
- bufsize -= BLOCKSIZE - amount_read;
- amount_read = 0;
- set_next_block_after (start);
- start = find_next_block ();
- memset (start->buffer, 0, BLOCKSIZE);
- }
- #endif
- /* Store the data. */
- count = read (file, start->buffer, BLOCKSIZE);
- if (count < 0)
- {
- char buf[UINTMAX_STRSIZE_BOUND];
- ERROR ((0, errno, _("\
- Read error at byte %s, reading %lu bytes, in file %s"),
- STRINGIFY_BIGINT (fullsize - *sizeleft, buf),
- (unsigned long) bufsize, name));
- return 1;
- }
- bufsize -= count;
- *sizeleft -= count;
- set_next_block_after (start);
- start = find_next_block ();
- memset (start->buffer, 0, BLOCKSIZE);
- }
- {
- char buffer[BLOCKSIZE];
- clear_buffer (buffer);
- count = read (file, buffer, bufsize);
- memcpy (start->buffer, buffer, BLOCKSIZE);
- }
- if (count < 0)
- {
- char buf[UINTMAX_STRSIZE_BOUND];
-
- ERROR ((0, errno,
- _("Read error at byte %s, reading %lu bytes, in file %s"),
- STRINGIFY_BIGINT (fullsize - *sizeleft, buf),
- (unsigned long) bufsize, name));
- return 1;
- }
- #if 0
- if (amount_read >= BLOCKSIZE)
- {
- amount_read = 0;
- set_next_block_after (start + (count - 1) / BLOCKSIZE);
- if (count != bufsize)
- {
- ERROR ((0, 0,
- _("File %s shrunk, padding with zeros"),
- name));
- return 1;
- }
- start = find_next_block ();
- }
- else
- amount_read += bufsize;
- #endif
- *sizeleft -= count;
- set_next_block_after (start);
- }
- free (sparsearray);
- #if 0
- set_next_block_after (start + (count - 1) / BLOCKSIZE);
- #endif
- return 0;
- }
- /* Main functions of this module. */
- /*---.
- | ? |
- `---*/
- void
- create_archive (void)
- {
- char *p;
- open_archive (ACCESS_WRITE);
- if (incremental_option)
- {
- char *buffer = xmalloc (PATH_MAX);
- const char *q;
- char *bufp;
- collect_and_sort_names ();
- while (p = name_from_list (), p)
- dump_file (p, (dev_t) -1, 1);
- blank_name_list ();
- while (p = name_from_list (), p)
- {
- strcpy (buffer, p);
- if (p[strlen (p) - 1] != '/')
- strcat (buffer, "/");
- bufp = buffer + strlen (buffer);
- for (q = gnu_list_name->dir_contents;
- q && *q;
- q += strlen (q) + 1)
- {
- if (*q == 'Y')
- {
- strcpy (bufp, q + 1);
- dump_file (buffer, (dev_t) -1, 1);
- }
- }
- }
- free (buffer);
- }
- else
- {
- while (p = name_next (1), p)
- dump_file (p, (dev_t) -1, 1);
- }
- write_eot ();
- close_archive ();
- if (listed_incremental_option)
- write_dir_file ();
- }
- /*----------------------------------------------------------------------.
- | Dump a single file. Recurse on directories. Result is nonzero for |
- | success. P is file name to dump. PARENT_DEVICE is device our parent |
- | directory was on. TOP_LEVEL tells wether we are a toplevel call. |
- | |
- | Sets global CURRENT_STAT to stat output for this file. |
- `----------------------------------------------------------------------*/
- /* FIXME: One should make sure that for *every* path leading to setting
- exit_status to failure, a clear diagnostic has been issued. */
- void
- dump_file (char *p, dev_t parent_device, int top_level)
- {
- union block *header;
- char type;
- union block *exhdr;
- char save_typeflag;
- struct utimbuf restore_times;
- /* FIXME: `header' and `upperbound' might be used uninitialized in this
- function. Reported by Bruno Haible. */
- if (interactive_option && !confirm ("add", p))
- return;
- /* Use stat if following (rather than dumping) 4.2BSD's symbolic links.
- Otherwise, use lstat (which falls back to stat if no symbolic links). */
- if (dereference_option != 0
- #ifdef STX_HIDDEN /* AIX */
- ? statx (p, ¤t_stat, STATSIZE, STX_HIDDEN)
- : statx (p, ¤t_stat, STATSIZE, STX_HIDDEN | STX_LINK)
- #else
- ? stat (p, ¤t_stat) : lstat (p, ¤t_stat)
- #endif
- )
- {
- WARN ((0, errno, _("Cannot add file %s"), p));
- if (!ignore_failed_read_option)
- exit_status = TAREXIT_FAILURE;
- return;
- }
- restore_times.actime = current_stat.st_atime;
- restore_times.modtime = current_stat.st_mtime;
- #ifdef S_ISHIDDEN
- if (S_ISHIDDEN (current_stat.st_mode))
- {
- char *new = (char *) alloca (strlen (p) + 2);
- if (new)
- {
- strcpy (new, p);
- strcat (new, "@");
- p = new;
- }
- }
- #endif
- /* See if we only want new files, and check if this one is too old to
- put in the archive. */
- if (!incremental_option && !S_ISDIR (current_stat.st_mode)
- && current_stat.st_mtime < newer_mtime_option
- && (!after_date_option || current_stat.st_ctime < newer_ctime_option))
- {
- if (parent_device == (dev_t) -1)
- WARN ((0, 0, _("%s: is unchanged; not dumped"), p));
- /* FIXME: recheck this return. */
- return;
- }
- #if !MSDOS
- /* See if we are trying to dump the archive. */
- if (ar_dev && current_stat.st_dev == ar_dev && current_stat.st_ino == ar_ino)
- {
- WARN ((0, 0, _("%s is the archive; not dumped"), p));
- return;
- }
- #endif
- /* Check for multiple links.
- We maintain a list of all such files that we've written so far. Any
- time we see another, we check the list and avoid dumping the data
- again if we've done it once already. */
- if (current_stat.st_nlink > 1
- && (S_ISREG (current_stat.st_mode)
- #ifdef S_ISCTG
- || S_ISCTG (current_stat.st_mode)
- #endif
- #ifdef S_ISCHR
- || S_ISCHR (current_stat.st_mode)
- #endif
- #ifdef S_ISBLK
- || S_ISBLK (current_stat.st_mode)
- #endif
- #ifdef S_ISFIFO
- || S_ISFIFO (current_stat.st_mode)
- #endif
- ))
- {
- struct link *lp;
- /* FIXME: First quick and dirty. Hashing, etc later. */
- for (lp = linklist; lp; lp = lp->next)
- if (lp->ino == current_stat.st_ino && lp->dev == current_stat.st_dev)
- {
- char *link_name = lp->name;
- /* We found a link. */
- while (!absolute_names_option && *link_name == '/')
- {
- static int warned_once = 0;
- if (!warned_once)
- {
- warned_once = 1;
- WARN ((0, 0, _("\
- Removing leading `/' from absolute links")));
- }
- link_name++;
- }
- if (strlen (link_name) >= NAME_FIELD_SIZE)
- write_long (link_name, GNUTYPE_LONGLINK);
- assign_string (¤t_link_name, link_name);
- current_stat.st_size = 0;
- header = start_header (p, ¤t_stat);
- if (header == NULL)
- {
- exit_status = TAREXIT_FAILURE;
- return;
- }
- strncpy (header->header.linkname,
- link_name, NAME_FIELD_SIZE);
- /* Force null truncated. */
- header->header.linkname[NAME_FIELD_SIZE - 1] = 0;
- header->header.typeflag = LNKTYPE;
- finish_header (header);
- /* FIXME: Maybe remove from list after all links found? */
- if (remove_files_option)
- if (unlink (p) == -1)
- ERROR ((0, errno, _("Cannot remove %s"), p));
- /* We dumped it. */
- return;
- }
- /* Not found. Add it to the list of possible links. */
- lp = (struct link *)
- xmalloc ((size_t) (sizeof (struct link) + strlen (p)));
- lp->ino = current_stat.st_ino;
- lp->dev = current_stat.st_dev;
- strcpy (lp->name, p);
- lp->next = linklist;
- linklist = lp;
- }
- /* This is not a link to a previously dumped file, so dump it. */
- if (S_ISREG (current_stat.st_mode)
- #ifdef S_ISCTG
- || S_ISCTG (current_stat.st_mode)
- #endif
- )
- {
- int f; /* file descriptor */
- size_t bufsize;
- ssize_t count;
- off_t sizeleft;
- union block *start;
- int header_moved;
- char isextended = 0;
- int upperbound;
- #if 0
- static int cried_once = 0;
- #endif
- header_moved = 0;
- if (sparse_option)
- {
- /* Check the size of the file against the number of blocks
- allocated for it, counting both data and indirect blocks.
- If there is a smaller number of blocks that would be
- necessary to accommodate a file of this size, this is safe
- to say that we have a sparse file: at least one of those
- blocks in the file is just a useless hole. For sparse
- files not having more hole blocks than indirect blocks, the
- sparseness will go undetected. */
- /* Bruno Haible sent me these statistics for Linux. It seems
- that some filesystems count indirect blocks in st_blocks,
- while others do not seem to:
- minix-fs tar: size=7205, st_blocks=18 and ST_NBLOCKS=18
- extfs tar: size=7205, st_blocks=18 and ST_NBLOCKS=18
- ext2fs tar: size=7205, st_blocks=16 and ST_NBLOCKS=16
- msdos-fs tar: size=7205, st_blocks=16 and ST_NBLOCKS=16
- Dick Streefland reports the previous numbers as misleading,
- because ext2fs use 12 direct blocks, while minix-fs uses only
- 6 direct blocks. Dick gets:
- ext2 size=20480 ls listed blocks=21
- minix size=20480 ls listed blocks=21
- msdos size=20480 ls listed blocks=20
- It seems that indirect blocks *are* included in st_blocks.
- The minix filesystem does not account for phantom blocks in
- st_blocks, so `du' and `ls -s' give wrong results. So, the
- --sparse option would not work on a minix filesystem. */
- if (ST_NBLOCKS (current_stat)
- < (current_stat.st_size / ST_NBLOCKSIZE
- + (current_stat.st_size % ST_NBLOCKSIZE != 0)))
- {
- off_t filesize = current_stat.st_size;
- int counter;
- header = start_header (p, ¤t_stat);
- if (header == NULL)
- {
- exit_status = TAREXIT_FAILURE;
- return;
- }
- header->header.typeflag = GNUTYPE_SPARSE;
- header_moved = 1;
- /* Call the routine that figures out the layout of the
- sparse file in question. UPPERBOUND is the index of the
- last element of the "sparsearray," i.e., the number of
- elements it needed to describe the file. */
- upperbound = deal_with_sparse (p, header);
- /* See if we'll need an extended header later. */
- if (upperbound > SPARSES_IN_OLDGNU_HEADER - 1)
- header->oldgnu_header.isextended = 1;
- /* We store the "real" file size so we can show that in
- case someone wants to list the archive, i.e., tar tvf
- <file>. It might be kind of disconcerting if the
- shrunken file size was the one that showed up. */
- OFF_TO_OCT (current_stat.st_size,
- header->oldgnu_header.realsize);
- /* This will be the new "size" of the file, i.e., the size
- of the file minus the blocks of holes that we're
- skipping over. */
- find_new_file_size (&filesize, upperbound);
- current_stat.st_size = filesize;
- OFF_TO_OCT (filesize, header->header.size);
- for (counter = 0; counter < SPARSES_IN_OLDGNU_HEADER; counter++)
- {
- if (!sparsearray[counter].numbytes)
- break;
- OFF_TO_OCT (sparsearray[counter].offset,
- header->oldgnu_header.sp[counter].offset);
- SIZE_TO_OCT (sparsearray[counter].numbytes,
- header->oldgnu_header.sp[counter].numbytes);
- }
- }
- }
- else
- upperbound = SPARSES_IN_OLDGNU_HEADER - 1;
- sizeleft = current_stat.st_size;
- /* Don't bother opening empty, world readable files. Also do not open
- files when archive is meant for /dev/null. */
- if (dev_null_output
- || (sizeleft == 0 && 0444 == (0444 & current_stat.st_mode)))
- f = -1;
- else
- {
- f = open (p, O_RDONLY | O_BINARY);
- if (f < 0)
- {
- WARN ((0, errno, _("Cannot add file %s"), p));
- if (!ignore_failed_read_option)
- exit_status = TAREXIT_FAILURE;
- return;
- }
- }
- /* If the file is sparse, we've already taken care of this. */
- if (!header_moved)
- {
- header = start_header (p, ¤t_stat);
- if (header == NULL)
- {
- if (f >= 0)
- close (f);
- exit_status = TAREXIT_FAILURE;
- return;
- }
- }
- #ifdef S_ISCTG
- /* Mark contiguous files, if we support them. */
- if (archive_format != V7_FORMAT && S_ISCTG (current_stat.st_mode))
- header->header.typeflag = CONTTYPE;
- #endif
- isextended = header->oldgnu_header.isextended;
- save_typeflag = header->header.typeflag;
- finish_header (header);
- if (isextended)
- {
- #if 0
- int sum = 0;
- #endif
- int counter;
- #if 0
- union block *exhdr;
- int arraybound = SPARSES_IN_SPARSE_HEADER;
- #endif
- /* static */ int index_offset = SPARSES_IN_OLDGNU_HEADER;
- extend:
- exhdr = find_next_block ();
- if (exhdr == NULL)
- {
- exit_status = TAREXIT_FAILURE;
- return;
- }
- memset (exhdr->buffer, 0, BLOCKSIZE);
- for (counter = 0; counter < SPARSES_IN_SPARSE_HEADER; counter++)
- {
- if (counter + index_offset > upperbound)
- break;
- SIZE_TO_OCT (sparsearray[counter + index_offset].numbytes,
- exhdr->sparse_header.sp[counter].numbytes);
- OFF_TO_OCT (sparsearray[counter + index_offset].offset,
- exhdr->sparse_header.sp[counter].offset);
- }
- set_next_block_after (exhdr);
- #if 0
- sum += counter;
- if (sum < upperbound)
- goto extend;
- #endif
- if (index_offset + counter <= upperbound)
- {
- index_offset += counter;
- exhdr->sparse_header.isextended = 1;
- goto extend;
- }
- }
- if (save_typeflag == GNUTYPE_SPARSE)
- {
- if (finish_sparse_file (f, &sizeleft, current_stat.st_size, p))
- goto padit;
- }
- else
- while (sizeleft > 0)
- {
- if (multi_volume_option)
- {
- assign_string (&save_name, p);
- save_sizeleft = sizeleft;
- save_totsize = current_stat.st_size;
- }
- start = find_next_block ();
- bufsize = available_space_after (start);
- if (sizeleft < bufsize)
- {
- /* Last read -- zero out area beyond. */
- bufsize = sizeleft;
- count = bufsize % BLOCKSIZE;
- if (count)
- memset (start->buffer + sizeleft, 0,
- (size_t) (BLOCKSIZE - count));
- }
- if (f < 0)
- count = bufsize;
- else
- count = read (f, start->buffer, bufsize);
- if (count < 0)
- {
- char buf[UINTMAX_STRSIZE_BOUND];
- ERROR ((0, errno, _("\
- Read error at byte %s, reading %lu bytes, in file %s"),
- STRINGIFY_BIGINT (current_stat.st_size - sizeleft,
- buf),
- (unsigned long) bufsize, p));
- goto padit;
- }
- sizeleft -= count;
- /* This is nonportable (the type of set_next_block_after's arg). */
- set_next_block_after (start + (count - 1) / BLOCKSIZE);
- if (count == bufsize)
- continue;
- else
- {
- char buf[UINTMAX_STRSIZE_BOUND];
- ERROR ((0, 0,
- _("File %s shrunk by %s bytes, padding with zeros"),
- p, STRINGIFY_BIGINT (sizeleft, buf)));
- goto padit; /* short read */
- }
- }
- if (multi_volume_option)
- assign_string (&save_name, NULL);
- if (f >= 0)
- {
- close (f);
- if (atime_preserve_option)
- utime (p, &restore_times);
- }
- if (remove_files_option)
- {
- if (unlink (p) == -1)
- ERROR ((0, errno, _("Cannot remove %s"), p));
- }
- return;
- /* File shrunk or gave error, pad out tape to match the size we
- specified in the header. */
- padit:
- while (sizeleft > 0)
- {
- save_sizeleft = sizeleft;
- start = find_next_block ();
- memset (start->buffer, 0, BLOCKSIZE);
- set_next_block_after (start);
- sizeleft -= BLOCKSIZE;
- }
- if (multi_volume_option)
- assign_string (&save_name, NULL);
- if (f >= 0)
- {
- close (f);
- if (atime_preserve_option)
- utime (p, &restore_times);
- }
- return;
- }
- #ifdef S_ISLNK
- else if (S_ISLNK (current_stat.st_mode))
- {
- int size;
- char *buffer = (char *) alloca (PATH_MAX + 1);
- size = readlink (p, buffer, PATH_MAX + 1);
- if (size < 0)
- {
- WARN ((0, errno, _("Cannot add file %s"), p));
- if (!ignore_failed_read_option)
- exit_status = TAREXIT_FAILURE;
- return;
- }
- buffer[size] = '\0';
- if (size >= NAME_FIELD_SIZE)
- write_long (buffer, GNUTYPE_LONGLINK);
- assign_string (¤t_link_name, buffer);
- current_stat.st_size = 0; /* force 0 size on symlink */
- header = start_header (p, ¤t_stat);
- if (header == NULL)
- {
- exit_status = TAREXIT_FAILURE;
- return;
- }
- strncpy (header->header.linkname, buffer, NAME_FIELD_SIZE);
- header->header.linkname[NAME_FIELD_SIZE - 1] = '\0';
- header->header.typeflag = SYMTYPE;
- finish_header (header); /* nothing more to do to it */
- if (remove_files_option)
- {
- if (unlink (p) == -1)
- ERROR ((0, errno, _("Cannot remove %s"), p));
- }
- return;
- }
- #endif /* S_ISLNK */
- else if (S_ISDIR (current_stat.st_mode))
- {
- DIR *directory;
- struct dirent *entry;
- char *namebuf;
- size_t buflen;
- size_t len;
- dev_t our_device = current_stat.st_dev;
- /* If this tar program is installed suid root, like for Amanda, the
- access might look like denied, while it is not really.
- FIXME: I have the feeling this test is done too early. Couldn't it
- just be bundled in later actions? I guess that the proper support
- of --ignore-failed-read is the key of the current writing. */
- if (access (p, R_OK) == -1 && geteuid () != 0)
- {
- WARN ((0, errno, _("Cannot add directory %s"), p));
- if (!ignore_failed_read_option)
- exit_status = TAREXIT_FAILURE;
- return;
- }
- /* Build new prototype name. Ensure exactly one trailing slash. */
- len = strlen (p);
- buflen = len + NAME_FIELD_SIZE;
- namebuf = xmalloc (buflen + 1);
- strncpy (namebuf, p, buflen);
- while (len >= 1 && namebuf[len - 1] == '/')
- len--;
- namebuf[len++] = '/';
- namebuf[len] = '\0';
- if (1)
- {
- /* The "1" above used to be "archive_format != V7_FORMAT", GNU tar
- was just not writing directory blocks at all. Daniel Trinkle
- writes: ``All old versions of tar I have ever seen have
- correctly archived an empty directory. The really old ones I
- checked included HP-UX 7 and Mt. Xinu More/BSD. There may be
- some subtle reason for the exclusion that I don't know, but the
- current behavior is broken.'' I do not know those subtle
- reasons either, so until these are reported (anew?), just allow
- directory blocks to be written even with old archives. */
- current_stat.st_size = 0; /* force 0 size on dir */
- /* FIXME: If people could really read standard archives, this
- should be:
- header
- = start_header (standard_option ? p : namebuf, ¤t_stat);
- but since they'd interpret DIRTYPE blocks as regular
- files, we'd better put the / on the name. */
- header = start_header (namebuf, ¤t_stat);
- if (header == NULL)
- {
- exit_status = TAREXIT_FAILURE;
- return; /* eg name too long */
- }
- if (incremental_option)
- header->header.typeflag = GNUTYPE_DUMPDIR;
- else /* if (standard_option) */
- header->header.typeflag = DIRTYPE;
- /* If we're gnudumping, we aren't done yet so don't close it. */
- if (!incremental_option)
- finish_header (header); /* done with directory header */
- }
- if (incremental_option && gnu_list_name->dir_contents)
- {
- off_t sizeleft;
- off_t totsize;
- size_t bufsize;
- union block *start;
- ssize_t count;
- const char *buffer, *p_buffer;
- buffer = gnu_list_name->dir_contents; /* FOO */
- totsize = 0;
- for (p_buffer = buffer; p_buffer && *p_buffer;)
- {
- size_t tmp;
- tmp = strlen (p_buffer) + 1;
- totsize += tmp;
- p_buffer += tmp;
- }
- totsize++;
- OFF_TO_OCT (totsize, header->header.size);
- finish_header (header);
- p_buffer = buffer;
- sizeleft = totsize;
- while (sizeleft > 0)
- {
- if (multi_volume_option)
- {
- assign_string (&save_name, p);
- save_sizeleft = sizeleft;
- save_totsize = totsize;
- }
- start = find_next_block ();
- bufsize = available_space_after (start);
- if (sizeleft < bufsize)
- {
- bufsize = sizeleft;
- count = bufsize % BLOCKSIZE;
- if (count)
- memset (start->buffer + sizeleft, 0,
- (size_t) (BLOCKSIZE - count));
- }
- memcpy (start->buffer, p_buffer, bufsize);
- sizeleft -= bufsize;
- p_buffer += bufsize;
- set_next_block_after (start + (bufsize - 1) / BLOCKSIZE);
- }
- if (multi_volume_option)
- assign_string (&save_name, NULL);
- if (atime_preserve_option)
- utime (p, &restore_times);
- return;
- }
- /* See if we are about to recurse into a directory, and avoid doing
- so if the user wants that we do not descend into directories. */
- if (no_recurse_option)
- return;
- /* See if we are crossing from one file system to another, and
- avoid doing so if the user only wants to dump one file system. */
- if (one_file_system_option && !top_level
- && parent_device != current_stat.st_dev)
- {
- if (verbose_option)
- WARN ((0, 0, _("%s: On a different filesystem; not dumped"), p));
- return;
- }
- /* Now output all the files in the directory. */
- errno = 0; /* FIXME: errno should be read-only */
- directory = opendir (p);
- if (!directory)
- {
- ERROR ((0, errno, _("Cannot open directory %s"), p));
- return;
- }
- /* Hack to remove "./" from the front of all the file names. */
- if (len == 2 && namebuf[0] == '.' && namebuf[1] == '/')
- len = 0;
- /* FIXME: Should speed this up by cd-ing into the dir. */
- while (entry = readdir (directory), entry)
- {
- /* Skip `.' and `..'. */
- if (is_dot_or_dotdot (entry->d_name))
- continue;
- if ((int) NAMLEN (entry) + len >= buflen)
- {
- buflen = len + NAMLEN (entry);
- namebuf = (char *) xrealloc (namebuf, buflen + 1);
- #if 0
- namebuf[len] = '\0';
- ERROR ((0, 0, _("File name %s%s too long"),
- namebuf, entry->d_name));
- continue;
- #endif
- }
- strcpy (namebuf + len, entry->d_name);
- if (exclude_option && check_exclude (namebuf))
- continue;
- dump_file (namebuf, our_device, 0);
- }
- closedir (directory);
- free (namebuf);
- if (atime_preserve_option)
- utime (p, &restore_times);
- return;
- }
- #ifdef S_ISCHR
- else if (S_ISCHR (current_stat.st_mode))
- type = CHRTYPE;
- #endif
- #ifdef S_ISBLK
- else if (S_ISBLK (current_stat.st_mode))
- type = BLKTYPE;
- #endif
- /* Avoid screwy apollo lossage where S_IFIFO == S_IFSOCK. */
- #if (_ISP__M68K == 0) && (_ISP__A88K == 0) && defined(S_ISFIFO)
- else if (S_ISFIFO (current_stat.st_mode))
- type = FIFOTYPE;
- #endif
- #ifdef S_ISSOCK
- else if (S_ISSOCK (current_stat.st_mode))
- type = FIFOTYPE;
- #endif
- else
- goto unknown;
- if (archive_format == V7_FORMAT)
- goto unknown;
- current_stat.st_size = 0; /* force 0 size */
- header = start_header (p, ¤t_stat);
- if (header == NULL)
- {
- exit_status = TAREXIT_FAILURE;
- return; /* eg name too long */
- }
- header->header.typeflag = type;
- #if defined(S_IFBLK) || defined(S_IFCHR)
- if (type != FIFOTYPE)
- {
- MAJOR_TO_OCT (major (current_stat.st_rdev), header->header.devmajor);
- MINOR_TO_OCT (minor (current_stat.st_rdev), header->header.devminor);
- }
- #endif
- finish_header (header);
- if (remove_files_option)
- {
- if (unlink (p) == -1)
- ERROR ((0, errno, _("Cannot remove %s"), p));
- }
- return;
- unknown:
- ERROR ((0, 0, _("%s: Unknown file type; file ignored"), p));
- }
|