386BSD 0.1 development
[unix-history] / usr / src / usr.bin / tar / create.c
/* Create a tar archive.
Copyright (C) 1988 Free Software Foundation
This file is part of GNU Tar.
GNU Tar is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 1, or (at your option)
any later version.
GNU Tar is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with GNU Tar; see the file COPYING. If not, write to
the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
/*
* Create a tar archive.
*
* Written 25 Aug 1985 by John Gilmore, ihnp4!hoptoad!gnu.
*
* @(#)create.c 1.36 11/6/87 - gnu
*/
#include <sys/types.h>
#include <sys/stat.h>
#include <stdio.h>
#ifndef V7
#include <fcntl.h>
#endif
#ifndef __MSDOS__
#include <sys/file.h>
#include <sys/param.h> /* for MAXPATHLEN */
#include <pwd.h>
#include <grp.h>
#endif
#ifdef BSD42
#include <sys/dir.h>
#else
#ifdef __MSDOS__
#include "msd_dir.h"
#else
#ifdef USG
#ifdef NDIR
#include <ndir.h>
#else
#include <dirent.h>
#endif
#ifndef DIRECT
#define direct dirent
#endif
#define DP_NAMELEN(x) strlen((x)->d_name)
#else
/*
* FIXME: On other systems there is no standard place for the header file
* for the portable directory access routines. Change the #include line
* below to bring it in from wherever it is.
*/
#include "ndir.h"
#endif
#endif
#endif
#ifndef DP_NAMELEN
#define DP_NAMELEN(x) (x)->d_namlen
#endif
#ifdef USG
#include <sys/sysmacros.h> /* major() and minor() defined here */
#endif
/*
* V7 doesn't have a #define for this.
*/
#ifndef O_RDONLY
#define O_RDONLY 0
#endif
/*
* Most people don't have a #define for this.
*/
#ifndef O_BINARY
#define O_BINARY 0
#endif
#ifndef MAXPATHLEN
#define MAXPATHLEN 1024
#endif
#include "tar.h"
#include "port.h"
extern struct stat hstat; /* Stat struct corresponding */
#ifndef __MSDOS__
extern dev_t ar_dev;
extern ino_t ar_ino;
#endif
/* JF */
extern struct name *gnu_list_name;
/*
* If there are no symbolic links, there is no lstat(). Use stat().
*/
#ifndef S_IFLNK
#define lstat stat
#endif
extern char *malloc();
extern char *strcpy();
extern char *strncpy();
extern void bzero();
extern void bcopy();
extern int errno;
extern void print_header();
union record *start_header();
void finish_header();
void finduname();
void findgname();
char *name_next();
void to_oct();
void dump_file();
/* This code moved from tar.h since create.c is the only file that cares
about 'struct link's. This means that other files might not have to
include sys/types.h any more.
*/
struct link {
struct link *next;
dev_t dev;
ino_t ino;
short linkcount;
char name[1];
};
struct link *linklist; /* Points to first link in list */
static nolinks; /* Gets set if we run out of RAM */
/*
* "Scratch" space to store the information about a sparse file before
* writing the info into the header or extended header
*/
/* struct sp_array *sparsearray;*/
/* number of elts storable in the sparsearray */
/*int sparse_array_size = 10;*/
void
create_archive()
{
register char *p;
char *name_from_list();
open_archive(0); /* Open for writing */
if(f_gnudump) {
char buf[MAXNAMLEN],*q,*bufp;
collect_and_sort_names();
while(p=name_from_list())
dump_file(p,-1);
/* if(!f_dironly) { */
blank_name_list();
while(p=name_from_list()) {
strcpy(buf,p);
if(p[strlen(p)-1]!='/')
strcat(buf,"/");
bufp=buf+strlen(buf);
for(q=gnu_list_name->dir_contents;q && *q;q+=strlen(q)+1) {
if(*q=='Y') {
strcpy(bufp,q+1);
dump_file(buf,-1);
}
}
}
/* } */
} else {
p = name_next(1);
if(!p)
dump_file(".", -1);
else {
do dump_file(p, -1);
while (p = name_next(1));
}
}
write_mangled();
write_eot();
close_archive();
if(f_gnudump)
write_dir_file();
name_close();
}
/*
* Dump a single file. If it's a directory, recurse.
* Result is 1 for success, 0 for failure.
* Sets global "hstat" to stat() output for this file.
*/
void
dump_file (p, curdev)
char *p; /* File name to dump */
int curdev; /* Device our parent dir was on */
{
union record *header;
char type;
extern char *save_name; /* JF for multi-volume support */
extern long save_totsize;
extern long save_sizeleft;
union record *exhdr;
char save_linkflag;
extern time_t new_time;
int sparse_ind = 0;
if(f_confirm && !confirm("add",p))
return;
/*
* Use stat if following (rather than dumping) 4.2BSD's
* symbolic links. Otherwise, use lstat (which, on non-4.2
* systems, is #define'd to stat anyway.
*/
#ifdef AIX
if (0 != f_follow_links ?
statx (p, &hstat, STATSIZE, STX_HIDDEN):
statx (p, &hstat, STATSIZE, STX_HIDDEN|STX_LINK))
#else
if (0 != f_follow_links? stat(p, &hstat): lstat(p, &hstat))
#endif /* AIX */
{
badperror:
msg_perror("can't add file %s",p);
badfile:
errors++;
return;
}
#ifdef AIX
if (S_ISHIDDEN (hstat.st_mode)) {
char *new = (char *)allocate (strlen (p) + 2);
if (new) {
strcpy (new, p);
strcat (new, "@");
p = new;
}
}
#endif /* AIX */
/* See if we only want new files, and check if this one is too old to
put in the archive. */
if( f_new_files
&& !f_gnudump
&& new_time>hstat.st_mtime
&& (hstat.st_mode&S_IFMT)!=S_IFDIR
&& (f_new_files>1 || new_time>hstat.st_ctime)) {
if(curdev<0) {
msg("%s: is unchanged; not dumped",p);
}
return;
}
#ifndef __MSDOS__
/* See if we are trying to dump the archive */
if(ar_dev && hstat.st_dev==ar_dev && hstat.st_ino==ar_ino) {
msg("%s is the archive; not dumped",p);
return;
}
#endif
/*
* Check for multiple links.
*
* We maintain a list of all such files that we've written so
* far. Any time we see another, we check the list and
* avoid dumping the data again if we've done it once already.
*/
if (hstat.st_nlink > 1) switch (hstat.st_mode & S_IFMT) {
register struct link *lp;
case S_IFREG: /* Regular file */
#ifdef S_IFCTG
case S_IFCTG: /* Contigous file */
#endif
#ifdef S_IFCHR
case S_IFCHR: /* Character special file */
#endif
#ifdef S_IFBLK
case S_IFBLK: /* Block special file */
#endif
#ifdef S_IFIFO
case S_IFIFO: /* Fifo special file */
#endif
/* First quick and dirty. Hashing, etc later FIXME */
for (lp = linklist; lp; lp = lp->next) {
if (lp->ino == hstat.st_ino &&
lp->dev == hstat.st_dev) {
char *link_name = lp->name;
/* We found a link. */
hstat.st_size = 0;
header = start_header(p, &hstat);
if (header == NULL) goto badfile;
while(!f_absolute_paths && *link_name == '/') {
static int link_warn = 0;
if (!link_warn) {
msg("Removing leading / from absolute links");
link_warn++;
}
link_name++;
}
strncpy(header->header.linkname,
link_name,NAMSIZ);
if(header->header.linkname[NAMSIZ-1]) {
char *mangled;
extern char *find_mangled();
mangled=find_mangled(link_name);
msg("%s: link name too long: mangled to %s",link_name,mangled);
strncpy(header->header.linkname,mangled,NAMSIZ);
}
header->header.linkflag = LF_LINK;
finish_header(header);
/* FIXME: Maybe remove from list after all links found? */
return; /* We dumped it */
}
}
/* Not found. Add it to the list of possible links. */
lp = (struct link *)malloc((unsigned)(sizeof(struct link)+strlen(p)));
if (!lp) {
if (!nolinks) {
msg(
"no memory for links, they will be dumped as separate files");
nolinks++;
}
}
lp->ino = hstat.st_ino;
lp->dev = hstat.st_dev;
strcpy(lp->name, p);
lp->next = linklist;
linklist = lp;
}
/*
* This is not a link to a previously dumped file, so dump it.
*/
switch (hstat.st_mode & S_IFMT) {
case S_IFREG: /* Regular file */
#ifdef S_IFCTG
case S_IFCTG: /* Contiguous file */
#endif
{
int f; /* File descriptor */
long bufsize, count;
long sizeleft;
register union record *start;
int header_moved;
char isextended = 0;
int upperbound;
int end_nulls = 0;
header_moved = 0;
#ifdef BSD42
if (f_sparse_files) {
/*
* JK - This is the test for sparseness: whether the
* "size" of the file matches the number of blocks
* allocated for it. If there is a smaller number
* of blocks that would be necessary to accommodate
* a file of this size, we have a sparse file, i.e.,
* at least one of those records in the file is just
* a useless hole.
*/
#ifdef hpux /* Nice of HPUX to gratuitiously change it, huh? - mib */
if (hstat.st_size - (hstat.st_blocks * 1024) > 1024 ) {
#else
if (hstat.st_size - (hstat.st_blocks * RECORDSIZE) > RECORDSIZE) {
#endif
int filesize = hstat.st_size;
register int i;
header = start_header(p, &hstat);
if (header == NULL)
goto badfile;
header->header.linkflag = LF_SPARSE;
header_moved++;
/*
* Call the routine that figures out the
* layout of the sparse file in question.
* UPPERBOUND is the index of the last
* element of the "sparsearray," i.e.,
* the number of elements it needed to
* describe the file.
*/
upperbound = deal_with_sparse(p, header);
/*
* See if we'll need an extended header
* later
*/
if (upperbound > SPARSE_IN_HDR-1)
header->header.isextended++;
/*
* We store the "real" file size so
* we can show that in case someone wants
* to list the archive, i.e., tar tvf <file>.
* It might be kind of disconcerting if the
* shrunken file size was the one that showed
* up.
*/
to_oct((long) hstat.st_size, 1+12,
header->header.realsize);
/*
* This will be the new "size" of the
* file, i.e., the size of the file
* minus the records of holes that we're
* skipping over.
*/
find_new_file_size(&filesize, upperbound);
hstat.st_size = filesize;
to_oct((long) filesize, 1+12,
header->header.size);
/* to_oct((long) end_nulls, 1+12,
header->header.ending_blanks);*/
for (i = 0; i < SPARSE_IN_HDR; i++) {
if (!sparsearray[i].numbytes)
break;
to_oct(sparsearray[i].offset, 1+12,
header->header.sp[i].offset);
to_oct(sparsearray[i].numbytes, 1+12,
header->header.sp[i].numbytes);
}
}
}
#else
upperbound=SPARSE_IN_HDR-1;
#endif
sizeleft = hstat.st_size;
/* Don't bother opening empty, world readable files. */
if (sizeleft > 0 || 0444 != (0444 & hstat.st_mode)) {
f = open(p, O_RDONLY|O_BINARY);
if (f < 0) goto badperror;
} else {
f = -1;
}
/* If the file is sparse, we've already taken care of this */
if (!header_moved) {
header = start_header(p, &hstat);
if (header == NULL) {
if(f>=0)
(void)close(f);
goto badfile;
}
}
#ifdef S_IFCTG
/* Mark contiguous files, if we support them */
if (f_standard && (hstat.st_mode & S_IFMT) == S_IFCTG) {
header->header.linkflag = LF_CONTIG;
}
#endif
isextended = header->header.isextended;
save_linkflag = header->header.linkflag;
finish_header(header);
if (isextended) {
int sum = 0;
register int i;
/* register union record *exhdr;*/
int arraybound = SPARSE_EXT_HDR;
/* static */ int index_offset = SPARSE_IN_HDR;
extend: exhdr = findrec();
if (exhdr == NULL) goto badfile;
bzero(exhdr->charptr, RECORDSIZE);
for (i = 0; i < SPARSE_EXT_HDR; i++) {
if (i+index_offset > upperbound)
break;
to_oct((long) sparsearray[i+index_offset].numbytes,
1+12,
exhdr->ext_hdr.sp[i].numbytes);
to_oct((long) sparsearray[i+index_offset].offset,
1+12,
exhdr->ext_hdr.sp[i].offset);
}
userec(exhdr);
/* sum += i;
if (sum < upperbound)
goto extend;*/
if (index_offset+i < upperbound) {
index_offset += i;
exhdr->ext_hdr.isextended++;
goto extend;
}
}
if (save_linkflag == LF_SPARSE) {
if (finish_sparse_file(f, &sizeleft, hstat.st_size, p))
goto padit;
}
else
while (sizeleft > 0) {
if(f_multivol) {
save_name = p;
save_sizeleft = sizeleft;
save_totsize = hstat.st_size;
}
start = findrec();
bufsize = endofrecs()->charptr - start->charptr;
if (sizeleft < bufsize) {
/* Last read -- zero out area beyond */
bufsize = (int)sizeleft;
count = bufsize % RECORDSIZE;
if (count)
bzero(start->charptr + sizeleft,
(int)(RECORDSIZE - count));
}
count = read(f, start->charptr, bufsize);
if (count < 0) {
msg_perror("read error at byte %ld, reading\
%d bytes, in file %s", hstat.st_size - sizeleft, bufsize,p);
goto padit;
}
sizeleft -= count;
/* This is nonportable (the type of userec's arg). */
userec(start+(count-1)/RECORDSIZE);
if (count == bufsize) continue;
msg( "file %s shrunk by %d bytes, padding with zeros.", p, sizeleft);
goto padit; /* Short read */
}
if(f_multivol)
save_name = 0;
if (f >= 0)
(void)close(f);
break;
/*
* File shrunk or gave error, pad out tape to match
* the size we specified in the header.
*/
padit:
while(sizeleft>0) {
save_sizeleft=sizeleft;
start=findrec();
bzero(start->charptr,RECORDSIZE);
userec(start);
sizeleft-=RECORDSIZE;
}
if(f_multivol)
save_name=0;
if(f>=0)
(void)close(f);
break;
/* abort(); */
}
#ifdef S_IFLNK
case S_IFLNK: /* Symbolic link */
{
int size;
hstat.st_size = 0; /* Force 0 size on symlink */
header = start_header(p, &hstat);
if (header == NULL) goto badfile;
size = readlink(p, header->header.linkname, NAMSIZ);
if (size < 0) goto badperror;
if (size == NAMSIZ) {
char buf[MAXPATHLEN];
readlink(p,buf,MAXPATHLEN);
/* next_mangle(header->header.linkname); */
add_symlink_mangle(buf,p,header->header.linkname);
msg("symbolic link %s too long: mangling to %s",p, header->header.linkname);
/* size=strlen(header->header.linkname); */
} else
header->header.linkname[size] = '\0';
header->header.linkflag = LF_SYMLINK;
finish_header(header); /* Nothing more to do to it */
}
break;
#endif
case S_IFDIR: /* Directory */
{
register DIR *dirp;
register struct direct *d;
char *namebuf;
int buflen;
register int len;
int our_device = hstat.st_dev;
extern char *ck_malloc(),*ck_realloc();
/* Build new prototype name */
len = strlen(p);
buflen=len+NAMSIZ;
namebuf=ck_malloc(buflen+1);
strncpy(namebuf, p, buflen);
while (len >= 1 && '/' == namebuf[len-1])
len--; /* Delete trailing slashes */
namebuf[len++] = '/'; /* Now add exactly one back */
namebuf[len] = '\0'; /* Make sure null-terminated */
/*
* Output directory header record with permissions
* FIXME, do this AFTER files, to avoid R/O dir problems?
* If old archive format, don't write record at all.
*/
if (!f_oldarch) {
hstat.st_size = 0; /* Force 0 size on dir */
/*
* If people could really read standard archives,
* this should be: (FIXME)
header = start_header(f_standard? p: namebuf, &hstat);
* but since they'd interpret LF_DIR records as
* regular files, we'd better put the / on the name.
*/
header = start_header(namebuf, &hstat);
if (header == NULL)
goto badfile; /* eg name too long */
if (f_gnudump)
header->header.linkflag = LF_DUMPDIR;
else if (f_standard)
header->header.linkflag = LF_DIR;
/* If we're gnudumping, we aren't done yet so don't close it. */
if(!f_gnudump)
finish_header(header); /* Done with directory header */
}
if(f_gnudump) {
int sizeleft;
int totsize;
int bufsize;
union record *start;
int count;
char *buf,*p_buf;
buf=gnu_list_name->dir_contents; /* FOO */
totsize=0;
for(p_buf=buf;p_buf && *p_buf;) {
int tmp;
tmp=strlen(p_buf)+1;
totsize+=tmp;
p_buf+=tmp;
}
totsize++;
to_oct((long)totsize,1+12,header->header.size);
finish_header(header);
p_buf=buf;
sizeleft=totsize;
while(sizeleft>0) {
if(f_multivol) {
save_name=p;
save_sizeleft=sizeleft;
save_totsize=totsize;
}
start=findrec();
bufsize=endofrecs()->charptr - start->charptr;
if(sizeleft<bufsize) {
bufsize=sizeleft;
count=bufsize%RECORDSIZE;
if(count)
bzero(start->charptr+sizeleft,RECORDSIZE-count);
}
bcopy(p_buf,start->charptr,bufsize);
sizeleft-=bufsize;
p_buf+=bufsize;
userec(start+(bufsize-1)/RECORDSIZE);
}
if(f_multivol)
save_name = 0;
break;
}
/* Now output all the files in the directory */
/* if (f_dironly)
break; /* Unless the cmdline said not to */
/*
* See if we are crossing from one file system to another,
* and avoid doing so if the user only wants to dump one file system.
*/
if (f_local_filesys && curdev >= 0 && curdev != hstat.st_dev) {
if(f_verbose)
msg("%s: is on a different filesystem; not dumped",p);
break;
}
errno = 0;
dirp = opendir(p);
if (!dirp) {
if (errno) {
msg_perror ("can't open directory %s",p);
} else {
msg("error opening directory %s",
p);
}
break;
}
/* Hack to remove "./" from the front of all the file names */
if (len == 2 && namebuf[0] == '.' && namebuf[1]=='/')
len = 0;
/* Should speed this up by cd-ing into the dir, FIXME */
while (NULL != (d=readdir(dirp))) {
/* Skip . and .. */
if(is_dot_or_dotdot(d->d_name))
continue;
if (DP_NAMELEN(d) + len >= buflen) {
buflen=len+DP_NAMELEN(d);
namebuf=ck_realloc(namebuf,buflen+1);
/* namebuf[len]='\0';
msg("file name %s%s too long",
namebuf, d->d_name);
continue; */
}
strcpy(namebuf+len, d->d_name);
if(f_exclude && check_exclude(namebuf))
continue;
dump_file(namebuf, our_device);
}
closedir(dirp);
free(namebuf);
}
break;
#ifdef S_IFCHR
case S_IFCHR: /* Character special file */
type = LF_CHR;
goto easy;
#endif
#ifdef S_IFBLK
case S_IFBLK: /* Block special file */
type = LF_BLK;
goto easy;
#endif
/* Avoid screwy apollo lossage where S_IFIFO == S_IFSOCK */
#if ((_ISP__M68K == 0) && (_ISP__A88K == 0))
#ifdef S_IFIFO
case S_IFIFO: /* Fifo special file */
type = LF_FIFO;
goto easy;
#endif
#endif
#ifdef S_IFSOCK
case S_IFSOCK: /* Socket pretend its a fifo? */
type = LF_FIFO;
goto easy;
#endif
easy:
if (!f_standard) goto unknown;
hstat.st_size = 0; /* Force 0 size */
header = start_header(p, &hstat);
if (header == NULL) goto badfile; /* eg name too long */
header->header.linkflag = type;
if (type != LF_FIFO) {
to_oct((long) major(hstat.st_rdev), 8,
header->header.devmajor);
to_oct((long) minor(hstat.st_rdev), 8,
header->header.devminor);
}
finish_header(header);
break;
default:
unknown:
msg("%s: Unknown file type; file ignored.", p);
break;
}
}
int
finish_sparse_file(fd, sizeleft, fullsize, name)
int fd;
long *sizeleft,
fullsize;
char *name;
{
union record *start;
char tempbuf[RECORDSIZE];
int bufsize,
sparse_ind = 0,
count;
long pos;
long nwritten = 0;
while (*sizeleft > 0) {
start = findrec();
bzero(start->charptr, RECORDSIZE);
bufsize = sparsearray[sparse_ind].numbytes;
if (!bufsize) { /* we blew it, maybe */
msg("Wrote %ld of %ld bytes to file %s",
fullsize - *sizeleft, fullsize, name);
break;
}
pos = lseek(fd, sparsearray[sparse_ind++].offset, 0);
/*
* If the number of bytes to be written here exceeds
* the size of the temporary buffer, do it in steps.
*/
while (bufsize > RECORDSIZE) {
/* if (amt_read) {
count = read(fd, start->charptr+amt_read, RECORDSIZE-amt_read);
bufsize -= RECORDSIZE - amt_read;
amt_read = 0;
userec(start);
start = findrec();
bzero(start->charptr, RECORDSIZE);
}*/
/* store the data */
count = read(fd, start->charptr, RECORDSIZE);
if (count < 0) {
msg_perror("read error at byte %ld, reading %d bytes, in file %s",
fullsize - *sizeleft, bufsize, name);
return 1;
}
bufsize -= count;
*sizeleft -= count;
userec(start);
nwritten += RECORDSIZE; /* XXX */
start = findrec();
bzero(start->charptr, RECORDSIZE);
}
clear_buffer(tempbuf);
count = read(fd, tempbuf, bufsize);
bcopy(tempbuf, start->charptr, RECORDSIZE);
if (count < 0) {
msg_perror("read error at byte %ld, reading %d bytes, in file %s",
fullsize - *sizeleft, bufsize, name);
return 1;
}
/* if (amt_read >= RECORDSIZE) {
amt_read = 0;
userec(start+(count-1)/RECORDSIZE);
if (count != bufsize) {
msg("file %s shrunk by %d bytes, padding with zeros.", name, sizeleft);
return 1;
}
start = findrec();
} else
amt_read += bufsize;*/
nwritten += count; /* XXX */
*sizeleft -= count;
userec(start);
}
free(sparsearray);
printf ("Amount actually written is (I hope) %d.\n", nwritten);
/* userec(start+(count-1)/RECORDSIZE);*/
return 0;
}
init_sparsearray()
{
register int i;
sp_array_size = 10;
/*
* Make room for our scratch space -- initially is 10 elts long
*/
sparsearray = (struct sp_array *) malloc(sp_array_size * sizeof(struct sp_array));
for (i = 0; i < sp_array_size; i++) {
sparsearray[i].offset = 0;
sparsearray[i].numbytes = 0;
}
}
/*
* Okay, we've got a sparse file on our hands -- now, what we need to do is
* make a pass through the file and carefully note where any data is, i.e.,
* we want to find how far into the file each instance of data is, and how
* many bytes are there. We store this information in the sparsearray,
* which will later be translated into header information. For now, we use
* the sparsearray as convenient storage.
*
* As a side note, this routine is a mess. If I could have found a cleaner
* way to do it, I would have. If anyone wants to find a nicer way to do
* this, feel free.
*/
/* There is little point in trimming small amounts of null data at the */
/* head and tail of blocks -- it's ok if we only avoid dumping blocks */
/* of complete null data */
int
deal_with_sparse(name, header, nulls_at_end)
char *name;
union record *header;
{
long numbytes = 0;
long offset = 0;
long save_offset;
int fd;
int current_size = hstat.st_size;
int sparse_ind = 0,
cc;
char buf[RECORDSIZE];
int read_last_data = 0; /* did we just read the last record? */
int amidst_data = 0;
header->header.isextended = 0;
/*
* Can't open the file -- this problem will be caught later on,
* so just return.
*/
if ((fd = open(name, O_RDONLY)) < 0)
return 0;
init_sparsearray();
clear_buffer(buf);
while ((cc = read(fd, buf, sizeof buf)) != 0) {
if (sparse_ind > sp_array_size-1) {
/*
* realloc the scratch area, since we've run out of room --
*/
sparsearray = (struct sp_array *)
realloc(sparsearray,
2 * sp_array_size * (sizeof(struct sp_array)));
sp_array_size *= 2;
}
if (cc == sizeof buf) {
if (zero_record(buf)) {
if (amidst_data) {
sparsearray[sparse_ind++].numbytes
= numbytes;
amidst_data = 0;
}
} else { /* !zero_record(buf) */
if (amidst_data)
numbytes += cc;
else {
amidst_data = 1;
numbytes = cc;
sparsearray[sparse_ind].offset
= offset;
}
}
} else if (cc < sizeof buf) {
/* This has to be the last bit of the file, so this */
/* is somewhat shorter than the above. */
if (!zero_record(buf)) {
if (!amidst_data) {
amidst_data = 1;
numbytes = cc;
sparsearray[sparse_ind].offset
= offset;
} else
numbytes += cc;
}
}
offset += cc;
clear_buffer(buf);
}
if (amidst_data)
sparsearray[sparse_ind++].numbytes = numbytes;
close(fd);
return sparse_ind - 1;
}
/*
* Just zeroes out the buffer so we don't confuse ourselves with leftover
* data.
*/
clear_buffer(buf)
char *buf;
{
register int i;
for (i = 0; i < RECORDSIZE; i++)
buf[i] = '\0';
}
#if 0 /* I'm leaving this as a monument to Joy Kendall, who wrote it */
/*
* JK -
* This routine takes a character array, and tells where within that array
* the data can be found. It skips over any zeros, and sets the first
* non-zero point in the array to be the "start", and continues until it
* finds non-data again, which is marked as the "end." This routine is
* mainly for 1) seeing how far into a file we must lseek to data, given
* that we have a sparse file, and 2) determining the "real size" of the
* file, i.e., the number of bytes in the sparse file that are data, as
* opposed to the zeros we are trying to skip.
*/
where_is_data(from, to, buffer)
int *from,
*to;
char *buffer;
{
register int i = 0;
register int save_to = *to;
int amidst_data = 0;
while (!buffer[i])
i++;
*from = i;
if (*from < 16) /* don't bother */
*from = 0;
/* keep going to make sure there isn't more real
data in this record */
while (i < RECORDSIZE) {
if (!buffer[i]) {
if (amidst_data) {
save_to = i;
amidst_data = 0;
}
i++;
}
else if (buffer[i]) {
if (!amidst_data)
amidst_data = 1;
i++;
}
}
if (i == RECORDSIZE)
*to = i;
else
*to = save_to;
}
#endif
/* Note that this routine is only called if zero_record returned true */
#if 0 /* But we actually don't need it at all. */
where_is_data (from, to, buffer)
int *from, *to;
char *buffer;
{
char *fp, *tp;
for (fp = buffer; ! *fp; fp++)
;
for (tp = buffer + RECORDSIZE - 1; ! *tp; tp--)
;
*from = fp - buffer;
*to = tp - buffer + 1;
}
#endif
/*
* Takes a recordful of data and basically cruises through it to see if
* it's made *entirely* of zeros, returning a 0 the instant it finds
* something that is a non-zero, i.e., useful data.
*/
zero_record(buffer)
char *buffer;
{
register int i;
for (i = 0; i < RECORDSIZE; i++)
if (buffer[i] != '\000')
return 0;
return 1;
}
find_new_file_size(filesize, highest_index)
int *filesize;
int highest_index;
{
register int i;
*filesize = 0;
for (i = 0; sparsearray[i].numbytes && i <= highest_index; i++)
*filesize += sparsearray[i].numbytes;
}
/*
* Make a header block for the file name whose stat info is st .
* Return header pointer for success, NULL if the name is too long.
*/
union record *
start_header(name, st)
char *name;
register struct stat *st;
{
register union record *header;
header = (union record *) findrec();
bzero(header->charptr, sizeof(*header)); /* XXX speed up */
/*
* Check the file name and put it in the record.
*/
if(!f_absolute_paths) {
static int warned_once = 0;
#ifdef __MSDOS__
if(name[1]==':') {
name+=2;
if(!warned_once++)
msg("Removing drive spec from names in the archive");
}
#endif
while ('/' == *name) {
name++; /* Force relative path */
if (!warned_once++)
msg("Removing leading / from absolute path names in the archive.");
}
}
strncpy(header->header.name, name, NAMSIZ);
if (header->header.name[NAMSIZ-1]) {
char *mangled;
/* next_mangle(header->header.name); */
add_mangle(name,header->header.name);
msg("%s: is too long: mangling to %s", name, header->header.name);
}
to_oct((long) (st->st_mode & ~S_IFMT),
8, header->header.mode);
to_oct((long) st->st_uid, 8, header->header.uid);
to_oct((long) st->st_gid, 8, header->header.gid);
to_oct((long) st->st_size, 1+12, header->header.size);
to_oct((long) st->st_mtime, 1+12, header->header.mtime);
/* header->header.linkflag is left as null */
if(f_gnudump) {
to_oct((long) st->st_atime, 1+12, header->header.atime);
to_oct((long) st->st_ctime, 1+12, header->header.ctime);
}
#ifndef NONAMES
/* Fill in new Unix Standard fields if desired. */
if (f_standard) {
header->header.linkflag = LF_NORMAL; /* New default */
strcpy(header->header.magic, TMAGIC); /* Mark as Unix Std */
finduname(header->header.uname, st->st_uid);
findgname(header->header.gname, st->st_gid);
}
#endif
return header;
}
/*
* Finish off a filled-in header block and write it out.
* We also print the file name and/or full info if verbose is on.
*/
void
finish_header(header)
register union record *header;
{
register int i, sum;
register char *p;
void bcopy();
bcopy(CHKBLANKS, header->header.chksum, sizeof(header->header.chksum));
sum = 0;
p = header->charptr;
for (i = sizeof(*header); --i >= 0; ) {
/*
* We can't use unsigned char here because of old compilers,
* e.g. V7.
*/
sum += 0xFF & *p++;
}
/*
* Fill in the checksum field. It's formatted differently
* from the other fields: it has [6] digits, a null, then a
* space -- rather than digits, a space, then a null.
* We use to_oct then write the null in over to_oct's space.
* The final space is already there, from checksumming, and
* to_oct doesn't modify it.
*
* This is a fast way to do:
* (void) sprintf(header->header.chksum, "%6o", sum);
*/
to_oct((long) sum, 8, header->header.chksum);
header->header.chksum[6] = '\0'; /* Zap the space */
userec(header);
if (f_verbose) {
extern union record *head; /* Points to current tape header */
extern int head_standard; /* Tape header is in ANSI format */
/* These globals are parameters to print_header, sigh */
head = header;
/* hstat is already set up */
head_standard = f_standard;
print_header();
}
return;
}
/*
* Quick and dirty octal conversion.
* Converts long "value" into a "digs"-digit field at "where",
* including a trailing space and room for a null. "digs"==3 means
* 1 digit, a space, and room for a null.
*
* We assume the trailing null is already there and don't fill it in.
* This fact is used by start_header and finish_header, so don't change it!
*
* This should be equivalent to:
* (void) sprintf(where, "%*lo ", digs-2, value);
* except that sprintf fills in the trailing null and we don't.
*/
void
to_oct(value, digs, where)
register long value;
register int digs;
register char *where;
{
--digs; /* Trailing null slot is left alone */
where[--digs] = ' '; /* Put in the space, though */
/* Produce the digits -- at least one */
do {
where[--digs] = '0' + (char)(value & 7); /* one octal digit */
value >>= 3;
} while (digs > 0 && value != 0);
/* Leading spaces, if necessary */
while (digs > 0)
where[--digs] = ' ';
}
/*
* Write the EOT record(s).
* We actually zero at least one record, through the end of the block.
* Old tar writes garbage after two zeroed records -- and PDtar used to.
*/
write_eot()
{
union record *p;
int bufsize;
void bzero();
p = findrec();
if (p)
{
bufsize = endofrecs()->charptr - p->charptr;
bzero(p->charptr, bufsize);
userec(p);
}
}