diff options
Diffstat (limited to 'gnu/usr.bin/tar/diffarch.c')
| -rw-r--r-- | gnu/usr.bin/tar/diffarch.c | 759 | 
1 files changed, 759 insertions, 0 deletions
| diff --git a/gnu/usr.bin/tar/diffarch.c b/gnu/usr.bin/tar/diffarch.c new file mode 100644 index 000000000000..ce47d9d6cab5 --- /dev/null +++ b/gnu/usr.bin/tar/diffarch.c @@ -0,0 +1,759 @@ +/* Diff files from a tar archive. +   Copyright (C) 1988, 1992, 1993 Free Software Foundation + +This file is part of GNU Tar. + +GNU Tar is free software; you can redistribute it and/or modify +it under the terms of the GNU General Public License as published by +the Free Software Foundation; either version 2, or (at your option) +any later version. + +GNU Tar is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with GNU Tar; see the file COPYING.  If not, write to +the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */ + +/* + * Diff files from a tar archive. + * + * Written 30 April 1987 by John Gilmore, ihnp4!hoptoad!gnu. + */ + +#include <stdio.h> +#include <errno.h> +#ifndef STDC_HEADERS +extern int errno; +#endif +#include <sys/types.h> + +#ifdef BSD42 +#include <sys/file.h> +#else +#ifndef V7 +#include <fcntl.h> +#endif +#endif + +#ifdef HAVE_SYS_MTIO_H +#include <sys/ioctl.h> +#include <sys/mtio.h> +#endif + +#include "tar.h" +#include "port.h" +#include "rmt.h" + +#ifndef S_ISLNK +#define lstat stat +#endif + +extern void *valloc (); + +extern union record *head;	/* Points to current tape header */ +extern struct stat hstat;	/* Stat struct corresponding */ +extern int head_standard;	/* Tape header is in ANSI format */ + +void decode_header (); +void diff_sparse_files (); +void fill_in_sparse_array (); +void fl_read (); +long from_oct (); +int do_stat (); +extern void print_header (); +int read_header (); +void saverec (); +void sigh (); +extern void skip_file (); +extern void skip_extended_headers (); +int wantbytes (); + +extern FILE *msg_file; + +int now_verifying = 0;		/* Are we verifying at the moment? */ + +int diff_fd;			/* Descriptor of file we're diffing */ + +char *diff_buf = 0;		/* Pointer to area for reading +					   file contents into */ + +char *diff_dir;			/* Directory contents for LF_DUMPDIR */ + +int different = 0; + +/*struct sp_array *sparsearray; +int 		sp_ar_size = 10;*/ +/* + * Initialize for a diff operation + */ +void +diff_init () +{ +  /*NOSTRICT*/ +  diff_buf = (char *) valloc ((unsigned) blocksize); +  if (!diff_buf) +    { +      msg ("could not allocate memory for diff buffer of %d bytes", +	   blocksize); +      exit (EX_ARGSBAD); +    } +} + +/* + * Diff a file against the archive. + */ +void +diff_archive () +{ +  register char *data; +  int check, namelen; +  int err; +  long offset; +  struct stat filestat; +  int compare_chunk (); +  int compare_dir (); +  int no_op (); +#ifndef __MSDOS__ +  dev_t dev; +  ino_t ino; +#endif +  char *get_dir_contents (); +  long from_oct (); + +  errno = EPIPE;		/* FIXME, remove perrors */ + +  saverec (&head);		/* Make sure it sticks around */ +  userec (head);		/* And go past it in the archive */ +  decode_header (head, &hstat, &head_standard, 1);	/* Snarf fields */ + +  /* Print the record from 'head' and 'hstat' */ +  if (f_verbose) +    { +      if (now_verifying) +	fprintf (msg_file, "Verify "); +      print_header (); +    } + +  switch (head->header.linkflag) +    { + +    default: +      msg ("Unknown file type '%c' for %s, diffed as normal file", +	   head->header.linkflag, current_file_name); +      /* FALL THRU */ + +    case LF_OLDNORMAL: +    case LF_NORMAL: +    case LF_SPARSE: +    case LF_CONTIG: +      /* +		 * Appears to be a file. +		 * See if it's really a directory. +		 */ +      namelen = strlen (current_file_name) - 1; +      if (current_file_name[namelen] == '/') +	goto really_dir; + + +      if (do_stat (&filestat)) +	{ +	  if (head->header.isextended) +	    skip_extended_headers (); +	  skip_file ((long) hstat.st_size); +	  different++; +	  goto quit; +	} + +      if (!S_ISREG (filestat.st_mode)) +	{ +	  fprintf (msg_file, "%s: not a regular file\n", +		   current_file_name); +	  skip_file ((long) hstat.st_size); +	  different++; +	  goto quit; +	} + +      filestat.st_mode &= 07777; +      if (filestat.st_mode != hstat.st_mode) +	sigh ("mode"); +      if (filestat.st_uid != hstat.st_uid) +	sigh ("uid"); +      if (filestat.st_gid != hstat.st_gid) +	sigh ("gid"); +      if (filestat.st_mtime != hstat.st_mtime) +	sigh ("mod time"); +      if (head->header.linkflag != LF_SPARSE && +	  filestat.st_size != hstat.st_size) +	{ +	  sigh ("size"); +	  skip_file ((long) hstat.st_size); +	  goto quit; +	} + +      diff_fd = open (current_file_name, O_NDELAY | O_RDONLY | O_BINARY); + +      if (diff_fd < 0 && !f_absolute_paths) +	{ +	  char tmpbuf[NAMSIZ + 2]; + +	  tmpbuf[0] = '/'; +	  strcpy (&tmpbuf[1], current_file_name); +	  diff_fd = open (tmpbuf, O_NDELAY | O_RDONLY); +	} +      if (diff_fd < 0) +	{ +	  msg_perror ("cannot open %s", current_file_name); +	  if (head->header.isextended) +	    skip_extended_headers (); +	  skip_file ((long) hstat.st_size); +	  different++; +	  goto quit; +	} +      /* +		 * Need to treat sparse files completely differently here. +		 */ +      if (head->header.linkflag == LF_SPARSE) +	diff_sparse_files (hstat.st_size); +      else +	wantbytes ((long) (hstat.st_size), compare_chunk); + +      check = close (diff_fd); +      if (check < 0) +	msg_perror ("Error while closing %s", current_file_name); + +    quit: +      break; + +#ifndef __MSDOS__ +    case LF_LINK: +      if (do_stat (&filestat)) +	break; +      dev = filestat.st_dev; +      ino = filestat.st_ino; +      err = stat (current_link_name, &filestat); +      if (err < 0) +	{ +	  if (errno == ENOENT) +	    { +	      fprintf (msg_file, "%s: does not exist\n", current_file_name); +	    } +	  else +	    { +	      msg_perror ("cannot stat file %s", current_file_name); +	    } +	  different++; +	  break; +	} +      if (filestat.st_dev != dev || filestat.st_ino != ino) +	{ +	  fprintf (msg_file, "%s not linked to %s\n", current_file_name, current_link_name); +	  break; +	} +      break; +#endif + +#ifdef S_ISLNK +    case LF_SYMLINK: +      { +	char linkbuf[NAMSIZ + 3]; +	check = readlink (current_file_name, linkbuf, +			  (sizeof linkbuf) - 1); + +	if (check < 0) +	  { +	    if (errno == ENOENT) +	      { +		fprintf (msg_file, +			 "%s: no such file or directory\n", +			 current_file_name); +	      } +	    else +	      { +		msg_perror ("cannot read link %s", current_file_name); +	      } +	    different++; +	    break; +	  } + +	linkbuf[check] = '\0';	/* Null-terminate it */ +	if (strncmp (current_link_name, linkbuf, check) != 0) +	  { +	    fprintf (msg_file, "%s: symlink differs\n", +		     current_link_name); +	    different++; +	  } +      } +      break; +#endif + +#ifdef S_IFCHR +    case LF_CHR: +      hstat.st_mode |= S_IFCHR; +      goto check_node; +#endif + +#ifdef S_IFBLK +      /* If local system doesn't support block devices, use default case */ +    case LF_BLK: +      hstat.st_mode |= S_IFBLK; +      goto check_node; +#endif + +#ifdef S_ISFIFO +      /* If local system doesn't support FIFOs, use default case */ +    case LF_FIFO: +#ifdef S_IFIFO +      hstat.st_mode |= S_IFIFO; +#endif +      hstat.st_rdev = 0;	/* FIXME, do we need this? */ +      goto check_node; +#endif + +    check_node: +      /* FIXME, deal with umask */ +      if (do_stat (&filestat)) +	break; +      if (hstat.st_rdev != filestat.st_rdev) +	{ +	  fprintf (msg_file, "%s: device numbers changed\n", current_file_name); +	  different++; +	  break; +	} +#ifdef S_IFMT +      if (hstat.st_mode != filestat.st_mode) +#else /* POSIX lossage */ +      if ((hstat.st_mode & 07777) != (filestat.st_mode & 07777)) +#endif +	{ +	  fprintf (msg_file, "%s: mode or device-type changed\n", current_file_name); +	  different++; +	  break; +	} +      break; + +    case LF_DUMPDIR: +      data = diff_dir = get_dir_contents (current_file_name, 0); +      if (data) +	{ +	  wantbytes ((long) (hstat.st_size), compare_dir); +	  free (data); +	} +      else +	wantbytes ((long) (hstat.st_size), no_op); +      /* FALL THROUGH */ + +    case LF_DIR: +      /* Check for trailing / */ +      namelen = strlen (current_file_name) - 1; +    really_dir: +      while (namelen && current_file_name[namelen] == '/') +	current_file_name[namelen--] = '\0';	/* Zap / */ + +      if (do_stat (&filestat)) +	break; +      if (!S_ISDIR (filestat.st_mode)) +	{ +	  fprintf (msg_file, "%s is no longer a directory\n", current_file_name); +	  different++; +	  break; +	} +      if ((filestat.st_mode & 07777) != (hstat.st_mode & 07777)) +	sigh ("mode"); +      break; + +    case LF_VOLHDR: +      break; + +    case LF_MULTIVOL: +      namelen = strlen (current_file_name) - 1; +      if (current_file_name[namelen] == '/') +	goto really_dir; + +      if (do_stat (&filestat)) +	break; + +      if (!S_ISREG (filestat.st_mode)) +	{ +	  fprintf (msg_file, "%s: not a regular file\n", +		   current_file_name); +	  skip_file ((long) hstat.st_size); +	  different++; +	  break; +	} + +      filestat.st_mode &= 07777; +      offset = from_oct (1 + 12, head->header.offset); +      if (filestat.st_size != hstat.st_size + offset) +	{ +	  sigh ("size"); +	  skip_file ((long) hstat.st_size); +	  different++; +	  break; +	} + +      diff_fd = open (current_file_name, O_NDELAY | O_RDONLY | O_BINARY); + +      if (diff_fd < 0) +	{ +	  msg_perror ("cannot open file %s", current_file_name); +	  skip_file ((long) hstat.st_size); +	  different++; +	  break; +	} +      err = lseek (diff_fd, offset, 0); +      if (err != offset) +	{ +	  msg_perror ("cannot seek to %ld in file %s", offset, current_file_name); +	  different++; +	  break; +	} + +      wantbytes ((long) (hstat.st_size), compare_chunk); + +      check = close (diff_fd); +      if (check < 0) +	{ +	  msg_perror ("Error while closing %s", current_file_name); +	} +      break; + +    } + +  /* We don't need to save it any longer. */ +  saverec ((union record **) 0);/* Unsave it */ +} + +int +compare_chunk (bytes, buffer) +     long bytes; +     char *buffer; +{ +  int err; + +  err = read (diff_fd, diff_buf, bytes); +  if (err != bytes) +    { +      if (err < 0) +	{ +	  msg_perror ("can't read %s", current_file_name); +	} +      else +	{ +	  fprintf (msg_file, "%s: could only read %d of %d bytes\n", current_file_name, err, bytes); +	} +      different++; +      return -1; +    } +  if (bcmp (buffer, diff_buf, bytes)) +    { +      fprintf (msg_file, "%s: data differs\n", current_file_name); +      different++; +      return -1; +    } +  return 0; +} + +int +compare_dir (bytes, buffer) +     long bytes; +     char *buffer; +{ +  if (bcmp (buffer, diff_dir, bytes)) +    { +      fprintf (msg_file, "%s: data differs\n", current_file_name); +      different++; +      return -1; +    } +  diff_dir += bytes; +  return 0; +} + +/* + * Sigh about something that differs. + */ +void +sigh (what) +     char *what; +{ + +  fprintf (msg_file, "%s: %s differs\n", +	   current_file_name, what); +} + +void +verify_volume () +{ +  int status; +#ifdef MTIOCTOP +  struct mtop t; +  int er; +#endif + +  if (!diff_buf) +    diff_init (); +#ifdef MTIOCTOP +  t.mt_op = MTBSF; +  t.mt_count = 1; +  if ((er = rmtioctl (archive, MTIOCTOP, &t)) < 0) +    { +      if (errno != EIO || (er = rmtioctl (archive, MTIOCTOP, &t)) < 0) +	{ +#endif +	  if (rmtlseek (archive, 0L, 0) != 0) +	    { +	      /* Lseek failed.  Try a different method */ +	      msg_perror ("Couldn't rewind archive file for verify"); +	      return; +	    } +#ifdef MTIOCTOP +	} +    } +#endif +  ar_reading = 1; +  now_verifying = 1; +  fl_read (); +  for (;;) +    { +      status = read_header (); +      if (status == 0) +	{ +	  unsigned n; + +	  n = 0; +	  do +	    { +	      n++; +	      status = read_header (); +	    } +	  while (status == 0); +	  msg ("VERIFY FAILURE: %d invalid header%s detected!", n, n == 1 ? "" : "s"); +	} +      if (status == 2 || status == EOF) +	break; +      diff_archive (); +    } +  ar_reading = 0; +  now_verifying = 0; + +} + +int +do_stat (statp) +     struct stat *statp; +{ +  int err; + +  err = f_follow_links ? stat (current_file_name, statp) : lstat (current_file_name, statp); +  if (err < 0) +    { +      if (errno == ENOENT) +	{ +	  fprintf (msg_file, "%s: does not exist\n", current_file_name); +	} +      else +	msg_perror ("can't stat file %s", current_file_name); +      /*		skip_file((long)hstat.st_size); +		different++;*/ +      return 1; +    } +  else +    return 0; +} + +/* + * JK + * Diff'ing a sparse file with its counterpart on the tar file is a + * bit of a different story than a normal file.  First, we must know + * what areas of the file to skip through, i.e., we need to contruct + * a sparsearray, which will hold all the information we need.  We must + * compare small amounts of data at a time as we find it. + */ + +void +diff_sparse_files (filesize) +     int filesize; + +{ +  int sparse_ind = 0; +  char *buf; +  int buf_size = RECORDSIZE; +  union record *datarec; +  int err; +  long numbytes; +  /*	int		amt_read = 0;*/ +  int size = filesize; + +  buf = (char *) ck_malloc (buf_size * sizeof (char)); + +  fill_in_sparse_array (); + + +  while (size > 0) +    { +      datarec = findrec (); +      if (!sparsearray[sparse_ind].numbytes) +	break; + +      /* +		 * 'numbytes' is nicer to write than +		 * 'sparsearray[sparse_ind].numbytes' all the time ... +		 */ +      numbytes = sparsearray[sparse_ind].numbytes; + +      lseek (diff_fd, sparsearray[sparse_ind].offset, 0); +      /* +		 * take care to not run out of room in our buffer +		 */ +      while (buf_size < numbytes) +	{ +	  buf = (char *) ck_realloc (buf, buf_size * 2 * sizeof (char)); +	  buf_size *= 2; +	} +      while (numbytes > RECORDSIZE) +	{ +	  if ((err = read (diff_fd, buf, RECORDSIZE)) != RECORDSIZE) +	    { +	      if (err < 0) +		msg_perror ("can't read %s", current_file_name); +	      else +		fprintf (msg_file, "%s: could only read %d of %d bytes\n", +			 current_file_name, err, numbytes); +	      break; +	    } +	  if (bcmp (buf, datarec->charptr, RECORDSIZE)) +	    { +	      different++; +	      break; +	    } +	  numbytes -= err; +	  size -= err; +	  userec (datarec); +	  datarec = findrec (); +	} +      if ((err = read (diff_fd, buf, numbytes)) != numbytes) +	{ +	  if (err < 0) +	    msg_perror ("can't read %s", current_file_name); +	  else +	    fprintf (msg_file, "%s: could only read %d of %d bytes\n", +		     current_file_name, err, numbytes); +	  break; +	} + +      if (bcmp (buf, datarec->charptr, numbytes)) +	{ +	  different++; +	  break; +	} +      /*		amt_read += numbytes; +		if (amt_read >= RECORDSIZE) { +			amt_read = 0; +			userec(datarec); +			datarec = findrec(); +		}*/ +      userec (datarec); +      sparse_ind++; +      size -= numbytes; +    } +  /* +	 * if the number of bytes read isn't the +	 * number of bytes supposedly in the file, +	 * they're different +	 */ +  /*	if (amt_read != filesize) +		different++;*/ +  userec (datarec); +  free (sparsearray); +  if (different) +    fprintf (msg_file, "%s: data differs\n", current_file_name); + +} + +/* + * JK + * This routine should be used more often than it is ... look into + * that.  Anyhow, what it does is translate the sparse information + * on the header, and in any subsequent extended headers, into an + * array of structures with true numbers, as opposed to character + * strings.  It simply makes our life much easier, doing so many + * comparisong and such. + */ +void +fill_in_sparse_array () +{ +  int ind; + +  /* +	 * allocate space for our scratch space; it's initially +	 * 10 elements long, but can change in this routine if +	 * necessary +	 */ +  sp_array_size = 10; +  sparsearray = (struct sp_array *) ck_malloc (sp_array_size * sizeof (struct sp_array)); + +  /* +	 * there are at most five of these structures in the header +	 * itself; read these in first +	 */ +  for (ind = 0; ind < SPARSE_IN_HDR; ind++) +    { +      if (!head->header.sp[ind].numbytes) +	break; +      sparsearray[ind].offset = +	from_oct (1 + 12, head->header.sp[ind].offset); +      sparsearray[ind].numbytes = +	from_oct (1 + 12, head->header.sp[ind].numbytes); +    } +  /* +	 * if the header's extended, we gotta read in exhdr's till +	 * we're done +	 */ +  if (head->header.isextended) +    { +      /* how far into the sparsearray we are 'so far' */ +      static int so_far_ind = SPARSE_IN_HDR; +      union record *exhdr; + +      for (;;) +	{ +	  exhdr = findrec (); +	  for (ind = 0; ind < SPARSE_EXT_HDR; ind++) +	    { +	      if (ind + so_far_ind > sp_array_size - 1) +		{ +		  /* + 				 * we just ran out of room in our +				 *  scratch area - realloc it + 				 */ +		  sparsearray = (struct sp_array *) +		    ck_realloc (sparsearray, +			     sp_array_size * 2 * sizeof (struct sp_array)); +		  sp_array_size *= 2; +		} +	      /* +			 * convert the character strings into longs +			 */ +	      sparsearray[ind + so_far_ind].offset = +		from_oct (1 + 12, exhdr->ext_hdr.sp[ind].offset); +	      sparsearray[ind + so_far_ind].numbytes = +		from_oct (1 + 12, exhdr->ext_hdr.sp[ind].numbytes); +	    } +	  /* +		 * if this is the last extended header for this +		 * file, we can stop +		 */ +	  if (!exhdr->ext_hdr.isextended) +	    break; +	  else +	    { +	      so_far_ind += SPARSE_EXT_HDR; +	      userec (exhdr); +	    } +	} +      /* be sure to skip past the last one  */ +      userec (exhdr); +    } +} | 
