328 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			328 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/* treecmp - compare two trees		Author: Andy Tanenbaum */
 | 
						|
 | 
						|
/* This program recursively compares two trees and reports on differences.
 | 
						|
 * It can be used, for example, when a project consists of a large number
 | 
						|
 * of files and directories.  When a new release (i.e., a new tree) has been
 | 
						|
 * prepared, the old and new tree can be compared to give a list of what has
 | 
						|
 * changed.  The algorithm used is that the second tree is recursively
 | 
						|
 * descended and for each file or directory found, the corresponding one in
 | 
						|
 * the other tree checked.  The two arguments are not completely symmetric
 | 
						|
 * because the second tree is descended, not the first one, but reversing
 | 
						|
 * the arguments will still detect all the differences, only they will be
 | 
						|
 * printed in a different order.  The program needs lots of stack space
 | 
						|
 * because routines with local arrays are called recursively. The call is
 | 
						|
 *    treecmp [-cv] old_dir new_dir
 | 
						|
 * The -v flag (verbose) prints the directory names as they are processed.
 | 
						|
 * The -c flag (changes) just prints the names of changed and new files.
 | 
						|
 */
 | 
						|
 | 
						|
#include <sys/types.h>
 | 
						|
#include <sys/stat.h>
 | 
						|
#include <fcntl.h>
 | 
						|
#include <string.h>
 | 
						|
#include <unistd.h>
 | 
						|
#include <stdlib.h>
 | 
						|
#include <stdio.h>
 | 
						|
 | 
						|
#define BUFSIZE 4096		/* size of file buffers */
 | 
						|
#define MAXPATH 128		/* longest acceptable path */
 | 
						|
#define DIRENTLEN 14		/* number of characters in a file name */
 | 
						|
 | 
						|
struct dirstruct {		/* layout of a directory entry */
 | 
						|
  ino_t inum;
 | 
						|
  char fname[DIRENTLEN];
 | 
						|
};
 | 
						|
 | 
						|
struct stat stat1, stat2;	/* stat buffers */
 | 
						|
 | 
						|
char buf1[BUFSIZE];		/* used for comparing bufs */
 | 
						|
char buf2[BUFSIZE];		/* used for comparing bufs */
 | 
						|
 | 
						|
int changes;			/* set on -c flag */
 | 
						|
int verbose;			/* set on -v flag */
 | 
						|
 | 
						|
_PROTOTYPE(int main, (int argc, char **argv));
 | 
						|
_PROTOTYPE(void compare, (char *old, char *new));
 | 
						|
_PROTOTYPE(void regular, (char *old, char *new));
 | 
						|
_PROTOTYPE(void directory, (char *old, char *new));
 | 
						|
_PROTOTYPE(void check, (char *s, struct dirstruct *dp1, int ent1, char *new));
 | 
						|
_PROTOTYPE(void usage, (void));
 | 
						|
 | 
						|
int main(argc, argv)
 | 
						|
int argc;
 | 
						|
char *argv[];
 | 
						|
{
 | 
						|
  char *p;
 | 
						|
 | 
						|
  if (argc < 3 || argc > 4) usage();
 | 
						|
  p = argv[1];
 | 
						|
  if (argc == 4) {
 | 
						|
	if (*p != '-') usage();
 | 
						|
	p++;
 | 
						|
	if (*p == '\0') usage();
 | 
						|
	while (*p) {
 | 
						|
		if (*p == 'c') changes++;
 | 
						|
		if (*p == 'v') verbose++;
 | 
						|
		if (*p != 'c' && *p != 'v') usage();
 | 
						|
		p++;
 | 
						|
	}
 | 
						|
  }
 | 
						|
  if (argc == 3)
 | 
						|
	compare(argv[1], argv[2]);
 | 
						|
  else
 | 
						|
	compare(argv[2], argv[3]);
 | 
						|
 | 
						|
  return(0);
 | 
						|
}
 | 
						|
 | 
						|
void compare(old, new)
 | 
						|
char *old, *new;
 | 
						|
{
 | 
						|
/* This is the main comparision routine.  It gets two path names as arguments
 | 
						|
 * and stats them both.  Depending on the results, it calls other routines
 | 
						|
 * to compare directories or files.
 | 
						|
 */
 | 
						|
 | 
						|
  int type1, type2;
 | 
						|
 | 
						|
  if (stat(new, &stat1) < 0) {
 | 
						|
	/* The new file does not exist. */
 | 
						|
	if (changes == 0)
 | 
						|
		fprintf(stderr, "Cannot stat: %s\n", new);
 | 
						|
	else
 | 
						|
		printf("%s\n", new);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
  if (stat(old, &stat2) < 0) {
 | 
						|
	/* The old file does not exist. */
 | 
						|
	if (changes == 0) 
 | 
						|
		fprintf(stderr, "Missing file: %s\n", old);
 | 
						|
	else
 | 
						|
		printf("%s\n", new);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
 | 
						|
  /* Examine the types of the files. */
 | 
						|
  type1 = stat1.st_mode & S_IFMT;
 | 
						|
  type2 = stat2.st_mode & S_IFMT;
 | 
						|
  if (type1 != type2) {
 | 
						|
	fprintf(stderr, "Type diff: %s and %s\n", new, old);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
 | 
						|
  /* The types are the same. */
 | 
						|
  switch (type1) {
 | 
						|
      case S_IFREG:	regular(old, new);	break;
 | 
						|
      case S_IFDIR:	directory(old, new);	break;
 | 
						|
      case S_IFCHR:	break;
 | 
						|
      case S_IFBLK:	break;
 | 
						|
      default:		fprintf(stderr, "Unknown file type %o\n", type1);
 | 
						|
  }
 | 
						|
  return;
 | 
						|
}
 | 
						|
 | 
						|
void regular(old, new)
 | 
						|
char *old, *new;
 | 
						|
{
 | 
						|
/* Compare to regular files.  If they are different, complain. */
 | 
						|
 | 
						|
  int fd1, fd2, n1, n2;
 | 
						|
  unsigned bytes;
 | 
						|
  long count;
 | 
						|
 | 
						|
  if (stat1.st_size != stat2.st_size) {
 | 
						|
	if (changes == 0)
 | 
						|
		printf("Size diff: %s and %s\n", new, old);
 | 
						|
	else
 | 
						|
		printf("%s\n", new);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
 | 
						|
  /* The sizes are the same.  We actually have to read the files now. */
 | 
						|
  fd1 = open(new, O_RDONLY);
 | 
						|
  if (fd1 < 0) {
 | 
						|
	fprintf(stderr, "Cannot open %s for reading\n", new);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
  fd2 = open(old, O_RDONLY);
 | 
						|
  if (fd2 < 0) {
 | 
						|
	fprintf(stderr, "Cannot open %s for reading\n", old);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
  count = stat1.st_size;
 | 
						|
  while (count > 0L) {
 | 
						|
	bytes = (unsigned) (count > BUFSIZE ? BUFSIZE : count);	/* rd count */
 | 
						|
	n1 = read(fd1, buf1, bytes);
 | 
						|
	n2 = read(fd2, buf2, bytes);
 | 
						|
	if (n1 != n2) {
 | 
						|
		if (changes == 0)
 | 
						|
			printf("Length diff: %s and %s\n", new, old);
 | 
						|
		else
 | 
						|
			printf("%s\n", new);
 | 
						|
		close(fd1);
 | 
						|
		close(fd2);
 | 
						|
		return;
 | 
						|
	}
 | 
						|
 | 
						|
	/* Compare the buffers. */
 | 
						|
	if (memcmp((void *) buf1, (void *) buf2, (size_t) n1) != 0) {
 | 
						|
		if (changes == 0)
 | 
						|
			printf("File diff: %s and %s\n", new, old);
 | 
						|
		else
 | 
						|
			printf("%s\n", new);
 | 
						|
		close(fd1);
 | 
						|
		close(fd2);
 | 
						|
		return;
 | 
						|
	}
 | 
						|
	count -= n1;
 | 
						|
  }
 | 
						|
  close(fd1);
 | 
						|
  close(fd2);
 | 
						|
}
 | 
						|
 | 
						|
void directory(old, new)
 | 
						|
char *old, *new;
 | 
						|
{
 | 
						|
/* Recursively compare two directories by reading them and comparing their
 | 
						|
 * contents.  The order of the entries need not be the same.
 | 
						|
 */
 | 
						|
 | 
						|
  int fd1, fd2, n1, n2, ent1, ent2, i, used1 = 0, used2 = 0;
 | 
						|
  char *dir1buf, *dir2buf;
 | 
						|
  char name1buf[MAXPATH], name2buf[MAXPATH];
 | 
						|
  struct dirstruct *dp1, *dp2;
 | 
						|
  unsigned dir1bytes, dir2bytes;
 | 
						|
 | 
						|
  /* Allocate space to read in the directories */
 | 
						|
  dir1bytes = (unsigned) stat1.st_size;
 | 
						|
  dir1buf = (char *)malloc((size_t)dir1bytes);
 | 
						|
  if (dir1buf == 0) {
 | 
						|
	fprintf(stderr, "Cannot process directory %s: out of memory\n", new);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
  dir2bytes = (unsigned) stat2.st_size;
 | 
						|
  dir2buf = (char *)malloc((size_t)dir2bytes);
 | 
						|
  if (dir2buf == 0) {
 | 
						|
	fprintf(stderr, "Cannot process directory %s: out of memory\n", old);
 | 
						|
	free(dir1buf);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
 | 
						|
  /* Read in the directories. */
 | 
						|
  fd1 = open(new, O_RDONLY);
 | 
						|
  if (fd1 > 0) n1 = read(fd1, dir1buf, dir1bytes);
 | 
						|
  if (fd1 < 0 || n1 != dir1bytes) {
 | 
						|
	fprintf(stderr, "Cannot read directory %s\n", new);
 | 
						|
	free(dir1buf);
 | 
						|
	free(dir2buf);
 | 
						|
	if (fd1 > 0) close(fd1);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
  close(fd1);
 | 
						|
 | 
						|
  fd2 = open(old, O_RDONLY);
 | 
						|
  if (fd2 > 0) n2 = read(fd2, dir2buf, dir2bytes);
 | 
						|
  if (fd2 < 0 || n2 != dir2bytes) {
 | 
						|
	fprintf(stderr, "Cannot read directory %s\n", old);
 | 
						|
	free(dir1buf);
 | 
						|
	free(dir2buf);
 | 
						|
	close(fd1);
 | 
						|
	if (fd2 > 0) close(fd2);
 | 
						|
	return;
 | 
						|
  }
 | 
						|
  close(fd2);
 | 
						|
 | 
						|
  /* Linearly search directories */
 | 
						|
  ent1 = dir1bytes / sizeof(struct dirstruct);
 | 
						|
  dp1 = (struct dirstruct *) dir1buf;
 | 
						|
  for (i = 0; i < ent1; i++) {
 | 
						|
	if (dp1->inum != 0) used1++;
 | 
						|
	dp1++;
 | 
						|
  }
 | 
						|
 | 
						|
  ent2 = dir2bytes / sizeof(struct dirstruct);
 | 
						|
  dp2 = (struct dirstruct *) dir2buf;
 | 
						|
  for (i = 0; i < ent2; i++) {
 | 
						|
	if (dp2->inum != 0) used2++;
 | 
						|
	dp2++;
 | 
						|
  }
 | 
						|
 | 
						|
  if (verbose) printf("Directory %s: %d entries\n", new, used1);
 | 
						|
 | 
						|
  /* Check to see if any entries in dir2 are missing from dir1. */
 | 
						|
  dp1 = (struct dirstruct *) dir1buf;
 | 
						|
  dp2 = (struct dirstruct *) dir2buf;
 | 
						|
  for (i = 0; i < ent2; i++) {
 | 
						|
	if (dp2->inum == 0 || strcmp(dp2->fname, ".") == 0 ||
 | 
						|
					    strcmp(dp2->fname, "..") == 0) {
 | 
						|
		dp2++;
 | 
						|
		continue;
 | 
						|
	}
 | 
						|
	check(dp2->fname, dp1, ent1, new);
 | 
						|
	dp2++;
 | 
						|
  }
 | 
						|
 | 
						|
  /* Recursively process all the entries in dir1. */
 | 
						|
  dp1 = (struct dirstruct *) dir1buf;
 | 
						|
  for (i = 0; i < ent1; i++) {
 | 
						|
	if (dp1->inum == 0 || strcmp(dp1->fname, ".") == 0 ||
 | 
						|
	    strcmp(dp1->fname, "..") == 0) {
 | 
						|
		dp1++;
 | 
						|
		continue;
 | 
						|
	}
 | 
						|
	if (strlen(new) + DIRENTLEN >= MAXPATH) {
 | 
						|
		fprintf(stderr, "Path too long: %s\n", new);
 | 
						|
		free(dir1buf);
 | 
						|
		free(dir2buf);
 | 
						|
		return;
 | 
						|
	}
 | 
						|
	if (strlen(old) + DIRENTLEN >= MAXPATH) {
 | 
						|
		fprintf(stderr, "Path too long: %s\n", old);
 | 
						|
		free(dir1buf);
 | 
						|
		free(dir2buf);
 | 
						|
		return;
 | 
						|
	}
 | 
						|
	strcpy(name1buf, old);
 | 
						|
	strcat(name1buf, "/");
 | 
						|
	strncat(name1buf, dp1->fname, (size_t)DIRENTLEN);
 | 
						|
	strcpy(name2buf, new);
 | 
						|
	strcat(name2buf, "/");
 | 
						|
	strncat(name2buf, dp1->fname, (size_t)DIRENTLEN);
 | 
						|
 | 
						|
	/* Here is the recursive call to process an entry. */
 | 
						|
	compare(name1buf, name2buf);	/* recursive call */
 | 
						|
	dp1++;
 | 
						|
  }
 | 
						|
 | 
						|
  free(dir1buf);
 | 
						|
  free(dir2buf);
 | 
						|
}
 | 
						|
 | 
						|
void check(s, dp1, ent1, new)
 | 
						|
char *s;
 | 
						|
struct dirstruct *dp1;
 | 
						|
int ent1;
 | 
						|
char *new;
 | 
						|
{
 | 
						|
/* See if the file name 's' is present in the directory 'dirbuf'. */
 | 
						|
  int i;
 | 
						|
  char file[DIRENTLEN+1];
 | 
						|
 | 
						|
  for (i = 0; i < ent1; i++) {
 | 
						|
	if (strncmp(dp1->fname, s, (size_t)DIRENTLEN) == 0) return;
 | 
						|
	dp1++;
 | 
						|
  }
 | 
						|
  if (changes == 0) {
 | 
						|
	strncpy(file, s, DIRENTLEN);
 | 
						|
	file[DIRENTLEN] = '\0';
 | 
						|
	printf("Missing file: %s/%s\n", new, file);
 | 
						|
  }
 | 
						|
	
 | 
						|
}
 | 
						|
 | 
						|
void usage()
 | 
						|
{
 | 
						|
  printf("Usage: treecmp [-cv] old_dir new_dir\n");
 | 
						|
  exit(1);
 | 
						|
}
 |