[comp.os.minix] Reposting of diff.c

ast@botter.UUCP (05/20/87)

Based on some recent postings and some mail to me, I have the impression that
a lot of people did not see Erik Baalbergen's posting of diff.c a while back.
Perhaps there was a foul-up in the news delivery.  Here it is again.

Andy Tanenbaum

----------------------------------------- cut here ----------------------
/* diff(1)  --  author Erik Baalbergen */

/* Straight forward implementation of diff(1); no options available.
   It tends to give more output than other diffs but it's faster.
*/
#include <stdio.h>

#define LINELEN 256
#define stop(n)	exit(n)

/* the main program */
char *prog;
int diffs = 0;

main(argc, argv)
	char **argv;
{
	FILE *fp1 = NULL, *fp2 = NULL;

	prog = *argv++;
	if (argc != 3) {
		fprintf(stderr, "use: %s file1 file2\n", prog);
		stop(2);
	}
	if (strcmp(argv[0], "-") == 0)
		fp1 = stdin;
	else
	if (strcmp(argv[1], "-") == 0)
		fp2 = stdin;
	if (fp1 == NULL && (fp1 = fopen(argv[0], "r")) == NULL)
		open_failed(argv[0]);
	if (fp2 == NULL && (fp2 = fopen(argv[1], "r")) == NULL)
		open_failed(argv[1]);
	diff(fp1, fp2);
	stop(diffs > 0);
}

open_failed(s)
	char *s;
{
	fprintf(stderr, "%s: can't read %s\n", prog, s);
	stop(2);
}

/* the line module */
char *malloc();
char *fgets();

struct line {
	struct line *l_next;
	char l_text[LINELEN];
};

struct line *freelist = 0;

struct line *
new_line()
{
	register struct line *l;

	if (l = freelist) {
		freelist = freelist->l_next;
		return l;
	}
	if ((l = (struct line *)malloc(sizeof(struct line))) == 0) {
		fprintf(stderr, "out of memory\n");
		stop(2);
	}
	return l;
}

free_line(l)
	register struct line *l;
{
	l->l_next = freelist;
	freelist = l;
}

equal_line(l1, l2)
	struct line *l1, *l2;
{
	return strcmp(l1->l_text, l2->l_text) == 0;
}

struct line *
read_line(fp)
	FILE *fp;
{
	register struct line *l = new_line();

	if (fgets(l->l_text, LINELEN, fp) == NULL) {
		free_line(l);
		return 0;
	}
	l->l_next = 0;
	return l;
}

/* file window handler */
struct f {
	struct line *f_bwin, *f_ewin;
	struct line *f_aside;
	int f_linecnt;	/* line number in file of last advanced line */
	FILE *f_fp;
};

advance(f)
	register struct f *f;
{
	register struct line *l;
	
	if (l = f->f_bwin) {
		if (f->f_ewin == l)
			f->f_bwin = f->f_ewin = 0;
		else
			f->f_bwin = l->l_next;
		free_line(l);
		(f->f_linecnt)++;
	}
}

aside(f, l)
	struct f *f;
	struct line *l;
{
	register struct line *ll;

	if (ll = l->l_next) {
		while (ll->l_next)
			ll = ll->l_next;
		ll->l_next = f->f_aside;
		f->f_aside = l->l_next;
		l->l_next = 0;
		f->f_ewin = l;
	}
}

struct line *
next(f)
	register struct f *f;
{
	register struct line *l;

	if (l = f->f_aside) {
		f->f_aside = l->l_next;
		l->l_next = 0;
	}
	else
		l = read_line(f->f_fp);
	if (l) {
		if (f->f_bwin == 0)
			f->f_bwin = f->f_ewin = l;
		else {
			f->f_ewin->l_next = l;
			f->f_ewin = l;
		}
	}
	return l;
}

init_f(f, fp)
	register struct f *f;
	FILE *fp;
{
	f->f_bwin = f->f_ewin =  f->f_aside = 0;
	f->f_linecnt = 0;
	f->f_fp = fp;
}

update(f, s)
	register struct f *f;
	char *s;
{
	while (f->f_bwin && f->f_bwin != f->f_ewin) {
		printf("%s%s", s, f->f_bwin->l_text);
		advance(f);
	}
}
	
/* diff procedure */
diff(fp1, fp2)
	FILE *fp1, *fp2;
{
	struct f f1, f2;
	struct line *l1, *s1, *l2, *s2;
	register struct line *ll;

	init_f(&f1, fp1);
	init_f(&f2, fp2);

	l1 = next(&f1);
	l2 = next(&f2);
	while (l1 && l2) {
		if (equal_line(l1, l2)) {
equal:
			advance(&f1);
			advance(&f2);
			l1 = next(&f1);
			l2 = next(&f2);
			continue;
		}
		s1 = l1;
		s2 = l2;
		/* start searching */
search:
		if ((l2 = next(&f2)) == 0)
			continue;
		ll = s1;
		do {
			if (equal_line(ll, l2)) {
				aside(&f1, ll);
				differ(&f1, &f2);
				goto equal;
			}
		} while (ll = ll->l_next);
		if ((l1 = next(&f1)) == 0)
			continue;
		ll = s2;
		do {
			if (equal_line(ll, l1)) {
				aside(&f2, ll);
				differ(&f1, &f2);
				goto equal;
			}
		} while (ll = ll->l_next);
		goto search;
	}
	/* arrived here: one of the files reached EOF */
	if (l1) /* eof on 2 */
		while (next(&f1)) {}
	if (l2)
		while (next(&f2)) {}
	f1.f_ewin = 0;
	f2.f_ewin = 0;
	differ(&f1, &f2);
}

differ(f1, f2)
	register struct f *f1, *f2;
{
	int cnt1 = f1->f_linecnt, len1 = wlen(f1), cnt2 = f2->f_linecnt,
		len2 = wlen(f2);

	if (len1 == 0) {
		if (len2 == 0)
			return;
		if (len2 == 1)
			printf("%da%d\n", cnt1, cnt2 + 1);
		else
			printf("%da%d,%d\n", cnt1, cnt2 + 1, cnt2 + len2);
	}
	else
	if (len2 == 0) {
		if (len1 == 1)
			printf("%dd%d\n", cnt1 + 1, cnt2);
		else
			printf("%d,%dd%d\n", cnt1 + 1, cnt1 + len1, cnt2);
	}
	else {
		if (len1 == 1)
			printf("%dc", cnt1 + 1);
		else
			printf("%d,%dc", cnt1 + 1, cnt1 + len1);
		if (len2 == 1)
			printf("%d\n", cnt2 + 1);
		else
			printf("%d,%d\n", cnt2 + 1, cnt2 + len2);
	}
	if (len1)
		update(f1, "< ");
	if (len1 && len2)
		printf("---\n");
	if (len2)
		update(f2, "> ");
	diffs++;
}

wlen(f)
	struct f *f;
{
	register cnt = 0;
	register struct line *l = f->f_bwin, *e = f->f_ewin;

	while (l && l != e) {
		cnt++;
		l = l->l_next;
	}
	return cnt;
}

erikb@cs.vu.nl (Erik Baalbergen) (05/21/87)

Please ignore my previous version of diff, which has been posted to this news
group. It contained a few bugs which are fixed in the following one.
Because there is still no 'patch' program widely available, I post the full
source.

Erik Baalbergen

--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--8<--
/* diff  --  author Erik Baalbergen */

/* Poor man's implementation of diff(1)
 - no options available
 - may give more output than other diffs, due to the straight-forward algorithm
 - runs out of memory if the differing chunks become too large
 - input line length should not exceed LINELEN; longer lines are truncated,
   while only the first LINELEN characters are compared
 
 Please report bugs and suggestions to erikb@cs.vu.nl
*/
#include <stdio.h>

#define LINELEN 128

char *prog;
int diffs = 0;

main(argc, argv)
	char **argv;
{
	FILE *fp1 = NULL, *fp2 = NULL;

	prog = *argv++;
	if (argc != 3)
		fatal("use: %s file1 file2", prog);
	if (strcmp(argv[0], "-") == 0)
		fp1 = stdin;
	else
	if (strcmp(argv[1], "-") == 0)
		fp2 = stdin;
	if (fp1 == NULL && (fp1 = fopen(argv[0], "r")) == NULL)
		fatal("can't read %s", argv[0]);
	if (fp2 == NULL && (fp2 = fopen(argv[1], "r")) == NULL)
		fatal("can't read %s", argv[1]);
	diff(fp1, fp2);
	exit(diffs > 0);
}

fatal(fmt, s)
	char *fmt, *s;
{
	fprintf(stderr, "%s: ", prog);
	fprintf(stderr, fmt, s);
	fprintf(stderr, "\n");
	exit(2);
}

/* the line module */
char *malloc();
char *fgets();

struct line {
	struct line *l_next;
	char l_text[LINELEN + 2];
};

struct line *freelist = 0;

struct line *
new_line()
{
	register struct line *l;

	if (l = freelist)
		freelist = freelist->l_next;
	else
	if ((l = (struct line *)malloc(sizeof(struct line))) == 0)
		fatal("out of memory");
	return l;
}

free_line(l)
	register struct line *l;
{
	l->l_next = freelist;
	freelist = l;
}

#define equal_line(l1, l2) (strcmp((l1)->l_text, (l2)->l_text) == 0)

struct line *
read_line(fp)
	FILE *fp;
{
	register struct line *l = new_line();
	register char *p;
	register int c;

	(p = &(l->l_text[LINELEN]))[1] = '\377';
	if (fgets(l->l_text, LINELEN + 2, fp) == NULL) {
		free_line(l);
		return 0;
	}
	if (p[1] != '\377' && *p != '\n') {
		while ((c = fgetc(fp)) != '\n' && c != EOF) {}
		*p++ = '\n';
		*p = '\0';
	}
	l->l_next = 0;
	return l;
}

/* file window handler */
struct f {
	struct line *f_bwin, *f_ewin;
	struct line *f_aside;
	int f_linecnt;	/* line number in file of last advanced line */
	FILE *f_fp;
};

advance(f)
	register struct f *f;
{
	register struct line *l;
	
	if (l = f->f_bwin) {
		if (f->f_ewin == l)
			f->f_bwin = f->f_ewin = 0;
		else
			f->f_bwin = l->l_next;
		free_line(l);
		(f->f_linecnt)++;
	}
}

aside(f, l)
	struct f *f;
	struct line *l;
{
	register struct line *ll;

	if (ll = l->l_next) {
		while (ll->l_next)
			ll = ll->l_next;
		ll->l_next = f->f_aside;
		f->f_aside = l->l_next;
		l->l_next = 0;
		f->f_ewin = l;
	}
}

struct line *
next(f)
	register struct f *f;
{
	register struct line *l;

	if (l = f->f_aside) {
		f->f_aside = l->l_next;
		l->l_next = 0;
	}
	else
		l = read_line(f->f_fp);
	if (l) {
		if (f->f_bwin == 0)
			f->f_bwin = f->f_ewin = l;
		else {
			f->f_ewin->l_next = l;
			f->f_ewin = l;
		}
	}
	return l;
}

init_f(f, fp)
	register struct f *f;
	FILE *fp;
{
	f->f_bwin = f->f_ewin =  f->f_aside = 0;
	f->f_linecnt = 0;
	f->f_fp = fp;
}

update(f, s)
	register struct f *f;
	char *s;
{
	register char c;

	while (f->f_bwin && f->f_bwin != f->f_ewin) {
		printf("%s%s", s, f->f_bwin->l_text);
		advance(f);
	}
}
	
/* diff procedure */
diff(fp1, fp2)
	FILE *fp1, *fp2;
{
	struct f f1, f2;
	struct line *l1, *s1, *l2, *s2;
	register struct line *ll;

	init_f(&f1, fp1);
	init_f(&f2, fp2);
	l1 = next(&f1);
	l2 = next(&f2);
	while (l1 && l2) {
		if (equal_line(l1, l2)) {
equal:
			advance(&f1);
			advance(&f2);
			l1 = next(&f1);
			l2 = next(&f2);
			continue;
		}
		s1 = l1;
		s2 = l2;
		/* start searching */
search:
		if ((l2 = next(&f2)) == 0)
			continue;
		ll = s1;
		do {
			if (equal_line(ll, l2)) {
				aside(&f1, ll);
				differ(&f1, &f2);
				goto equal;
			}
		} while (ll = ll->l_next);
		if ((l1 = next(&f1)) == 0)
			continue;
		ll = s2;
		do {
			if (equal_line(ll, l1)) {
				aside(&f2, ll);
				differ(&f1, &f2);
				goto equal;
			}
		} while (ll = ll->l_next);
		goto search;
	}
	/* one of the files reached EOF */
	if (l1) /* eof on 2 */
		while (next(&f1)) {}
	if (l2)
		while (next(&f2)) {}
	f1.f_ewin = 0;
	f2.f_ewin = 0;
	differ(&f1, &f2);
}

differ(f1, f2)
	register struct f *f1, *f2;
{
	int cnt1 = f1->f_linecnt, len1 = wlen(f1), cnt2 = f2->f_linecnt,
		len2 = wlen(f2);

	if ((len1 = wlen(f1)) || (len2 = wlen(f2))) {
		if (len1 == 0) {
			printf("%da", cnt1);
			range(cnt2 + 1, cnt2 + len2);
		}
		else
		if (len2 == 0) {
			range(cnt1 + 1, cnt1 + len1);
			printf("d%d", cnt2);
		}
		else {
			range(cnt1 + 1, cnt1 + len1);
			putchar('c');
			range(cnt2 + 1, cnt2 + len2);
		}
		putchar('\n');
		if (len1)
			update(f1, "< ");
		if (len1 && len2)
			printf("---\n");
		if (len2)
			update(f2, "> ");
		diffs++;
	}
}

wlen(f)
	struct f *f;
{
	register cnt = 0;
	register struct line *l = f->f_bwin, *e = f->f_ewin;

	while (l && l != e) {
		cnt++;
		l = l->l_next;
	}
	return cnt;
}

range(a, b)
{
	printf(((a == b) ? "%d" : "%d,%d"), a, b);
}