#include <u.h> #include <libc.h> #include <bio.h> #include <ctype.h> #include "diff.h" struct line { int serial; int value; }; extern struct line *file[2]; extern int len[2]; extern long *ixold, *ixnew; extern int *J; static Biobuf *input[2]; static char *file1, *file2; static int firstchange; #define MAXLINELEN 4096 #define MIN(x, y) ((x) < (y) ? (x): (y)) static int readline(Biobuf *bp, char *buf) { int c; char *p, *e; p = buf; e = p + MAXLINELEN-1; do { c = Bgetc(bp); if (c < 0) { if (p == buf) return -1; break; } if (c == '\n') break; *p++ = c; } while (p < e); *p = 0; if (c != '\n' && c >= 0) { do c = Bgetc(bp); while (c >= 0 && c != '\n'); } return p - buf; } #define HALFLONG 16 #define low(x) (x&((1L<<HALFLONG)-1)) #define high(x) (x>>HALFLONG) /* * hashing has the effect of * arranging line in 7-bit bytes and then * summing 1-s complement in 16-bit hunks */ static int readhash(Biobuf *bp, char *buf) { long sum; unsigned shift; char *p; int len, space; sum = 1; shift = 0; if ((len = readline(bp, buf)) == -1) return 0; p = buf; switch(bflag) /* various types of white space handling */ { case 0: while (len--) { sum += (long)*p++ << (shift &= (HALFLONG-1)); shift += 7; } break; case 1: /* * coalesce multiple white-space */ for (space = 0; len--; p++) { if (isspace((uchar)*p)) { space++; continue; } if (space) { shift += 7; space = 0; } sum += (long)*p << (shift &= (HALFLONG-1)); shift += 7; } break; default: /* * strip all white-space */ while (len--) { if (isspace((uchar)*p)) { p++; continue; } sum += (long)*p++ << (shift &= (HALFLONG-1)); shift += 7; } break; } sum = low(sum) + high(sum); return ((short)low(sum) + (short)high(sum)); } Biobuf * prepare(int i, char *arg) { struct line *p; int j, h; Biobuf *bp; char *cp, buf[MAXLINELEN]; int nbytes; Rune r; bp = Bopen(arg, OREAD); if (!bp) { panic(mflag ? 0: 2, "cannot open %s: %r\n", arg); return 0; } if (binary) return bp; nbytes = Bread(bp, buf, MIN(1024, MAXLINELEN)); if (nbytes > 0) { cp = buf; while (cp < buf+nbytes-UTFmax) { /* * heuristic for a binary file in the * brave new UNICODE world */ cp += chartorune(&r, cp); if (r == 0 || (r > 0x7f && r <= 0xa0)) { binary++; return bp; } } Bseek(bp, 0, 0); } p = MALLOC(struct line, 3); for (j = 0; h = readhash(bp, buf); p[j].value = h) p = REALLOC(p, struct line, (++j+3)); len[i] = j; file[i] = p; input[i] = bp; /*fix*/ if (i == 0) { /*fix*/ file1 = arg; firstchange = 0; } else file2 = arg; return bp; } static int squishspace(char *buf) { char *p, *q; int space; for (space = 0, q = p = buf; *q; q++) { if (isspace((uchar)*q)) { space++; continue; } if (space && bflag == 1) { *p++ = ' '; space = 0; } *p++ = *q; } *p = 0; return p - buf; } /* * need to fix up for unexpected EOF's */ void check(Biobuf *bf, Biobuf *bt) { int f, t, flen, tlen; char fbuf[MAXLINELEN], tbuf[MAXLINELEN]; ixold[0] = ixnew[0] = 0; for (f = t = 1; f < len[0]; f++) { flen = readline(bf, fbuf); ixold[f] = ixold[f-1] + flen + 1; /* ftell(bf) */ if (J[f] == 0) continue; do { tlen = readline(bt, tbuf); ixnew[t] = ixnew[t-1] + tlen + 1; /* ftell(bt) */ } while (t++ < J[f]); if (bflag) { flen = squishspace(fbuf); tlen = squishspace(tbuf); } if (flen != tlen || strcmp(fbuf, tbuf)) J[f] = 0; } while (t < len[1]) { tlen = readline(bt, tbuf); ixnew[t] = ixnew[t-1] + tlen + 1; /* fseek(bt) */ t++; } } static void range(int a, int b, char *separator) { Bprint(&stdout, "%d", a > b ? b: a); if (a < b) Bprint(&stdout, "%s%d", separator, b); } static void fetch(long *f, int a, int b, Biobuf *bp, char *s) { char buf[MAXLINELEN]; int maxb; if(a <= 1) a = 1; if(bp == input[0]) maxb = len[0]; else maxb = len[1]; if(b > maxb) b = maxb; if(a > maxb) return; Bseek(bp, f[a-1], 0); while (a++ <= b) { readline(bp, buf); Bprint(&stdout, "%s%s\n", s, buf); } } typedef struct Change Change; struct Change { int a; int b; int c; int d; }; Change *changes; int nchanges; void change(int a, int b, int c, int d) { char verb; char buf[4]; Change *ch; if (a > b && c > d) return; anychange = 1; if (mflag && firstchange == 0) { if(mode) { buf[0] = '-'; buf[1] = mode; buf[2] = ' '; buf[3] = '\0'; } else { buf[0] = '\0'; } Bprint(&stdout, "diff %s%s %s\n", buf, file1, file2); firstchange = 1; } verb = a > b ? 'a': c > d ? 'd': 'c'; switch(mode) { case 'e': range(a, b, ","); Bputc(&stdout, verb); break; case 0: range(a, b, ","); Bputc(&stdout, verb); range(c, d, ","); break; case 'n': Bprint(&stdout, "%s:", file1); range(a, b, ","); Bprint(&stdout, " %c ", verb); Bprint(&stdout, "%s:", file2); range(c, d, ","); break; case 'f': Bputc(&stdout, verb); range(a, b, " "); break; case 'c': case 'a': if(nchanges%1024 == 0) changes = erealloc(changes, (nchanges+1024)*sizeof(changes[0])); ch = &changes[nchanges++]; ch->a = a; ch->b = b; ch->c = c; ch->d = d; return; } Bputc(&stdout, '\n'); if (mode == 0 || mode == 'n') { fetch(ixold, a, b, input[0], "< "); if (a <= b && c <= d) Bprint(&stdout, "---\n"); } fetch(ixnew, c, d, input[1], mode == 0 || mode == 'n' ? "> ": ""); if (mode != 0 && mode != 'n' && c <= d) Bprint(&stdout, ".\n"); } enum { Lines = 3, /* number of lines of context shown */ }; int changeset(int i) { while(i<nchanges && changes[i].b+1+2*Lines > changes[i+1].a) i++; if(i<nchanges) return i+1; return nchanges; } void flushchanges(void) { int a, b, c, d, at; int i, j; if(nchanges == 0) return; for(i=0; i<nchanges; ){ j = changeset(i); a = changes[i].a-Lines; b = changes[j-1].b+Lines; c = changes[i].c-Lines; d = changes[j-1].d+Lines; if(a < 1) a = 1; if(c < 1) c = 1; if(b > len[0]) b = len[0]; if(d > len[1]) d = len[1]; if(mode == 'a'){ a = 1; b = len[0]; c = 1; d = len[1]; j = nchanges; } Bprint(&stdout, "%s:", file1); range(a, b, ","); Bprint(&stdout, " - "); Bprint(&stdout, "%s:", file2); range(c, d, ","); Bputc(&stdout, '\n'); at = a; for(; i<j; i++){ fetch(ixold, at, changes[i].a-1, input[0], " "); fetch(ixold, changes[i].a, changes[i].b, input[0], "- "); fetch(ixnew, changes[i].c, changes[i].d, input[1], "+ "); at = changes[i].b+1; } fetch(ixold, at, b, input[0], " "); } nchanges = 0; }