1 /* $OpenBSD: diff3prog.c,v 1.11 2009/10/27 23:59:37 deraadt Exp $ */
4 * Copyright (C) Caldera International Inc. 2001-2002.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
10 * 1. Redistributions of source code and documentation must retain the above
11 * copyright notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. All advertising materials mentioning features or use of this software
16 * must display the following acknowledgement:
17 * This product includes software developed or owned by Caldera
19 * 4. Neither the name of Caldera International, Inc. nor the names of other
20 * contributors may be used to endorse or promote products derived from
21 * this software without specific prior written permission.
23 * USE OF THE SOFTWARE PROVIDED FOR UNDER THIS LICENSE BY CALDERA
24 * INTERNATIONAL, INC. AND CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR
25 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
26 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
27 * IN NO EVENT SHALL CALDERA INTERNATIONAL, INC. BE LIABLE FOR ANY DIRECT,
28 * INDIRECT INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
29 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
30 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
32 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
33 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34 * POSSIBILITY OF SUCH DAMAGE.
37 * Copyright (c) 1991, 1993
38 * The Regents of the University of California. All rights reserved.
40 * Redistribution and use in source and binary forms, with or without
41 * modification, are permitted provided that the following conditions
43 * 1. Redistributions of source code must retain the above copyright
44 * notice, this list of conditions and the following disclaimer.
45 * 2. Redistributions in binary form must reproduce the above copyright
46 * notice, this list of conditions and the following disclaimer in the
47 * documentation and/or other materials provided with the distribution.
48 * 3. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
64 * @(#)diff3.c 8.1 (Berkeley) 6/6/93
69 static char sccsid[] = "@(#)diff3.c 8.1 (Berkeley) 6/6/93";
72 #include <sys/cdefs.h>
73 __FBSDID("$FreeBSD$");
75 #include <sys/capsicum.h>
76 #include <sys/procdesc.h>
77 #include <sys/types.h>
78 #include <sys/event.h>
81 #include <capsicum_helpers.h>
94 * "from" is first in range of changed lines; "to" is last+1
95 * from=to=line after point of insertion for added lines.
110 /* Ranges as lines */
116 #define EFLAG_OVERLAP 1
117 #define EFLAG_NOOVERLAP 2
118 #define EFLAG_UNMERGED 3
120 static size_t szchanges;
122 static struct diff *d13;
123 static struct diff *d23;
125 * "de" is used to gather editing scripts. These are later spewed out in
126 * reverse order. Its first element must be all zero, the "old" and "new"
127 * components of "de" contain line positions. Array overlap indicates which
128 * sections in "de" correspond to lines that are different in all three files.
130 static struct diff *de;
131 static char *overlap;
132 static int overlapcnt;
134 static int cline[3]; /* # of the last-read line in each file (0-2) */
136 * The latest known correspondence between line numbers of the 3 files
137 * is stored in last[1-3];
140 static int Aflag, eflag, iflag, mflag, Tflag;
141 static int oflag; /* indicates whether to mark overlaps (-E or -X) */
143 static char *f1mark, *f2mark, *f3mark;
144 static const char *oldmark = "<<<<<<<";
145 static const char *orgmark = "|||||||";
146 static const char *newmark = ">>>>>>>";
148 static bool duplicate(struct range *, struct range *);
149 static int edit(struct diff *, bool, int, int);
150 static char *getchange(FILE *);
151 static char *get_line(FILE *, size_t *);
152 static int readin(int fd, struct diff **);
153 static int skip(int, int, const char *);
154 static void change(int, struct range *, bool);
155 static void keep(int, struct range *);
156 static void merge(int, int);
157 static void prange(struct range *, bool);
158 static void repos(int);
159 static void edscript(int) __dead2;
160 static void Ascript(int) __dead2;
161 static void mergescript(int) __dead2;
162 static void increase(void);
163 static void usage(void);
164 static void printrange(FILE *, struct range *);
166 static const char diff3_version[] = "FreeBSD diff3 20220517";
175 #define DIFF_PATH "/usr/bin/diff"
177 #define OPTIONS "3aAeEiL:mTxX"
178 static struct option longopts[] = {
179 { "ed", no_argument, NULL, 'e' },
180 { "show-overlap", no_argument, NULL, 'E' },
181 { "overlap-only", no_argument, NULL, 'x' },
182 { "initial-tab", no_argument, NULL, 'T' },
183 { "text", no_argument, NULL, 'a' },
184 { "strip-trailing-cr", no_argument, NULL, STRIPCR_OPT },
185 { "show-all", no_argument, NULL, 'A' },
186 { "easy-only", no_argument, NULL, '3' },
187 { "merge", no_argument, NULL, 'm' },
188 { "label", required_argument, NULL, 'L' },
189 { "diff-program", required_argument, NULL, DIFFPROG_OPT },
190 { "help", no_argument, NULL, HELP_OPT},
191 { "version", no_argument, NULL, VERSION_OPT}
197 fprintf(stderr, "usage: diff3 [-3aAeEimTxX] [-L label1] [-L label2] "
198 "[-L label3] file1 file2 file3\n");
202 readin(int fd, struct diff **dd)
212 for (i = 0; (p = getchange(f)); i++) {
214 (*dd)[i].line = strdup(p);
217 if (i >= szchanges - 1)
219 a = b = (int)strtoimax(p, &p, 10);
222 b = (int)strtoimax(p, &p, 10);
225 c = d = (int)strtoimax(p, &p, 10);
228 d = (int)strtoimax(p, &p, 10);
236 (*dd)[i].old.from = a;
238 (*dd)[i].new.from = c;
242 (*dd)[i].old.from = (*dd)[i - 1].old.to;
243 (*dd)[i].new.from = (*dd)[i - 1].new.to;
250 diffexec(const char *diffprog, char **diffargv, int fd[])
254 switch (pdfork(&pd, PD_CLOEXEC)) {
257 if (dup2(fd[1], STDOUT_FILENO) == -1)
258 err(2, "child could not duplicate descriptor");
260 execvp(diffprog, diffargv);
261 err(2, "could not execute diff: %s", diffprog);
264 err(2, "could not fork");
276 while ((line = get_line(b, NULL))) {
277 if (isdigit((unsigned char)line[0]))
285 get_line(FILE *b, size_t *n)
288 static char *buf = NULL;
289 static size_t bufsize = 0;
291 if ((len = getline(&buf, &bufsize, b)) < 0)
294 if (strip_cr && len >= 2 && strcmp("\r\n", &(buf[len - 2])) == 0) {
307 merge(int m1, int m2)
309 struct diff *d1, *d2, *d3;
317 while (t1 = d1 < d13 + m1, t2 = d2 < d23 + m2, t1 || t2) {
318 /* first file is different from the others */
319 if (!t2 || (t1 && d1->new.to < d2->new.from)) {
320 /* stuff peculiar to 1st file */
321 if (eflag == EFLAG_NONE) {
323 change(1, &d1->old, false);
325 change(3, &d1->new, false);
330 /* second file is different from others */
331 if (!t1 || (t2 && d2->new.to < d1->new.from)) {
332 if (eflag == EFLAG_NONE) {
335 change(3, &d2->new, false);
336 change(2, &d2->old, false);
337 } else if (Aflag || mflag) {
338 // XXX-THJ: What does it mean for the second file to differ?
339 j = edit(d2, dup, j, DIFF_TYPE2);
345 * Merge overlapping changes in first file
346 * this happens after extension (see below).
348 if (d1 + 1 < d13 + m1 && d1->new.to >= d1[1].new.from) {
349 d1[1].old.from = d1->old.from;
350 d1[1].new.from = d1->new.from;
355 /* merge overlapping changes in second */
356 if (d2 + 1 < d23 + m2 && d2->new.to >= d2[1].new.from) {
357 d2[1].old.from = d2->old.from;
358 d2[1].new.from = d2->new.from;
362 /* stuff peculiar to third file or different in all */
363 if (d1->new.from == d2->new.from && d1->new.to == d2->new.to) {
364 dup = duplicate(&d1->old, &d2->old);
366 * dup = 0 means all files differ
367 * dup = 1 means files 1 and 2 identical
369 if (eflag == EFLAG_NONE) {
370 printf("====%s\n", dup ? "3" : "");
371 change(1, &d1->old, dup);
372 change(2, &d2->old, false);
373 d3 = d1->old.to > d1->old.from ? d1 : d2;
374 change(3, &d3->new, false);
376 j = edit(d1, dup, j, DIFF_TYPE3);
384 * Overlapping changes from file 1 and 2; extend changes
385 * appropriately to make them coincide.
387 if (d1->new.from < d2->new.from) {
388 d2->old.from -= d2->new.from - d1->new.from;
389 d2->new.from = d1->new.from;
390 } else if (d2->new.from < d1->new.from) {
391 d1->old.from -= d1->new.from - d2->new.from;
392 d1->new.from = d2->new.from;
394 if (d1->new.to > d2->new.to) {
395 d2->old.to += d1->new.to - d2->new.to;
396 d2->new.to = d1->new.to;
397 } else if (d2->new.to > d1->new.to) {
398 d1->old.to += d2->new.to - d1->new.to;
399 d1->new.to = d2->new.to;
412 * The range of lines rold.from thru rold.to in file i is to be changed.
413 * It is to be printed only if it does not duplicate something to be
417 change(int i, struct range *rold, bool dup)
426 skip(i, rold->from, NULL);
427 skip(i, rold->to, " ");
431 * Print the range of line numbers, rold.from thru rold.to, as n1,n2 or
435 prange(struct range *rold, bool delete)
438 if (rold->to <= rold->from)
439 printf("%da\n", rold->from - 1);
441 printf("%d", rold->from);
442 if (rold->to > rold->from + 1)
443 printf(",%d", rold->to - 1);
452 * No difference was reported by diff between file 1 (or 2) and file 3,
453 * and an artificial dummy difference (trange) must be ginned up to
454 * correspond to the change reported in the other file.
457 keep(int i, struct range *rnew)
462 delta = last[3] - last[i];
463 trange.from = rnew->from - delta;
464 trange.to = rnew->to - delta;
465 change(i, &trange, true);
469 * skip to just before line number from in file "i". If "pr" is non-NULL,
470 * print all skipped stuff with string pr as a prefix.
473 skip(int i, int from, const char *pr)
478 for (n = 0; cline[i] < from - 1; n += j) {
479 if ((line = get_line(fp[i], &j)) == NULL)
480 errx(EXIT_FAILURE, "logic error");
482 printf("%s%s", Tflag == 1 ? "\t" : pr, line);
489 * Return 1 or 0 according as the old range (in file 1) contains exactly
490 * the same data as the new range (in file 2).
493 duplicate(struct range *r1, struct range *r2)
499 if (r1->to-r1->from != r2->to-r2->from)
501 skip(0, r1->from, NULL);
502 skip(1, r2->from, NULL);
504 for (nline = 0; nline < r1->to - r1->from; nline++) {
508 if (c == -1 && d == -1)
510 if (c == -1 || d == -1)
511 errx(EXIT_FAILURE, "logic error");
528 for (i = 0; i < 2; i++)
529 (void)fseek(fp[i], (long)-nchar, SEEK_CUR);
533 * collect an editing script for later regurgitation
536 edit(struct diff *diff, bool dup, int j, int difftype)
538 if (!(eflag == EFLAG_UNMERGED ||
539 (!dup && eflag == EFLAG_OVERLAP ) ||
540 (dup && eflag == EFLAG_NOOVERLAP))) {
548 de[j].type = difftype;
550 de[j].line = strdup(diff->line);
553 de[j].old.from = diff->old.from;
554 de[j].old.to = diff->old.to;
555 de[j].new.from = diff->new.from;
556 de[j].new.to = diff->new.to;
561 printrange(FILE *p, struct range *r)
568 /* We haven't been asked to print anything */
569 if (r->from == r->to)
573 errx(EXIT_FAILURE, "invalid print range");
576 * XXX-THJ: We read through all of the file for each range printed.
577 * This duplicates work and will probably impact performance on large
578 * files with lots of ranges.
580 fseek(p, 0L, SEEK_SET);
581 while ((rlen = getline(&line, &len, p)) > 0) {
597 delete = (de[n].new.from == de[n].new.to);
598 if (!oflag || !overlap[n]) {
599 prange(&de[n].old, delete);
601 printf("%da\n", de[n].old.to - 1);
604 printrange(fp[2], &de[n].new);
605 if (!oflag || !overlap[n]) {
609 printf("%s %s\n.\n", newmark, f3mark);
610 printf("%da\n%s %s\n.\n", de[n].old.from - 1,
617 exit(eflag == EFLAG_NONE ? overlapcnt : 0);
621 * Output an edit script to turn mine into yours, when there is a conflict
622 * between the 3 files bracket the changes. Regurgitate the diffs in reverse
623 * order to allow the ed script to track down where the lines are as changes
635 deletenew = (de[n].new.from == de[n].new.to);
636 deleteold = (de[n].old.from == de[n].old.to);
637 startmark = de[n].old.from + (de[n].old.to - de[n].old.from) - 1;
639 if (de[n].type == DIFF_TYPE2) {
640 if (!oflag || !overlap[n]) {
641 prange(&de[n].old, deletenew);
642 printrange(fp[2], &de[n].new);
644 startmark = de[n].new.from +
645 (de[n].new.to - de[n].new.from);
650 printf("%da\n", startmark);
651 printf("%s %s\n", newmark, f3mark);
655 printf("%da\n", startmark -
656 (de[n].new.to - de[n].new.from));
657 printf("%s %s\n", oldmark, f2mark);
659 printrange(fp[1], &de[n].old);
660 printf("=======\n.\n");
663 } else if (de[n].type == DIFF_TYPE3) {
664 if (!oflag || !overlap[n]) {
665 prange(&de[n].old, deletenew);
666 printrange(fp[2], &de[n].new);
668 printf("%da\n", startmark);
669 printf("%s %s\n", orgmark, f2mark);
673 r.from = de[n].old.from-1;
675 printrange(fp[1], &r);
677 printrange(fp[1], &de[n].old);
680 printrange(fp[2], &de[n].new);
683 if (!oflag || !overlap[n]) {
687 printf("%s %s\n.\n", newmark, f3mark);
690 * Go to the start of the conflict in original
691 * file and append lines
693 printf("%da\n%s %s\n.\n",
694 startmark - (de[n].old.to - de[n].old.from),
702 exit(overlapcnt > 0);
706 * Output the merged file directly (don't generate an ed script). When
707 * regurgitating diffs we need to walk forward through the file and print any
719 for (n = 1; n < i+1; n++) {
720 /* print any lines leading up to here */
721 r.to = de[n].old.from;
722 printrange(fp[0], &r);
724 if (de[n].type == DIFF_TYPE2) {
725 printf("%s %s\n", oldmark, f2mark);
726 printrange(fp[1], &de[n].old);
728 printrange(fp[2], &de[n].new);
729 printf("%s %s\n", newmark, f3mark);
730 } else if (de[n].type == DIFF_TYPE3) {
731 if (!oflag || !overlap[n]) {
732 printrange(fp[2], &de[n].new);
735 printf("%s %s\n", oldmark, f1mark);
736 printrange(fp[0], &de[n].old);
738 printf("%s %s\n", orgmark, f2mark);
739 if (de[n].old.from == de[n].old.to) {
741 or.from = de[n].old.from -1;
742 or.to = de[n].new.to;
743 printrange(fp[1], &or);
745 printrange(fp[1], &de[n].old);
749 printrange(fp[2], &de[n].new);
750 printf("%s %s\n", newmark, f3mark);
754 if (de[n].old.from == de[n].old.to)
755 r.from = de[n].new.to;
757 r.from = de[n].old.to;
760 * Print from the final range to the end of 'myfile'. Any deletions or
761 * additions to this file should have been handled by now.
763 * If the ranges are the same we need to rewind a line.
764 * If the new range is 0 length (from == to), we need to use the old
767 if ((de[n-1].old.from == de[n-1].new.from) &&
768 (de[n-1].old.to == de[n-1].new.to))
770 else if (de[n-1].new.from == de[n-1].new.to)
771 r.from = de[n-1].old.from;
774 * If the range is a 3 way merge then we need to skip a line in the
777 if (de[n-1].type == DIFF_TYPE3)
781 printrange(fp[0], &r);
782 exit(overlapcnt > 0);
792 /* are the memset(3) calls needed? */
793 newsz = szchanges == 0 ? 64 : 2 * szchanges;
794 incr = newsz - szchanges;
796 p = reallocarray(d13, newsz, sizeof(struct diff));
799 memset(p + szchanges, 0, incr * sizeof(struct diff));
801 p = reallocarray(d23, newsz, sizeof(struct diff));
804 memset(p + szchanges, 0, incr * sizeof(struct diff));
806 p = reallocarray(de, newsz, sizeof(struct diff));
809 memset(p + szchanges, 0, incr * sizeof(struct diff));
811 q = reallocarray(overlap, newsz, sizeof(char));
814 memset(q + szchanges, 0, incr * sizeof(char));
821 main(int argc, char **argv)
823 int ch, nblabels, status, m, n, kq, nke, nleft, i;
824 char *labels[] = { NULL, NULL, NULL };
825 const char *diffprog = DIFF_PATH;
826 char *file1, *file2, *file3;
829 int fd13[2], fd23[2];
831 cap_rights_t rights_ro;
837 diffargv[diffargc++] = __DECONST(char *, diffprog);
838 while ((ch = getopt_long(argc, argv, OPTIONS, longopts, NULL)) != -1) {
841 eflag = EFLAG_NOOVERLAP;
844 diffargv[diffargc++] = __DECONST(char *, "-a");
850 eflag = EFLAG_UNMERGED;
853 eflag = EFLAG_UNMERGED;
862 errx(2, "too many file label options");
863 labels[nblabels++] = optarg;
874 eflag = EFLAG_OVERLAP;
878 eflag = EFLAG_OVERLAP;
885 diffargv[diffargc++] = __DECONST(char *, "--strip-trailing-cr");
891 printf("%s\n", diff3_version);
899 eflag = EFLAG_UNMERGED;
908 if (caph_limit_stdio() == -1)
909 err(2, "unable to limit stdio");
911 cap_rights_init(&rights_ro, CAP_READ, CAP_FSTAT, CAP_SEEK);
917 e = malloc(2 * sizeof(struct kevent));
927 asprintf(&f1mark, "%s",
928 labels[0] != NULL ? labels[0] : file1);
931 asprintf(&f2mark, "%s",
932 labels[1] != NULL ? labels[1] : file2);
935 asprintf(&f3mark, "%s",
936 labels[2] != NULL ? labels[2] : file3);
940 fp[0] = fopen(file1, "r");
942 err(2, "Can't open %s", file1);
943 if (caph_rights_limit(fileno(fp[0]), &rights_ro) < 0)
944 err(2, "unable to limit rights on: %s", file1);
946 fp[1] = fopen(file2, "r");
948 err(2, "Can't open %s", file2);
949 if (caph_rights_limit(fileno(fp[1]), &rights_ro) < 0)
950 err(2, "unable to limit rights on: %s", file2);
952 fp[2] = fopen(file3, "r");
954 err(2, "Can't open %s", file3);
955 if (caph_rights_limit(fileno(fp[2]), &rights_ro) < 0)
956 err(2, "unable to limit rights on: %s", file3);
963 diffargv[diffargc] = file1;
964 diffargv[diffargc + 1] = file3;
965 diffargv[diffargc + 2] = NULL;
968 pd13 = diffexec(diffprog, diffargv, fd13);
969 EV_SET(e + nleft , pd13, EVFILT_PROCDESC, EV_ADD, NOTE_EXIT, 0, NULL);
970 if (kevent(kq, e + nleft, 1, NULL, 0, NULL) == -1)
974 diffargv[diffargc] = file2;
975 pd23 = diffexec(diffprog, diffargv, fd23);
976 EV_SET(e + nleft , pd23, EVFILT_PROCDESC, EV_ADD, NOTE_EXIT, 0, NULL);
977 if (kevent(kq, e + nleft, 1, NULL, 0, NULL) == -1)
981 caph_cache_catpages();
982 if (caph_enter() < 0)
983 err(2, "unable to enter capability mode");
987 m = readin(fd13[0], &d13);
988 n = readin(fd23[0], &d23);
990 /* waitpid cooked over pdforks */
992 nke = kevent(kq, NULL, 0, e, nleft, NULL);
995 for (i = 0; i < nke; i++) {
997 if (WIFEXITED(status) && WEXITSTATUS(status) >= 2)
998 errx(2, "diff exited abnormally");
999 else if (WIFSIGNALED(status))
1000 errx(2, "diff killed by signal %d",
1007 return (EXIT_SUCCESS);