1 /* $OpenBSD: diff3.c,v 1.41 2016/10/18 21:06:52 millert Exp $ */
4 * Copyright (C) Caldera International Inc. 2001-2002.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
10 * 1. Redistributions of source code and documentation must retain the above
11 * copyright notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. All advertising materials mentioning features or use of this software
16 * must display the following acknowledgement:
17 * This product includes software developed or owned by Caldera
19 * 4. Neither the name of Caldera International, Inc. nor the names of other
20 * contributors may be used to endorse or promote products derived from
21 * this software without specific prior written permission.
23 * USE OF THE SOFTWARE PROVIDED FOR UNDER THIS LICENSE BY CALDERA
24 * INTERNATIONAL, INC. AND CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR
25 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
26 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
27 * IN NO EVENT SHALL CALDERA INTERNATIONAL, INC. BE LIABLE FOR ANY DIRECT,
28 * INDIRECT INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
29 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
30 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
32 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
33 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34 * POSSIBILITY OF SUCH DAMAGE.
37 * Copyright (c) 1991, 1993
38 * The Regents of the University of California. All rights reserved.
40 * Redistribution and use in source and binary forms, with or without
41 * modification, are permitted provided that the following conditions
43 * 1. Redistributions of source code must retain the above copyright
44 * notice, this list of conditions and the following disclaimer.
45 * 2. Redistributions in binary form must reproduce the above copyright
46 * notice, this list of conditions and the following disclaimer in the
47 * documentation and/or other materials provided with the distribution.
48 * 3. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
64 * @(#)diff3.c 8.1 (Berkeley) 6/6/93
68 #include <sys/queue.h>
79 #include "got_error.h"
80 #include "got_opentemp.h"
81 #include "got_object.h"
85 #include "got_lib_diff.h"
89 #define nitems(_a) (sizeof(_a) / sizeof((_a)[0]))
92 /* flags shared between merge(1) and rcsmerge(1) */
93 #define MERGE_EFLAG (1<<16)
94 #define MERGE_OFLAG (1<<17)
96 /* diff3 - 3-way differential file comparison */
98 /* diff3 [-ex3EX] d13 d23 f1 f2 f3 [m1 m3]
100 * d13 = diff report on f1 vs f3
101 * d23 = diff report on f2 vs f3
102 * f1, f2, f3 the 3 files
103 * if changes in f1 overlap with changes in f3, m1 and m3 are used
104 * to mark the overlaps; otherwise, the file names f1 and f3 are used
105 * (only for options E and X).
109 * "from" is first in range of changed lines; "to" is last+1
110 * from=to=line after point of insertion for added lines.
129 * "de" is used to gather editing scripts. These are later spewed out
130 * in reverse order. Its first element must be all zero, the "new"
131 * component of "de" contains line positions or byte positions
132 * depending on when you look (!?). Array overlap indicates which
133 * sections in "de" correspond to lines that are different in all
140 int cline[3]; /* # of the last-read line in each file (0-2) */
143 * the latest known correspondence between line numbers of the 3 files
144 * is stored in last[1-3];
150 char f1mark[PATH_MAX], f3mark[PATH_MAX]; /* markers for -E and -X */
158 static int duplicate(struct range *, struct range *, struct diff3_state *);
159 static int edit(struct diff *, int, int, struct diff3_state *);
160 static char *getchange(FILE *, struct diff3_state *);
161 static char *get_line(FILE *, size_t *, struct diff3_state *);
162 static int number(char **);
163 static const struct got_error *readin(size_t *, char *, struct diff **,
164 struct diff3_state *);
165 static int ed_patch_lines(struct rcs_lines *, struct rcs_lines *);
166 static int skip(int, int, char *, struct diff3_state *);
167 static int edscript(int, struct diff3_state *);
168 static int merge(size_t, size_t, struct diff3_state *);
169 static void change(int, struct range *, int, struct diff3_state *);
170 static void keep(int, struct range *, struct diff3_state *);
171 static void prange(struct range *);
172 static void repos(int, struct diff3_state *);
173 static void separate(const char *);
174 static const struct got_error *increase(struct diff3_state *);
175 static const struct got_error *diff3_internal(char *, char *, char *,
176 char *, char *, const char *, const char *, struct diff3_state *);
178 int diff3_conflicts = 0;
180 static const struct got_error *
181 diff_output(const char *fmt, ...)
189 i = vasprintf(&str, fmt, vap);
192 return got_error_from_errno();
194 buf_append(&newsize, diffbuf, str, strlen(str));
201 static const struct got_error*
202 diffreg(BUF **d, const char *path1, const char *path2)
204 const struct got_error *err = NULL;
205 FILE *f1 = NULL, *f2 = NULL, *outfile = NULL;
206 char *outpath = NULL;
207 struct got_diff_state ds;
208 struct got_diff_args args;
213 f1 = fopen(path1, "r");
215 err = got_error_from_errno();
218 f2 = fopen(path2, "r");
220 err = got_error_from_errno();
224 err = got_opentemp_named(&outpath, &outfile, "/tmp/got-diff");
228 memset(&ds, 0, sizeof(ds));
229 /* XXX should stat buffers be passed in args instead of ds? */
230 if (stat(path1, &ds.stb1) == -1) {
231 err = got_error_from_errno();
234 if (stat(path2, &ds.stb2) == -1) {
235 err = got_error_from_errno();
239 memset(&args, 0, sizeof(args));
240 args.diff_format = D_NORMAL;
243 args.diff_context = 0;
245 err = got_diffreg(&res, f1, f2, D_FORCEASCII, &args, &ds,
250 *d = buf_load(outpath);
252 err = got_error_from_errno();
267 const struct got_error *
268 merge_diff3(BUF **buf, char *p1, char *p2, char *p3, int flags)
270 const struct got_error *err = NULL;
271 char *dp13, *dp23, *path1, *path2, *path3;
272 BUF *b1, *b2, *b3, *d1, *d2, *diffb;
273 u_char *data, *patch;
275 struct wklhead temp_files;
276 struct diff3_state *d3s;
281 d3s = calloc(1, sizeof(*d3s));
283 return got_error_from_errno();
284 d3s->eflag = 3; /* default -E for compatibility with former RCS */
285 d3s->oflag = 1; /* default -E for compatibility with former RCS */
287 b1 = b2 = b3 = d1 = d2 = diffb = NULL;
288 dp13 = dp23 = path1 = path2 = path3 = NULL;
291 if ((flags & MERGE_EFLAG) && !(flags & MERGE_OFLAG))
294 if ((b1 = buf_load(p1)) == NULL)
296 if ((b2 = buf_load(p2)) == NULL)
298 if ((b3 = buf_load(p3)) == NULL)
301 diffb = buf_alloc(128);
303 if (asprintf(&path1, "/tmp/got-diff1.XXXXXXXX") == -1) {
304 err = got_error_from_errno();
307 if (asprintf(&path2, "/tmp/got-diff2.XXXXXXXX") == -1) {
308 err = got_error_from_errno();
311 if (asprintf(&path3, "/tmp/got-diff3.XXXXXXXX") == -1) {
312 err = got_error_from_errno();
316 err = buf_write_stmp(b1, path1, &temp_files);
319 err = buf_write_stmp(b2, path2, &temp_files);
322 err = buf_write_stmp(b3, path3, &temp_files);
329 err = diffreg(&d1, path1, path3);
336 err = diffreg(&d2, path2, path3);
343 if (asprintf(&dp13, "/tmp/got-d13.XXXXXXXXXX") == -1) {
344 err = got_error_from_errno();
347 err = buf_write_stmp(d1, dp13, &temp_files);
354 if (asprintf(&dp23, "/tmp/got-d23.XXXXXXXXXX") == -1) {
355 err = got_error_from_errno();
358 err = buf_write_stmp(d2, dp23, &temp_files);
366 err = diff3_internal(dp13, dp23, path1, path2, path3, p1, p3,
374 plen = buf_len(diffb);
375 patch = buf_release(diffb);
377 data = buf_release(b1);
379 if ((diffb = rcs_patchfile(data, dlen, patch, plen, ed_patch_lines)) == NULL)
401 worklist_clean(&temp_files, worklist_unlink);
403 for (i = 0; i < nitems(d3s->fp); i++) {
413 static const struct got_error *
414 diff3_internal(char *dp13, char *dp23, char *path1, char *path2, char *path3,
415 const char *fmark, const char *rmark, struct diff3_state *d3s)
417 const struct got_error *err = NULL;
421 i = snprintf(d3s->f1mark, sizeof(d3s->f1mark), "<<<<<<< %s", fmark);
422 if (i < 0 || i >= (int)sizeof(d3s->f1mark))
423 return got_error(GOT_ERR_NO_SPACE);
425 i = snprintf(d3s->f3mark, sizeof(d3s->f3mark), ">>>>>>> %s", rmark);
426 if (i < 0 || i >= (int)sizeof(d3s->f3mark))
427 return got_error(GOT_ERR_NO_SPACE);
433 err = readin(&m, dp13, &d3s->d13, d3s);
436 err = readin(&n, dp23, &d3s->d23, d3s);
440 if ((d3s->fp[0] = fopen(path1, "r")) == NULL)
441 return got_error_from_errno();
442 if ((d3s->fp[1] = fopen(path2, "r")) == NULL)
443 return got_error_from_errno();
444 if ((d3s->fp[2] = fopen(path3, "r")) == NULL)
445 return got_error_from_errno();
447 if (merge(m, n, d3s) < 0)
448 return got_error_from_errno();
453 ed_patch_lines(struct rcs_lines *dlines, struct rcs_lines *plines)
456 struct rcs_line *sort, *lp, *dlp, *ndlp, *insert_after;
457 int start, end, i, lineno;
460 dlp = TAILQ_FIRST(&(dlines->l_lines));
461 lp = TAILQ_FIRST(&(plines->l_lines));
464 for (lp = TAILQ_NEXT(lp, l_list); lp != NULL;
465 lp = TAILQ_NEXT(lp, l_list)) {
466 /* Skip blank lines */
470 /* NUL-terminate line buffer for strtol() safety. */
471 tmp = lp->l_line[lp->l_len - 1];
472 lp->l_line[lp->l_len - 1] = '\0';
474 /* len - 1 is NUL terminator so we use len - 2 for 'op' */
475 op = lp->l_line[lp->l_len - 2];
476 start = (int)strtol(lp->l_line, &ep, 10);
478 /* Restore the last byte of the buffer */
479 lp->l_line[lp->l_len - 1] = tmp;
482 if (start > dlines->l_nblines ||
483 start < 0 || *ep != 'a')
485 } else if (op == 'c') {
486 if (start > dlines->l_nblines ||
487 start < 0 || (*ep != ',' && *ep != 'c'))
492 end = (int)strtol(ep, &ep, 10);
493 if (end < 0 || *ep != 'c')
504 if (dlp->l_lineno == start)
506 if (dlp->l_lineno > start) {
507 dlp = TAILQ_PREV(dlp, tqh, l_list);
508 } else if (dlp->l_lineno < start) {
509 ndlp = TAILQ_NEXT(dlp, l_list);
510 if (ndlp->l_lineno > start)
521 insert_after = TAILQ_PREV(dlp, tqh, l_list);
522 for (i = 0; i <= (end - start); i++) {
523 ndlp = TAILQ_NEXT(dlp, l_list);
524 TAILQ_REMOVE(&(dlines->l_lines), dlp, l_list);
530 if (op == 'a' || op == 'c') {
533 lp = TAILQ_NEXT(lp, l_list);
537 if (!memcmp(lp->l_line, ".", 1))
540 TAILQ_REMOVE(&(plines->l_lines), lp, l_list);
541 TAILQ_INSERT_AFTER(&(dlines->l_lines), dlp,
545 lp->l_lineno = start;
551 * always resort lines as the markers might be put at the
552 * same line as we first started editing.
555 TAILQ_FOREACH(sort, &(dlines->l_lines), l_list)
556 sort->l_lineno = lineno++;
557 dlines->l_nblines = lineno - 1;
564 * Pick up the line numbers of all changes from one change file.
565 * (This puts the numbers in a vector, which is not strictly necessary,
566 * since the vector is processed in one sequential pass.
567 * The vector could be optimized out of existence)
569 static const struct got_error *
570 readin(size_t *n, char *name, struct diff **dd, struct diff3_state *d3s)
572 const struct got_error *err = NULL;
577 d3s->fp[0] = fopen(name, "r");
578 if (d3s->fp[0] == NULL)
579 return got_error_from_errno();
580 for (i = 0; (p = getchange(d3s->fp[0], d3s)); i++) {
581 if (i >= d3s->szchanges - 1) {
603 (*dd)[i].old.from = a;
605 (*dd)[i].new.from = c;
610 (*dd)[i].old.from = (*dd)[i-1].old.to;
611 (*dd)[i].new.from = (*dd)[i-1].new.to;
614 (void)fclose(d3s->fp[0]);
625 while (isdigit((unsigned char)(**lc)))
626 nn = nn*10 + *(*lc)++ - '0';
632 getchange(FILE *b, struct diff3_state *d3s)
636 while ((line = get_line(b, NULL, d3s))) {
637 if (isdigit((unsigned char)line[0]))
645 get_line(FILE *b, size_t *n, struct diff3_state *d3s)
651 if ((cp = fgetln(b, &len)) == NULL)
654 if (cp[len - 1] != '\n')
656 if (len + 1 > d3s->bufsize) {
658 d3s->bufsize += 1024;
659 } while (len + 1 > d3s->bufsize);
660 new = reallocarray(d3s->buf, 1, d3s->bufsize);
665 memcpy(d3s->buf, cp, len - 1);
666 d3s->buf[len - 1] = '\n';
667 d3s->buf[len] = '\0';
675 merge(size_t m1, size_t m2, struct diff3_state *d3s)
677 struct diff *d1, *d2, *d3;
684 t1 = (d1 < d3s->d13 + m1);
685 t2 = (d2 < d3s->d23 + m2);
690 printf("%d,%d=%d,%d %d,%d=%d,%d\n",
691 d1->old.from, d1->old.to,
692 d1->new.from, d1->new.to,
693 d2->old.from, d2->old.to,
694 d2->new.from, d2->new.to);
697 /* first file is different from others */
698 if (!t2 || (t1 && d1->new.to < d2->new.from)) {
699 /* stuff peculiar to 1st file */
700 if (d3s->eflag == 0) {
702 change(1, &d1->old, 0, d3s);
703 keep(2, &d1->new, d3s);
704 change(3, &d1->new, 0, d3s);
710 /* second file is different from others */
711 if (!t1 || (t2 && d2->new.to < d1->new.from)) {
712 if (d3s->eflag == 0) {
714 keep(1, &d2->new, d3s);
715 change(2, &d2->old, 0, d3s);
716 change(3, &d2->new, 0, d3s);
723 * Merge overlapping changes in first file
724 * this happens after extension (see below).
726 if (d1 + 1 < d3s->d13 + m1 && d1->new.to >= d1[1].new.from) {
727 d1[1].old.from = d1->old.from;
728 d1[1].new.from = d1->new.from;
733 /* merge overlapping changes in second */
734 if (d2 + 1 < d3s->d23 + m2 && d2->new.to >= d2[1].new.from) {
735 d2[1].old.from = d2->old.from;
736 d2[1].new.from = d2->new.from;
740 /* stuff peculiar to third file or different in all */
741 if (d1->new.from == d2->new.from && d1->new.to == d2->new.to) {
742 dpl = duplicate(&d1->old, &d2->old, d3s);
747 * dpl = 0 means all files differ
748 * dpl = 1 means files 1 and 2 identical
750 if (d3s->eflag == 0) {
751 separate(dpl ? "3" : "");
752 change(1, &d1->old, dpl, d3s);
753 change(2, &d2->old, 0, d3s);
754 d3 = d1->old.to > d1->old.from ? d1 : d2;
755 change(3, &d3->new, 0, d3s);
757 j = edit(d1, dpl, j, d3s);
764 * Overlapping changes from file 1 and 2; extend changes
765 * appropriately to make them coincide.
767 if (d1->new.from < d2->new.from) {
768 d2->old.from -= d2->new.from-d1->new.from;
769 d2->new.from = d1->new.from;
770 } else if (d2->new.from < d1->new.from) {
771 d1->old.from -= d1->new.from-d2->new.from;
772 d1->new.from = d2->new.from;
774 if (d1->new.to > d2->new.to) {
775 d2->old.to += d1->new.to - d2->new.to;
776 d2->new.to = d1->new.to;
777 } else if (d2->new.to > d1->new.to) {
778 d1->old.to += d2->new.to - d1->new.to;
779 d1->new.to = d2->new.to;
783 return (edscript(j, d3s));
787 separate(const char *s)
789 diff_output("====%s\n", s);
793 * The range of lines rold.from thru rold.to in file i is to be changed.
794 * It is to be printed only if it does not duplicate something to be
798 change(int i, struct range *rold, int fdup, struct diff3_state *d3s)
800 diff_output("%d:", i);
801 d3s->last[i] = rold->to;
803 if (fdup || d3s->debug)
806 (void)skip(i, rold->from, NULL, d3s);
807 (void)skip(i, rold->to, " ", d3s);
811 * print the range of line numbers, rold.from thru rold.to, as n1,n2 or n1
814 prange(struct range *rold)
816 if (rold->to <= rold->from)
817 diff_output("%da\n", rold->from - 1);
819 diff_output("%d", rold->from);
820 if (rold->to > rold->from+1)
821 diff_output(",%d", rold->to - 1);
827 * No difference was reported by diff between file 1 (or 2) and file 3,
828 * and an artificial dummy difference (trange) must be ginned up to
829 * correspond to the change reported in the other file.
832 keep(int i, struct range *rnew, struct diff3_state *d3s)
837 delta = d3s->last[3] - d3s->last[i];
838 trange.from = rnew->from - delta;
839 trange.to = rnew->to - delta;
840 change(i, &trange, 1, d3s);
844 * skip to just before line number from in file "i". If "pr" is non-NULL,
845 * print all skipped stuff with string pr as a prefix.
848 skip(int i, int from, char *pr, struct diff3_state *d3s)
853 for (n = 0; d3s->cline[i] < from - 1; n += j) {
854 if ((line = get_line(d3s->fp[i], &j, d3s)) == NULL)
857 diff_output("%s%s", pr, line);
864 * Return 1 or 0 according as the old range (in file 1) contains exactly
865 * the same data as the new range (in file 2).
868 duplicate(struct range *r1, struct range *r2, struct diff3_state *d3s)
874 if (r1->to-r1->from != r2->to-r2->from)
876 (void)skip(0, r1->from, NULL, d3s);
877 (void)skip(1, r2->from, NULL, d3s);
879 for (nline=0; nline < r1->to - r1->from; nline++) {
881 c = getc(d3s->fp[0]);
882 d = getc(d3s->fp[1]);
883 if (c == -1 || d== -1)
897 repos(int nchar, struct diff3_state *d3s)
901 for (i = 0; i < 2; i++)
902 (void)fseek(d3s->fp[i], (long)-nchar, SEEK_CUR);
906 * collect an editing script for later regurgitation
909 edit(struct diff *diff, int fdup, int j, struct diff3_state *d3s)
911 if (((fdup + 1) & d3s->eflag) == 0)
914 d3s->overlap[j] = !fdup;
917 d3s->de[j].old.from = diff->old.from;
918 d3s->de[j].old.to = diff->old.to;
919 d3s->de[j].new.from =
920 d3s->de[j-1].new.to + skip(2, diff->new.from, NULL, d3s);
922 d3s->de[j].new.from + skip(2, diff->new.to, NULL, d3s);
928 edscript(int n, struct diff3_state *d3s)
931 char block[BUFSIZ+1];
934 if (!d3s->oflag || !d3s->overlap[n])
935 prange(&d3s->de[n].old);
937 diff_output("%da\n=======\n", d3s->de[n].old.to -1);
938 (void)fseek(d3s->fp[2], (long)d3s->de[n].new.from, SEEK_SET);
939 k = d3s->de[n].new.to - d3s->de[n].new.from;
940 for (; k > 0; k-= j) {
941 j = k > BUFSIZ ? BUFSIZ : k;
942 if (fread(block, 1, j, d3s->fp[2]) != (size_t)j)
945 diff_output("%s", block);
948 if (!d3s->oflag || !d3s->overlap[n])
951 diff_output("%s\n.\n", d3s->f3mark);
952 diff_output("%da\n%s\n.\n", d3s->de[n].old.from - 1,
957 return (d3s->overlapcnt);
960 static const struct got_error *
961 increase(struct diff3_state *d3s)
967 /* are the memset(3) calls needed? */
968 newsz = d3s->szchanges == 0 ? 64 : 2 * d3s->szchanges;
969 incr = newsz - d3s->szchanges;
971 d = reallocarray(d3s->d13, newsz, sizeof(*d3s->d13));
973 return got_error_from_errno();
975 memset(d3s->d13 + d3s->szchanges, 0, incr * sizeof(*d3s->d13));
977 d = reallocarray(d3s->d23, newsz, sizeof(*d3s->d23));
979 return got_error_from_errno();
981 memset(d3s->d23 + d3s->szchanges, 0, incr * sizeof(*d3s->d23));
983 d = reallocarray(d3s->de, newsz, sizeof(*d3s->de));
985 return got_error_from_errno();
987 memset(d3s->de + d3s->szchanges, 0, incr * sizeof(*d3s->de));
989 s = reallocarray(d3s->overlap, newsz, sizeof(*d3s->overlap));
991 return got_error_from_errno();
993 memset(d3s->overlap + d3s->szchanges, 0, incr * sizeof(*d3s->overlap));
994 d3s->szchanges = newsz;