2 * LibXDiff by Davide Libenzi ( File Differential Library )
3 * Copyright (C) 2003-2006 Davide Libenzi, Johannes E. Schindelin
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2.1 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 * Davide Libenzi <davidel@xmailserver.org>
25 typedef struct s_xdmerge
{
26 struct s_xdmerge
*next
;
29 * 1 = no conflict, take first,
30 * 2 = no conflict, take second.
31 * 3 = no conflict, take both.
35 * These point at the respective postimages. E.g. <i1,chg1> is
36 * how side #1 wants to change the common ancestor; if there is no
37 * overlap, lines before i1 in the postimage of side #1 appear
38 * in the merge result as a region touched by neither side.
43 * These point at the preimage; of course there is just one
44 * preimage, that is from the shared common ancestor.
50 static int xdl_append_merge(xdmerge_t
**merge
, int mode
,
55 xdmerge_t
*m
= *merge
;
56 if (m
&& (i1
<= m
->i1
+ m
->chg1
|| i2
<= m
->i2
+ m
->chg2
)) {
59 m
->chg0
= i0
+ chg0
- m
->i0
;
60 m
->chg1
= i1
+ chg1
- m
->i1
;
61 m
->chg2
= i2
+ chg2
- m
->i2
;
63 m
= xdl_malloc(sizeof(xdmerge_t
));
81 static int xdl_cleanup_merge(xdmerge_t
*c
)
86 /* were there conflicts? */
87 for (; c
; c
= next_c
) {
96 static int xdl_merge_cmp_lines(xdfenv_t
*xe1
, int i1
, xdfenv_t
*xe2
, int i2
,
97 int line_count
, long flags
)
100 xrecord_t
**rec1
= xe1
->xdf2
.recs
+ i1
;
101 xrecord_t
**rec2
= xe2
->xdf2
.recs
+ i2
;
103 for (i
= 0; i
< line_count
; i
++) {
104 int result
= xdl_recmatch(rec1
[i
]->ptr
, rec1
[i
]->size
,
105 rec2
[i
]->ptr
, rec2
[i
]->size
, flags
);
112 static int xdl_recs_copy_0(int use_orig
, xdfenv_t
*xe
, int i
, int count
, int needs_cr
, int add_nl
, char *dest
)
117 recs
= (use_orig
? xe
->xdf1
.recs
: xe
->xdf2
.recs
) + i
;
122 for (i
= 0; i
< count
; size
+= recs
[i
++]->size
)
124 memcpy(dest
+ size
, recs
[i
]->ptr
, recs
[i
]->size
);
126 i
= recs
[count
- 1]->size
;
127 if (i
== 0 || recs
[count
- 1]->ptr
[i
- 1] != '\n') {
142 static int xdl_recs_copy(xdfenv_t
*xe
, int i
, int count
, int needs_cr
, int add_nl
, char *dest
)
144 return xdl_recs_copy_0(0, xe
, i
, count
, needs_cr
, add_nl
, dest
);
147 static int xdl_orig_copy(xdfenv_t
*xe
, int i
, int count
, int needs_cr
, int add_nl
, char *dest
)
149 return xdl_recs_copy_0(1, xe
, i
, count
, needs_cr
, add_nl
, dest
);
153 * Returns 1 if the i'th line ends in CR/LF (if it is the last line and
154 * has no eol, the preceding line, if any), 0 if it ends in LF-only, and
155 * -1 if the line ending cannot be determined.
157 static int is_eol_crlf(xdfile_t
*file
, int i
)
161 if (i
< file
->nrec
- 1)
162 /* All lines before the last *must* end in LF */
163 return (size
= file
->recs
[i
]->size
) > 1 &&
164 file
->recs
[i
]->ptr
[size
- 2] == '\r';
166 /* Cannot determine eol style from empty file */
168 if ((size
= file
->recs
[i
]->size
) &&
169 file
->recs
[i
]->ptr
[size
- 1] == '\n')
170 /* Last line; ends in LF; Is it CR/LF? */
172 file
->recs
[i
]->ptr
[size
- 2] == '\r';
174 /* The only line has no eol */
176 /* Determine eol from second-to-last line */
177 return (size
= file
->recs
[i
- 1]->size
) > 1 &&
178 file
->recs
[i
- 1]->ptr
[size
- 2] == '\r';
181 static int is_cr_needed(xdfenv_t
*xe1
, xdfenv_t
*xe2
, xdmerge_t
*m
)
185 /* Match post-images' preceding, or first, lines' end-of-line style */
186 needs_cr
= is_eol_crlf(&xe1
->xdf2
, m
->i1
? m
->i1
- 1 : 0);
188 needs_cr
= is_eol_crlf(&xe2
->xdf2
, m
->i2
? m
->i2
- 1 : 0);
189 /* Look at pre-image's first line, unless we already settled on LF */
191 needs_cr
= is_eol_crlf(&xe1
->xdf1
, 0);
192 /* If still undecided, use LF-only */
193 return needs_cr
< 0 ? 0 : needs_cr
;
196 static int fill_conflict_hunk(xdfenv_t
*xe1
, const char *name1
,
197 xdfenv_t
*xe2
, const char *name2
,
199 int size
, int i
, int style
,
200 xdmerge_t
*m
, char *dest
, int marker_size
)
202 int marker1_size
= (name1
? strlen(name1
) + 1 : 0);
203 int marker2_size
= (name2
? strlen(name2
) + 1 : 0);
204 int marker3_size
= (name3
? strlen(name3
) + 1 : 0);
205 int needs_cr
= is_cr_needed(xe1
, xe2
, m
);
207 if (marker_size
<= 0)
208 marker_size
= DEFAULT_CONFLICT_MARKER_SIZE
;
210 /* Before conflicting part */
211 size
+= xdl_recs_copy(xe1
, i
, m
->i1
- i
, 0, 0,
212 dest
? dest
+ size
: NULL
);
215 size
+= marker_size
+ 1 + needs_cr
+ marker1_size
;
217 memset(dest
+ size
, '<', marker_size
);
221 memcpy(dest
+ size
+ 1, name1
, marker1_size
- 1);
222 size
+= marker1_size
;
229 /* Postimage from side #1 */
230 size
+= xdl_recs_copy(xe1
, m
->i1
, m
->chg1
, needs_cr
, 1,
231 dest
? dest
+ size
: NULL
);
233 if (style
== XDL_MERGE_DIFF3
) {
234 /* Shared preimage */
236 size
+= marker_size
+ 1 + needs_cr
+ marker3_size
;
238 memset(dest
+ size
, '|', marker_size
);
242 memcpy(dest
+ size
+ 1, name3
, marker3_size
- 1);
243 size
+= marker3_size
;
249 size
+= xdl_orig_copy(xe1
, m
->i0
, m
->chg0
, needs_cr
, 1,
250 dest
? dest
+ size
: NULL
);
254 size
+= marker_size
+ 1 + needs_cr
;
256 memset(dest
+ size
, '=', marker_size
);
263 /* Postimage from side #2 */
264 size
+= xdl_recs_copy(xe2
, m
->i2
, m
->chg2
, needs_cr
, 1,
265 dest
? dest
+ size
: NULL
);
267 size
+= marker_size
+ 1 + needs_cr
+ marker2_size
;
269 memset(dest
+ size
, '>', marker_size
);
273 memcpy(dest
+ size
+ 1, name2
, marker2_size
- 1);
274 size
+= marker2_size
;
283 static int xdl_fill_merge_buffer(xdfenv_t
*xe1
, const char *name1
,
284 xdfenv_t
*xe2
, const char *name2
,
285 const char *ancestor_name
,
287 xdmerge_t
*m
, char *dest
, int style
,
292 for (size
= i
= 0; m
; m
= m
->next
) {
293 if (favor
&& !m
->mode
)
297 size
= fill_conflict_hunk(xe1
, name1
, xe2
, name2
,
299 size
, i
, style
, m
, dest
,
301 else if (m
->mode
& 3) {
302 /* Before conflicting part */
303 size
+= xdl_recs_copy(xe1
, i
, m
->i1
- i
, 0, 0,
304 dest
? dest
+ size
: NULL
);
305 /* Postimage from side #1 */
307 int needs_cr
= is_cr_needed(xe1
, xe2
, m
);
309 size
+= xdl_recs_copy(xe1
, m
->i1
, m
->chg1
, needs_cr
, (m
->mode
& 2),
310 dest
? dest
+ size
: NULL
);
312 /* Postimage from side #2 */
314 size
+= xdl_recs_copy(xe2
, m
->i2
, m
->chg2
, 0, 0,
315 dest
? dest
+ size
: NULL
);
320 size
+= xdl_recs_copy(xe1
, i
, xe1
->xdf2
.nrec
- i
, 0, 0,
321 dest
? dest
+ size
: NULL
);
326 * Sometimes, changes are not quite identical, but differ in only a few
327 * lines. Try hard to show only these few lines as conflicting.
329 static int xdl_refine_conflicts(xdfenv_t
*xe1
, xdfenv_t
*xe2
, xdmerge_t
*m
,
330 xpparam_t
const *xpp
)
332 for (; m
; m
= m
->next
) {
335 xdchange_t
*xscr
, *x
;
336 int i1
= m
->i1
, i2
= m
->i2
;
338 /* let's handle just the conflicts */
342 /* no sense refining a conflict when one side is empty */
343 if (m
->chg1
== 0 || m
->chg2
== 0)
347 * This probably does not work outside git, since
348 * we have a very simple mmfile structure.
350 t1
.ptr
= (char *)xe1
->xdf2
.recs
[m
->i1
]->ptr
;
351 t1
.size
= xe1
->xdf2
.recs
[m
->i1
+ m
->chg1
- 1]->ptr
352 + xe1
->xdf2
.recs
[m
->i1
+ m
->chg1
- 1]->size
- t1
.ptr
;
353 t2
.ptr
= (char *)xe2
->xdf2
.recs
[m
->i2
]->ptr
;
354 t2
.size
= xe2
->xdf2
.recs
[m
->i2
+ m
->chg2
- 1]->ptr
355 + xe2
->xdf2
.recs
[m
->i2
+ m
->chg2
- 1]->size
- t2
.ptr
;
356 if (xdl_do_diff(&t1
, &t2
, xpp
, &xe
) < 0)
358 if (xdl_change_compact(&xe
.xdf1
, &xe
.xdf2
, xpp
->flags
) < 0 ||
359 xdl_change_compact(&xe
.xdf2
, &xe
.xdf1
, xpp
->flags
) < 0 ||
360 xdl_build_script(&xe
, &xscr
) < 0) {
365 /* If this happens, the changes are identical. */
371 m
->i1
= xscr
->i1
+ i1
;
372 m
->chg1
= xscr
->chg1
;
373 m
->i2
= xscr
->i2
+ i2
;
374 m
->chg2
= xscr
->chg2
;
376 xdmerge_t
*m2
= xdl_malloc(sizeof(xdmerge_t
));
387 m
->i1
= xscr
->i1
+ i1
;
388 m
->chg1
= xscr
->chg1
;
389 m
->i2
= xscr
->i2
+ i2
;
390 m
->chg2
= xscr
->chg2
;
398 static int line_contains_alnum(const char *ptr
, long size
)
401 if (isalnum((unsigned char)*(ptr
++)))
406 static int lines_contain_alnum(xdfenv_t
*xe
, int i
, int chg
)
408 for (; chg
; chg
--, i
++)
409 if (line_contains_alnum(xe
->xdf2
.recs
[i
]->ptr
,
410 xe
->xdf2
.recs
[i
]->size
))
416 * This function merges m and m->next, marking everything between those hunks
417 * as conflicting, too.
419 static void xdl_merge_two_conflicts(xdmerge_t
*m
)
421 xdmerge_t
*next_m
= m
->next
;
422 m
->chg1
= next_m
->i1
+ next_m
->chg1
- m
->i1
;
423 m
->chg2
= next_m
->i2
+ next_m
->chg2
- m
->i2
;
424 m
->next
= next_m
->next
;
429 * If there are less than 3 non-conflicting lines between conflicts,
430 * it appears simpler -- because it takes up less (or as many) lines --
431 * if the lines are moved into the conflicts.
433 static int xdl_simplify_non_conflicts(xdfenv_t
*xe1
, xdmerge_t
*m
,
434 int simplify_if_no_alnum
)
441 xdmerge_t
*next_m
= m
->next
;
447 begin
= m
->i1
+ m
->chg1
;
450 if (m
->mode
!= 0 || next_m
->mode
!= 0 ||
452 (!simplify_if_no_alnum
||
453 lines_contain_alnum(xe1
, begin
, end
- begin
)))) {
457 xdl_merge_two_conflicts(m
);
463 * level == 0: mark all overlapping changes as conflict
464 * level == 1: mark overlapping changes as conflict only if not identical
465 * level == 2: analyze non-identical changes for minimal conflict set
466 * level == 3: analyze non-identical changes for minimal conflict set, but
467 * treat hunks not containing any letter or number as conflicting
469 * returns < 0 on error, == 0 for no conflicts, else number of conflicts
471 static int xdl_do_merge(xdfenv_t
*xe1
, xdchange_t
*xscr1
,
472 xdfenv_t
*xe2
, xdchange_t
*xscr2
,
473 xmparam_t
const *xmp
, mmbuffer_t
*result
)
475 xdmerge_t
*changes
, *c
;
476 xpparam_t
const *xpp
= &xmp
->xpp
;
477 const char *const ancestor_name
= xmp
->ancestor
;
478 const char *const name1
= xmp
->file1
;
479 const char *const name2
= xmp
->file2
;
480 int i0
, i1
, i2
, chg0
, chg1
, chg2
;
481 int level
= xmp
->level
;
482 int style
= xmp
->style
;
483 int favor
= xmp
->favor
;
485 if (style
== XDL_MERGE_DIFF3
) {
487 * "diff3 -m" output does not make sense for anything
488 * more aggressive than XDL_MERGE_EAGER.
490 if (XDL_MERGE_EAGER
< level
)
491 level
= XDL_MERGE_EAGER
;
496 while (xscr1
&& xscr2
) {
499 if (xscr1
->i1
+ xscr1
->chg1
< xscr2
->i1
) {
502 i2
= xscr2
->i2
- xscr2
->i1
+ xscr1
->i1
;
506 if (xdl_append_merge(&c
, 1,
507 i0
, chg0
, i1
, chg1
, i2
, chg2
)) {
508 xdl_cleanup_merge(changes
);
514 if (xscr2
->i1
+ xscr2
->chg1
< xscr1
->i1
) {
516 i1
= xscr1
->i2
- xscr1
->i1
+ xscr2
->i1
;
521 if (xdl_append_merge(&c
, 2,
522 i0
, chg0
, i1
, chg1
, i2
, chg2
)) {
523 xdl_cleanup_merge(changes
);
529 if (level
== XDL_MERGE_MINIMAL
|| xscr1
->i1
!= xscr2
->i1
||
530 xscr1
->chg1
!= xscr2
->chg1
||
531 xscr1
->chg2
!= xscr2
->chg2
||
532 xdl_merge_cmp_lines(xe1
, xscr1
->i2
,
534 xscr1
->chg2
, xpp
->flags
)) {
536 int off
= xscr1
->i1
- xscr2
->i1
;
537 int ffo
= off
+ xscr1
->chg1
- xscr2
->chg1
;
548 chg0
= xscr1
->i1
+ xscr1
->chg1
- i0
;
549 chg1
= xscr1
->i2
+ xscr1
->chg2
- i1
;
550 chg2
= xscr2
->i2
+ xscr2
->chg2
- i2
;
556 if (xdl_append_merge(&c
, 0,
557 i0
, chg0
, i1
, chg1
, i2
, chg2
)) {
558 xdl_cleanup_merge(changes
);
563 i1
= xscr1
->i1
+ xscr1
->chg1
;
564 i2
= xscr2
->i1
+ xscr2
->chg1
;
576 i2
= xscr1
->i1
+ xe2
->xdf2
.nrec
- xe2
->xdf1
.nrec
;
580 if (xdl_append_merge(&c
, 1,
581 i0
, chg0
, i1
, chg1
, i2
, chg2
)) {
582 xdl_cleanup_merge(changes
);
591 i1
= xscr2
->i1
+ xe1
->xdf2
.nrec
- xe1
->xdf1
.nrec
;
596 if (xdl_append_merge(&c
, 2,
597 i0
, chg0
, i1
, chg1
, i2
, chg2
)) {
598 xdl_cleanup_merge(changes
);
605 /* refine conflicts */
606 if (XDL_MERGE_ZEALOUS
<= level
&&
607 (xdl_refine_conflicts(xe1
, xe2
, changes
, xpp
) < 0 ||
608 xdl_simplify_non_conflicts(xe1
, changes
,
609 XDL_MERGE_ZEALOUS
< level
) < 0)) {
610 xdl_cleanup_merge(changes
);
615 int marker_size
= xmp
->marker_size
;
616 int size
= xdl_fill_merge_buffer(xe1
, name1
, xe2
, name2
,
618 favor
, changes
, NULL
, style
,
620 result
->ptr
= xdl_malloc(size
);
622 xdl_cleanup_merge(changes
);
626 xdl_fill_merge_buffer(xe1
, name1
, xe2
, name2
,
627 ancestor_name
, favor
, changes
,
628 result
->ptr
, style
, marker_size
);
630 return xdl_cleanup_merge(changes
);
633 int xdl_merge(mmfile_t
*orig
, mmfile_t
*mf1
, mmfile_t
*mf2
,
634 xmparam_t
const *xmp
, mmbuffer_t
*result
)
636 xdchange_t
*xscr1
, *xscr2
;
639 xpparam_t
const *xpp
= &xmp
->xpp
;
644 if (xdl_do_diff(orig
, mf1
, xpp
, &xe1
) < 0) {
647 if (xdl_do_diff(orig
, mf2
, xpp
, &xe2
) < 0) {
651 if (xdl_change_compact(&xe1
.xdf1
, &xe1
.xdf2
, xpp
->flags
) < 0 ||
652 xdl_change_compact(&xe1
.xdf2
, &xe1
.xdf1
, xpp
->flags
) < 0 ||
653 xdl_build_script(&xe1
, &xscr1
) < 0) {
657 if (xdl_change_compact(&xe2
.xdf1
, &xe2
.xdf2
, xpp
->flags
) < 0 ||
658 xdl_change_compact(&xe2
.xdf2
, &xe2
.xdf1
, xpp
->flags
) < 0 ||
659 xdl_build_script(&xe2
, &xscr2
) < 0) {
660 xdl_free_script(xscr1
);
667 result
->ptr
= xdl_malloc(mf2
->size
);
668 memcpy(result
->ptr
, mf2
->ptr
, mf2
->size
);
669 result
->size
= mf2
->size
;
671 result
->ptr
= xdl_malloc(mf1
->size
);
672 memcpy(result
->ptr
, mf1
->ptr
, mf1
->size
);
673 result
->size
= mf1
->size
;
675 status
= xdl_do_merge(&xe1
, xscr1
,
679 xdl_free_script(xscr1
);
680 xdl_free_script(xscr2
);