7 #include "xdiff-interface.h"
10 static int uninteresting(struct diff_filepair
*p
)
12 if (diff_unmodified_pair(p
))
17 static struct combine_diff_path
*intersect_paths(struct combine_diff_path
*curr
, int n
, int num_parent
)
19 struct diff_queue_struct
*q
= &diff_queued_diff
;
20 struct combine_diff_path
*p
;
24 struct combine_diff_path
*list
= NULL
, **tail
= &list
;
25 for (i
= 0; i
< q
->nr
; i
++) {
28 if (uninteresting(q
->queue
[i
]))
30 path
= q
->queue
[i
]->two
->path
;
32 p
= xmalloc(combine_diff_path_size(num_parent
, len
));
33 p
->path
= (char*) &(p
->parent
[num_parent
]);
34 memcpy(p
->path
, path
, len
);
39 sizeof(p
->parent
[0]) * num_parent
);
41 memcpy(p
->sha1
, q
->queue
[i
]->two
->sha1
, 20);
42 p
->mode
= q
->queue
[i
]->two
->mode
;
43 memcpy(p
->parent
[n
].sha1
, q
->queue
[i
]->one
->sha1
, 20);
44 p
->parent
[n
].mode
= q
->queue
[i
]->one
->mode
;
45 p
->parent
[n
].status
= q
->queue
[i
]->status
;
52 for (p
= curr
; p
; p
= p
->next
) {
56 for (i
= 0; i
< q
->nr
; i
++) {
60 if (uninteresting(q
->queue
[i
]))
62 path
= q
->queue
[i
]->two
->path
;
64 if (len
== p
->len
&& !memcmp(path
, p
->path
, len
)) {
66 memcpy(p
->parent
[n
].sha1
,
67 q
->queue
[i
]->one
->sha1
, 20);
68 p
->parent
[n
].mode
= q
->queue
[i
]->one
->mode
;
69 p
->parent
[n
].status
= q
->queue
[i
]->status
;
79 /* Lines lost from parent */
83 unsigned long parent_map
;
84 char line
[FLEX_ARRAY
];
87 /* Lines surviving in the merge result */
89 struct lline
*lost_head
, **lost_tail
;
92 /* bit 0 up to (N-1) are on if the parent has this line (i.e.
93 * we did not change it).
94 * bit N is used for "interesting" lines, including context.
100 static char *grab_blob(const unsigned char *sha1
, unsigned long *size
)
104 if (!memcmp(sha1
, null_sha1
, 20)) {
107 return xcalloc(1, 1);
109 blob
= read_sha1_file(sha1
, type
, size
);
110 if (strcmp(type
, blob_type
))
111 die("object '%s' is not a blob!", sha1_to_hex(sha1
));
115 static void append_lost(struct sline
*sline
, int n
, const char *line
, int len
)
118 unsigned long this_mask
= (1UL<<n
);
119 if (line
[len
-1] == '\n')
122 /* Check to see if we can squash things */
123 if (sline
->lost_head
) {
124 struct lline
*last_one
= NULL
;
125 /* We cannot squash it with earlier one */
126 for (lline
= sline
->lost_head
;
129 if (lline
->parent_map
& this_mask
)
131 lline
= last_one
? last_one
->next
: sline
->lost_head
;
133 if (lline
->len
== len
&&
134 !memcmp(lline
->line
, line
, len
)) {
135 lline
->parent_map
|= this_mask
;
142 lline
= xmalloc(sizeof(*lline
) + len
+ 1);
145 lline
->parent_map
= this_mask
;
146 memcpy(lline
->line
, line
, len
);
147 lline
->line
[len
] = 0;
148 *sline
->lost_tail
= lline
;
149 sline
->lost_tail
= &lline
->next
;
152 struct combine_diff_state
{
153 struct xdiff_emit_state xm
;
161 struct sline
*lost_bucket
;
164 static void consume_line(void *state_
, char *line
, unsigned long len
)
166 struct combine_diff_state
*state
= state_
;
167 if (5 < len
&& !memcmp("@@ -", line
, 4)) {
168 if (parse_hunk_header(line
, len
,
169 &state
->ob
, &state
->on
,
170 &state
->nb
, &state
->nn
))
172 state
->lno
= state
->nb
;
174 /* @@ -1,2 +0,0 @@ to remove the
179 /* @@ -X,Y +N,0 @@ removed Y lines
180 * that would have come *after* line N
181 * in the result. Our lost buckets hang
182 * to the line after the removed lines,
184 state
->lost_bucket
= &state
->sline
[state
->nb
];
186 state
->lost_bucket
= &state
->sline
[state
->nb
-1];
187 if (!state
->sline
[state
->nb
-1].p_lno
)
188 state
->sline
[state
->nb
-1].p_lno
=
189 xcalloc(state
->num_parent
,
190 sizeof(unsigned long));
191 state
->sline
[state
->nb
-1].p_lno
[state
->n
] = state
->ob
;
194 if (!state
->lost_bucket
)
195 return; /* not in any hunk yet */
198 append_lost(state
->lost_bucket
, state
->n
, line
+1, len
-1);
201 state
->sline
[state
->lno
-1].flag
|= state
->nmask
;
207 static void combine_diff(const unsigned char *parent
, mmfile_t
*result_file
,
208 struct sline
*sline
, int cnt
, int n
, int num_parent
)
210 unsigned int p_lno
, lno
;
211 unsigned long nmask
= (1UL << n
);
214 mmfile_t parent_file
;
216 struct combine_diff_state state
;
220 return; /* result deleted */
222 parent_file
.ptr
= grab_blob(parent
, &sz
);
223 parent_file
.size
= sz
;
224 xpp
.flags
= XDF_NEED_MINIMAL
;
227 ecb
.outf
= xdiff_outf
;
229 memset(&state
, 0, sizeof(state
));
230 state
.xm
.consume
= consume_line
;
234 state
.num_parent
= num_parent
;
237 xdl_diff(&parent_file
, result_file
, &xpp
, &xecfg
, &ecb
);
238 free(parent_file
.ptr
);
240 /* Assign line numbers for this parent.
242 * sline[lno].p_lno[n] records the first line number
243 * (counting from 1) for parent N if the final hunk display
244 * started by showing sline[lno] (possibly showing the lost
245 * lines attached to it first).
247 for (lno
= 0, p_lno
= 1; lno
<= cnt
; lno
++) {
249 sline
[lno
].p_lno
[n
] = p_lno
;
251 /* How many lines would this sline advance the p_lno? */
252 ll
= sline
[lno
].lost_head
;
254 if (ll
->parent_map
& nmask
)
255 p_lno
++; /* '-' means parent had it */
258 if (lno
< cnt
&& !(sline
[lno
].flag
& nmask
))
259 p_lno
++; /* no '+' means parent had it */
261 sline
[lno
].p_lno
[n
] = p_lno
; /* trailer */
264 static unsigned long context
= 3;
265 static char combine_marker
= '@';
267 static int interesting(struct sline
*sline
, unsigned long all_mask
)
269 /* If some parents lost lines here, or if we have added to
270 * some parent, it is interesting.
272 return ((sline
->flag
& all_mask
) || sline
->lost_head
);
275 static unsigned long adjust_hunk_tail(struct sline
*sline
,
276 unsigned long all_mask
,
277 unsigned long hunk_begin
,
280 /* i points at the first uninteresting line. If the last line
281 * of the hunk was interesting only because it has some
282 * deletion, then it is not all that interesting for the
283 * purpose of giving trailing context lines. This is because
284 * we output '-' line and then unmodified sline[i-1] itself in
285 * that case which gives us one extra context line.
287 if ((hunk_begin
+ 1 <= i
) && !(sline
[i
-1].flag
& all_mask
))
292 static unsigned long find_next(struct sline
*sline
,
298 /* We have examined up to i-1 and are about to look at i.
299 * Find next interesting or uninteresting line. Here,
300 * "interesting" does not mean interesting(), but marked by
301 * the give_context() function below (i.e. it includes context
302 * lines that are not interesting to interesting() function
303 * that are surrounded by interesting() ones.
307 ? !(sline
[i
].flag
& mark
)
308 : (sline
[i
].flag
& mark
))
315 static int give_context(struct sline
*sline
, unsigned long cnt
, int num_parent
)
317 unsigned long all_mask
= (1UL<<num_parent
) - 1;
318 unsigned long mark
= (1UL<<num_parent
);
321 /* Two groups of interesting lines may have a short gap of
322 * unintersting lines. Connect such groups to give them a
325 * We first start from what the interesting() function says,
326 * and mark them with "mark", and paint context lines with the
327 * mark. So interesting() would still say false for such context
328 * lines but they are treated as "interesting" in the end.
330 i
= find_next(sline
, mark
, 0, cnt
, 0);
335 unsigned long j
= (context
< i
) ? (i
- context
) : 0;
338 /* Paint a few lines before the first interesting line. */
340 sline
[j
++].flag
|= mark
;
343 /* we know up to i is to be included. where does the
344 * next uninteresting one start?
346 j
= find_next(sline
, mark
, i
, cnt
, 1);
348 break; /* the rest are all interesting */
350 /* lookahead context lines */
351 k
= find_next(sline
, mark
, j
, cnt
, 0);
352 j
= adjust_hunk_tail(sline
, all_mask
, i
, j
);
354 if (k
< j
+ context
) {
355 /* k is interesting and [j,k) are not, but
356 * paint them interesting because the gap is small.
359 sline
[j
++].flag
|= mark
;
364 /* j is the first uninteresting line and there is
365 * no overlap beyond it within context lines. Paint
366 * the trailing edge a bit.
369 k
= (j
+ context
< cnt
+1) ? j
+ context
: cnt
+1;
371 sline
[j
++].flag
|= mark
;
376 static int make_hunks(struct sline
*sline
, unsigned long cnt
,
377 int num_parent
, int dense
)
379 unsigned long all_mask
= (1UL<<num_parent
) - 1;
380 unsigned long mark
= (1UL<<num_parent
);
382 int has_interesting
= 0;
384 for (i
= 0; i
<= cnt
; i
++) {
385 if (interesting(&sline
[i
], all_mask
))
386 sline
[i
].flag
|= mark
;
388 sline
[i
].flag
&= ~mark
;
391 return give_context(sline
, cnt
, num_parent
);
393 /* Look at each hunk, and if we have changes from only one
394 * parent, or the changes are the same from all but one
395 * parent, mark that uninteresting.
399 unsigned long j
, hunk_begin
, hunk_end
;
400 unsigned long same_diff
;
401 while (i
<= cnt
&& !(sline
[i
].flag
& mark
))
404 break; /* No more interesting hunks */
406 for (j
= i
+ 1; j
<= cnt
; j
++) {
407 if (!(sline
[j
].flag
& mark
)) {
408 /* Look beyond the end to see if there
409 * is an interesting line after this
410 * hunk within context span.
412 unsigned long la
; /* lookahead */
414 la
= adjust_hunk_tail(sline
, all_mask
,
416 la
= (la
+ context
< cnt
+ 1) ?
417 (la
+ context
) : cnt
+ 1;
419 if (sline
[la
].flag
& mark
) {
431 /* [i..hunk_end) are interesting. Now is it really
432 * interesting? We check if there are only two versions
433 * and the result matches one of them. That is, we look
435 * (+) line, which records lines added to which parents;
436 * this line appears in the result.
437 * (-) line, which records from what parents the line
438 * was removed; this line does not appear in the result.
439 * then check the set of parents the result has difference
440 * from, from all lines. If there are lines that has
441 * different set of parents that the result has differences
442 * from, that means we have more than two versions.
444 * Even when we have only two versions, if the result does
445 * not match any of the parents, the it should be considered
446 * interesting. In such a case, we would have all '+' line.
447 * After passing the above "two versions" test, that would
448 * appear as "the same set of parents" to be "all parents".
452 for (j
= i
; j
< hunk_end
&& !has_interesting
; j
++) {
453 unsigned long this_diff
= sline
[j
].flag
& all_mask
;
454 struct lline
*ll
= sline
[j
].lost_head
;
456 /* This has some changes. Is it the
460 same_diff
= this_diff
;
461 else if (same_diff
!= this_diff
) {
466 while (ll
&& !has_interesting
) {
467 /* Lost this line from these parents;
468 * who are they? Are they the same?
470 this_diff
= ll
->parent_map
;
472 same_diff
= this_diff
;
473 else if (same_diff
!= this_diff
) {
480 if (!has_interesting
&& same_diff
!= all_mask
) {
481 /* This hunk is not that interesting after all */
482 for (j
= hunk_begin
; j
< hunk_end
; j
++)
483 sline
[j
].flag
&= ~mark
;
488 has_interesting
= give_context(sline
, cnt
, num_parent
);
489 return has_interesting
;
492 static void show_parent_lno(struct sline
*sline
, unsigned long l0
, unsigned long l1
, unsigned long cnt
, int n
)
494 l0
= sline
[l0
].p_lno
[n
];
495 l1
= sline
[l1
].p_lno
[n
];
496 printf(" -%lu,%lu", l0
, l1
-l0
);
499 static void dump_sline(struct sline
*sline
, unsigned long cnt
, int num_parent
)
501 unsigned long mark
= (1UL<<num_parent
);
503 unsigned long lno
= 0;
506 return; /* result deleted */
509 struct sline
*sl
= &sline
[lno
];
510 unsigned long hunk_end
;
511 unsigned long rlines
;
512 while (lno
<= cnt
&& !(sline
[lno
].flag
& mark
))
517 for (hunk_end
= lno
+ 1; hunk_end
<= cnt
; hunk_end
++)
518 if (!(sline
[hunk_end
].flag
& mark
))
521 rlines
= hunk_end
- lno
;
523 rlines
--; /* pointing at the last delete hunk */
524 for (i
= 0; i
<= num_parent
; i
++) putchar(combine_marker
);
525 for (i
= 0; i
< num_parent
; i
++)
526 show_parent_lno(sline
, lno
, hunk_end
, cnt
, i
);
527 printf(" +%lu,%lu ", lno
+1, rlines
);
528 for (i
= 0; i
<= num_parent
; i
++) putchar(combine_marker
);
530 while (lno
< hunk_end
) {
533 unsigned long p_mask
;
537 for (j
= 0; j
< num_parent
; j
++) {
538 if (ll
->parent_map
& (1UL<<j
))
549 for (j
= 0; j
< num_parent
; j
++) {
550 if (p_mask
& sl
->flag
)
556 printf("%.*s\n", sl
->len
, sl
->bol
);
561 static void reuse_combine_diff(struct sline
*sline
, unsigned long cnt
,
564 /* We have already examined parent j and we know parent i
565 * and parent j are the same, so reuse the combined result
566 * of parent j for parent i.
568 unsigned long lno
, imask
, jmask
;
572 for (lno
= 0; lno
<= cnt
; lno
++) {
573 struct lline
*ll
= sline
->lost_head
;
574 sline
->p_lno
[i
] = sline
->p_lno
[j
];
576 if (ll
->parent_map
& jmask
)
577 ll
->parent_map
|= imask
;
580 if (sline
->flag
& jmask
)
581 sline
->flag
|= imask
;
584 /* the overall size of the file (sline[cnt]) */
585 sline
->p_lno
[i
] = sline
->p_lno
[j
];
588 static int show_patch_diff(struct combine_diff_path
*elem
, int num_parent
,
589 int dense
, struct rev_info
*rev
)
591 struct diff_options
*opt
= &rev
->diffopt
;
592 unsigned long result_size
, cnt
, lno
;
593 char *result
, *cp
, *ep
;
594 struct sline
*sline
; /* survived lines */
595 int mode_differs
= 0;
596 int i
, show_hunks
, shown_header
= 0;
597 int working_tree_file
= !memcmp(elem
->sha1
, null_sha1
, 20);
598 int abbrev
= opt
->full_index
? 40 : DEFAULT_ABBREV
;
599 mmfile_t result_file
;
601 /* Read the result of merge first */
602 if (!working_tree_file
)
603 result
= grab_blob(elem
->sha1
, &result_size
);
605 /* Used by diff-tree to read from the working tree */
608 if (0 <= (fd
= open(elem
->path
, O_RDONLY
)) &&
610 int len
= st
.st_size
;
613 elem
->mode
= canon_mode(st
.st_mode
);
615 result
= xmalloc(len
+ 1);
617 int done
= xread(fd
, result
+cnt
, len
-cnt
);
621 die("read error '%s'", elem
->path
);
637 for (cnt
= 0, cp
= result
; cp
- result
< result_size
; cp
++) {
641 if (result_size
&& result
[result_size
-1] != '\n')
642 cnt
++; /* incomplete line */
644 sline
= xcalloc(cnt
+2, sizeof(*sline
));
646 sline
[0].bol
= result
;
647 for (lno
= 0; lno
<= cnt
+ 1; lno
++) {
648 sline
[lno
].lost_tail
= &sline
[lno
].lost_head
;
651 for (lno
= 0, cp
= result
; cp
- result
< result_size
; cp
++) {
653 sline
[lno
].len
= cp
- sline
[lno
].bol
;
656 sline
[lno
].bol
= cp
+ 1;
659 if (result_size
&& result
[result_size
-1] != '\n')
660 sline
[cnt
-1].len
= result_size
- (sline
[cnt
-1].bol
- result
);
662 result_file
.ptr
= result
;
663 result_file
.size
= result_size
;
665 /* Even p_lno[cnt+1] is valid -- that is for the end line number
666 * for deletion hunk at the end.
668 sline
[0].p_lno
= xcalloc((cnt
+2) * num_parent
, sizeof(unsigned long));
669 for (lno
= 0; lno
<= cnt
; lno
++)
670 sline
[lno
+1].p_lno
= sline
[lno
].p_lno
+ num_parent
;
672 for (i
= 0; i
< num_parent
; i
++) {
674 for (j
= 0; j
< i
; j
++) {
675 if (!memcmp(elem
->parent
[i
].sha1
,
676 elem
->parent
[j
].sha1
, 20)) {
677 reuse_combine_diff(sline
, cnt
, i
, j
);
682 combine_diff(elem
->parent
[i
].sha1
, &result_file
, sline
,
684 if (elem
->parent
[i
].mode
!= elem
->mode
)
688 show_hunks
= make_hunks(sline
, cnt
, num_parent
, dense
);
690 if (show_hunks
|| mode_differs
|| working_tree_file
) {
694 show_log(rev
, rev
->loginfo
, "\n");
695 printf("diff --%s ", dense
? "cc" : "combined");
696 if (quote_c_style(elem
->path
, NULL
, NULL
, 0))
697 quote_c_style(elem
->path
, NULL
, stdout
, 0);
699 printf("%s", elem
->path
);
702 for (i
= 0; i
< num_parent
; i
++) {
703 abb
= find_unique_abbrev(elem
->parent
[i
].sha1
,
705 printf("%s%s", i
? "," : "", abb
);
707 abb
= find_unique_abbrev(elem
->sha1
, abbrev
);
708 printf("..%s\n", abb
);
711 int added
= !!elem
->mode
;
712 for (i
= 0; added
&& i
< num_parent
; i
++)
713 if (elem
->parent
[i
].status
!=
717 printf("new file mode %06o", elem
->mode
);
720 printf("deleted file ");
722 for (i
= 0; i
< num_parent
; i
++) {
723 printf("%s%06o", i
? "," : "",
724 elem
->parent
[i
].mode
);
727 printf("..%06o", elem
->mode
);
731 dump_sline(sline
, cnt
, num_parent
);
735 for (i
= 0; i
< cnt
; i
++) {
736 if (sline
[i
].lost_head
) {
737 struct lline
*ll
= sline
[i
].lost_head
;
739 struct lline
*tmp
= ll
;
745 free(sline
[0].p_lno
);
750 #define COLONS "::::::::::::::::::::::::::::::::"
752 static void show_raw_diff(struct combine_diff_path
*p
, int num_parent
, struct rev_info
*rev
)
754 struct diff_options
*opt
= &rev
->diffopt
;
755 int i
, offset
, mod_type
= 'A';
757 int line_termination
, inter_name_termination
;
759 line_termination
= opt
->line_termination
;
760 inter_name_termination
= '\t';
761 if (!line_termination
)
762 inter_name_termination
= 0;
765 show_log(rev
, rev
->loginfo
, "\n");
767 for (i
= 0; i
< num_parent
; i
++) {
768 if (p
->parent
[i
].mode
)
774 if (opt
->output_format
== DIFF_FORMAT_RAW
) {
775 offset
= strlen(COLONS
) - num_parent
;
778 prefix
= COLONS
+ offset
;
781 for (i
= 0; i
< num_parent
; i
++) {
782 printf("%s%06o", prefix
, p
->parent
[i
].mode
);
785 printf("%s%06o", prefix
, p
->mode
);
788 for (i
= 0; i
< num_parent
; i
++)
789 printf(" %s", diff_unique_abbrev(p
->parent
[i
].sha1
,
791 printf(" %s ", diff_unique_abbrev(p
->sha1
, opt
->abbrev
));
794 if (opt
->output_format
== DIFF_FORMAT_RAW
||
795 opt
->output_format
== DIFF_FORMAT_NAME_STATUS
) {
796 for (i
= 0; i
< num_parent
; i
++)
797 putchar(p
->parent
[i
].status
);
798 putchar(inter_name_termination
);
801 if (line_termination
) {
802 if (quote_c_style(p
->path
, NULL
, NULL
, 0))
803 quote_c_style(p
->path
, NULL
, stdout
, 0);
805 printf("%s", p
->path
);
806 putchar(line_termination
);
809 printf("%s%c", p
->path
, line_termination
);
813 void show_combined_diff(struct combine_diff_path
*p
,
816 struct rev_info
*rev
)
818 struct diff_options
*opt
= &rev
->diffopt
;
821 switch (opt
->output_format
) {
822 case DIFF_FORMAT_RAW
:
823 case DIFF_FORMAT_NAME_STATUS
:
824 case DIFF_FORMAT_NAME
:
825 show_raw_diff(p
, num_parent
, rev
);
829 case DIFF_FORMAT_PATCH
:
830 show_patch_diff(p
, num_parent
, dense
, rev
);
834 void diff_tree_combined_merge(const unsigned char *sha1
,
835 int dense
, struct rev_info
*rev
)
837 struct diff_options
*opt
= &rev
->diffopt
;
838 struct commit
*commit
= lookup_commit(sha1
);
839 struct diff_options diffopts
;
840 struct commit_list
*parents
;
841 struct combine_diff_path
*p
, *paths
= NULL
;
842 int num_parent
, i
, num_paths
;
845 diffopts
.output_format
= DIFF_FORMAT_NO_OUTPUT
;
846 diffopts
.with_raw
= 0;
847 diffopts
.recursive
= 1;
850 for (parents
= commit
->parents
, num_parent
= 0;
852 parents
= parents
->next
, num_parent
++)
855 /* find set of paths that everybody touches */
856 for (parents
= commit
->parents
, i
= 0;
858 parents
= parents
->next
, i
++) {
859 struct commit
*parent
= parents
->item
;
860 diff_tree_sha1(parent
->object
.sha1
, commit
->object
.sha1
, "",
862 diffcore_std(&diffopts
);
863 paths
= intersect_paths(paths
, i
, num_parent
);
864 diff_flush(&diffopts
);
867 /* find out surviving paths */
868 for (num_paths
= 0, p
= paths
; p
; p
= p
->next
) {
874 int saved_format
= opt
->output_format
;
875 opt
->output_format
= DIFF_FORMAT_RAW
;
876 for (p
= paths
; p
; p
= p
->next
) {
877 show_combined_diff(p
, num_parent
, dense
, rev
);
879 opt
->output_format
= saved_format
;
880 putchar(opt
->line_termination
);
882 for (p
= paths
; p
; p
= p
->next
) {
883 show_combined_diff(p
, num_parent
, dense
, rev
);
887 /* Clean things up */
889 struct combine_diff_path
*tmp
= paths
;