2 #include "object-store.h"
8 #include "xdiff-interface.h"
9 #include "xdiff/xmacros.h"
13 #include "oid-array.h"
16 static int compare_paths(const struct combine_diff_path
*one
,
17 const struct diff_filespec
*two
)
19 if (!S_ISDIR(one
->mode
) && !S_ISDIR(two
->mode
))
20 return strcmp(one
->path
, two
->path
);
22 return base_name_compare(one
->path
, strlen(one
->path
), one
->mode
,
23 two
->path
, strlen(two
->path
), two
->mode
);
26 static int filename_changed(char status
)
28 return status
== 'R' || status
== 'C';
31 static struct combine_diff_path
*intersect_paths(
32 struct combine_diff_path
*curr
,
35 int combined_all_paths
)
37 struct diff_queue_struct
*q
= &diff_queued_diff
;
38 struct combine_diff_path
*p
, **tail
= &curr
;
42 for (i
= 0; i
< q
->nr
; i
++) {
45 if (diff_unmodified_pair(q
->queue
[i
]))
47 path
= q
->queue
[i
]->two
->path
;
49 p
= xmalloc(combine_diff_path_size(num_parent
, len
));
50 p
->path
= (char *) &(p
->parent
[num_parent
]);
51 memcpy(p
->path
, path
, len
);
55 sizeof(p
->parent
[0]) * num_parent
);
57 oidcpy(&p
->oid
, &q
->queue
[i
]->two
->oid
);
58 p
->mode
= q
->queue
[i
]->two
->mode
;
59 oidcpy(&p
->parent
[n
].oid
, &q
->queue
[i
]->one
->oid
);
60 p
->parent
[n
].mode
= q
->queue
[i
]->one
->mode
;
61 p
->parent
[n
].status
= q
->queue
[i
]->status
;
63 if (combined_all_paths
&&
64 filename_changed(p
->parent
[n
].status
)) {
65 strbuf_init(&p
->parent
[n
].path
, 0);
66 strbuf_addstr(&p
->parent
[n
].path
,
67 q
->queue
[i
]->one
->path
);
76 * paths in curr (linked list) and q->queue[] (array) are
77 * both sorted in the tree order.
80 while ((p
= *tail
) != NULL
) {
82 ? -1 : compare_paths(p
, q
->queue
[i
]->two
));
85 /* p->path not in q->queue[]; drop it */
87 for (j
= 0; j
< num_parent
; j
++)
88 if (combined_all_paths
&&
89 filename_changed(p
->parent
[j
].status
))
90 strbuf_release(&p
->parent
[j
].path
);
96 /* q->queue[i] not in p->path; skip it */
101 oidcpy(&p
->parent
[n
].oid
, &q
->queue
[i
]->one
->oid
);
102 p
->parent
[n
].mode
= q
->queue
[i
]->one
->mode
;
103 p
->parent
[n
].status
= q
->queue
[i
]->status
;
104 if (combined_all_paths
&&
105 filename_changed(p
->parent
[n
].status
))
106 strbuf_addstr(&p
->parent
[n
].path
,
107 q
->queue
[i
]->one
->path
);
115 /* Lines lost from parent */
117 struct lline
*next
, *prev
;
119 unsigned long parent_map
;
120 char line
[FLEX_ARRAY
];
123 /* Lines lost from current parent (before coalescing) */
125 struct lline
*lost_head
, *lost_tail
;
129 /* Lines surviving in the merge result */
131 /* Accumulated and coalesced lost lines */
137 /* bit 0 up to (N-1) are on if the parent has this line (i.e.
138 * we did not change it).
139 * bit N is used for "interesting" lines, including context.
140 * bit (N+1) is used for "do not show deletion before this".
143 unsigned long *p_lno
;
146 static int match_string_spaces(const char *line1
, int len1
,
147 const char *line2
, int len2
,
150 if (flags
& XDF_WHITESPACE_FLAGS
) {
151 for (; len1
> 0 && XDL_ISSPACE(line1
[len1
- 1]); len1
--);
152 for (; len2
> 0 && XDL_ISSPACE(line2
[len2
- 1]); len2
--);
155 if (!(flags
& (XDF_IGNORE_WHITESPACE
| XDF_IGNORE_WHITESPACE_CHANGE
)))
156 return (len1
== len2
&& !memcmp(line1
, line2
, len1
));
158 while (len1
> 0 && len2
> 0) {
161 if (XDL_ISSPACE(line1
[len1
]) || XDL_ISSPACE(line2
[len2
])) {
162 if ((flags
& XDF_IGNORE_WHITESPACE_CHANGE
) &&
163 (!XDL_ISSPACE(line1
[len1
]) || !XDL_ISSPACE(line2
[len2
])))
166 for (; len1
> 0 && XDL_ISSPACE(line1
[len1
]); len1
--);
167 for (; len2
> 0 && XDL_ISSPACE(line2
[len2
]); len2
--);
169 if (line1
[len1
] != line2
[len2
])
173 if (flags
& XDF_IGNORE_WHITESPACE
) {
174 /* Consume remaining spaces */
175 for (; len1
> 0 && XDL_ISSPACE(line1
[len1
- 1]); len1
--);
176 for (; len2
> 0 && XDL_ISSPACE(line2
[len2
- 1]); len2
--);
179 /* We matched full line1 and line2 */
186 enum coalesce_direction
{ MATCH
, BASE
, NEW
};
188 /* Coalesce new lines into base by finding LCS */
189 static struct lline
*coalesce_lines(struct lline
*base
, int *lenbase
,
190 struct lline
*newline
, int lennew
,
191 unsigned long parent
, long flags
)
194 enum coalesce_direction
**directions
;
195 struct lline
*baseend
, *newend
= NULL
;
196 int i
, j
, origbaselen
= *lenbase
;
207 * Coalesce new lines into base by finding the LCS
208 * - Create the table to run dynamic programming
210 * - Then reverse read the direction structure:
211 * - If we have MATCH, assign parent to base flag, and consume
212 * both baseend and newend
213 * - Else if we have BASE, consume baseend
214 * - Else if we have NEW, insert newend lline into base and
217 CALLOC_ARRAY(lcs
, st_add(origbaselen
, 1));
218 CALLOC_ARRAY(directions
, st_add(origbaselen
, 1));
219 for (i
= 0; i
< origbaselen
+ 1; i
++) {
220 CALLOC_ARRAY(lcs
[i
], st_add(lennew
, 1));
221 CALLOC_ARRAY(directions
[i
], st_add(lennew
, 1));
222 directions
[i
][0] = BASE
;
224 for (j
= 1; j
< lennew
+ 1; j
++)
225 directions
[0][j
] = NEW
;
227 for (i
= 1, baseend
= base
; i
< origbaselen
+ 1; i
++) {
228 for (j
= 1, newend
= newline
; j
< lennew
+ 1; j
++) {
229 if (match_string_spaces(baseend
->line
, baseend
->len
,
230 newend
->line
, newend
->len
, flags
)) {
231 lcs
[i
][j
] = lcs
[i
- 1][j
- 1] + 1;
232 directions
[i
][j
] = MATCH
;
233 } else if (lcs
[i
][j
- 1] >= lcs
[i
- 1][j
]) {
234 lcs
[i
][j
] = lcs
[i
][j
- 1];
235 directions
[i
][j
] = NEW
;
237 lcs
[i
][j
] = lcs
[i
- 1][j
];
238 directions
[i
][j
] = BASE
;
241 newend
= newend
->next
;
244 baseend
= baseend
->next
;
247 for (i
= 0; i
< origbaselen
+ 1; i
++)
251 /* At this point, baseend and newend point to the end of each lists */
254 while (i
!= 0 || j
!= 0) {
255 if (directions
[i
][j
] == MATCH
) {
256 baseend
->parent_map
|= 1<<parent
;
257 baseend
= baseend
->prev
;
258 newend
= newend
->prev
;
261 } else if (directions
[i
][j
] == NEW
) {
265 /* Remove lline from new list and update newend */
267 lline
->prev
->next
= lline
->next
;
269 newline
= lline
->next
;
271 lline
->next
->prev
= lline
->prev
;
273 newend
= lline
->prev
;
276 /* Add lline to base list */
278 lline
->next
= baseend
->next
;
279 lline
->prev
= baseend
;
281 lline
->prev
->next
= lline
;
290 lline
->next
->prev
= lline
;
293 baseend
= baseend
->prev
;
300 struct lline
*lline
= newend
;
301 newend
= newend
->next
;
305 for (i
= 0; i
< origbaselen
+ 1; i
++)
312 static char *grab_blob(struct repository
*r
,
313 const struct object_id
*oid
, unsigned int mode
,
314 unsigned long *size
, struct userdiff_driver
*textconv
,
318 enum object_type type
;
320 if (S_ISGITLINK(mode
)) {
321 struct strbuf buf
= STRBUF_INIT
;
322 strbuf_addf(&buf
, "Subproject commit %s\n", oid_to_hex(oid
));
324 blob
= strbuf_detach(&buf
, NULL
);
325 } else if (is_null_oid(oid
)) {
328 return xcalloc(1, 1);
329 } else if (textconv
) {
330 struct diff_filespec
*df
= alloc_filespec(path
);
331 fill_filespec(df
, oid
, 1, mode
);
332 *size
= fill_textconv(r
, textconv
, df
, &blob
);
335 blob
= read_object_file(oid
, &type
, size
);
336 if (type
!= OBJ_BLOB
)
337 die("object '%s' is not a blob!", oid_to_hex(oid
));
342 static void append_lost(struct sline
*sline
, int n
, const char *line
, int len
)
345 unsigned long this_mask
= (1UL<<n
);
346 if (line
[len
-1] == '\n')
349 FLEX_ALLOC_MEM(lline
, line
, line
, len
);
352 lline
->prev
= sline
->plost
.lost_tail
;
354 lline
->prev
->next
= lline
;
356 sline
->plost
.lost_head
= lline
;
357 sline
->plost
.lost_tail
= lline
;
359 lline
->parent_map
= this_mask
;
362 struct combine_diff_state
{
369 struct sline
*lost_bucket
;
372 static void consume_hunk(void *state_
,
375 const char *funcline
, long funclen
)
377 struct combine_diff_state
*state
= state_
;
383 state
->lno
= state
->nb
;
384 if (state
->nn
== 0) {
385 /* @@ -X,Y +N,0 @@ removed Y lines
386 * that would have come *after* line N
387 * in the result. Our lost buckets hang
388 * to the line after the removed lines,
390 * Note that this is correct even when N == 0,
391 * in which case the hunk removes the first
394 state
->lost_bucket
= &state
->sline
[state
->nb
];
398 state
->lost_bucket
= &state
->sline
[state
->nb
-1];
400 if (!state
->sline
[state
->nb
-1].p_lno
)
401 CALLOC_ARRAY(state
->sline
[state
->nb
- 1].p_lno
,
403 state
->sline
[state
->nb
-1].p_lno
[state
->n
] = state
->ob
;
406 static int consume_line(void *state_
, char *line
, unsigned long len
)
408 struct combine_diff_state
*state
= state_
;
409 if (!state
->lost_bucket
)
410 return 0; /* not in any hunk yet */
413 append_lost(state
->lost_bucket
, state
->n
, line
+1, len
-1);
416 state
->sline
[state
->lno
-1].flag
|= state
->nmask
;
423 static void combine_diff(struct repository
*r
,
424 const struct object_id
*parent
, unsigned int mode
,
425 mmfile_t
*result_file
,
426 struct sline
*sline
, unsigned int cnt
, int n
,
427 int num_parent
, int result_deleted
,
428 struct userdiff_driver
*textconv
,
429 const char *path
, long flags
)
431 unsigned int p_lno
, lno
;
432 unsigned long nmask
= (1UL << n
);
435 mmfile_t parent_file
;
436 struct combine_diff_state state
;
440 return; /* result deleted */
442 parent_file
.ptr
= grab_blob(r
, parent
, mode
, &sz
, textconv
, path
);
443 parent_file
.size
= sz
;
444 memset(&xpp
, 0, sizeof(xpp
));
446 memset(&xecfg
, 0, sizeof(xecfg
));
447 memset(&state
, 0, sizeof(state
));
451 state
.num_parent
= num_parent
;
454 if (xdi_diff_outf(&parent_file
, result_file
, consume_hunk
,
455 consume_line
, &state
, &xpp
, &xecfg
))
456 die("unable to generate combined diff for %s",
458 free(parent_file
.ptr
);
460 /* Assign line numbers for this parent.
462 * sline[lno].p_lno[n] records the first line number
463 * (counting from 1) for parent N if the final hunk display
464 * started by showing sline[lno] (possibly showing the lost
465 * lines attached to it first).
467 for (lno
= 0, p_lno
= 1; lno
<= cnt
; lno
++) {
469 sline
[lno
].p_lno
[n
] = p_lno
;
471 /* Coalesce new lines */
472 if (sline
[lno
].plost
.lost_head
) {
473 struct sline
*sl
= &sline
[lno
];
474 sl
->lost
= coalesce_lines(sl
->lost
, &sl
->lenlost
,
476 sl
->plost
.len
, n
, flags
);
477 sl
->plost
.lost_head
= sl
->plost
.lost_tail
= NULL
;
481 /* How many lines would this sline advance the p_lno? */
482 ll
= sline
[lno
].lost
;
484 if (ll
->parent_map
& nmask
)
485 p_lno
++; /* '-' means parent had it */
488 if (lno
< cnt
&& !(sline
[lno
].flag
& nmask
))
489 p_lno
++; /* no '+' means parent had it */
491 sline
[lno
].p_lno
[n
] = p_lno
; /* trailer */
494 static unsigned long context
= 3;
495 static char combine_marker
= '@';
497 static int interesting(struct sline
*sline
, unsigned long all_mask
)
499 /* If some parents lost lines here, or if we have added to
500 * some parent, it is interesting.
502 return ((sline
->flag
& all_mask
) || sline
->lost
);
505 static unsigned long adjust_hunk_tail(struct sline
*sline
,
506 unsigned long all_mask
,
507 unsigned long hunk_begin
,
510 /* i points at the first uninteresting line. If the last line
511 * of the hunk was interesting only because it has some
512 * deletion, then it is not all that interesting for the
513 * purpose of giving trailing context lines. This is because
514 * we output '-' line and then unmodified sline[i-1] itself in
515 * that case which gives us one extra context line.
517 if ((hunk_begin
+ 1 <= i
) && !(sline
[i
-1].flag
& all_mask
))
522 static unsigned long find_next(struct sline
*sline
,
526 int look_for_uninteresting
)
528 /* We have examined up to i-1 and are about to look at i.
529 * Find next interesting or uninteresting line. Here,
530 * "interesting" does not mean interesting(), but marked by
531 * the give_context() function below (i.e. it includes context
532 * lines that are not interesting to interesting() function
533 * that are surrounded by interesting() ones.
536 if (look_for_uninteresting
537 ? !(sline
[i
].flag
& mark
)
538 : (sline
[i
].flag
& mark
))
545 static int give_context(struct sline
*sline
, unsigned long cnt
, int num_parent
)
547 unsigned long all_mask
= (1UL<<num_parent
) - 1;
548 unsigned long mark
= (1UL<<num_parent
);
549 unsigned long no_pre_delete
= (2UL<<num_parent
);
552 /* Two groups of interesting lines may have a short gap of
553 * uninteresting lines. Connect such groups to give them a
556 * We first start from what the interesting() function says,
557 * and mark them with "mark", and paint context lines with the
558 * mark. So interesting() would still say false for such context
559 * lines but they are treated as "interesting" in the end.
561 i
= find_next(sline
, mark
, 0, cnt
, 0);
566 unsigned long j
= (context
< i
) ? (i
- context
) : 0;
569 /* Paint a few lines before the first interesting line. */
571 if (!(sline
[j
].flag
& mark
))
572 sline
[j
].flag
|= no_pre_delete
;
573 sline
[j
++].flag
|= mark
;
577 /* we know up to i is to be included. where does the
578 * next uninteresting one start?
580 j
= find_next(sline
, mark
, i
, cnt
, 1);
582 break; /* the rest are all interesting */
584 /* lookahead context lines */
585 k
= find_next(sline
, mark
, j
, cnt
, 0);
586 j
= adjust_hunk_tail(sline
, all_mask
, i
, j
);
588 if (k
< j
+ context
) {
589 /* k is interesting and [j,k) are not, but
590 * paint them interesting because the gap is small.
593 sline
[j
++].flag
|= mark
;
598 /* j is the first uninteresting line and there is
599 * no overlap beyond it within context lines. Paint
600 * the trailing edge a bit.
603 k
= (j
+ context
< cnt
+1) ? j
+ context
: cnt
+1;
605 sline
[j
++].flag
|= mark
;
610 static int make_hunks(struct sline
*sline
, unsigned long cnt
,
611 int num_parent
, int dense
)
613 unsigned long all_mask
= (1UL<<num_parent
) - 1;
614 unsigned long mark
= (1UL<<num_parent
);
616 int has_interesting
= 0;
618 for (i
= 0; i
<= cnt
; i
++) {
619 if (interesting(&sline
[i
], all_mask
))
620 sline
[i
].flag
|= mark
;
622 sline
[i
].flag
&= ~mark
;
625 return give_context(sline
, cnt
, num_parent
);
627 /* Look at each hunk, and if we have changes from only one
628 * parent, or the changes are the same from all but one
629 * parent, mark that uninteresting.
633 unsigned long j
, hunk_begin
, hunk_end
;
634 unsigned long same_diff
;
635 while (i
<= cnt
&& !(sline
[i
].flag
& mark
))
638 break; /* No more interesting hunks */
640 for (j
= i
+ 1; j
<= cnt
; j
++) {
641 if (!(sline
[j
].flag
& mark
)) {
642 /* Look beyond the end to see if there
643 * is an interesting line after this
644 * hunk within context span.
646 unsigned long la
; /* lookahead */
648 la
= adjust_hunk_tail(sline
, all_mask
,
650 la
= (la
+ context
< cnt
+ 1) ?
651 (la
+ context
) : cnt
+ 1;
652 while (la
&& j
<= --la
) {
653 if (sline
[la
].flag
& mark
) {
665 /* [i..hunk_end) are interesting. Now is it really
666 * interesting? We check if there are only two versions
667 * and the result matches one of them. That is, we look
669 * (+) line, which records lines added to which parents;
670 * this line appears in the result.
671 * (-) line, which records from what parents the line
672 * was removed; this line does not appear in the result.
673 * then check the set of parents the result has difference
674 * from, from all lines. If there are lines that has
675 * different set of parents that the result has differences
676 * from, that means we have more than two versions.
678 * Even when we have only two versions, if the result does
679 * not match any of the parents, the it should be considered
680 * interesting. In such a case, we would have all '+' line.
681 * After passing the above "two versions" test, that would
682 * appear as "the same set of parents" to be "all parents".
686 for (j
= i
; j
< hunk_end
&& !has_interesting
; j
++) {
687 unsigned long this_diff
= sline
[j
].flag
& all_mask
;
688 struct lline
*ll
= sline
[j
].lost
;
690 /* This has some changes. Is it the
694 same_diff
= this_diff
;
695 else if (same_diff
!= this_diff
) {
700 while (ll
&& !has_interesting
) {
701 /* Lost this line from these parents;
702 * who are they? Are they the same?
704 this_diff
= ll
->parent_map
;
706 same_diff
= this_diff
;
707 else if (same_diff
!= this_diff
) {
714 if (!has_interesting
&& same_diff
!= all_mask
) {
715 /* This hunk is not that interesting after all */
716 for (j
= hunk_begin
; j
< hunk_end
; j
++)
717 sline
[j
].flag
&= ~mark
;
722 has_interesting
= give_context(sline
, cnt
, num_parent
);
723 return has_interesting
;
726 static void show_parent_lno(struct sline
*sline
, unsigned long l0
, unsigned long l1
, int n
, unsigned long null_context
)
728 l0
= sline
[l0
].p_lno
[n
];
729 l1
= sline
[l1
].p_lno
[n
];
730 printf(" -%lu,%lu", l0
, l1
-l0
-null_context
);
733 static int hunk_comment_line(const char *bol
)
740 return (isalpha(ch
) || ch
== '_' || ch
== '$');
743 static void show_line_to_eol(const char *line
, int len
, const char *reset
)
745 int saw_cr_at_eol
= 0;
748 saw_cr_at_eol
= (len
&& line
[len
-1] == '\r');
750 printf("%.*s%s%s\n", len
- saw_cr_at_eol
, line
,
752 saw_cr_at_eol
? "\r" : "");
755 static void dump_sline(struct sline
*sline
, const char *line_prefix
,
756 unsigned long cnt
, int num_parent
,
757 int use_color
, int result_deleted
)
759 unsigned long mark
= (1UL<<num_parent
);
760 unsigned long no_pre_delete
= (2UL<<num_parent
);
762 unsigned long lno
= 0;
763 const char *c_frag
= diff_get_color(use_color
, DIFF_FRAGINFO
);
764 const char *c_func
= diff_get_color(use_color
, DIFF_FUNCINFO
);
765 const char *c_new
= diff_get_color(use_color
, DIFF_FILE_NEW
);
766 const char *c_old
= diff_get_color(use_color
, DIFF_FILE_OLD
);
767 const char *c_context
= diff_get_color(use_color
, DIFF_CONTEXT
);
768 const char *c_reset
= diff_get_color(use_color
, DIFF_RESET
);
771 return; /* result deleted */
774 unsigned long hunk_end
;
775 unsigned long rlines
;
776 const char *hunk_comment
= NULL
;
777 unsigned long null_context
= 0;
779 while (lno
<= cnt
&& !(sline
[lno
].flag
& mark
)) {
780 if (hunk_comment_line(sline
[lno
].bol
))
781 hunk_comment
= sline
[lno
].bol
;
787 for (hunk_end
= lno
+ 1; hunk_end
<= cnt
; hunk_end
++)
788 if (!(sline
[hunk_end
].flag
& mark
))
791 rlines
= hunk_end
- lno
;
793 rlines
--; /* pointing at the last delete hunk */
797 * Even when running with --unified=0, all
798 * lines in the hunk needs to be processed in
799 * the loop below in order to show the
800 * deletion recorded in lost_head. However,
801 * we do not want to show the resulting line
802 * with all blank context markers in such a
806 for (j
= lno
; j
< hunk_end
; j
++)
807 if (!(sline
[j
].flag
& (mark
-1)))
809 rlines
-= null_context
;
812 printf("%s%s", line_prefix
, c_frag
);
813 for (i
= 0; i
<= num_parent
; i
++) putchar(combine_marker
);
814 for (i
= 0; i
< num_parent
; i
++)
815 show_parent_lno(sline
, lno
, hunk_end
, i
, null_context
);
816 printf(" +%lu,%lu ", lno
+1, rlines
);
817 for (i
= 0; i
<= num_parent
; i
++) putchar(combine_marker
);
821 for (i
= 0; i
< 40; i
++) {
822 int ch
= hunk_comment
[i
] & 0xff;
823 if (!ch
|| ch
== '\n')
829 printf("%s%s %s%s", c_reset
,
832 for (i
= 0; i
< comment_end
; i
++)
833 putchar(hunk_comment
[i
]);
836 printf("%s\n", c_reset
);
837 while (lno
< hunk_end
) {
840 unsigned long p_mask
;
841 struct sline
*sl
= &sline
[lno
++];
842 ll
= (sl
->flag
& no_pre_delete
) ? NULL
: sl
->lost
;
844 printf("%s%s", line_prefix
, c_old
);
845 for (j
= 0; j
< num_parent
; j
++) {
846 if (ll
->parent_map
& (1UL<<j
))
851 show_line_to_eol(ll
->line
, -1, c_reset
);
857 fputs(line_prefix
, stdout
);
858 if (!(sl
->flag
& (mark
-1))) {
860 * This sline was here to hang the
861 * lost lines in front of it.
865 fputs(c_context
, stdout
);
868 fputs(c_new
, stdout
);
869 for (j
= 0; j
< num_parent
; j
++) {
870 if (p_mask
& sl
->flag
)
876 show_line_to_eol(sl
->bol
, sl
->len
, c_reset
);
881 static void reuse_combine_diff(struct sline
*sline
, unsigned long cnt
,
884 /* We have already examined parent j and we know parent i
885 * and parent j are the same, so reuse the combined result
886 * of parent j for parent i.
888 unsigned long lno
, imask
, jmask
;
892 for (lno
= 0; lno
<= cnt
; lno
++) {
893 struct lline
*ll
= sline
->lost
;
894 sline
->p_lno
[i
] = sline
->p_lno
[j
];
896 if (ll
->parent_map
& jmask
)
897 ll
->parent_map
|= imask
;
900 if (sline
->flag
& jmask
)
901 sline
->flag
|= imask
;
904 /* the overall size of the file (sline[cnt]) */
905 sline
->p_lno
[i
] = sline
->p_lno
[j
];
908 static void dump_quoted_path(const char *head
,
911 const char *line_prefix
,
912 const char *c_meta
, const char *c_reset
)
914 static struct strbuf buf
= STRBUF_INIT
;
917 strbuf_addstr(&buf
, line_prefix
);
918 strbuf_addstr(&buf
, c_meta
);
919 strbuf_addstr(&buf
, head
);
920 quote_two_c_style(&buf
, prefix
, path
, 0);
921 strbuf_addstr(&buf
, c_reset
);
925 static void show_combined_header(struct combine_diff_path
*elem
,
927 struct rev_info
*rev
,
928 const char *line_prefix
,
930 int show_file_header
)
932 struct diff_options
*opt
= &rev
->diffopt
;
933 int abbrev
= opt
->flags
.full_index
? the_hash_algo
->hexsz
: DEFAULT_ABBREV
;
934 const char *a_prefix
= opt
->a_prefix
? opt
->a_prefix
: "a/";
935 const char *b_prefix
= opt
->b_prefix
? opt
->b_prefix
: "b/";
936 const char *c_meta
= diff_get_color_opt(opt
, DIFF_METAINFO
);
937 const char *c_reset
= diff_get_color_opt(opt
, DIFF_RESET
);
942 int dense
= rev
->dense_combined_merges
;
944 if (rev
->loginfo
&& !rev
->no_commit_id
)
947 dump_quoted_path(dense
? "diff --cc " : "diff --combined ",
948 "", elem
->path
, line_prefix
, c_meta
, c_reset
);
949 printf("%s%sindex ", line_prefix
, c_meta
);
950 for (i
= 0; i
< num_parent
; i
++) {
951 abb
= find_unique_abbrev(&elem
->parent
[i
].oid
,
953 printf("%s%s", i
? "," : "", abb
);
955 abb
= find_unique_abbrev(&elem
->oid
, abbrev
);
956 printf("..%s%s\n", abb
, c_reset
);
959 deleted
= !elem
->mode
;
961 /* We say it was added if nobody had it */
963 for (i
= 0; added
&& i
< num_parent
; i
++)
964 if (elem
->parent
[i
].status
!=
968 printf("%s%snew file mode %06o",
969 line_prefix
, c_meta
, elem
->mode
);
972 printf("%s%sdeleted file ",
973 line_prefix
, c_meta
);
975 for (i
= 0; i
< num_parent
; i
++) {
976 printf("%s%06o", i
? "," : "",
977 elem
->parent
[i
].mode
);
980 printf("..%06o", elem
->mode
);
982 printf("%s\n", c_reset
);
985 if (!show_file_header
)
988 if (rev
->combined_all_paths
) {
989 for (i
= 0; i
< num_parent
; i
++) {
990 char *path
= filename_changed(elem
->parent
[i
].status
)
991 ? elem
->parent
[i
].path
.buf
: elem
->path
;
992 if (elem
->parent
[i
].status
== DIFF_STATUS_ADDED
)
993 dump_quoted_path("--- ", "", "/dev/null",
994 line_prefix
, c_meta
, c_reset
);
996 dump_quoted_path("--- ", a_prefix
, path
,
997 line_prefix
, c_meta
, c_reset
);
1001 dump_quoted_path("--- ", "", "/dev/null",
1002 line_prefix
, c_meta
, c_reset
);
1004 dump_quoted_path("--- ", a_prefix
, elem
->path
,
1005 line_prefix
, c_meta
, c_reset
);
1008 dump_quoted_path("+++ ", "", "/dev/null",
1009 line_prefix
, c_meta
, c_reset
);
1011 dump_quoted_path("+++ ", b_prefix
, elem
->path
,
1012 line_prefix
, c_meta
, c_reset
);
1015 static void show_patch_diff(struct combine_diff_path
*elem
, int num_parent
,
1016 int working_tree_file
,
1017 struct rev_info
*rev
)
1019 struct diff_options
*opt
= &rev
->diffopt
;
1020 unsigned long result_size
, cnt
, lno
;
1021 int result_deleted
= 0;
1023 struct sline
*sline
; /* survived lines */
1024 int mode_differs
= 0;
1026 mmfile_t result_file
;
1027 struct userdiff_driver
*userdiff
;
1028 struct userdiff_driver
*textconv
= NULL
;
1030 const char *line_prefix
= diff_line_prefix(opt
);
1032 context
= opt
->context
;
1033 userdiff
= userdiff_find_by_path(opt
->repo
->index
, elem
->path
);
1035 userdiff
= userdiff_find_by_name("default");
1036 if (opt
->flags
.allow_textconv
)
1037 textconv
= userdiff_get_textconv(opt
->repo
, userdiff
);
1039 /* Read the result of merge first */
1040 if (!working_tree_file
)
1041 result
= grab_blob(opt
->repo
, &elem
->oid
, elem
->mode
, &result_size
,
1042 textconv
, elem
->path
);
1044 /* Used by diff-tree to read from the working tree */
1048 if (lstat(elem
->path
, &st
) < 0)
1051 if (S_ISLNK(st
.st_mode
)) {
1052 struct strbuf buf
= STRBUF_INIT
;
1054 if (strbuf_readlink(&buf
, elem
->path
, st
.st_size
) < 0) {
1055 error_errno("readlink(%s)", elem
->path
);
1058 result_size
= buf
.len
;
1059 result
= strbuf_detach(&buf
, NULL
);
1060 elem
->mode
= canon_mode(st
.st_mode
);
1061 } else if (S_ISDIR(st
.st_mode
)) {
1062 struct object_id oid
;
1063 if (resolve_gitlink_ref(elem
->path
, "HEAD", &oid
) < 0)
1064 result
= grab_blob(opt
->repo
, &elem
->oid
,
1065 elem
->mode
, &result_size
,
1068 result
= grab_blob(opt
->repo
, &oid
, elem
->mode
,
1069 &result_size
, NULL
, NULL
);
1070 } else if (textconv
) {
1071 struct diff_filespec
*df
= alloc_filespec(elem
->path
);
1072 fill_filespec(df
, null_oid(), 0, st
.st_mode
);
1073 result_size
= fill_textconv(opt
->repo
, textconv
, df
, &result
);
1075 } else if (0 <= (fd
= open(elem
->path
, O_RDONLY
))) {
1076 size_t len
= xsize_t(st
.st_size
);
1080 elem
->mode
= canon_mode(st
.st_mode
);
1081 /* if symlinks don't work, assume symlink if all parents
1084 is_file
= has_symlinks
;
1085 for (i
= 0; !is_file
&& i
< num_parent
; i
++)
1086 is_file
= !S_ISLNK(elem
->parent
[i
].mode
);
1088 elem
->mode
= canon_mode(S_IFLNK
);
1091 result
= xmallocz(len
);
1093 done
= read_in_full(fd
, result
, len
);
1095 die_errno("read error '%s'", elem
->path
);
1096 else if (done
< len
)
1097 die("early EOF '%s'", elem
->path
);
1099 /* If not a fake symlink, apply filters, e.g. autocrlf */
1101 struct strbuf buf
= STRBUF_INIT
;
1103 if (convert_to_git(rev
->diffopt
.repo
->index
,
1104 elem
->path
, result
, len
, &buf
, global_conv_flags_eol
)) {
1106 result
= strbuf_detach(&buf
, &len
);
1116 result
= xcalloc(1, 1);
1123 for (i
= 0; i
< num_parent
; i
++) {
1124 if (elem
->parent
[i
].mode
!= elem
->mode
) {
1132 else if (userdiff
->binary
!= -1)
1133 is_binary
= userdiff
->binary
;
1135 is_binary
= buffer_is_binary(result
, result_size
);
1136 for (i
= 0; !is_binary
&& i
< num_parent
; i
++) {
1139 buf
= grab_blob(opt
->repo
,
1140 &elem
->parent
[i
].oid
,
1141 elem
->parent
[i
].mode
,
1143 if (buffer_is_binary(buf
, size
))
1149 show_combined_header(elem
, num_parent
, rev
,
1150 line_prefix
, mode_differs
, 0);
1151 printf("Binary files differ\n");
1156 for (cnt
= 0, cp
= result
; cp
< result
+ result_size
; cp
++) {
1160 if (result_size
&& result
[result_size
-1] != '\n')
1161 cnt
++; /* incomplete line */
1163 CALLOC_ARRAY(sline
, st_add(cnt
, 2));
1164 sline
[0].bol
= result
;
1165 for (lno
= 0, cp
= result
; cp
< result
+ result_size
; cp
++) {
1167 sline
[lno
].len
= cp
- sline
[lno
].bol
;
1170 sline
[lno
].bol
= cp
+ 1;
1173 if (result_size
&& result
[result_size
-1] != '\n')
1174 sline
[cnt
-1].len
= result_size
- (sline
[cnt
-1].bol
- result
);
1176 result_file
.ptr
= result
;
1177 result_file
.size
= result_size
;
1179 /* Even p_lno[cnt+1] is valid -- that is for the end line number
1180 * for deletion hunk at the end.
1182 CALLOC_ARRAY(sline
[0].p_lno
, st_mult(st_add(cnt
, 2), num_parent
));
1183 for (lno
= 0; lno
<= cnt
; lno
++)
1184 sline
[lno
+1].p_lno
= sline
[lno
].p_lno
+ num_parent
;
1186 for (i
= 0; i
< num_parent
; i
++) {
1188 for (j
= 0; j
< i
; j
++) {
1189 if (oideq(&elem
->parent
[i
].oid
,
1190 &elem
->parent
[j
].oid
)) {
1191 reuse_combine_diff(sline
, cnt
, i
, j
);
1196 combine_diff(opt
->repo
,
1197 &elem
->parent
[i
].oid
,
1198 elem
->parent
[i
].mode
,
1199 &result_file
, sline
,
1200 cnt
, i
, num_parent
, result_deleted
,
1201 textconv
, elem
->path
, opt
->xdl_opts
);
1204 show_hunks
= make_hunks(sline
, cnt
, num_parent
, rev
->dense_combined_merges
);
1206 if (show_hunks
|| mode_differs
|| working_tree_file
) {
1207 show_combined_header(elem
, num_parent
, rev
,
1208 line_prefix
, mode_differs
, 1);
1209 dump_sline(sline
, line_prefix
, cnt
, num_parent
,
1210 opt
->use_color
, result_deleted
);
1214 for (lno
= 0; lno
< cnt
; lno
++) {
1215 if (sline
[lno
].lost
) {
1216 struct lline
*ll
= sline
[lno
].lost
;
1218 struct lline
*tmp
= ll
;
1224 free(sline
[0].p_lno
);
1228 static void show_raw_diff(struct combine_diff_path
*p
, int num_parent
, struct rev_info
*rev
)
1230 struct diff_options
*opt
= &rev
->diffopt
;
1231 int line_termination
, inter_name_termination
, i
;
1232 const char *line_prefix
= diff_line_prefix(opt
);
1234 line_termination
= opt
->line_termination
;
1235 inter_name_termination
= '\t';
1236 if (!line_termination
)
1237 inter_name_termination
= 0;
1239 if (rev
->loginfo
&& !rev
->no_commit_id
)
1243 if (opt
->output_format
& DIFF_FORMAT_RAW
) {
1244 printf("%s", line_prefix
);
1246 /* As many colons as there are parents */
1247 for (i
= 0; i
< num_parent
; i
++)
1250 /* Show the modes */
1251 for (i
= 0; i
< num_parent
; i
++)
1252 printf("%06o ", p
->parent
[i
].mode
);
1253 printf("%06o", p
->mode
);
1256 for (i
= 0; i
< num_parent
; i
++)
1257 printf(" %s", diff_aligned_abbrev(&p
->parent
[i
].oid
,
1259 printf(" %s ", diff_aligned_abbrev(&p
->oid
, opt
->abbrev
));
1262 if (opt
->output_format
& (DIFF_FORMAT_RAW
| DIFF_FORMAT_NAME_STATUS
)) {
1263 for (i
= 0; i
< num_parent
; i
++)
1264 putchar(p
->parent
[i
].status
);
1265 putchar(inter_name_termination
);
1268 for (i
= 0; i
< num_parent
; i
++)
1269 if (rev
->combined_all_paths
) {
1270 if (filename_changed(p
->parent
[i
].status
))
1271 write_name_quoted(p
->parent
[i
].path
.buf
, stdout
,
1272 inter_name_termination
);
1274 write_name_quoted(p
->path
, stdout
,
1275 inter_name_termination
);
1277 write_name_quoted(p
->path
, stdout
, line_termination
);
1281 * The result (p->elem) is from the working tree and their
1282 * parents are typically from multiple stages during a merge
1283 * (i.e. diff-files) or the state in HEAD and in the index
1284 * (i.e. diff-index).
1286 void show_combined_diff(struct combine_diff_path
*p
,
1288 struct rev_info
*rev
)
1290 struct diff_options
*opt
= &rev
->diffopt
;
1292 if (opt
->output_format
& (DIFF_FORMAT_RAW
|
1294 DIFF_FORMAT_NAME_STATUS
))
1295 show_raw_diff(p
, num_parent
, rev
);
1296 else if (opt
->output_format
& DIFF_FORMAT_PATCH
)
1297 show_patch_diff(p
, num_parent
, 1, rev
);
1300 static void free_combined_pair(struct diff_filepair
*pair
)
1307 * A combine_diff_path expresses N parents on the LHS against 1 merge
1308 * result. Synthesize a diff_filepair that has N entries on the "one"
1309 * side and 1 entry on the "two" side.
1311 * In the future, we might want to add more data to combine_diff_path
1312 * so that we can fill fields we are ignoring (most notably, size) here,
1313 * but currently nobody uses it, so this should suffice for now.
1315 static struct diff_filepair
*combined_pair(struct combine_diff_path
*p
,
1319 struct diff_filepair
*pair
;
1320 struct diff_filespec
*pool
;
1322 pair
= xmalloc(sizeof(*pair
));
1323 CALLOC_ARRAY(pool
, st_add(num_parent
, 1));
1324 pair
->one
= pool
+ 1;
1327 for (i
= 0; i
< num_parent
; i
++) {
1328 pair
->one
[i
].path
= p
->path
;
1329 pair
->one
[i
].mode
= p
->parent
[i
].mode
;
1330 oidcpy(&pair
->one
[i
].oid
, &p
->parent
[i
].oid
);
1331 pair
->one
[i
].oid_valid
= !is_null_oid(&p
->parent
[i
].oid
);
1332 pair
->one
[i
].has_more_entries
= 1;
1334 pair
->one
[num_parent
- 1].has_more_entries
= 0;
1336 pair
->two
->path
= p
->path
;
1337 pair
->two
->mode
= p
->mode
;
1338 oidcpy(&pair
->two
->oid
, &p
->oid
);
1339 pair
->two
->oid_valid
= !is_null_oid(&p
->oid
);
1343 static void handle_combined_callback(struct diff_options
*opt
,
1344 struct combine_diff_path
*paths
,
1348 struct combine_diff_path
*p
;
1349 struct diff_queue_struct q
;
1352 CALLOC_ARRAY(q
.queue
, num_paths
);
1353 q
.alloc
= num_paths
;
1355 for (i
= 0, p
= paths
; p
; p
= p
->next
)
1356 q
.queue
[i
++] = combined_pair(p
, num_parent
);
1357 opt
->format_callback(&q
, opt
, opt
->format_callback_data
);
1358 for (i
= 0; i
< num_paths
; i
++)
1359 free_combined_pair(q
.queue
[i
]);
1363 static const char *path_path(void *obj
)
1365 struct combine_diff_path
*path
= (struct combine_diff_path
*)obj
;
1371 * Diff stat formats which we always compute solely against the first parent.
1373 #define STAT_FORMAT_MASK (DIFF_FORMAT_NUMSTAT \
1374 | DIFF_FORMAT_SHORTSTAT \
1375 | DIFF_FORMAT_SUMMARY \
1376 | DIFF_FORMAT_DIRSTAT \
1377 | DIFF_FORMAT_DIFFSTAT)
1379 /* find set of paths that every parent touches */
1380 static struct combine_diff_path
*find_paths_generic(const struct object_id
*oid
,
1381 const struct oid_array
*parents
,
1382 struct diff_options
*opt
,
1383 int combined_all_paths
)
1385 struct combine_diff_path
*paths
= NULL
;
1386 int i
, num_parent
= parents
->nr
;
1388 int output_format
= opt
->output_format
;
1389 const char *orderfile
= opt
->orderfile
;
1391 opt
->output_format
= DIFF_FORMAT_NO_OUTPUT
;
1392 /* tell diff_tree to emit paths in sorted (=tree) order */
1393 opt
->orderfile
= NULL
;
1395 /* D(A,P1...Pn) = D(A,P1) ^ ... ^ D(A,Pn) (wrt paths) */
1396 for (i
= 0; i
< num_parent
; i
++) {
1398 * show stat against the first parent even when doing
1401 int stat_opt
= output_format
& STAT_FORMAT_MASK
;
1402 if (i
== 0 && stat_opt
)
1403 opt
->output_format
= stat_opt
;
1405 opt
->output_format
= DIFF_FORMAT_NO_OUTPUT
;
1406 diff_tree_oid(&parents
->oid
[i
], oid
, "", opt
);
1408 paths
= intersect_paths(paths
, i
, num_parent
,
1409 combined_all_paths
);
1411 /* if showing diff, show it in requested order */
1412 if (opt
->output_format
!= DIFF_FORMAT_NO_OUTPUT
&&
1414 diffcore_order(orderfile
);
1420 opt
->output_format
= output_format
;
1421 opt
->orderfile
= orderfile
;
1427 * find set of paths that everybody touches, assuming diff is run without
1428 * rename/copy detection, etc, comparing all trees simultaneously (= faster).
1430 static struct combine_diff_path
*find_paths_multitree(
1431 const struct object_id
*oid
, const struct oid_array
*parents
,
1432 struct diff_options
*opt
)
1434 int i
, nparent
= parents
->nr
;
1435 const struct object_id
**parents_oid
;
1436 struct combine_diff_path paths_head
;
1439 ALLOC_ARRAY(parents_oid
, nparent
);
1440 for (i
= 0; i
< nparent
; i
++)
1441 parents_oid
[i
] = &parents
->oid
[i
];
1443 /* fake list head, so worker can assume it is non-NULL */
1444 paths_head
.next
= NULL
;
1446 strbuf_init(&base
, PATH_MAX
);
1447 diff_tree_paths(&paths_head
, oid
, parents_oid
, nparent
, &base
, opt
);
1449 strbuf_release(&base
);
1451 return paths_head
.next
;
1454 static int match_objfind(struct combine_diff_path
*path
,
1456 const struct oidset
*set
)
1459 if (oidset_contains(set
, &path
->oid
))
1461 for (i
= 0; i
< num_parent
; i
++) {
1462 if (oidset_contains(set
, &path
->parent
[i
].oid
))
1468 static struct combine_diff_path
*combined_objfind(struct diff_options
*opt
,
1469 struct combine_diff_path
*paths
,
1472 struct combine_diff_path
*ret
= NULL
, **tail
= &ret
;
1473 struct combine_diff_path
*p
= paths
;
1476 struct combine_diff_path
*next
= p
->next
;
1478 if (match_objfind(p
, num_parent
, opt
->objfind
)) {
1491 void diff_tree_combined(const struct object_id
*oid
,
1492 const struct oid_array
*parents
,
1493 struct rev_info
*rev
)
1495 struct diff_options
*opt
= &rev
->diffopt
;
1496 struct diff_options diffopts
;
1497 struct combine_diff_path
*p
, *paths
;
1498 int i
, num_paths
, needsep
, show_log_first
, num_parent
= parents
->nr
;
1499 int need_generic_pathscan
;
1501 /* nothing to do, if no parents */
1505 show_log_first
= !!rev
->loginfo
&& !rev
->no_commit_id
;
1507 if (show_log_first
) {
1510 if (rev
->verbose_header
&& opt
->output_format
&&
1511 opt
->output_format
!= DIFF_FORMAT_NO_OUTPUT
&&
1512 !commit_format_is_empty(rev
->commit_format
))
1513 printf("%s%c", diff_line_prefix(opt
),
1514 opt
->line_termination
);
1518 copy_pathspec(&diffopts
.pathspec
, &opt
->pathspec
);
1519 diffopts
.flags
.recursive
= 1;
1520 diffopts
.flags
.allow_external
= 0;
1522 /* find set of paths that everybody touches
1526 * Diffcore transformations are bound to diff_filespec and logic
1527 * comparing two entries - i.e. they do not apply directly to combine
1530 * If some of such transformations is requested - we launch generic
1531 * path scanning, which works significantly slower compared to
1532 * simultaneous all-trees-in-one-go scan in find_paths_multitree().
1534 * TODO some of the filters could be ported to work on
1535 * combine_diff_paths - i.e. all functionality that skips paths, so in
1536 * theory, we could end up having only multitree path scanning.
1538 * NOTE please keep this semantically in sync with diffcore_std()
1540 need_generic_pathscan
= opt
->skip_stat_unmatch
||
1541 opt
->flags
.follow_renames
||
1542 opt
->break_opt
!= -1 ||
1543 opt
->detect_rename
||
1544 (opt
->pickaxe_opts
&
1545 (DIFF_PICKAXE_KINDS_MASK
& ~DIFF_PICKAXE_KIND_OBJFIND
)) ||
1548 if (need_generic_pathscan
) {
1550 * NOTE generic case also handles --stat, as it computes
1551 * diff(sha1,parent_i) for all i to do the job, specifically
1554 paths
= find_paths_generic(oid
, parents
, &diffopts
,
1555 rev
->combined_all_paths
);
1559 paths
= find_paths_multitree(oid
, parents
, &diffopts
);
1561 if (opt
->pickaxe_opts
& DIFF_PICKAXE_KIND_OBJFIND
)
1562 paths
= combined_objfind(opt
, paths
, num_parent
);
1565 * show stat against the first parent even
1566 * when doing combined diff.
1568 stat_opt
= opt
->output_format
& STAT_FORMAT_MASK
;
1570 diffopts
.output_format
= stat_opt
;
1572 diff_tree_oid(&parents
->oid
[0], oid
, "", &diffopts
);
1573 diffcore_std(&diffopts
);
1575 diffcore_order(opt
->orderfile
);
1576 diff_flush(&diffopts
);
1580 /* find out number of surviving paths */
1581 for (num_paths
= 0, p
= paths
; p
; p
= p
->next
)
1584 /* order paths according to diffcore_order */
1585 if (opt
->orderfile
&& num_paths
) {
1586 struct obj_order
*o
;
1588 ALLOC_ARRAY(o
, num_paths
);
1589 for (i
= 0, p
= paths
; p
; p
= p
->next
, i
++)
1591 order_objects(opt
->orderfile
, path_path
, o
, num_paths
);
1592 for (i
= 0; i
< num_paths
- 1; i
++) {
1594 p
->next
= o
[i
+1].obj
;
1597 p
= o
[num_paths
-1].obj
;
1605 if (opt
->output_format
& (DIFF_FORMAT_RAW
|
1607 DIFF_FORMAT_NAME_STATUS
)) {
1608 for (p
= paths
; p
; p
= p
->next
)
1609 show_raw_diff(p
, num_parent
, rev
);
1612 else if (opt
->output_format
& STAT_FORMAT_MASK
)
1614 else if (opt
->output_format
& DIFF_FORMAT_CALLBACK
)
1615 handle_combined_callback(opt
, paths
, num_parent
, num_paths
);
1617 if (opt
->output_format
& DIFF_FORMAT_PATCH
) {
1619 printf("%s%c", diff_line_prefix(opt
),
1620 opt
->line_termination
);
1621 for (p
= paths
; p
; p
= p
->next
)
1622 show_patch_diff(p
, num_parent
, 0, rev
);
1626 /* Clean things up */
1628 struct combine_diff_path
*tmp
= paths
;
1629 paths
= paths
->next
;
1630 for (i
= 0; i
< num_parent
; i
++)
1631 if (rev
->combined_all_paths
&&
1632 filename_changed(tmp
->parent
[i
].status
))
1633 strbuf_release(&tmp
->parent
[i
].path
);
1637 clear_pathspec(&diffopts
.pathspec
);
1640 void diff_tree_combined_merge(const struct commit
*commit
,
1641 struct rev_info
*rev
)
1643 struct commit_list
*parent
= get_saved_parents(rev
, commit
);
1644 struct oid_array parents
= OID_ARRAY_INIT
;
1647 oid_array_append(&parents
, &parent
->item
->object
.oid
);
1648 parent
= parent
->next
;
1650 diff_tree_combined(&commit
->object
.oid
, &parents
, rev
);
1651 oid_array_clear(&parents
);