2 * Copyright (C) 2005 Junio C Hamano
11 #include "xdiff-interface.h"
13 static int use_size_cache
;
15 int diff_rename_limit_default
= -1;
17 int git_diff_config(const char *var
, const char *value
)
19 if (!strcmp(var
, "diff.renamelimit")) {
20 diff_rename_limit_default
= git_config_int(var
, value
);
24 return git_default_config(var
, value
);
27 static char *quote_one(const char *str
)
34 needlen
= quote_c_style(str
, NULL
, NULL
, 0);
37 xp
= xmalloc(needlen
+ 1);
38 quote_c_style(str
, xp
, NULL
, 0);
42 static char *quote_two(const char *one
, const char *two
)
44 int need_one
= quote_c_style(one
, NULL
, NULL
, 1);
45 int need_two
= quote_c_style(two
, NULL
, NULL
, 1);
48 if (need_one
+ need_two
) {
49 if (!need_one
) need_one
= strlen(one
);
50 if (!need_two
) need_one
= strlen(two
);
52 xp
= xmalloc(need_one
+ need_two
+ 3);
54 quote_c_style(one
, xp
+ 1, NULL
, 1);
55 quote_c_style(two
, xp
+ need_one
+ 1, NULL
, 1);
56 strcpy(xp
+ need_one
+ need_two
+ 1, "\"");
59 need_one
= strlen(one
);
60 need_two
= strlen(two
);
61 xp
= xmalloc(need_one
+ need_two
+ 1);
63 strcpy(xp
+ need_one
, two
);
67 static const char *external_diff(void)
69 static const char *external_diff_cmd
= NULL
;
70 static int done_preparing
= 0;
73 return external_diff_cmd
;
74 external_diff_cmd
= getenv("GIT_EXTERNAL_DIFF");
76 return external_diff_cmd
;
79 #define TEMPFILE_PATH_LEN 50
81 static struct diff_tempfile
{
82 const char *name
; /* filename external diff should read from */
85 char tmp_path
[TEMPFILE_PATH_LEN
];
88 static int count_lines(const char *data
, int size
)
90 int count
, ch
, completely_empty
= 1, nl_just_seen
= 0;
101 completely_empty
= 0;
104 if (completely_empty
)
107 count
++; /* no trailing newline */
111 static void print_line_count(int count
)
121 printf("1,%d", count
);
126 static void copy_file(int prefix
, const char *data
, int size
)
128 int ch
, nl_just_seen
= 1;
140 printf("\n\\ No newline at end of file\n");
143 static void emit_rewrite_diff(const char *name_a
,
145 struct diff_filespec
*one
,
146 struct diff_filespec
*two
)
149 diff_populate_filespec(one
, 0);
150 diff_populate_filespec(two
, 0);
151 lc_a
= count_lines(one
->data
, one
->size
);
152 lc_b
= count_lines(two
->data
, two
->size
);
153 printf("--- %s\n+++ %s\n@@ -", name_a
, name_b
);
154 print_line_count(lc_a
);
156 print_line_count(lc_b
);
159 copy_file('-', one
->data
, one
->size
);
161 copy_file('+', two
->data
, two
->size
);
164 static int fill_mmfile(mmfile_t
*mf
, struct diff_filespec
*one
)
166 if (!DIFF_FILE_VALID(one
)) {
167 mf
->ptr
= ""; /* does not matter */
171 else if (diff_populate_filespec(one
, 0))
174 mf
->size
= one
->size
;
178 struct emit_callback
{
179 const char **label_path
;
182 static int fn_out(void *priv
, mmbuffer_t
*mb
, int nbuf
)
185 struct emit_callback
*ecbdata
= priv
;
187 if (ecbdata
->label_path
[0]) {
188 printf("--- %s\n", ecbdata
->label_path
[0]);
189 printf("+++ %s\n", ecbdata
->label_path
[1]);
190 ecbdata
->label_path
[0] = ecbdata
->label_path
[1] = NULL
;
192 for (i
= 0; i
< nbuf
; i
++)
193 if (!fwrite(mb
[i
].ptr
, mb
[i
].size
, 1, stdout
))
199 struct xdiff_emit_state xm
;
203 struct diffstat_file
{
205 unsigned is_unmerged
:1;
206 unsigned is_binary
:1;
207 unsigned int added
, deleted
;
211 static struct diffstat_file
*diffstat_add(struct diffstat_t
*diffstat
,
214 struct diffstat_file
*x
;
215 x
= xcalloc(sizeof (*x
), 1);
216 if (diffstat
->nr
== diffstat
->alloc
) {
217 diffstat
->alloc
= alloc_nr(diffstat
->alloc
);
218 diffstat
->files
= xrealloc(diffstat
->files
,
219 diffstat
->alloc
* sizeof(x
));
221 diffstat
->files
[diffstat
->nr
++] = x
;
222 x
->name
= strdup(name
);
226 static void diffstat_consume(void *priv
, char *line
, unsigned long len
)
228 struct diffstat_t
*diffstat
= priv
;
229 struct diffstat_file
*x
= diffstat
->files
[diffstat
->nr
- 1];
233 else if (line
[0] == '-')
237 static const char pluses
[] = "++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++";
238 static const char minuses
[]= "----------------------------------------------------------------------";
240 static void show_stats(struct diffstat_t
* data
)
243 int i
, len
, add
, del
, total
, adds
= 0, dels
= 0;
244 int max
, max_change
= 0, max_len
= 0;
245 int total_files
= data
->nr
;
250 for (i
= 0; i
< data
->nr
; i
++) {
251 struct diffstat_file
*file
= data
->files
[i
];
253 len
= strlen(file
->name
);
257 if (file
->is_binary
|| file
->is_unmerged
)
259 if (max_change
< file
->added
+ file
->deleted
)
260 max_change
= file
->added
+ file
->deleted
;
263 for (i
= 0; i
< data
->nr
; i
++) {
264 char *name
= data
->files
[i
]->name
;
265 int added
= data
->files
[i
]->added
;
266 int deleted
= data
->files
[i
]->deleted
;
268 if (0 < (len
= quote_c_style(name
, NULL
, NULL
, 0))) {
269 char *qname
= xmalloc(len
+ 1);
270 quote_c_style(name
, qname
, NULL
, 0);
272 data
->files
[i
]->name
= name
= qname
;
276 * "scale" the filename
287 slash
= strchr(name
, '/');
294 * scale the add/delete
300 if (data
->files
[i
]->is_binary
) {
301 printf(" %s%-*s | Bin\n", prefix
, len
, name
);
302 goto free_diffstat_file
;
304 else if (data
->files
[i
]->is_unmerged
) {
305 printf(" %s%-*s | Unmerged\n", prefix
, len
, name
);
306 goto free_diffstat_file
;
308 else if (added
+ deleted
== 0) {
310 goto free_diffstat_file
;
319 if (max_change
> 0) {
320 total
= (total
* max
+ max_change
/ 2) / max_change
;
321 add
= (add
* max
+ max_change
/ 2) / max_change
;
324 printf(" %s%-*s |%5d %.*s%.*s\n", prefix
,
325 len
, name
, added
+ deleted
,
326 add
, pluses
, del
, minuses
);
328 free(data
->files
[i
]->name
);
329 free(data
->files
[i
]);
332 printf(" %d files changed, %d insertions(+), %d deletions(-)\n",
333 total_files
, adds
, dels
);
336 #define FIRST_FEW_BYTES 8000
337 static int mmfile_is_binary(mmfile_t
*mf
)
340 if (FIRST_FEW_BYTES
< sz
)
341 sz
= FIRST_FEW_BYTES
;
342 if (memchr(mf
->ptr
, 0, sz
))
347 static void builtin_diff(const char *name_a
,
349 struct diff_filespec
*one
,
350 struct diff_filespec
*two
,
351 const char *xfrm_msg
,
352 int complete_rewrite
)
358 a_one
= quote_two("a/", name_a
);
359 b_two
= quote_two("b/", name_b
);
360 lbl
[0] = DIFF_FILE_VALID(one
) ? a_one
: "/dev/null";
361 lbl
[1] = DIFF_FILE_VALID(two
) ? b_two
: "/dev/null";
362 printf("diff --git %s %s\n", a_one
, b_two
);
363 if (lbl
[0][0] == '/') {
365 printf("new file mode %06o\n", two
->mode
);
366 if (xfrm_msg
&& xfrm_msg
[0])
369 else if (lbl
[1][0] == '/') {
370 printf("deleted file mode %06o\n", one
->mode
);
371 if (xfrm_msg
&& xfrm_msg
[0])
375 if (one
->mode
!= two
->mode
) {
376 printf("old mode %06o\n", one
->mode
);
377 printf("new mode %06o\n", two
->mode
);
379 if (xfrm_msg
&& xfrm_msg
[0])
382 * we do not run diff between different kind
385 if ((one
->mode
^ two
->mode
) & S_IFMT
)
386 goto free_ab_and_return
;
387 if (complete_rewrite
) {
388 emit_rewrite_diff(name_a
, name_b
, one
, two
);
389 goto free_ab_and_return
;
393 if (fill_mmfile(&mf1
, one
) < 0 || fill_mmfile(&mf2
, two
) < 0)
394 die("unable to read files to diff");
396 if (mmfile_is_binary(&mf1
) || mmfile_is_binary(&mf2
))
397 printf("Binary files %s and %s differ\n", lbl
[0], lbl
[1]);
399 /* Crazy xdl interfaces.. */
400 const char *diffopts
= getenv("GIT_DIFF_OPTS");
404 struct emit_callback ecbdata
;
406 ecbdata
.label_path
= lbl
;
407 xpp
.flags
= XDF_NEED_MINIMAL
;
409 xecfg
.flags
= XDL_EMIT_FUNCNAMES
;
412 else if (!strncmp(diffopts
, "--unified=", 10))
413 xecfg
.ctxlen
= strtoul(diffopts
+ 10, NULL
, 10);
414 else if (!strncmp(diffopts
, "-u", 2))
415 xecfg
.ctxlen
= strtoul(diffopts
+ 2, NULL
, 10);
418 xdl_diff(&mf1
, &mf2
, &xpp
, &xecfg
, &ecb
);
427 static void builtin_diffstat(const char *name_a
, const char *name_b
,
428 struct diff_filespec
*one
, struct diff_filespec
*two
,
429 struct diffstat_t
*diffstat
)
432 struct diffstat_file
*data
;
434 data
= diffstat_add(diffstat
, name_a
? name_a
: name_b
);
437 data
->is_unmerged
= 1;
441 if (fill_mmfile(&mf1
, one
) < 0 || fill_mmfile(&mf2
, two
) < 0)
442 die("unable to read files to diff");
444 if (mmfile_is_binary(&mf1
) || mmfile_is_binary(&mf2
))
447 /* Crazy xdl interfaces.. */
452 xpp
.flags
= XDF_NEED_MINIMAL
;
455 ecb
.outf
= xdiff_outf
;
457 xdl_diff(&mf1
, &mf2
, &xpp
, &xecfg
, &ecb
);
461 struct diff_filespec
*alloc_filespec(const char *path
)
463 int namelen
= strlen(path
);
464 struct diff_filespec
*spec
= xmalloc(sizeof(*spec
) + namelen
+ 1);
466 memset(spec
, 0, sizeof(*spec
));
467 spec
->path
= (char *)(spec
+ 1);
468 memcpy(spec
->path
, path
, namelen
+1);
472 void fill_filespec(struct diff_filespec
*spec
, const unsigned char *sha1
,
476 spec
->mode
= canon_mode(mode
);
477 memcpy(spec
->sha1
, sha1
, 20);
478 spec
->sha1_valid
= !!memcmp(sha1
, null_sha1
, 20);
483 * Given a name and sha1 pair, if the dircache tells us the file in
484 * the work tree has that object contents, return true, so that
485 * prepare_temp_file() does not have to inflate and extract.
487 static int work_tree_matches(const char *name
, const unsigned char *sha1
)
489 struct cache_entry
*ce
;
493 /* We do not read the cache ourselves here, because the
494 * benchmark with my previous version that always reads cache
495 * shows that it makes things worse for diff-tree comparing
496 * two linux-2.6 kernel trees in an already checked out work
497 * tree. This is because most diff-tree comparisons deal with
498 * only a small number of files, while reading the cache is
499 * expensive for a large project, and its cost outweighs the
500 * savings we get by not inflating the object to a temporary
501 * file. Practically, this code only helps when we are used
502 * by diff-cache --cached, which does read the cache before
509 pos
= cache_name_pos(name
, len
);
512 ce
= active_cache
[pos
];
513 if ((lstat(name
, &st
) < 0) ||
514 !S_ISREG(st
.st_mode
) || /* careful! */
515 ce_match_stat(ce
, &st
, 0) ||
516 memcmp(sha1
, ce
->sha1
, 20))
518 /* we return 1 only when we can stat, it is a regular file,
519 * stat information matches, and sha1 recorded in the cache
520 * matches. I.e. we know the file in the work tree really is
521 * the same as the <name, sha1> pair.
526 static struct sha1_size_cache
{
527 unsigned char sha1
[20];
530 static int sha1_size_cache_nr
, sha1_size_cache_alloc
;
532 static struct sha1_size_cache
*locate_size_cache(unsigned char *sha1
,
537 struct sha1_size_cache
*e
;
540 last
= sha1_size_cache_nr
;
541 while (last
> first
) {
542 int cmp
, next
= (last
+ first
) >> 1;
543 e
= sha1_size_cache
[next
];
544 cmp
= memcmp(e
->sha1
, sha1
, 20);
556 /* insert to make it at "first" */
557 if (sha1_size_cache_alloc
<= sha1_size_cache_nr
) {
558 sha1_size_cache_alloc
= alloc_nr(sha1_size_cache_alloc
);
559 sha1_size_cache
= xrealloc(sha1_size_cache
,
560 sha1_size_cache_alloc
*
561 sizeof(*sha1_size_cache
));
563 sha1_size_cache_nr
++;
564 if (first
< sha1_size_cache_nr
)
565 memmove(sha1_size_cache
+ first
+ 1, sha1_size_cache
+ first
,
566 (sha1_size_cache_nr
- first
- 1) *
567 sizeof(*sha1_size_cache
));
568 e
= xmalloc(sizeof(struct sha1_size_cache
));
569 sha1_size_cache
[first
] = e
;
570 memcpy(e
->sha1
, sha1
, 20);
576 * While doing rename detection and pickaxe operation, we may need to
577 * grab the data for the blob (or file) for our own in-core comparison.
578 * diff_filespec has data and size fields for this purpose.
580 int diff_populate_filespec(struct diff_filespec
*s
, int size_only
)
583 if (!DIFF_FILE_VALID(s
))
584 die("internal error: asking to populate invalid file.");
585 if (S_ISDIR(s
->mode
))
593 if (!s
->sha1_valid
||
594 work_tree_matches(s
->path
, s
->sha1
)) {
597 if (lstat(s
->path
, &st
) < 0) {
598 if (errno
== ENOENT
) {
607 s
->size
= st
.st_size
;
612 if (S_ISLNK(st
.st_mode
)) {
614 s
->data
= xmalloc(s
->size
);
616 ret
= readlink(s
->path
, s
->data
, s
->size
);
623 fd
= open(s
->path
, O_RDONLY
);
626 s
->data
= mmap(NULL
, s
->size
, PROT_READ
, MAP_PRIVATE
, fd
, 0);
628 if (s
->data
== MAP_FAILED
)
630 s
->should_munmap
= 1;
634 struct sha1_size_cache
*e
;
637 e
= locate_size_cache(s
->sha1
, 1, 0);
642 if (!sha1_object_info(s
->sha1
, type
, &s
->size
))
643 locate_size_cache(s
->sha1
, 0, s
->size
);
646 s
->data
= read_sha1_file(s
->sha1
, type
, &s
->size
);
653 void diff_free_filespec_data(struct diff_filespec
*s
)
657 else if (s
->should_munmap
)
658 munmap(s
->data
, s
->size
);
659 s
->should_free
= s
->should_munmap
= 0;
665 static void prep_temp_blob(struct diff_tempfile
*temp
,
668 const unsigned char *sha1
,
673 fd
= git_mkstemp(temp
->tmp_path
, TEMPFILE_PATH_LEN
, ".diff_XXXXXX");
675 die("unable to create temp-file");
676 if (write(fd
, blob
, size
) != size
)
677 die("unable to write temp-file");
679 temp
->name
= temp
->tmp_path
;
680 strcpy(temp
->hex
, sha1_to_hex(sha1
));
682 sprintf(temp
->mode
, "%06o", mode
);
685 static void prepare_temp_file(const char *name
,
686 struct diff_tempfile
*temp
,
687 struct diff_filespec
*one
)
689 if (!DIFF_FILE_VALID(one
)) {
691 /* A '-' entry produces this for file-2, and
692 * a '+' entry produces this for file-1.
694 temp
->name
= "/dev/null";
695 strcpy(temp
->hex
, ".");
696 strcpy(temp
->mode
, ".");
700 if (!one
->sha1_valid
||
701 work_tree_matches(name
, one
->sha1
)) {
703 if (lstat(name
, &st
) < 0) {
705 goto not_a_valid_file
;
706 die("stat(%s): %s", name
, strerror(errno
));
708 if (S_ISLNK(st
.st_mode
)) {
710 char buf
[PATH_MAX
+ 1]; /* ought to be SYMLINK_MAX */
711 if (sizeof(buf
) <= st
.st_size
)
712 die("symlink too long: %s", name
);
713 ret
= readlink(name
, buf
, st
.st_size
);
715 die("readlink(%s)", name
);
716 prep_temp_blob(temp
, buf
, st
.st_size
,
718 one
->sha1
: null_sha1
),
720 one
->mode
: S_IFLNK
));
723 /* we can borrow from the file in the work tree */
725 if (!one
->sha1_valid
)
726 strcpy(temp
->hex
, sha1_to_hex(null_sha1
));
728 strcpy(temp
->hex
, sha1_to_hex(one
->sha1
));
729 /* Even though we may sometimes borrow the
730 * contents from the work tree, we always want
731 * one->mode. mode is trustworthy even when
732 * !(one->sha1_valid), as long as
733 * DIFF_FILE_VALID(one).
735 sprintf(temp
->mode
, "%06o", one
->mode
);
740 if (diff_populate_filespec(one
, 0))
741 die("cannot read data blob for %s", one
->path
);
742 prep_temp_blob(temp
, one
->data
, one
->size
,
743 one
->sha1
, one
->mode
);
747 static void remove_tempfile(void)
751 for (i
= 0; i
< 2; i
++)
752 if (diff_temp
[i
].name
== diff_temp
[i
].tmp_path
) {
753 unlink(diff_temp
[i
].name
);
754 diff_temp
[i
].name
= NULL
;
758 static void remove_tempfile_on_signal(int signo
)
761 signal(SIGINT
, SIG_DFL
);
765 static int spawn_prog(const char *pgm
, const char **arg
)
773 die("unable to fork");
775 execvp(pgm
, (char *const*) arg
);
779 while (waitpid(pid
, &status
, 0) < 0) {
785 /* Earlier we did not check the exit status because
786 * diff exits non-zero if files are different, and
787 * we are not interested in knowing that. It was a
788 * mistake which made it harder to quit a diff-*
789 * session that uses the git-apply-patch-script as
790 * the GIT_EXTERNAL_DIFF. A custom GIT_EXTERNAL_DIFF
791 * should also exit non-zero only when it wants to
792 * abort the entire diff-* session.
794 if (WIFEXITED(status
) && !WEXITSTATUS(status
))
799 /* An external diff command takes:
801 * diff-cmd name infile1 infile1-sha1 infile1-mode \
802 * infile2 infile2-sha1 infile2-mode [ rename-to ]
805 static void run_external_diff(const char *pgm
,
808 struct diff_filespec
*one
,
809 struct diff_filespec
*two
,
810 const char *xfrm_msg
,
811 int complete_rewrite
)
813 const char *spawn_arg
[10];
814 struct diff_tempfile
*temp
= diff_temp
;
816 static int atexit_asked
= 0;
817 const char *othername
;
818 const char **arg
= &spawn_arg
[0];
820 othername
= (other
? other
: name
);
822 prepare_temp_file(name
, &temp
[0], one
);
823 prepare_temp_file(othername
, &temp
[1], two
);
824 if (! atexit_asked
&&
825 (temp
[0].name
== temp
[0].tmp_path
||
826 temp
[1].name
== temp
[1].tmp_path
)) {
828 atexit(remove_tempfile
);
830 signal(SIGINT
, remove_tempfile_on_signal
);
836 *arg
++ = temp
[0].name
;
837 *arg
++ = temp
[0].hex
;
838 *arg
++ = temp
[0].mode
;
839 *arg
++ = temp
[1].name
;
840 *arg
++ = temp
[1].hex
;
841 *arg
++ = temp
[1].mode
;
851 retval
= spawn_prog(pgm
, spawn_arg
);
854 fprintf(stderr
, "external diff died, stopping at %s.\n", name
);
859 static void run_diff_cmd(const char *pgm
,
862 struct diff_filespec
*one
,
863 struct diff_filespec
*two
,
864 const char *xfrm_msg
,
865 int complete_rewrite
)
868 run_external_diff(pgm
, name
, other
, one
, two
, xfrm_msg
,
873 builtin_diff(name
, other
? other
: name
,
874 one
, two
, xfrm_msg
, complete_rewrite
);
876 printf("* Unmerged path %s\n", name
);
879 static void diff_fill_sha1_info(struct diff_filespec
*one
)
881 if (DIFF_FILE_VALID(one
)) {
882 if (!one
->sha1_valid
) {
884 if (lstat(one
->path
, &st
) < 0)
885 die("stat %s", one
->path
);
886 if (index_path(one
->sha1
, one
->path
, &st
, 0))
887 die("cannot hash %s\n", one
->path
);
891 memset(one
->sha1
, 0, 20);
894 static void run_diff(struct diff_filepair
*p
, struct diff_options
*o
)
896 const char *pgm
= external_diff();
897 char msg
[PATH_MAX
*2+300], *xfrm_msg
;
898 struct diff_filespec
*one
;
899 struct diff_filespec
*two
;
902 char *name_munged
, *other_munged
;
903 int complete_rewrite
= 0;
906 if (DIFF_PAIR_UNMERGED(p
)) {
908 run_diff_cmd(pgm
, p
->one
->path
, NULL
, NULL
, NULL
, NULL
, 0);
913 other
= (strcmp(name
, p
->two
->path
) ? p
->two
->path
: NULL
);
914 name_munged
= quote_one(name
);
915 other_munged
= quote_one(other
);
916 one
= p
->one
; two
= p
->two
;
918 diff_fill_sha1_info(one
);
919 diff_fill_sha1_info(two
);
923 case DIFF_STATUS_COPIED
:
924 len
+= snprintf(msg
+ len
, sizeof(msg
) - len
,
925 "similarity index %d%%\n"
928 (int)(0.5 + p
->score
* 100.0/MAX_SCORE
),
929 name_munged
, other_munged
);
931 case DIFF_STATUS_RENAMED
:
932 len
+= snprintf(msg
+ len
, sizeof(msg
) - len
,
933 "similarity index %d%%\n"
936 (int)(0.5 + p
->score
* 100.0/MAX_SCORE
),
937 name_munged
, other_munged
);
939 case DIFF_STATUS_MODIFIED
:
941 len
+= snprintf(msg
+ len
, sizeof(msg
) - len
,
942 "dissimilarity index %d%%\n",
943 (int)(0.5 + p
->score
*
945 complete_rewrite
= 1;
954 if (memcmp(one
->sha1
, two
->sha1
, 20)) {
956 int abbrev
= o
->full_index
? 40 : DEFAULT_ABBREV
;
957 memcpy(one_sha1
, sha1_to_hex(one
->sha1
), 41);
959 len
+= snprintf(msg
+ len
, sizeof(msg
) - len
,
961 abbrev
, one_sha1
, abbrev
,
962 sha1_to_hex(two
->sha1
));
963 if (one
->mode
== two
->mode
)
964 len
+= snprintf(msg
+ len
, sizeof(msg
) - len
,
966 len
+= snprintf(msg
+ len
, sizeof(msg
) - len
, "\n");
971 xfrm_msg
= len
? msg
: NULL
;
974 DIFF_FILE_VALID(one
) && DIFF_FILE_VALID(two
) &&
975 (S_IFMT
& one
->mode
) != (S_IFMT
& two
->mode
)) {
976 /* a filepair that changes between file and symlink
977 * needs to be split into deletion and creation.
979 struct diff_filespec
*null
= alloc_filespec(two
->path
);
980 run_diff_cmd(NULL
, name
, other
, one
, null
, xfrm_msg
, 0);
982 null
= alloc_filespec(one
->path
);
983 run_diff_cmd(NULL
, name
, other
, null
, two
, xfrm_msg
, 0);
987 run_diff_cmd(pgm
, name
, other
, one
, two
, xfrm_msg
,
994 static void run_diffstat(struct diff_filepair
*p
, struct diff_options
*o
,
995 struct diffstat_t
*diffstat
)
1000 if (DIFF_PAIR_UNMERGED(p
)) {
1002 builtin_diffstat(p
->one
->path
, NULL
, NULL
, NULL
, diffstat
);
1006 name
= p
->one
->path
;
1007 other
= (strcmp(name
, p
->two
->path
) ? p
->two
->path
: NULL
);
1009 diff_fill_sha1_info(p
->one
);
1010 diff_fill_sha1_info(p
->two
);
1012 builtin_diffstat(name
, other
, p
->one
, p
->two
, diffstat
);
1015 void diff_setup(struct diff_options
*options
)
1017 memset(options
, 0, sizeof(*options
));
1018 options
->output_format
= DIFF_FORMAT_RAW
;
1019 options
->line_termination
= '\n';
1020 options
->break_opt
= -1;
1021 options
->rename_limit
= -1;
1023 options
->change
= diff_change
;
1024 options
->add_remove
= diff_addremove
;
1027 int diff_setup_done(struct diff_options
*options
)
1029 if ((options
->find_copies_harder
&&
1030 options
->detect_rename
!= DIFF_DETECT_COPY
) ||
1031 (0 <= options
->rename_limit
&& !options
->detect_rename
))
1035 * These cases always need recursive; we do not drop caller-supplied
1036 * recursive bits for other formats here.
1038 if ((options
->output_format
== DIFF_FORMAT_PATCH
) ||
1039 (options
->output_format
== DIFF_FORMAT_DIFFSTAT
))
1040 options
->recursive
= 1;
1042 if (options
->detect_rename
&& options
->rename_limit
< 0)
1043 options
->rename_limit
= diff_rename_limit_default
;
1044 if (options
->setup
& DIFF_SETUP_USE_CACHE
) {
1046 /* read-cache does not die even when it fails
1047 * so it is safe for us to do this here. Also
1048 * it does not smudge active_cache or active_nr
1049 * when it fails, so we do not have to worry about
1050 * cleaning it up ourselves either.
1054 if (options
->setup
& DIFF_SETUP_USE_SIZE_CACHE
)
1056 if (options
->abbrev
<= 0 || 40 < options
->abbrev
)
1057 options
->abbrev
= 40; /* full */
1062 int diff_opt_parse(struct diff_options
*options
, const char **av
, int ac
)
1064 const char *arg
= av
[0];
1065 if (!strcmp(arg
, "-p") || !strcmp(arg
, "-u"))
1066 options
->output_format
= DIFF_FORMAT_PATCH
;
1067 else if (!strcmp(arg
, "--patch-with-raw")) {
1068 options
->output_format
= DIFF_FORMAT_PATCH
;
1069 options
->with_raw
= 1;
1071 else if (!strcmp(arg
, "--stat"))
1072 options
->output_format
= DIFF_FORMAT_DIFFSTAT
;
1073 else if (!strcmp(arg
, "--patch-with-stat")) {
1074 options
->output_format
= DIFF_FORMAT_PATCH
;
1075 options
->with_stat
= 1;
1077 else if (!strcmp(arg
, "-z"))
1078 options
->line_termination
= 0;
1079 else if (!strncmp(arg
, "-l", 2))
1080 options
->rename_limit
= strtoul(arg
+2, NULL
, 10);
1081 else if (!strcmp(arg
, "--full-index"))
1082 options
->full_index
= 1;
1083 else if (!strcmp(arg
, "--name-only"))
1084 options
->output_format
= DIFF_FORMAT_NAME
;
1085 else if (!strcmp(arg
, "--name-status"))
1086 options
->output_format
= DIFF_FORMAT_NAME_STATUS
;
1087 else if (!strcmp(arg
, "-R"))
1088 options
->reverse_diff
= 1;
1089 else if (!strncmp(arg
, "-S", 2))
1090 options
->pickaxe
= arg
+ 2;
1091 else if (!strcmp(arg
, "-s"))
1092 options
->output_format
= DIFF_FORMAT_NO_OUTPUT
;
1093 else if (!strncmp(arg
, "-O", 2))
1094 options
->orderfile
= arg
+ 2;
1095 else if (!strncmp(arg
, "--diff-filter=", 14))
1096 options
->filter
= arg
+ 14;
1097 else if (!strcmp(arg
, "--pickaxe-all"))
1098 options
->pickaxe_opts
= DIFF_PICKAXE_ALL
;
1099 else if (!strcmp(arg
, "--pickaxe-regex"))
1100 options
->pickaxe_opts
= DIFF_PICKAXE_REGEX
;
1101 else if (!strncmp(arg
, "-B", 2)) {
1102 if ((options
->break_opt
=
1103 diff_scoreopt_parse(arg
)) == -1)
1106 else if (!strncmp(arg
, "-M", 2)) {
1107 if ((options
->rename_score
=
1108 diff_scoreopt_parse(arg
)) == -1)
1110 options
->detect_rename
= DIFF_DETECT_RENAME
;
1112 else if (!strncmp(arg
, "-C", 2)) {
1113 if ((options
->rename_score
=
1114 diff_scoreopt_parse(arg
)) == -1)
1116 options
->detect_rename
= DIFF_DETECT_COPY
;
1118 else if (!strcmp(arg
, "--find-copies-harder"))
1119 options
->find_copies_harder
= 1;
1120 else if (!strcmp(arg
, "--abbrev"))
1121 options
->abbrev
= DEFAULT_ABBREV
;
1122 else if (!strncmp(arg
, "--abbrev=", 9)) {
1123 options
->abbrev
= strtoul(arg
+ 9, NULL
, 10);
1124 if (options
->abbrev
< MINIMUM_ABBREV
)
1125 options
->abbrev
= MINIMUM_ABBREV
;
1126 else if (40 < options
->abbrev
)
1127 options
->abbrev
= 40;
1134 static int parse_num(const char **cp_p
)
1136 unsigned long num
, scale
;
1138 const char *cp
= *cp_p
;
1145 if ( !dot
&& ch
== '.' ) {
1148 } else if ( ch
== '%' ) {
1149 scale
= dot
? scale
*100 : 100;
1150 cp
++; /* % is always at the end */
1152 } else if ( ch
>= '0' && ch
<= '9' ) {
1153 if ( scale
< 100000 ) {
1155 num
= (num
*10) + (ch
-'0');
1164 /* user says num divided by scale and we say internally that
1165 * is MAX_SCORE * num / scale.
1167 return (num
>= scale
) ? MAX_SCORE
: (MAX_SCORE
* num
/ scale
);
1170 int diff_scoreopt_parse(const char *opt
)
1172 int opt1
, opt2
, cmd
;
1177 if (cmd
!= 'M' && cmd
!= 'C' && cmd
!= 'B')
1178 return -1; /* that is not a -M, -C nor -B option */
1180 opt1
= parse_num(&opt
);
1186 else if (*opt
!= '/')
1187 return -1; /* we expect -B80/99 or -B80 */
1190 opt2
= parse_num(&opt
);
1195 return opt1
| (opt2
<< 16);
1198 struct diff_queue_struct diff_queued_diff
;
1200 void diff_q(struct diff_queue_struct
*queue
, struct diff_filepair
*dp
)
1202 if (queue
->alloc
<= queue
->nr
) {
1203 queue
->alloc
= alloc_nr(queue
->alloc
);
1204 queue
->queue
= xrealloc(queue
->queue
,
1205 sizeof(dp
) * queue
->alloc
);
1207 queue
->queue
[queue
->nr
++] = dp
;
1210 struct diff_filepair
*diff_queue(struct diff_queue_struct
*queue
,
1211 struct diff_filespec
*one
,
1212 struct diff_filespec
*two
)
1214 struct diff_filepair
*dp
= xmalloc(sizeof(*dp
));
1219 dp
->source_stays
= 0;
1220 dp
->broken_pair
= 0;
1226 void diff_free_filepair(struct diff_filepair
*p
)
1228 diff_free_filespec_data(p
->one
);
1229 diff_free_filespec_data(p
->two
);
1235 /* This is different from find_unique_abbrev() in that
1236 * it stuffs the result with dots for alignment.
1238 const char *diff_unique_abbrev(const unsigned char *sha1
, int len
)
1243 return sha1_to_hex(sha1
);
1245 abbrev
= find_unique_abbrev(sha1
, len
);
1247 return sha1_to_hex(sha1
);
1248 abblen
= strlen(abbrev
);
1250 static char hex
[41];
1251 if (len
< abblen
&& abblen
<= len
+ 2)
1252 sprintf(hex
, "%s%.*s", abbrev
, len
+3-abblen
, "..");
1254 sprintf(hex
, "%s...", abbrev
);
1257 return sha1_to_hex(sha1
);
1260 static void diff_flush_raw(struct diff_filepair
*p
,
1261 int line_termination
,
1262 int inter_name_termination
,
1263 struct diff_options
*options
,
1268 int abbrev
= options
->abbrev
;
1269 const char *path_one
, *path_two
;
1271 path_one
= p
->one
->path
;
1272 path_two
= p
->two
->path
;
1273 if (line_termination
) {
1274 path_one
= quote_one(path_one
);
1275 path_two
= quote_one(path_two
);
1279 sprintf(status
, "%c%03d", p
->status
,
1280 (int)(0.5 + p
->score
* 100.0/MAX_SCORE
));
1282 status
[0] = p
->status
;
1285 switch (p
->status
) {
1286 case DIFF_STATUS_COPIED
:
1287 case DIFF_STATUS_RENAMED
:
1290 case DIFF_STATUS_ADDED
:
1291 case DIFF_STATUS_DELETED
:
1298 if (output_format
!= DIFF_FORMAT_NAME_STATUS
) {
1299 printf(":%06o %06o %s ",
1300 p
->one
->mode
, p
->two
->mode
,
1301 diff_unique_abbrev(p
->one
->sha1
, abbrev
));
1303 diff_unique_abbrev(p
->two
->sha1
, abbrev
));
1305 printf("%s%c%s", status
, inter_name_termination
, path_one
);
1307 printf("%c%s", inter_name_termination
, path_two
);
1308 putchar(line_termination
);
1309 if (path_one
!= p
->one
->path
)
1310 free((void*)path_one
);
1311 if (path_two
!= p
->two
->path
)
1312 free((void*)path_two
);
1315 static void diff_flush_name(struct diff_filepair
*p
,
1316 int inter_name_termination
,
1317 int line_termination
)
1319 char *path
= p
->two
->path
;
1321 if (line_termination
)
1322 path
= quote_one(p
->two
->path
);
1324 path
= p
->two
->path
;
1325 printf("%s%c", path
, line_termination
);
1326 if (p
->two
->path
!= path
)
1330 int diff_unmodified_pair(struct diff_filepair
*p
)
1332 /* This function is written stricter than necessary to support
1333 * the currently implemented transformers, but the idea is to
1334 * let transformers to produce diff_filepairs any way they want,
1335 * and filter and clean them up here before producing the output.
1337 struct diff_filespec
*one
, *two
;
1339 if (DIFF_PAIR_UNMERGED(p
))
1340 return 0; /* unmerged is interesting */
1345 /* deletion, addition, mode or type change
1346 * and rename are all interesting.
1348 if (DIFF_FILE_VALID(one
) != DIFF_FILE_VALID(two
) ||
1349 DIFF_PAIR_MODE_CHANGED(p
) ||
1350 strcmp(one
->path
, two
->path
))
1353 /* both are valid and point at the same path. that is, we are
1354 * dealing with a change.
1356 if (one
->sha1_valid
&& two
->sha1_valid
&&
1357 !memcmp(one
->sha1
, two
->sha1
, sizeof(one
->sha1
)))
1358 return 1; /* no change */
1359 if (!one
->sha1_valid
&& !two
->sha1_valid
)
1360 return 1; /* both look at the same file on the filesystem. */
1364 static void diff_flush_patch(struct diff_filepair
*p
, struct diff_options
*o
)
1366 if (diff_unmodified_pair(p
))
1369 if ((DIFF_FILE_VALID(p
->one
) && S_ISDIR(p
->one
->mode
)) ||
1370 (DIFF_FILE_VALID(p
->two
) && S_ISDIR(p
->two
->mode
)))
1371 return; /* no tree diffs in patch format */
1376 static void diff_flush_stat(struct diff_filepair
*p
, struct diff_options
*o
,
1377 struct diffstat_t
*diffstat
)
1379 if (diff_unmodified_pair(p
))
1382 if ((DIFF_FILE_VALID(p
->one
) && S_ISDIR(p
->one
->mode
)) ||
1383 (DIFF_FILE_VALID(p
->two
) && S_ISDIR(p
->two
->mode
)))
1384 return; /* no tree diffs in patch format */
1386 run_diffstat(p
, o
, diffstat
);
1389 int diff_queue_is_empty(void)
1391 struct diff_queue_struct
*q
= &diff_queued_diff
;
1393 for (i
= 0; i
< q
->nr
; i
++)
1394 if (!diff_unmodified_pair(q
->queue
[i
]))
1400 void diff_debug_filespec(struct diff_filespec
*s
, int x
, const char *one
)
1402 fprintf(stderr
, "queue[%d] %s (%s) %s %06o %s\n",
1405 DIFF_FILE_VALID(s
) ? "valid" : "invalid",
1407 s
->sha1_valid
? sha1_to_hex(s
->sha1
) : "");
1408 fprintf(stderr
, "queue[%d] %s size %lu flags %d\n",
1410 s
->size
, s
->xfrm_flags
);
1413 void diff_debug_filepair(const struct diff_filepair
*p
, int i
)
1415 diff_debug_filespec(p
->one
, i
, "one");
1416 diff_debug_filespec(p
->two
, i
, "two");
1417 fprintf(stderr
, "score %d, status %c stays %d broken %d\n",
1418 p
->score
, p
->status
? p
->status
: '?',
1419 p
->source_stays
, p
->broken_pair
);
1422 void diff_debug_queue(const char *msg
, struct diff_queue_struct
*q
)
1426 fprintf(stderr
, "%s\n", msg
);
1427 fprintf(stderr
, "q->nr = %d\n", q
->nr
);
1428 for (i
= 0; i
< q
->nr
; i
++) {
1429 struct diff_filepair
*p
= q
->queue
[i
];
1430 diff_debug_filepair(p
, i
);
1435 static void diff_resolve_rename_copy(void)
1438 struct diff_filepair
*p
, *pp
;
1439 struct diff_queue_struct
*q
= &diff_queued_diff
;
1441 diff_debug_queue("resolve-rename-copy", q
);
1443 for (i
= 0; i
< q
->nr
; i
++) {
1445 p
->status
= 0; /* undecided */
1446 if (DIFF_PAIR_UNMERGED(p
))
1447 p
->status
= DIFF_STATUS_UNMERGED
;
1448 else if (!DIFF_FILE_VALID(p
->one
))
1449 p
->status
= DIFF_STATUS_ADDED
;
1450 else if (!DIFF_FILE_VALID(p
->two
))
1451 p
->status
= DIFF_STATUS_DELETED
;
1452 else if (DIFF_PAIR_TYPE_CHANGED(p
))
1453 p
->status
= DIFF_STATUS_TYPE_CHANGED
;
1455 /* from this point on, we are dealing with a pair
1456 * whose both sides are valid and of the same type, i.e.
1457 * either in-place edit or rename/copy edit.
1459 else if (DIFF_PAIR_RENAME(p
)) {
1460 if (p
->source_stays
) {
1461 p
->status
= DIFF_STATUS_COPIED
;
1464 /* See if there is some other filepair that
1465 * copies from the same source as us. If so
1466 * we are a copy. Otherwise we are either a
1467 * copy if the path stays, or a rename if it
1468 * does not, but we already handled "stays" case.
1470 for (j
= i
+ 1; j
< q
->nr
; j
++) {
1472 if (strcmp(pp
->one
->path
, p
->one
->path
))
1473 continue; /* not us */
1474 if (!DIFF_PAIR_RENAME(pp
))
1475 continue; /* not a rename/copy */
1476 /* pp is a rename/copy from the same source */
1477 p
->status
= DIFF_STATUS_COPIED
;
1481 p
->status
= DIFF_STATUS_RENAMED
;
1483 else if (memcmp(p
->one
->sha1
, p
->two
->sha1
, 20) ||
1484 p
->one
->mode
!= p
->two
->mode
)
1485 p
->status
= DIFF_STATUS_MODIFIED
;
1487 /* This is a "no-change" entry and should not
1488 * happen anymore, but prepare for broken callers.
1490 error("feeding unmodified %s to diffcore",
1492 p
->status
= DIFF_STATUS_UNKNOWN
;
1495 diff_debug_queue("resolve-rename-copy done", q
);
1498 static void flush_one_pair(struct diff_filepair
*p
,
1499 int diff_output_format
,
1500 struct diff_options
*options
,
1501 struct diffstat_t
*diffstat
)
1503 int inter_name_termination
= '\t';
1504 int line_termination
= options
->line_termination
;
1505 if (!line_termination
)
1506 inter_name_termination
= 0;
1508 switch (p
->status
) {
1509 case DIFF_STATUS_UNKNOWN
:
1512 die("internal error in diff-resolve-rename-copy");
1515 switch (diff_output_format
) {
1516 case DIFF_FORMAT_DIFFSTAT
:
1517 diff_flush_stat(p
, options
, diffstat
);
1519 case DIFF_FORMAT_PATCH
:
1520 diff_flush_patch(p
, options
);
1522 case DIFF_FORMAT_RAW
:
1523 case DIFF_FORMAT_NAME_STATUS
:
1524 diff_flush_raw(p
, line_termination
,
1525 inter_name_termination
,
1526 options
, diff_output_format
);
1528 case DIFF_FORMAT_NAME
:
1530 inter_name_termination
,
1533 case DIFF_FORMAT_NO_OUTPUT
:
1539 void diff_flush(struct diff_options
*options
)
1541 struct diff_queue_struct
*q
= &diff_queued_diff
;
1543 int diff_output_format
= options
->output_format
;
1544 struct diffstat_t
*diffstat
= NULL
;
1546 if (diff_output_format
== DIFF_FORMAT_DIFFSTAT
|| options
->with_stat
) {
1547 diffstat
= xcalloc(sizeof (struct diffstat_t
), 1);
1548 diffstat
->xm
.consume
= diffstat_consume
;
1551 if (options
->with_raw
) {
1552 for (i
= 0; i
< q
->nr
; i
++) {
1553 struct diff_filepair
*p
= q
->queue
[i
];
1554 flush_one_pair(p
, DIFF_FORMAT_RAW
, options
, NULL
);
1556 putchar(options
->line_termination
);
1558 if (options
->with_stat
) {
1559 for (i
= 0; i
< q
->nr
; i
++) {
1560 struct diff_filepair
*p
= q
->queue
[i
];
1561 flush_one_pair(p
, DIFF_FORMAT_DIFFSTAT
, options
,
1564 show_stats(diffstat
);
1567 putchar(options
->line_termination
);
1569 for (i
= 0; i
< q
->nr
; i
++) {
1570 struct diff_filepair
*p
= q
->queue
[i
];
1571 flush_one_pair(p
, diff_output_format
, options
, diffstat
);
1572 diff_free_filepair(p
);
1576 show_stats(diffstat
);
1582 q
->nr
= q
->alloc
= 0;
1585 static void diffcore_apply_filter(const char *filter
)
1588 struct diff_queue_struct
*q
= &diff_queued_diff
;
1589 struct diff_queue_struct outq
;
1591 outq
.nr
= outq
.alloc
= 0;
1596 if (strchr(filter
, DIFF_STATUS_FILTER_AON
)) {
1598 for (i
= found
= 0; !found
&& i
< q
->nr
; i
++) {
1599 struct diff_filepair
*p
= q
->queue
[i
];
1600 if (((p
->status
== DIFF_STATUS_MODIFIED
) &&
1602 strchr(filter
, DIFF_STATUS_FILTER_BROKEN
)) ||
1604 strchr(filter
, DIFF_STATUS_MODIFIED
)))) ||
1605 ((p
->status
!= DIFF_STATUS_MODIFIED
) &&
1606 strchr(filter
, p
->status
)))
1612 /* otherwise we will clear the whole queue
1613 * by copying the empty outq at the end of this
1614 * function, but first clear the current entries
1617 for (i
= 0; i
< q
->nr
; i
++)
1618 diff_free_filepair(q
->queue
[i
]);
1621 /* Only the matching ones */
1622 for (i
= 0; i
< q
->nr
; i
++) {
1623 struct diff_filepair
*p
= q
->queue
[i
];
1625 if (((p
->status
== DIFF_STATUS_MODIFIED
) &&
1627 strchr(filter
, DIFF_STATUS_FILTER_BROKEN
)) ||
1629 strchr(filter
, DIFF_STATUS_MODIFIED
)))) ||
1630 ((p
->status
!= DIFF_STATUS_MODIFIED
) &&
1631 strchr(filter
, p
->status
)))
1634 diff_free_filepair(p
);
1641 void diffcore_std(struct diff_options
*options
)
1643 if (options
->break_opt
!= -1)
1644 diffcore_break(options
->break_opt
);
1645 if (options
->detect_rename
)
1646 diffcore_rename(options
);
1647 if (options
->break_opt
!= -1)
1648 diffcore_merge_broken();
1649 if (options
->pickaxe
)
1650 diffcore_pickaxe(options
->pickaxe
, options
->pickaxe_opts
);
1651 if (options
->orderfile
)
1652 diffcore_order(options
->orderfile
);
1653 diff_resolve_rename_copy();
1654 diffcore_apply_filter(options
->filter
);
1658 void diffcore_std_no_resolve(struct diff_options
*options
)
1660 if (options
->pickaxe
)
1661 diffcore_pickaxe(options
->pickaxe
, options
->pickaxe_opts
);
1662 if (options
->orderfile
)
1663 diffcore_order(options
->orderfile
);
1664 diffcore_apply_filter(options
->filter
);
1667 void diff_addremove(struct diff_options
*options
,
1668 int addremove
, unsigned mode
,
1669 const unsigned char *sha1
,
1670 const char *base
, const char *path
)
1672 char concatpath
[PATH_MAX
];
1673 struct diff_filespec
*one
, *two
;
1675 /* This may look odd, but it is a preparation for
1676 * feeding "there are unchanged files which should
1677 * not produce diffs, but when you are doing copy
1678 * detection you would need them, so here they are"
1679 * entries to the diff-core. They will be prefixed
1680 * with something like '=' or '*' (I haven't decided
1681 * which but should not make any difference).
1682 * Feeding the same new and old to diff_change()
1683 * also has the same effect.
1684 * Before the final output happens, they are pruned after
1685 * merged into rename/copy pairs as appropriate.
1687 if (options
->reverse_diff
)
1688 addremove
= (addremove
== '+' ? '-' :
1689 addremove
== '-' ? '+' : addremove
);
1691 if (!path
) path
= "";
1692 sprintf(concatpath
, "%s%s", base
, path
);
1693 one
= alloc_filespec(concatpath
);
1694 two
= alloc_filespec(concatpath
);
1696 if (addremove
!= '+')
1697 fill_filespec(one
, sha1
, mode
);
1698 if (addremove
!= '-')
1699 fill_filespec(two
, sha1
, mode
);
1701 diff_queue(&diff_queued_diff
, one
, two
);
1704 void diff_change(struct diff_options
*options
,
1705 unsigned old_mode
, unsigned new_mode
,
1706 const unsigned char *old_sha1
,
1707 const unsigned char *new_sha1
,
1708 const char *base
, const char *path
)
1710 char concatpath
[PATH_MAX
];
1711 struct diff_filespec
*one
, *two
;
1713 if (options
->reverse_diff
) {
1715 const unsigned char *tmp_c
;
1716 tmp
= old_mode
; old_mode
= new_mode
; new_mode
= tmp
;
1717 tmp_c
= old_sha1
; old_sha1
= new_sha1
; new_sha1
= tmp_c
;
1719 if (!path
) path
= "";
1720 sprintf(concatpath
, "%s%s", base
, path
);
1721 one
= alloc_filespec(concatpath
);
1722 two
= alloc_filespec(concatpath
);
1723 fill_filespec(one
, old_sha1
, old_mode
);
1724 fill_filespec(two
, new_sha1
, new_mode
);
1726 diff_queue(&diff_queued_diff
, one
, two
);
1729 void diff_unmerge(struct diff_options
*options
,
1732 struct diff_filespec
*one
, *two
;
1733 one
= alloc_filespec(path
);
1734 two
= alloc_filespec(path
);
1735 diff_queue(&diff_queued_diff
, one
, two
);