2 * Copyright (C) 2005 Junio C Hamano
13 * The diff API is for programs that compare two sets of files (e.g. two trees,
14 * one tree and the index) and present the found difference in various ways.
15 * The calling program is responsible for feeding the API pairs of files, one
16 * from the "old" set and the corresponding one from "new" set, that are
18 * The library called through this API is called diffcore, and is responsible
21 * - finding total rewrites (`-B`), renames (`-M`) and copies (`-C`), and
22 * changes that touch a string (`-S`), as specified by the caller.
24 * - outputting the differences in various formats, as specified by the caller.
29 * - Prepare `struct diff_options` to record the set of diff options, and then
30 * call `repo_diff_setup()` to initialize this structure. This sets up the
33 * - Fill in the options structure to specify desired output format, rename
34 * detection, etc. `diff_opt_parse()` can be used to parse options given
35 * from the command line in a way consistent with existing git-diff family
38 * - Call `diff_setup_done()`; this inspects the options set up so far for
39 * internal consistency and make necessary tweaking to it (e.g. if textual
40 * patch output was asked, recursive behaviour is turned on); the callback
41 * set_default in diff_options can be used to tweak this more.
43 * - As you find different pairs of files, call `diff_change()` to feed
44 * modified files, `diff_addremove()` to feed created or deleted files, or
45 * `diff_unmerge()` to feed a file whose state is 'unmerged' to the API.
46 * These are thin wrappers to a lower-level `diff_queue()` function that is
47 * flexible enough to record any of these kinds of changes.
49 * - Once you finish feeding the pairs of files, call `diffcore_std()`.
50 * This will tell the diffcore library to go ahead and do its work.
52 * - Calling `diff_flush()` will produce the output, it will call
53 * `diff_free()` to free any resources, e.g. those allocated in
56 * - Set `.no_free = 1` before calling `diff_flush()` to defer the
57 * freeing of allocated memory in diff_options. This is useful when
58 * `diff_flush()` is being called in a loop, rather than as a
59 * one-off. When setting `.no_free = 1` you must ensure that
60 * `diff_free()` is called at the end, either by flipping the flag
61 * before the last `diff_flush()` call, or by flipping it before
62 * calling `diff_free()` yourself.
65 struct combine_diff_path
;
69 struct diff_queue_struct
;
74 struct userdiff_driver
;
76 typedef int (*pathchange_fn_t
)(struct diff_options
*options
,
77 struct combine_diff_path
*path
);
79 typedef void (*change_fn_t
)(struct diff_options
*options
,
80 unsigned old_mode
, unsigned new_mode
,
81 const struct object_id
*old_oid
,
82 const struct object_id
*new_oid
,
83 int old_oid_valid
, int new_oid_valid
,
85 unsigned old_dirty_submodule
, unsigned new_dirty_submodule
);
87 typedef void (*add_remove_fn_t
)(struct diff_options
*options
,
88 int addremove
, unsigned mode
,
89 const struct object_id
*oid
,
91 const char *fullpath
, unsigned dirty_submodule
);
93 typedef void (*diff_format_fn_t
)(struct diff_queue_struct
*q
,
94 struct diff_options
*options
, void *data
);
96 typedef struct strbuf
*(*diff_prefix_fn_t
)(struct diff_options
*opt
, void *data
);
98 #define DIFF_FORMAT_RAW 0x0001
99 #define DIFF_FORMAT_DIFFSTAT 0x0002
100 #define DIFF_FORMAT_NUMSTAT 0x0004
101 #define DIFF_FORMAT_SUMMARY 0x0008
102 #define DIFF_FORMAT_PATCH 0x0010
103 #define DIFF_FORMAT_SHORTSTAT 0x0020
104 #define DIFF_FORMAT_DIRSTAT 0x0040
106 /* These override all above */
107 #define DIFF_FORMAT_NAME 0x0100
108 #define DIFF_FORMAT_NAME_STATUS 0x0200
109 #define DIFF_FORMAT_CHECKDIFF 0x0400
111 /* Same as output_format = 0 but we know that -s flag was given
112 * and we should not give default value to output_format.
114 #define DIFF_FORMAT_NO_OUTPUT 0x0800
116 #define DIFF_FORMAT_CALLBACK 0x1000
118 #define DIFF_FLAGS_INIT { 0 }
122 * Tells if tree traversal done by tree-diff should recursively descend
123 * into a tree object pair that are different in preimage and postimage set.
126 unsigned tree_in_recursive
;
128 /* Affects the way how a file that is seemingly binary is treated. */
133 * Tells the patch output format not to use abbreviated object names on the
138 /* Affects if diff-files shows removed files. */
139 unsigned silent_on_remove
;
142 * Tells the diffcore library that the caller is feeding unchanged
143 * filepairs to allow copies from unmodified files be detected.
145 unsigned find_copies_harder
;
147 unsigned follow_renames
;
148 unsigned rename_empty
;
150 /* Internal; used for optimization to see if there is any change. */
151 unsigned has_changes
;
156 * Tells diff-files that the input is not tracked files but files in random
157 * locations on the filesystem.
162 * Tells output routine that it is Ok to call user specified patch output
163 * routine. Plumbing disables this to ensure stable output.
165 unsigned allow_external
;
168 * For communication between the calling program and the options parser;
169 * tell the calling program to signal the presence of difference using
172 unsigned exit_with_status
;
175 * Tells the library that the calling program is feeding the filepairs
176 * reversed; `one` is two, and `two` is one.
178 unsigned reverse_diff
;
180 unsigned check_failed
;
181 unsigned relative_name
;
182 unsigned ignore_submodules
;
183 unsigned dirstat_cumulative
;
184 unsigned dirstat_by_file
;
185 unsigned allow_textconv
;
186 unsigned textconv_set_via_cmdline
;
187 unsigned diff_from_contents
;
188 unsigned dirty_submodules
;
189 unsigned ignore_untracked_in_submodules
;
190 unsigned ignore_submodule_set
;
191 unsigned ignore_dirty_submodules
;
192 unsigned override_submodule_config
;
193 unsigned dirstat_by_line
;
194 unsigned funccontext
;
195 unsigned default_follow_renames
;
196 unsigned stat_with_summary
;
197 unsigned suppress_diff_headers
;
198 unsigned dual_color_diffed_diffs
;
199 unsigned suppress_hunk_header_line_count
;
202 static inline void diff_flags_or(struct diff_flags
*a
,
203 const struct diff_flags
*b
)
205 char *tmp_a
= (char *)a
;
206 const char *tmp_b
= (const char *)b
;
209 for (i
= 0; i
< sizeof(struct diff_flags
); i
++)
210 tmp_a
[i
] |= tmp_b
[i
];
213 #define DIFF_XDL_TST(opts, flag) ((opts)->xdl_opts & XDF_##flag)
214 #define DIFF_XDL_SET(opts, flag) ((opts)->xdl_opts |= XDF_##flag)
215 #define DIFF_XDL_CLR(opts, flag) ((opts)->xdl_opts &= ~XDF_##flag)
217 #define DIFF_WITH_ALG(opts, flag) (((opts)->xdl_opts & ~XDF_DIFF_ALGORITHM_MASK) | XDF_##flag)
219 enum diff_words_type
{
221 DIFF_WORDS_PORCELAIN
,
226 enum diff_submodule_format
{
227 DIFF_SUBMODULE_SHORT
= 0,
229 DIFF_SUBMODULE_INLINE_DIFF
233 * the set of options the calling program wants to affect the operation of
234 * diffcore library with.
236 struct diff_options
{
237 const char *orderfile
;
240 * "--rotate-to=<file>" would start showing at <file> and when
241 * the output reaches the end, wrap around by default.
242 * Setting skip_instead_of_rotate to true stops the output at the
243 * end, effectively discarding the earlier part of the output
244 * before <file>'s diff (this is used to implement the
245 * "--skip-to=<file>" option).
247 * When rotate_to_strict is set, it is an error if there is no
248 * <file> in the diff. Otherwise, the output starts at the
249 * path that is the same as, or first path that sorts after,
250 * <file>. Because it is unreasonable to require the exact
251 * match for "git log -p --rotate-to=<file>" (i.e. not all
252 * commit would touch that single <file>), "git log" sets it
253 * to false. "git diff" sets it to true to detect an error
254 * in the command line option.
256 const char *rotate_to
;
257 int skip_instead_of_rotate
;
258 int rotate_to_strict
;
261 * A constant string (can and typically does contain newlines to look for
262 * a block of text, not just a single line) to filter out the filepairs
263 * that do not change the number of strings contained in its preimage and
264 * postimage of the diff_queue.
267 unsigned pickaxe_opts
;
270 regex_t
**ignore_regex
;
271 size_t ignore_regex_nr
, ignore_regex_alloc
;
273 const char *single_follow
;
274 const char *a_prefix
, *b_prefix
;
275 const char *line_prefix
;
276 size_t line_prefix_length
;
279 * collection of boolean options that affects the operation, but some do
280 * not have anything to do with the diffcore library.
282 struct diff_flags flags
;
284 /* diff-filter bits */
285 unsigned int filter
, filter_not
;
289 /* Number of context lines to generate in patch output. */
292 int interhunkcontext
;
294 /* Affects the way detection logic for complete rewrites, renames and
300 int irreversible_delete
;
301 int skip_stat_unmatch
;
302 int line_termination
;
304 /* The output format used when `diff_flush()` is run. */
307 /* Affects the way detection logic for complete rewrites, renames and
313 int needed_rename_limit
;
314 int degraded_cc_to_c
;
315 int show_rename_progress
;
316 int dirstat_permille
;
319 /* Number of hexdigits to abbreviate raw format output to. */
322 /* If non-zero, then stop computing after this many changes. */
325 int ita_invisible_in_index
;
326 /* white-space error highlighting */
327 #define WSEH_NEW (1<<12)
328 #define WSEH_CONTEXT (1<<13)
329 #define WSEH_OLD (1<<14)
330 unsigned ws_error_highlight
;
333 const char *stat_sep
;
335 int ignore_driver_algorithm
;
337 /* see Documentation/diff-options.txt */
339 size_t anchors_nr
, anchors_alloc
;
343 int stat_graph_width
;
345 const char *word_regex
;
346 enum diff_words_type word_diff
;
347 enum diff_submodule_format submodule_format
;
349 struct oidset
*objfind
;
351 /* this is set by diffcore for DIFF_FORMAT_PATCH */
354 /* to support internal diff recursion by --follow hack*/
357 /* Callback which allows tweaking the options in diff_setup_done(). */
358 void (*set_default
)(struct diff_options
*);
363 #define OUTPUT_INDICATOR_NEW 0
364 #define OUTPUT_INDICATOR_OLD 1
365 #define OUTPUT_INDICATOR_CONTEXT 2
366 char output_indicators
[3];
368 struct pathspec pathspec
;
369 pathchange_fn_t pathchange
;
371 add_remove_fn_t add_remove
;
372 void *change_fn_data
;
373 diff_format_fn_t format_callback
;
374 void *format_callback_data
;
375 diff_prefix_fn_t output_prefix
;
376 void *output_prefix_data
;
378 int diff_path_counter
;
380 struct emitted_diff_symbols
*emitted_symbols
;
383 COLOR_MOVED_PLAIN
= 1,
384 COLOR_MOVED_BLOCKS
= 2,
385 COLOR_MOVED_ZEBRA
= 3,
386 COLOR_MOVED_ZEBRA_DIM
= 4,
388 #define COLOR_MOVED_DEFAULT COLOR_MOVED_ZEBRA
389 #define COLOR_MOVED_MIN_ALNUM_COUNT 20
391 /* XDF_WHITESPACE_FLAGS regarding block detection are set at 2, 3, 4 */
392 #define COLOR_MOVED_WS_ALLOW_INDENTATION_CHANGE (1<<5)
393 #define COLOR_MOVED_WS_ERROR (1<<0)
394 unsigned color_moved_ws_handling
;
396 struct repository
*repo
;
397 struct strmap
*additional_path_headers
;
402 unsigned diff_filter_bit(char status
);
404 void diff_emit_submodule_del(struct diff_options
*o
, const char *line
);
405 void diff_emit_submodule_add(struct diff_options
*o
, const char *line
);
406 void diff_emit_submodule_untracked(struct diff_options
*o
, const char *path
);
407 void diff_emit_submodule_modified(struct diff_options
*o
, const char *path
);
408 void diff_emit_submodule_header(struct diff_options
*o
, const char *header
);
409 void diff_emit_submodule_error(struct diff_options
*o
, const char *err
);
410 void diff_emit_submodule_pipethrough(struct diff_options
*o
,
411 const char *line
, int len
);
416 struct diffstat_file
{
420 const char *comments
;
421 unsigned is_unmerged
:1;
422 unsigned is_binary
:1;
423 unsigned is_renamed
:1;
424 unsigned is_interesting
:1;
425 uintmax_t added
, deleted
;
439 DIFF_FILE_OLD_MOVED
= 9,
440 DIFF_FILE_OLD_MOVED_ALT
= 10,
441 DIFF_FILE_OLD_MOVED_DIM
= 11,
442 DIFF_FILE_OLD_MOVED_ALT_DIM
= 12,
443 DIFF_FILE_NEW_MOVED
= 13,
444 DIFF_FILE_NEW_MOVED_ALT
= 14,
445 DIFF_FILE_NEW_MOVED_DIM
= 15,
446 DIFF_FILE_NEW_MOVED_ALT_DIM
= 16,
447 DIFF_CONTEXT_DIM
= 17,
448 DIFF_FILE_OLD_DIM
= 18,
449 DIFF_FILE_NEW_DIM
= 19,
450 DIFF_CONTEXT_BOLD
= 20,
451 DIFF_FILE_OLD_BOLD
= 21,
452 DIFF_FILE_NEW_BOLD
= 22,
455 const char *diff_get_color(int diff_use_color
, enum color_diff ix
);
456 #define diff_get_color_opt(o, ix) \
457 diff_get_color((o)->use_color, ix)
460 const char *diff_line_prefix(struct diff_options
*);
463 extern const char mime_boundary_leader
[];
465 struct combine_diff_path
*diff_tree_paths(
466 struct combine_diff_path
*p
, const struct object_id
*oid
,
467 const struct object_id
**parents_oid
, int nparent
,
468 struct strbuf
*base
, struct diff_options
*opt
);
469 void diff_tree_oid(const struct object_id
*old_oid
,
470 const struct object_id
*new_oid
,
471 const char *base
, struct diff_options
*opt
);
472 void diff_root_tree_oid(const struct object_id
*new_oid
, const char *base
,
473 struct diff_options
*opt
);
475 struct combine_diff_path
{
476 struct combine_diff_path
*next
;
479 struct object_id oid
;
480 struct combine_diff_parent
{
483 struct object_id oid
;
485 } parent
[FLEX_ARRAY
];
487 #define combine_diff_path_size(n, l) \
488 st_add4(sizeof(struct combine_diff_path), (l), 1, \
489 st_mult(sizeof(struct combine_diff_parent), (n)))
491 void show_combined_diff(struct combine_diff_path
*elem
, int num_parent
,
494 void diff_tree_combined(const struct object_id
*oid
, const struct oid_array
*parents
, struct rev_info
*rev
);
496 void diff_tree_combined_merge(const struct commit
*commit
, struct rev_info
*rev
);
498 void diff_set_mnemonic_prefix(struct diff_options
*options
, const char *a
, const char *b
);
500 int diff_can_quit_early(struct diff_options
*);
502 void diff_addremove(struct diff_options
*,
505 const struct object_id
*oid
,
507 const char *fullpath
, unsigned dirty_submodule
);
509 void diff_change(struct diff_options
*,
510 unsigned mode1
, unsigned mode2
,
511 const struct object_id
*old_oid
,
512 const struct object_id
*new_oid
,
513 int old_oid_valid
, int new_oid_valid
,
514 const char *fullpath
,
515 unsigned dirty_submodule1
, unsigned dirty_submodule2
);
517 struct diff_filepair
*diff_unmerge(struct diff_options
*, const char *path
);
519 void compute_diffstat(struct diff_options
*options
, struct diffstat_t
*diffstat
,
520 struct diff_queue_struct
*q
);
521 void free_diffstat_info(struct diffstat_t
*diffstat
);
523 #define DIFF_SETUP_REVERSE 1
524 #define DIFF_SETUP_USE_SIZE_CACHE 4
527 * Poor man's alternative to parse-option, to allow both stuck form
528 * (--option=value) and separate form (--option value).
530 int parse_long_opt(const char *opt
, const char **argv
,
531 const char **optarg
);
533 int git_diff_basic_config(const char *var
, const char *value
, void *cb
);
534 int git_diff_heuristic_config(const char *var
, const char *value
, void *cb
);
535 void init_diff_ui_defaults(void);
536 int git_diff_ui_config(const char *var
, const char *value
, void *cb
);
537 #ifndef NO_THE_REPOSITORY_COMPATIBILITY_MACROS
538 #define diff_setup(diffopts) repo_diff_setup(the_repository, diffopts)
540 void repo_diff_setup(struct repository
*, struct diff_options
*);
541 struct option
*add_diff_options(const struct option
*, struct diff_options
*);
542 int diff_opt_parse(struct diff_options
*, const char **, int, const char *);
543 void diff_setup_done(struct diff_options
*);
544 int git_config_rename(const char *var
, const char *value
);
546 #define DIFF_DETECT_RENAME 1
547 #define DIFF_DETECT_COPY 2
549 #define DIFF_PICKAXE_ALL 1
550 #define DIFF_PICKAXE_REGEX 2
552 #define DIFF_PICKAXE_KIND_S 4 /* traditional plumbing counter */
553 #define DIFF_PICKAXE_KIND_G 8 /* grep in the patch */
554 #define DIFF_PICKAXE_KIND_OBJFIND 16 /* specific object IDs */
556 #define DIFF_PICKAXE_KINDS_MASK (DIFF_PICKAXE_KIND_S | \
557 DIFF_PICKAXE_KIND_G | \
558 DIFF_PICKAXE_KIND_OBJFIND)
559 #define DIFF_PICKAXE_KINDS_G_REGEX_MASK (DIFF_PICKAXE_KIND_G | \
561 #define DIFF_PICKAXE_KINDS_ALL_OBJFIND_MASK (DIFF_PICKAXE_ALL | \
562 DIFF_PICKAXE_KIND_OBJFIND)
564 #define DIFF_PICKAXE_IGNORE_CASE 32
566 void diffcore_std(struct diff_options
*);
567 void diffcore_fix_diff_index(void);
569 #define COMMON_DIFF_OPTIONS_HELP \
570 "\ncommon diff options:\n" \
571 " -z output diff-raw with lines terminated with NUL.\n" \
572 " -p output patch format.\n" \
573 " -u synonym for -p.\n" \
574 " --patch-with-raw\n" \
575 " output both a patch and the diff-raw format.\n" \
576 " --stat show diffstat instead of patch.\n" \
577 " --numstat show numeric diffstat instead of patch.\n" \
578 " --patch-with-stat\n" \
579 " output a patch and prepend its diffstat.\n" \
580 " --name-only show only names of changed files.\n" \
581 " --name-status show names and status of changed files.\n" \
582 " --full-index show full object name on index lines.\n" \
583 " --abbrev=<n> abbreviate object names in diff-tree header and diff-raw.\n" \
584 " -R swap input file pairs.\n" \
585 " -B detect complete rewrites.\n" \
586 " -M detect renames.\n" \
587 " -C detect copies.\n" \
588 " --find-copies-harder\n" \
589 " try unchanged files as candidate for copy detection.\n" \
590 " -l<n> limit rename attempts up to <n> paths.\n" \
591 " -O<file> reorder diffs according to the <file>.\n" \
592 " -S<string> find filepair whose only one side contains the string.\n" \
594 " show all files diff when -S is used and hit is found.\n" \
595 " -a --text treat all files as text.\n"
597 int diff_queue_is_empty(struct diff_options
*o
);
598 void diff_flush(struct diff_options
*);
599 void diff_free(struct diff_options
*);
600 void diff_warn_rename_limit(const char *varname
, int needed
, int degraded_cc
);
602 /* diff-raw status letters */
603 #define DIFF_STATUS_ADDED 'A'
604 #define DIFF_STATUS_COPIED 'C'
605 #define DIFF_STATUS_DELETED 'D'
606 #define DIFF_STATUS_MODIFIED 'M'
607 #define DIFF_STATUS_RENAMED 'R'
608 #define DIFF_STATUS_TYPE_CHANGED 'T'
609 #define DIFF_STATUS_UNKNOWN 'X'
610 #define DIFF_STATUS_UNMERGED 'U'
612 /* these are not diff-raw status letters proper, but used by
613 * diffcore-filter insn to specify additional restrictions.
615 #define DIFF_STATUS_FILTER_AON '*'
616 #define DIFF_STATUS_FILTER_BROKEN 'B'
619 * This is different from find_unique_abbrev() in that
620 * it stuffs the result with dots for alignment.
622 const char *diff_aligned_abbrev(const struct object_id
*sha1
, int);
624 void diff_get_merge_base(const struct rev_info
*revs
, struct object_id
*mb
);
626 /* do not report anything on removed paths */
627 #define DIFF_SILENT_ON_REMOVED 01
628 /* report racily-clean paths as modified */
629 #define DIFF_RACY_IS_MODIFIED 02
630 int run_diff_files(struct rev_info
*revs
, unsigned int option
);
632 #define DIFF_INDEX_CACHED 01
633 #define DIFF_INDEX_MERGE_BASE 02
634 int run_diff_index(struct rev_info
*revs
, unsigned int option
);
636 int do_diff_cache(const struct object_id
*, struct diff_options
*);
637 int diff_flush_patch_id(struct diff_options
*, struct object_id
*, int);
638 void flush_one_hunk(struct object_id
*result
, git_hash_ctx
*ctx
);
640 int diff_result_code(struct diff_options
*, int);
642 int diff_no_index(struct rev_info
*,
643 int implicit_no_index
, int, const char **);
645 int index_differs_from(struct repository
*r
, const char *def
,
646 const struct diff_flags
*flags
,
647 int ita_invisible_in_index
);
650 * Emit an interdiff of two object ID's to 'diff_options.file' optionally
651 * indented by 'indent' spaces.
653 void show_interdiff(const struct object_id
*, const struct object_id
*,
654 int indent
, struct diff_options
*);
657 * Fill the contents of the filespec "df", respecting any textconv defined by
658 * its userdiff driver. The "driver" parameter must come from a
659 * previous call to get_textconv(), and therefore should either be NULL or have
662 * Note that the memory ownership of the resulting buffer depends on whether
663 * the driver field is NULL. If it is, then the memory belongs to the filespec
664 * struct. If it is non-NULL, then "outbuf" points to a newly allocated buffer
665 * that should be freed by the caller.
667 size_t fill_textconv(struct repository
*r
,
668 struct userdiff_driver
*driver
,
669 struct diff_filespec
*df
,
673 * Look up the userdiff driver for the given filespec, and return it if
674 * and only if it has textconv enabled (otherwise return NULL). The result
675 * can be passed to fill_textconv().
677 struct userdiff_driver
*get_textconv(struct repository
*r
,
678 struct diff_filespec
*one
);
681 * Prepare diff_filespec and convert it using diff textconv API
682 * if the textconv driver exists.
683 * Return 1 if the conversion succeeds, 0 otherwise.
685 int textconv_object(struct repository
*repo
,
688 const struct object_id
*oid
, int oid_valid
,
689 char **buf
, unsigned long *buf_size
);
691 int parse_rename_score(const char **cp_p
);
693 long parse_algorithm_value(const char *value
);
695 void print_stat_summary(FILE *fp
, int files
,
696 int insertions
, int deletions
);
697 void setup_diff_pager(struct diff_options
*);