Merge branch 'jk/bundle-progress'
[git/debian.git] / rerere.c
bloba67abaab0776ee24c44d195e4d1a8f49acff5bdb
1 #include "git-compat-util.h"
2 #include "alloc.h"
3 #include "config.h"
4 #include "hex.h"
5 #include "lockfile.h"
6 #include "string-list.h"
7 #include "rerere.h"
8 #include "xdiff-interface.h"
9 #include "dir.h"
10 #include "resolve-undo.h"
11 #include "ll-merge.h"
12 #include "attr.h"
13 #include "pathspec.h"
14 #include "object-store.h"
15 #include "hash-lookup.h"
16 #include "strmap.h"
18 #define RESOLVED 0
19 #define PUNTED 1
20 #define THREE_STAGED 2
21 void *RERERE_RESOLVED = &RERERE_RESOLVED;
23 /* if rerere_enabled == -1, fall back to detection of .git/rr-cache */
24 static int rerere_enabled = -1;
26 /* automatically update cleanly resolved paths to the index */
27 static int rerere_autoupdate;
29 #define RR_HAS_POSTIMAGE 1
30 #define RR_HAS_PREIMAGE 2
31 struct rerere_dir {
32 int status_alloc, status_nr;
33 unsigned char *status;
34 char name[FLEX_ARRAY];
37 static struct strmap rerere_dirs = STRMAP_INIT;
39 static void free_rerere_dirs(void)
41 struct hashmap_iter iter;
42 struct strmap_entry *ent;
44 strmap_for_each_entry(&rerere_dirs, &iter, ent) {
45 struct rerere_dir *rr_dir = ent->value;
46 free(rr_dir->status);
47 free(rr_dir);
49 strmap_clear(&rerere_dirs, 0);
52 static void free_rerere_id(struct string_list_item *item)
54 free(item->util);
57 static const char *rerere_id_hex(const struct rerere_id *id)
59 return id->collection->name;
62 static void fit_variant(struct rerere_dir *rr_dir, int variant)
64 variant++;
65 ALLOC_GROW(rr_dir->status, variant, rr_dir->status_alloc);
66 if (rr_dir->status_nr < variant) {
67 memset(rr_dir->status + rr_dir->status_nr,
68 '\0', variant - rr_dir->status_nr);
69 rr_dir->status_nr = variant;
73 static void assign_variant(struct rerere_id *id)
75 int variant;
76 struct rerere_dir *rr_dir = id->collection;
78 variant = id->variant;
79 if (variant < 0) {
80 for (variant = 0; variant < rr_dir->status_nr; variant++)
81 if (!rr_dir->status[variant])
82 break;
84 fit_variant(rr_dir, variant);
85 id->variant = variant;
88 const char *rerere_path(const struct rerere_id *id, const char *file)
90 if (!file)
91 return git_path("rr-cache/%s", rerere_id_hex(id));
93 if (id->variant <= 0)
94 return git_path("rr-cache/%s/%s", rerere_id_hex(id), file);
96 return git_path("rr-cache/%s/%s.%d",
97 rerere_id_hex(id), file, id->variant);
100 static int is_rr_file(const char *name, const char *filename, int *variant)
102 const char *suffix;
103 char *ep;
105 if (!strcmp(name, filename)) {
106 *variant = 0;
107 return 1;
109 if (!skip_prefix(name, filename, &suffix) || *suffix != '.')
110 return 0;
112 errno = 0;
113 *variant = strtol(suffix + 1, &ep, 10);
114 if (errno || *ep)
115 return 0;
116 return 1;
119 static void scan_rerere_dir(struct rerere_dir *rr_dir)
121 struct dirent *de;
122 DIR *dir = opendir(git_path("rr-cache/%s", rr_dir->name));
124 if (!dir)
125 return;
126 while ((de = readdir(dir)) != NULL) {
127 int variant;
129 if (is_rr_file(de->d_name, "postimage", &variant)) {
130 fit_variant(rr_dir, variant);
131 rr_dir->status[variant] |= RR_HAS_POSTIMAGE;
132 } else if (is_rr_file(de->d_name, "preimage", &variant)) {
133 fit_variant(rr_dir, variant);
134 rr_dir->status[variant] |= RR_HAS_PREIMAGE;
137 closedir(dir);
140 static struct rerere_dir *find_rerere_dir(const char *hex)
142 struct rerere_dir *rr_dir;
144 rr_dir = strmap_get(&rerere_dirs, hex);
145 if (!rr_dir) {
146 FLEX_ALLOC_STR(rr_dir, name, hex);
147 rr_dir->status = NULL;
148 rr_dir->status_nr = 0;
149 rr_dir->status_alloc = 0;
150 strmap_put(&rerere_dirs, hex, rr_dir);
152 scan_rerere_dir(rr_dir);
154 return rr_dir;
157 static int has_rerere_resolution(const struct rerere_id *id)
159 const int both = RR_HAS_POSTIMAGE|RR_HAS_PREIMAGE;
160 int variant = id->variant;
162 if (variant < 0)
163 return 0;
164 return ((id->collection->status[variant] & both) == both);
167 static struct rerere_id *new_rerere_id_hex(char *hex)
169 struct rerere_id *id = xmalloc(sizeof(*id));
170 id->collection = find_rerere_dir(hex);
171 id->variant = -1; /* not known yet */
172 return id;
175 static struct rerere_id *new_rerere_id(unsigned char *hash)
177 return new_rerere_id_hex(hash_to_hex(hash));
181 * $GIT_DIR/MERGE_RR file is a collection of records, each of which is
182 * "conflict ID", a HT and pathname, terminated with a NUL, and is
183 * used to keep track of the set of paths that "rerere" may need to
184 * work on (i.e. what is left by the previous invocation of "git
185 * rerere" during the current conflict resolution session).
187 static void read_rr(struct repository *r, struct string_list *rr)
189 struct strbuf buf = STRBUF_INIT;
190 FILE *in = fopen_or_warn(git_path_merge_rr(r), "r");
192 if (!in)
193 return;
194 while (!strbuf_getwholeline(&buf, in, '\0')) {
195 char *path;
196 unsigned char hash[GIT_MAX_RAWSZ];
197 struct rerere_id *id;
198 int variant;
199 const unsigned hexsz = the_hash_algo->hexsz;
201 /* There has to be the hash, tab, path and then NUL */
202 if (buf.len < hexsz + 2 || get_sha1_hex(buf.buf, hash))
203 die(_("corrupt MERGE_RR"));
205 if (buf.buf[hexsz] != '.') {
206 variant = 0;
207 path = buf.buf + hexsz;
208 } else {
209 errno = 0;
210 variant = strtol(buf.buf + hexsz + 1, &path, 10);
211 if (errno)
212 die(_("corrupt MERGE_RR"));
214 if (*(path++) != '\t')
215 die(_("corrupt MERGE_RR"));
216 buf.buf[hexsz] = '\0';
217 id = new_rerere_id_hex(buf.buf);
218 id->variant = variant;
219 string_list_insert(rr, path)->util = id;
221 strbuf_release(&buf);
222 fclose(in);
225 static struct lock_file write_lock;
227 static int write_rr(struct string_list *rr, int out_fd)
229 int i;
230 for (i = 0; i < rr->nr; i++) {
231 struct strbuf buf = STRBUF_INIT;
232 struct rerere_id *id;
234 assert(rr->items[i].util != RERERE_RESOLVED);
236 id = rr->items[i].util;
237 if (!id)
238 continue;
239 assert(id->variant >= 0);
240 if (0 < id->variant)
241 strbuf_addf(&buf, "%s.%d\t%s%c",
242 rerere_id_hex(id), id->variant,
243 rr->items[i].string, 0);
244 else
245 strbuf_addf(&buf, "%s\t%s%c",
246 rerere_id_hex(id),
247 rr->items[i].string, 0);
249 if (write_in_full(out_fd, buf.buf, buf.len) < 0)
250 die(_("unable to write rerere record"));
252 strbuf_release(&buf);
254 if (commit_lock_file(&write_lock) != 0)
255 die(_("unable to write rerere record"));
256 return 0;
260 * "rerere" interacts with conflicted file contents using this I/O
261 * abstraction. It reads a conflicted contents from one place via
262 * "getline()" method, and optionally can write it out after
263 * normalizing the conflicted hunks to the "output". Subclasses of
264 * rerere_io embed this structure at the beginning of their own
265 * rerere_io object.
267 struct rerere_io {
268 int (*getline)(struct strbuf *, struct rerere_io *);
269 FILE *output;
270 int wrerror;
271 /* some more stuff */
274 static void ferr_write(const void *p, size_t count, FILE *fp, int *err)
276 if (!count || *err)
277 return;
278 if (fwrite(p, count, 1, fp) != 1)
279 *err = errno;
282 static inline void ferr_puts(const char *s, FILE *fp, int *err)
284 ferr_write(s, strlen(s), fp, err);
287 static void rerere_io_putstr(const char *str, struct rerere_io *io)
289 if (io->output)
290 ferr_puts(str, io->output, &io->wrerror);
293 static void rerere_io_putmem(const char *mem, size_t sz, struct rerere_io *io)
295 if (io->output)
296 ferr_write(mem, sz, io->output, &io->wrerror);
300 * Subclass of rerere_io that reads from an on-disk file
302 struct rerere_io_file {
303 struct rerere_io io;
304 FILE *input;
308 * ... and its getline() method implementation
310 static int rerere_file_getline(struct strbuf *sb, struct rerere_io *io_)
312 struct rerere_io_file *io = (struct rerere_io_file *)io_;
313 return strbuf_getwholeline(sb, io->input, '\n');
317 * Require the exact number of conflict marker letters, no more, no
318 * less, followed by SP or any whitespace
319 * (including LF).
321 static int is_cmarker(char *buf, int marker_char, int marker_size)
323 int want_sp;
326 * The beginning of our version and the end of their version
327 * always are labeled like "<<<<< ours" or ">>>>> theirs",
328 * hence we set want_sp for them. Note that the version from
329 * the common ancestor in diff3-style output is not always
330 * labelled (e.g. "||||| common" is often seen but "|||||"
331 * alone is also valid), so we do not set want_sp.
333 want_sp = (marker_char == '<') || (marker_char == '>');
335 while (marker_size--)
336 if (*buf++ != marker_char)
337 return 0;
338 if (want_sp && *buf != ' ')
339 return 0;
340 return isspace(*buf);
343 static void rerere_strbuf_putconflict(struct strbuf *buf, int ch, size_t size)
345 strbuf_addchars(buf, ch, size);
346 strbuf_addch(buf, '\n');
349 static int handle_conflict(struct strbuf *out, struct rerere_io *io,
350 int marker_size, git_hash_ctx *ctx)
352 enum {
353 RR_SIDE_1 = 0, RR_SIDE_2, RR_ORIGINAL
354 } hunk = RR_SIDE_1;
355 struct strbuf one = STRBUF_INIT, two = STRBUF_INIT;
356 struct strbuf buf = STRBUF_INIT, conflict = STRBUF_INIT;
357 int has_conflicts = -1;
359 while (!io->getline(&buf, io)) {
360 if (is_cmarker(buf.buf, '<', marker_size)) {
361 if (handle_conflict(&conflict, io, marker_size, NULL) < 0)
362 break;
363 if (hunk == RR_SIDE_1)
364 strbuf_addbuf(&one, &conflict);
365 else
366 strbuf_addbuf(&two, &conflict);
367 strbuf_release(&conflict);
368 } else if (is_cmarker(buf.buf, '|', marker_size)) {
369 if (hunk != RR_SIDE_1)
370 break;
371 hunk = RR_ORIGINAL;
372 } else if (is_cmarker(buf.buf, '=', marker_size)) {
373 if (hunk != RR_SIDE_1 && hunk != RR_ORIGINAL)
374 break;
375 hunk = RR_SIDE_2;
376 } else if (is_cmarker(buf.buf, '>', marker_size)) {
377 if (hunk != RR_SIDE_2)
378 break;
379 if (strbuf_cmp(&one, &two) > 0)
380 strbuf_swap(&one, &two);
381 has_conflicts = 1;
382 rerere_strbuf_putconflict(out, '<', marker_size);
383 strbuf_addbuf(out, &one);
384 rerere_strbuf_putconflict(out, '=', marker_size);
385 strbuf_addbuf(out, &two);
386 rerere_strbuf_putconflict(out, '>', marker_size);
387 if (ctx) {
388 the_hash_algo->update_fn(ctx, one.buf ?
389 one.buf : "",
390 one.len + 1);
391 the_hash_algo->update_fn(ctx, two.buf ?
392 two.buf : "",
393 two.len + 1);
395 break;
396 } else if (hunk == RR_SIDE_1)
397 strbuf_addbuf(&one, &buf);
398 else if (hunk == RR_ORIGINAL)
399 ; /* discard */
400 else if (hunk == RR_SIDE_2)
401 strbuf_addbuf(&two, &buf);
403 strbuf_release(&one);
404 strbuf_release(&two);
405 strbuf_release(&buf);
407 return has_conflicts;
411 * Read contents a file with conflicts, normalize the conflicts
412 * by (1) discarding the common ancestor version in diff3-style,
413 * (2) reordering our side and their side so that whichever sorts
414 * alphabetically earlier comes before the other one, while
415 * computing the "conflict ID", which is just an SHA-1 hash of
416 * one side of the conflict, NUL, the other side of the conflict,
417 * and NUL concatenated together.
419 * Return 1 if conflict hunks are found, 0 if there are no conflict
420 * hunks and -1 if an error occurred.
422 static int handle_path(unsigned char *hash, struct rerere_io *io, int marker_size)
424 git_hash_ctx ctx;
425 struct strbuf buf = STRBUF_INIT, out = STRBUF_INIT;
426 int has_conflicts = 0;
427 if (hash)
428 the_hash_algo->init_fn(&ctx);
430 while (!io->getline(&buf, io)) {
431 if (is_cmarker(buf.buf, '<', marker_size)) {
432 has_conflicts = handle_conflict(&out, io, marker_size,
433 hash ? &ctx : NULL);
434 if (has_conflicts < 0)
435 break;
436 rerere_io_putmem(out.buf, out.len, io);
437 strbuf_reset(&out);
438 } else
439 rerere_io_putstr(buf.buf, io);
441 strbuf_release(&buf);
442 strbuf_release(&out);
444 if (hash)
445 the_hash_algo->final_fn(hash, &ctx);
447 return has_conflicts;
451 * Scan the path for conflicts, do the "handle_path()" thing above, and
452 * return the number of conflict hunks found.
454 static int handle_file(struct index_state *istate,
455 const char *path, unsigned char *hash, const char *output)
457 int has_conflicts = 0;
458 struct rerere_io_file io;
459 int marker_size = ll_merge_marker_size(istate, path);
461 memset(&io, 0, sizeof(io));
462 io.io.getline = rerere_file_getline;
463 io.input = fopen(path, "r");
464 io.io.wrerror = 0;
465 if (!io.input)
466 return error_errno(_("could not open '%s'"), path);
468 if (output) {
469 io.io.output = fopen(output, "w");
470 if (!io.io.output) {
471 error_errno(_("could not write '%s'"), output);
472 fclose(io.input);
473 return -1;
477 has_conflicts = handle_path(hash, (struct rerere_io *)&io, marker_size);
479 fclose(io.input);
480 if (io.io.wrerror)
481 error(_("there were errors while writing '%s' (%s)"),
482 path, strerror(io.io.wrerror));
483 if (io.io.output && fclose(io.io.output))
484 io.io.wrerror = error_errno(_("failed to flush '%s'"), path);
486 if (has_conflicts < 0) {
487 if (output)
488 unlink_or_warn(output);
489 return error(_("could not parse conflict hunks in '%s'"), path);
491 if (io.io.wrerror)
492 return -1;
493 return has_conflicts;
497 * Look at a cache entry at "i" and see if it is not conflicting,
498 * conflicting and we are willing to handle, or conflicting and
499 * we are unable to handle, and return the determination in *type.
500 * Return the cache index to be looked at next, by skipping the
501 * stages we have already looked at in this invocation of this
502 * function.
504 static int check_one_conflict(struct index_state *istate, int i, int *type)
506 const struct cache_entry *e = istate->cache[i];
508 if (!ce_stage(e)) {
509 *type = RESOLVED;
510 return i + 1;
513 *type = PUNTED;
514 while (i < istate->cache_nr && ce_stage(istate->cache[i]) == 1)
515 i++;
517 /* Only handle regular files with both stages #2 and #3 */
518 if (i + 1 < istate->cache_nr) {
519 const struct cache_entry *e2 = istate->cache[i];
520 const struct cache_entry *e3 = istate->cache[i + 1];
521 if (ce_stage(e2) == 2 &&
522 ce_stage(e3) == 3 &&
523 ce_same_name(e, e3) &&
524 S_ISREG(e2->ce_mode) &&
525 S_ISREG(e3->ce_mode))
526 *type = THREE_STAGED;
529 /* Skip the entries with the same name */
530 while (i < istate->cache_nr && ce_same_name(e, istate->cache[i]))
531 i++;
532 return i;
536 * Scan the index and find paths that have conflicts that rerere can
537 * handle, i.e. the ones that has both stages #2 and #3.
539 * NEEDSWORK: we do not record or replay a previous "resolve by
540 * deletion" for a delete-modify conflict, as that is inherently risky
541 * without knowing what modification is being discarded. The only
542 * safe case, i.e. both side doing the deletion and modification that
543 * are identical to the previous round, might want to be handled,
544 * though.
546 static int find_conflict(struct repository *r, struct string_list *conflict)
548 int i;
550 if (repo_read_index(r) < 0)
551 return error(_("index file corrupt"));
553 for (i = 0; i < r->index->cache_nr;) {
554 int conflict_type;
555 const struct cache_entry *e = r->index->cache[i];
556 i = check_one_conflict(r->index, i, &conflict_type);
557 if (conflict_type == THREE_STAGED)
558 string_list_insert(conflict, (const char *)e->name);
560 return 0;
564 * The merge_rr list is meant to hold outstanding conflicted paths
565 * that rerere could handle. Abuse the list by adding other types of
566 * entries to allow the caller to show "rerere remaining".
568 * - Conflicted paths that rerere does not handle are added
569 * - Conflicted paths that have been resolved are marked as such
570 * by storing RERERE_RESOLVED to .util field (where conflict ID
571 * is expected to be stored).
573 * Do *not* write MERGE_RR file out after calling this function.
575 * NEEDSWORK: we may want to fix the caller that implements "rerere
576 * remaining" to do this without abusing merge_rr.
578 int rerere_remaining(struct repository *r, struct string_list *merge_rr)
580 int i;
582 if (setup_rerere(r, merge_rr, RERERE_READONLY))
583 return 0;
584 if (repo_read_index(r) < 0)
585 return error(_("index file corrupt"));
587 for (i = 0; i < r->index->cache_nr;) {
588 int conflict_type;
589 const struct cache_entry *e = r->index->cache[i];
590 i = check_one_conflict(r->index, i, &conflict_type);
591 if (conflict_type == PUNTED)
592 string_list_insert(merge_rr, (const char *)e->name);
593 else if (conflict_type == RESOLVED) {
594 struct string_list_item *it;
595 it = string_list_lookup(merge_rr, (const char *)e->name);
596 if (it) {
597 free_rerere_id(it);
598 it->util = RERERE_RESOLVED;
602 return 0;
606 * Try using the given conflict resolution "ID" to see
607 * if that recorded conflict resolves cleanly what we
608 * got in the "cur".
610 static int try_merge(struct index_state *istate,
611 const struct rerere_id *id, const char *path,
612 mmfile_t *cur, mmbuffer_t *result)
614 enum ll_merge_result ret;
615 mmfile_t base = {NULL, 0}, other = {NULL, 0};
617 if (read_mmfile(&base, rerere_path(id, "preimage")) ||
618 read_mmfile(&other, rerere_path(id, "postimage"))) {
619 ret = LL_MERGE_CONFLICT;
620 } else {
622 * A three-way merge. Note that this honors user-customizable
623 * low-level merge driver settings.
625 ret = ll_merge(result, path, &base, NULL, cur, "", &other, "",
626 istate, NULL);
629 free(base.ptr);
630 free(other.ptr);
632 return ret;
636 * Find the conflict identified by "id"; the change between its
637 * "preimage" (i.e. a previous contents with conflict markers) and its
638 * "postimage" (i.e. the corresponding contents with conflicts
639 * resolved) may apply cleanly to the contents stored in "path", i.e.
640 * the conflict this time around.
642 * Returns 0 for successful replay of recorded resolution, or non-zero
643 * for failure.
645 static int merge(struct index_state *istate, const struct rerere_id *id, const char *path)
647 FILE *f;
648 int ret;
649 mmfile_t cur = {NULL, 0};
650 mmbuffer_t result = {NULL, 0};
653 * Normalize the conflicts in path and write it out to
654 * "thisimage" temporary file.
656 if ((handle_file(istate, path, NULL, rerere_path(id, "thisimage")) < 0) ||
657 read_mmfile(&cur, rerere_path(id, "thisimage"))) {
658 ret = 1;
659 goto out;
662 ret = try_merge(istate, id, path, &cur, &result);
663 if (ret)
664 goto out;
667 * A successful replay of recorded resolution.
668 * Mark that "postimage" was used to help gc.
670 if (utime(rerere_path(id, "postimage"), NULL) < 0)
671 warning_errno(_("failed utime() on '%s'"),
672 rerere_path(id, "postimage"));
674 /* Update "path" with the resolution */
675 f = fopen(path, "w");
676 if (!f)
677 return error_errno(_("could not open '%s'"), path);
678 if (fwrite(result.ptr, result.size, 1, f) != 1)
679 error_errno(_("could not write '%s'"), path);
680 if (fclose(f))
681 return error_errno(_("writing '%s' failed"), path);
683 out:
684 free(cur.ptr);
685 free(result.ptr);
687 return ret;
690 static void update_paths(struct repository *r, struct string_list *update)
692 struct lock_file index_lock = LOCK_INIT;
693 int i;
695 repo_hold_locked_index(r, &index_lock, LOCK_DIE_ON_ERROR);
697 for (i = 0; i < update->nr; i++) {
698 struct string_list_item *item = &update->items[i];
699 if (add_file_to_index(r->index, item->string, 0))
700 exit(128);
701 fprintf_ln(stderr, _("Staged '%s' using previous resolution."),
702 item->string);
705 if (write_locked_index(r->index, &index_lock,
706 COMMIT_LOCK | SKIP_IF_UNCHANGED))
707 die(_("unable to write new index file"));
710 static void remove_variant(struct rerere_id *id)
712 unlink_or_warn(rerere_path(id, "postimage"));
713 unlink_or_warn(rerere_path(id, "preimage"));
714 id->collection->status[id->variant] = 0;
718 * The path indicated by rr_item may still have conflict for which we
719 * have a recorded resolution, in which case replay it and optionally
720 * update it. Or it may have been resolved by the user and we may
721 * only have the preimage for that conflict, in which case the result
722 * needs to be recorded as a resolution in a postimage file.
724 static void do_rerere_one_path(struct index_state *istate,
725 struct string_list_item *rr_item,
726 struct string_list *update)
728 const char *path = rr_item->string;
729 struct rerere_id *id = rr_item->util;
730 struct rerere_dir *rr_dir = id->collection;
731 int variant;
733 variant = id->variant;
735 /* Has the user resolved it already? */
736 if (variant >= 0) {
737 if (!handle_file(istate, path, NULL, NULL)) {
738 copy_file(rerere_path(id, "postimage"), path, 0666);
739 id->collection->status[variant] |= RR_HAS_POSTIMAGE;
740 fprintf_ln(stderr, _("Recorded resolution for '%s'."), path);
741 free_rerere_id(rr_item);
742 rr_item->util = NULL;
743 return;
746 * There may be other variants that can cleanly
747 * replay. Try them and update the variant number for
748 * this one.
752 /* Does any existing resolution apply cleanly? */
753 for (variant = 0; variant < rr_dir->status_nr; variant++) {
754 const int both = RR_HAS_PREIMAGE | RR_HAS_POSTIMAGE;
755 struct rerere_id vid = *id;
757 if ((rr_dir->status[variant] & both) != both)
758 continue;
760 vid.variant = variant;
761 if (merge(istate, &vid, path))
762 continue; /* failed to replay */
765 * If there already is a different variant that applies
766 * cleanly, there is no point maintaining our own variant.
768 if (0 <= id->variant && id->variant != variant)
769 remove_variant(id);
771 if (rerere_autoupdate)
772 string_list_insert(update, path);
773 else
774 fprintf_ln(stderr,
775 _("Resolved '%s' using previous resolution."),
776 path);
777 free_rerere_id(rr_item);
778 rr_item->util = NULL;
779 return;
782 /* None of the existing one applies; we need a new variant */
783 assign_variant(id);
785 variant = id->variant;
786 handle_file(istate, path, NULL, rerere_path(id, "preimage"));
787 if (id->collection->status[variant] & RR_HAS_POSTIMAGE) {
788 const char *path = rerere_path(id, "postimage");
789 if (unlink(path))
790 die_errno(_("cannot unlink stray '%s'"), path);
791 id->collection->status[variant] &= ~RR_HAS_POSTIMAGE;
793 id->collection->status[variant] |= RR_HAS_PREIMAGE;
794 fprintf_ln(stderr, _("Recorded preimage for '%s'"), path);
797 static int do_plain_rerere(struct repository *r,
798 struct string_list *rr, int fd)
800 struct string_list conflict = STRING_LIST_INIT_DUP;
801 struct string_list update = STRING_LIST_INIT_DUP;
802 int i;
804 find_conflict(r, &conflict);
807 * MERGE_RR records paths with conflicts immediately after
808 * merge failed. Some of the conflicted paths might have been
809 * hand resolved in the working tree since then, but the
810 * initial run would catch all and register their preimages.
812 for (i = 0; i < conflict.nr; i++) {
813 struct rerere_id *id;
814 unsigned char hash[GIT_MAX_RAWSZ];
815 const char *path = conflict.items[i].string;
816 int ret;
819 * Ask handle_file() to scan and assign a
820 * conflict ID. No need to write anything out
821 * yet.
823 ret = handle_file(r->index, path, hash, NULL);
824 if (ret != 0 && string_list_has_string(rr, path)) {
825 remove_variant(string_list_lookup(rr, path)->util);
826 string_list_remove(rr, path, 1);
828 if (ret < 1)
829 continue;
831 id = new_rerere_id(hash);
832 string_list_insert(rr, path)->util = id;
834 /* Ensure that the directory exists. */
835 mkdir_in_gitdir(rerere_path(id, NULL));
838 for (i = 0; i < rr->nr; i++)
839 do_rerere_one_path(r->index, &rr->items[i], &update);
841 if (update.nr)
842 update_paths(r, &update);
844 return write_rr(rr, fd);
847 static void git_rerere_config(void)
849 git_config_get_bool("rerere.enabled", &rerere_enabled);
850 git_config_get_bool("rerere.autoupdate", &rerere_autoupdate);
851 git_config(git_default_config, NULL);
854 static GIT_PATH_FUNC(git_path_rr_cache, "rr-cache")
856 static int is_rerere_enabled(void)
858 int rr_cache_exists;
860 if (!rerere_enabled)
861 return 0;
863 rr_cache_exists = is_directory(git_path_rr_cache());
864 if (rerere_enabled < 0)
865 return rr_cache_exists;
867 if (!rr_cache_exists && mkdir_in_gitdir(git_path_rr_cache()))
868 die(_("could not create directory '%s'"), git_path_rr_cache());
869 return 1;
872 int setup_rerere(struct repository *r, struct string_list *merge_rr, int flags)
874 int fd;
876 git_rerere_config();
877 if (!is_rerere_enabled())
878 return -1;
880 if (flags & (RERERE_AUTOUPDATE|RERERE_NOAUTOUPDATE))
881 rerere_autoupdate = !!(flags & RERERE_AUTOUPDATE);
882 if (flags & RERERE_READONLY)
883 fd = 0;
884 else
885 fd = hold_lock_file_for_update(&write_lock,
886 git_path_merge_rr(r),
887 LOCK_DIE_ON_ERROR);
888 read_rr(r, merge_rr);
889 return fd;
893 * The main entry point that is called internally from codepaths that
894 * perform mergy operations, possibly leaving conflicted index entries
895 * and working tree files.
897 int repo_rerere(struct repository *r, int flags)
899 struct string_list merge_rr = STRING_LIST_INIT_DUP;
900 int fd, status;
902 fd = setup_rerere(r, &merge_rr, flags);
903 if (fd < 0)
904 return 0;
905 status = do_plain_rerere(r, &merge_rr, fd);
906 free_rerere_dirs();
907 return status;
911 * Subclass of rerere_io that reads from an in-core buffer that is a
912 * strbuf
914 struct rerere_io_mem {
915 struct rerere_io io;
916 struct strbuf input;
920 * ... and its getline() method implementation
922 static int rerere_mem_getline(struct strbuf *sb, struct rerere_io *io_)
924 struct rerere_io_mem *io = (struct rerere_io_mem *)io_;
925 char *ep;
926 size_t len;
928 strbuf_release(sb);
929 if (!io->input.len)
930 return -1;
931 ep = memchr(io->input.buf, '\n', io->input.len);
932 if (!ep)
933 ep = io->input.buf + io->input.len;
934 else if (*ep == '\n')
935 ep++;
936 len = ep - io->input.buf;
937 strbuf_add(sb, io->input.buf, len);
938 strbuf_remove(&io->input, 0, len);
939 return 0;
942 static int handle_cache(struct index_state *istate,
943 const char *path, unsigned char *hash, const char *output)
945 mmfile_t mmfile[3] = {{NULL}};
946 mmbuffer_t result = {NULL, 0};
947 const struct cache_entry *ce;
948 int pos, len, i, has_conflicts;
949 struct rerere_io_mem io;
950 int marker_size = ll_merge_marker_size(istate, path);
953 * Reproduce the conflicted merge in-core
955 len = strlen(path);
956 pos = index_name_pos(istate, path, len);
957 if (0 <= pos)
958 return -1;
959 pos = -pos - 1;
961 while (pos < istate->cache_nr) {
962 enum object_type type;
963 unsigned long size;
965 ce = istate->cache[pos++];
966 if (ce_namelen(ce) != len || memcmp(ce->name, path, len))
967 break;
968 i = ce_stage(ce) - 1;
969 if (!mmfile[i].ptr) {
970 mmfile[i].ptr = read_object_file(&ce->oid, &type,
971 &size);
972 mmfile[i].size = size;
975 for (i = 0; i < 3; i++)
976 if (!mmfile[i].ptr && !mmfile[i].size)
977 mmfile[i].ptr = xstrdup("");
980 * NEEDSWORK: handle conflicts from merges with
981 * merge.renormalize set, too?
983 ll_merge(&result, path, &mmfile[0], NULL,
984 &mmfile[1], "ours",
985 &mmfile[2], "theirs",
986 istate, NULL);
987 for (i = 0; i < 3; i++)
988 free(mmfile[i].ptr);
990 memset(&io, 0, sizeof(io));
991 io.io.getline = rerere_mem_getline;
992 if (output)
993 io.io.output = fopen(output, "w");
994 else
995 io.io.output = NULL;
996 strbuf_init(&io.input, 0);
997 strbuf_attach(&io.input, result.ptr, result.size, result.size);
1000 * Grab the conflict ID and optionally write the original
1001 * contents with conflict markers out.
1003 has_conflicts = handle_path(hash, (struct rerere_io *)&io, marker_size);
1004 strbuf_release(&io.input);
1005 if (io.io.output)
1006 fclose(io.io.output);
1007 return has_conflicts;
1010 static int rerere_forget_one_path(struct index_state *istate,
1011 const char *path,
1012 struct string_list *rr)
1014 const char *filename;
1015 struct rerere_id *id;
1016 unsigned char hash[GIT_MAX_RAWSZ];
1017 int ret;
1018 struct string_list_item *item;
1021 * Recreate the original conflict from the stages in the
1022 * index and compute the conflict ID
1024 ret = handle_cache(istate, path, hash, NULL);
1025 if (ret < 1)
1026 return error(_("could not parse conflict hunks in '%s'"), path);
1028 /* Nuke the recorded resolution for the conflict */
1029 id = new_rerere_id(hash);
1031 for (id->variant = 0;
1032 id->variant < id->collection->status_nr;
1033 id->variant++) {
1034 mmfile_t cur = { NULL, 0 };
1035 mmbuffer_t result = {NULL, 0};
1036 int cleanly_resolved;
1038 if (!has_rerere_resolution(id))
1039 continue;
1041 handle_cache(istate, path, hash, rerere_path(id, "thisimage"));
1042 if (read_mmfile(&cur, rerere_path(id, "thisimage"))) {
1043 free(cur.ptr);
1044 error(_("failed to update conflicted state in '%s'"), path);
1045 goto fail_exit;
1047 cleanly_resolved = !try_merge(istate, id, path, &cur, &result);
1048 free(result.ptr);
1049 free(cur.ptr);
1050 if (cleanly_resolved)
1051 break;
1054 if (id->collection->status_nr <= id->variant) {
1055 error(_("no remembered resolution for '%s'"), path);
1056 goto fail_exit;
1059 filename = rerere_path(id, "postimage");
1060 if (unlink(filename)) {
1061 if (errno == ENOENT)
1062 error(_("no remembered resolution for '%s'"), path);
1063 else
1064 error_errno(_("cannot unlink '%s'"), filename);
1065 goto fail_exit;
1069 * Update the preimage so that the user can resolve the
1070 * conflict in the working tree, run us again to record
1071 * the postimage.
1073 handle_cache(istate, path, hash, rerere_path(id, "preimage"));
1074 fprintf_ln(stderr, _("Updated preimage for '%s'"), path);
1077 * And remember that we can record resolution for this
1078 * conflict when the user is done.
1080 item = string_list_insert(rr, path);
1081 free_rerere_id(item);
1082 item->util = id;
1083 fprintf(stderr, _("Forgot resolution for '%s'\n"), path);
1084 return 0;
1086 fail_exit:
1087 free(id);
1088 return -1;
1091 int rerere_forget(struct repository *r, struct pathspec *pathspec)
1093 int i, fd;
1094 struct string_list conflict = STRING_LIST_INIT_DUP;
1095 struct string_list merge_rr = STRING_LIST_INIT_DUP;
1097 if (repo_read_index(r) < 0)
1098 return error(_("index file corrupt"));
1100 fd = setup_rerere(r, &merge_rr, RERERE_NOAUTOUPDATE);
1101 if (fd < 0)
1102 return 0;
1105 * The paths may have been resolved (incorrectly);
1106 * recover the original conflicted state and then
1107 * find the conflicted paths.
1109 unmerge_index(r->index, pathspec);
1110 find_conflict(r, &conflict);
1111 for (i = 0; i < conflict.nr; i++) {
1112 struct string_list_item *it = &conflict.items[i];
1113 if (!match_pathspec(r->index, pathspec, it->string,
1114 strlen(it->string), 0, NULL, 0))
1115 continue;
1116 rerere_forget_one_path(r->index, it->string, &merge_rr);
1118 return write_rr(&merge_rr, fd);
1122 * Garbage collection support
1125 static timestamp_t rerere_created_at(struct rerere_id *id)
1127 struct stat st;
1129 return stat(rerere_path(id, "preimage"), &st) ? (time_t) 0 : st.st_mtime;
1132 static timestamp_t rerere_last_used_at(struct rerere_id *id)
1134 struct stat st;
1136 return stat(rerere_path(id, "postimage"), &st) ? (time_t) 0 : st.st_mtime;
1140 * Remove the recorded resolution for a given conflict ID
1142 static void unlink_rr_item(struct rerere_id *id)
1144 unlink_or_warn(rerere_path(id, "thisimage"));
1145 remove_variant(id);
1146 id->collection->status[id->variant] = 0;
1149 static void prune_one(struct rerere_id *id,
1150 timestamp_t cutoff_resolve, timestamp_t cutoff_noresolve)
1152 timestamp_t then;
1153 timestamp_t cutoff;
1155 then = rerere_last_used_at(id);
1156 if (then)
1157 cutoff = cutoff_resolve;
1158 else {
1159 then = rerere_created_at(id);
1160 if (!then)
1161 return;
1162 cutoff = cutoff_noresolve;
1164 if (then < cutoff)
1165 unlink_rr_item(id);
1168 /* Does the basename in "path" look plausibly like an rr-cache entry? */
1169 static int is_rr_cache_dirname(const char *path)
1171 struct object_id oid;
1172 const char *end;
1173 return !parse_oid_hex(path, &oid, &end) && !*end;
1176 void rerere_gc(struct repository *r, struct string_list *rr)
1178 struct string_list to_remove = STRING_LIST_INIT_DUP;
1179 DIR *dir;
1180 struct dirent *e;
1181 int i;
1182 timestamp_t now = time(NULL);
1183 timestamp_t cutoff_noresolve = now - 15 * 86400;
1184 timestamp_t cutoff_resolve = now - 60 * 86400;
1186 if (setup_rerere(r, rr, 0) < 0)
1187 return;
1189 git_config_get_expiry_in_days("gc.rerereresolved", &cutoff_resolve, now);
1190 git_config_get_expiry_in_days("gc.rerereunresolved", &cutoff_noresolve, now);
1191 git_config(git_default_config, NULL);
1192 dir = opendir(git_path("rr-cache"));
1193 if (!dir)
1194 die_errno(_("unable to open rr-cache directory"));
1195 /* Collect stale conflict IDs ... */
1196 while ((e = readdir_skip_dot_and_dotdot(dir))) {
1197 struct rerere_dir *rr_dir;
1198 struct rerere_id id;
1199 int now_empty;
1201 if (!is_rr_cache_dirname(e->d_name))
1202 continue; /* or should we remove e->d_name? */
1204 rr_dir = find_rerere_dir(e->d_name);
1206 now_empty = 1;
1207 for (id.variant = 0, id.collection = rr_dir;
1208 id.variant < id.collection->status_nr;
1209 id.variant++) {
1210 prune_one(&id, cutoff_resolve, cutoff_noresolve);
1211 if (id.collection->status[id.variant])
1212 now_empty = 0;
1214 if (now_empty)
1215 string_list_append(&to_remove, e->d_name);
1217 closedir(dir);
1219 /* ... and then remove the empty directories */
1220 for (i = 0; i < to_remove.nr; i++)
1221 rmdir(git_path("rr-cache/%s", to_remove.items[i].string));
1222 string_list_clear(&to_remove, 0);
1223 rollback_lock_file(&write_lock);
1227 * During a conflict resolution, after "rerere" recorded the
1228 * preimages, abandon them if the user did not resolve them or
1229 * record their resolutions. And drop $GIT_DIR/MERGE_RR.
1231 * NEEDSWORK: shouldn't we be calling this from "reset --hard"?
1233 void rerere_clear(struct repository *r, struct string_list *merge_rr)
1235 int i;
1237 if (setup_rerere(r, merge_rr, 0) < 0)
1238 return;
1240 for (i = 0; i < merge_rr->nr; i++) {
1241 struct rerere_id *id = merge_rr->items[i].util;
1242 if (!has_rerere_resolution(id)) {
1243 unlink_rr_item(id);
1244 rmdir(rerere_path(id, NULL));
1247 unlink_or_warn(git_path_merge_rr(r));
1248 rollback_lock_file(&write_lock);