A few more fixes before -rc1
[alt-git.git] / reftable / stack.c
blobb64e55648aa8798054bb7b8a781376e7fa3bc2af
1 /*
2 Copyright 2020 Google LLC
4 Use of this source code is governed by a BSD-style
5 license that can be found in the LICENSE file or at
6 https://developers.google.com/open-source/licenses/bsd
7 */
9 #include "stack.h"
11 #include "../write-or-die.h"
12 #include "system.h"
13 #include "merged.h"
14 #include "reader.h"
15 #include "refname.h"
16 #include "reftable-error.h"
17 #include "reftable-record.h"
18 #include "reftable-merged.h"
19 #include "writer.h"
20 #include "tempfile.h"
22 static int stack_try_add(struct reftable_stack *st,
23 int (*write_table)(struct reftable_writer *wr,
24 void *arg),
25 void *arg);
26 static int stack_write_compact(struct reftable_stack *st,
27 struct reftable_writer *wr,
28 size_t first, size_t last,
29 struct reftable_log_expiry_config *config);
30 static int stack_check_addition(struct reftable_stack *st,
31 const char *new_tab_name);
32 static void reftable_addition_close(struct reftable_addition *add);
33 static int reftable_stack_reload_maybe_reuse(struct reftable_stack *st,
34 int reuse_open);
36 static void stack_filename(struct strbuf *dest, struct reftable_stack *st,
37 const char *name)
39 strbuf_reset(dest);
40 strbuf_addstr(dest, st->reftable_dir);
41 strbuf_addstr(dest, "/");
42 strbuf_addstr(dest, name);
45 static ssize_t reftable_fd_write(void *arg, const void *data, size_t sz)
47 int *fdp = (int *)arg;
48 return write_in_full(*fdp, data, sz);
51 static int reftable_fd_flush(void *arg)
53 int *fdp = (int *)arg;
55 return fsync_component(FSYNC_COMPONENT_REFERENCE, *fdp);
58 int reftable_new_stack(struct reftable_stack **dest, const char *dir,
59 struct reftable_write_options config)
61 struct reftable_stack *p = reftable_calloc(1, sizeof(*p));
62 struct strbuf list_file_name = STRBUF_INIT;
63 int err = 0;
65 if (config.hash_id == 0) {
66 config.hash_id = GIT_SHA1_FORMAT_ID;
69 *dest = NULL;
71 strbuf_reset(&list_file_name);
72 strbuf_addstr(&list_file_name, dir);
73 strbuf_addstr(&list_file_name, "/tables.list");
75 p->list_file = strbuf_detach(&list_file_name, NULL);
76 p->list_fd = -1;
77 p->reftable_dir = xstrdup(dir);
78 p->config = config;
80 err = reftable_stack_reload_maybe_reuse(p, 1);
81 if (err < 0) {
82 reftable_stack_destroy(p);
83 } else {
84 *dest = p;
86 return err;
89 static int fd_read_lines(int fd, char ***namesp)
91 off_t size = lseek(fd, 0, SEEK_END);
92 char *buf = NULL;
93 int err = 0;
94 if (size < 0) {
95 err = REFTABLE_IO_ERROR;
96 goto done;
98 err = lseek(fd, 0, SEEK_SET);
99 if (err < 0) {
100 err = REFTABLE_IO_ERROR;
101 goto done;
104 REFTABLE_ALLOC_ARRAY(buf, size + 1);
105 if (read_in_full(fd, buf, size) != size) {
106 err = REFTABLE_IO_ERROR;
107 goto done;
109 buf[size] = 0;
111 parse_names(buf, size, namesp);
113 done:
114 reftable_free(buf);
115 return err;
118 int read_lines(const char *filename, char ***namesp)
120 int fd = open(filename, O_RDONLY);
121 int err = 0;
122 if (fd < 0) {
123 if (errno == ENOENT) {
124 REFTABLE_CALLOC_ARRAY(*namesp, 1);
125 return 0;
128 return REFTABLE_IO_ERROR;
130 err = fd_read_lines(fd, namesp);
131 close(fd);
132 return err;
135 struct reftable_merged_table *
136 reftable_stack_merged_table(struct reftable_stack *st)
138 return st->merged;
141 static int has_name(char **names, const char *name)
143 while (*names) {
144 if (!strcmp(*names, name))
145 return 1;
146 names++;
148 return 0;
151 /* Close and free the stack */
152 void reftable_stack_destroy(struct reftable_stack *st)
154 char **names = NULL;
155 int err = 0;
156 if (st->merged) {
157 reftable_merged_table_free(st->merged);
158 st->merged = NULL;
161 err = read_lines(st->list_file, &names);
162 if (err < 0) {
163 FREE_AND_NULL(names);
166 if (st->readers) {
167 int i = 0;
168 struct strbuf filename = STRBUF_INIT;
169 for (i = 0; i < st->readers_len; i++) {
170 const char *name = reader_name(st->readers[i]);
171 strbuf_reset(&filename);
172 if (names && !has_name(names, name)) {
173 stack_filename(&filename, st, name);
175 reftable_reader_free(st->readers[i]);
177 if (filename.len) {
178 /* On Windows, can only unlink after closing. */
179 unlink(filename.buf);
182 strbuf_release(&filename);
183 st->readers_len = 0;
184 FREE_AND_NULL(st->readers);
187 if (st->list_fd >= 0) {
188 close(st->list_fd);
189 st->list_fd = -1;
192 FREE_AND_NULL(st->list_file);
193 FREE_AND_NULL(st->reftable_dir);
194 reftable_free(st);
195 free_names(names);
198 static struct reftable_reader **stack_copy_readers(struct reftable_stack *st,
199 int cur_len)
201 struct reftable_reader **cur = reftable_calloc(cur_len, sizeof(*cur));
202 int i = 0;
203 for (i = 0; i < cur_len; i++) {
204 cur[i] = st->readers[i];
206 return cur;
209 static int reftable_stack_reload_once(struct reftable_stack *st, char **names,
210 int reuse_open)
212 size_t cur_len = !st->merged ? 0 : st->merged->stack_len;
213 struct reftable_reader **cur = stack_copy_readers(st, cur_len);
214 size_t names_len = names_length(names);
215 struct reftable_reader **new_readers =
216 reftable_calloc(names_len, sizeof(*new_readers));
217 struct reftable_table *new_tables =
218 reftable_calloc(names_len, sizeof(*new_tables));
219 size_t new_readers_len = 0;
220 struct reftable_merged_table *new_merged = NULL;
221 struct strbuf table_path = STRBUF_INIT;
222 int err = 0;
223 size_t i;
225 while (*names) {
226 struct reftable_reader *rd = NULL;
227 char *name = *names++;
229 /* this is linear; we assume compaction keeps the number of
230 tables under control so this is not quadratic. */
231 for (i = 0; reuse_open && i < cur_len; i++) {
232 if (cur[i] && 0 == strcmp(cur[i]->name, name)) {
233 rd = cur[i];
234 cur[i] = NULL;
235 break;
239 if (!rd) {
240 struct reftable_block_source src = { NULL };
241 stack_filename(&table_path, st, name);
243 err = reftable_block_source_from_file(&src,
244 table_path.buf);
245 if (err < 0)
246 goto done;
248 err = reftable_new_reader(&rd, &src, name);
249 if (err < 0)
250 goto done;
253 new_readers[new_readers_len] = rd;
254 reftable_table_from_reader(&new_tables[new_readers_len], rd);
255 new_readers_len++;
258 /* success! */
259 err = reftable_new_merged_table(&new_merged, new_tables,
260 new_readers_len, st->config.hash_id);
261 if (err < 0)
262 goto done;
264 new_tables = NULL;
265 st->readers_len = new_readers_len;
266 if (st->merged) {
267 merged_table_release(st->merged);
268 reftable_merged_table_free(st->merged);
270 if (st->readers) {
271 reftable_free(st->readers);
273 st->readers = new_readers;
274 new_readers = NULL;
275 new_readers_len = 0;
277 new_merged->suppress_deletions = 1;
278 st->merged = new_merged;
279 for (i = 0; i < cur_len; i++) {
280 if (cur[i]) {
281 const char *name = reader_name(cur[i]);
282 stack_filename(&table_path, st, name);
284 reader_close(cur[i]);
285 reftable_reader_free(cur[i]);
287 /* On Windows, can only unlink after closing. */
288 unlink(table_path.buf);
292 done:
293 for (i = 0; i < new_readers_len; i++) {
294 reader_close(new_readers[i]);
295 reftable_reader_free(new_readers[i]);
297 reftable_free(new_readers);
298 reftable_free(new_tables);
299 reftable_free(cur);
300 strbuf_release(&table_path);
301 return err;
304 /* return negative if a before b. */
305 static int tv_cmp(struct timeval *a, struct timeval *b)
307 time_t diff = a->tv_sec - b->tv_sec;
308 int udiff = a->tv_usec - b->tv_usec;
310 if (diff != 0)
311 return diff;
313 return udiff;
316 static int reftable_stack_reload_maybe_reuse(struct reftable_stack *st,
317 int reuse_open)
319 char **names = NULL, **names_after = NULL;
320 struct timeval deadline;
321 int64_t delay = 0;
322 int tries = 0, err;
323 int fd = -1;
325 err = gettimeofday(&deadline, NULL);
326 if (err < 0)
327 goto out;
328 deadline.tv_sec += 3;
330 while (1) {
331 struct timeval now;
333 err = gettimeofday(&now, NULL);
334 if (err < 0)
335 goto out;
338 * Only look at deadlines after the first few times. This
339 * simplifies debugging in GDB.
341 tries++;
342 if (tries > 3 && tv_cmp(&now, &deadline) >= 0)
343 goto out;
345 fd = open(st->list_file, O_RDONLY);
346 if (fd < 0) {
347 if (errno != ENOENT) {
348 err = REFTABLE_IO_ERROR;
349 goto out;
352 REFTABLE_CALLOC_ARRAY(names, 1);
353 } else {
354 err = fd_read_lines(fd, &names);
355 if (err < 0)
356 goto out;
359 err = reftable_stack_reload_once(st, names, reuse_open);
360 if (!err)
361 break;
362 if (err != REFTABLE_NOT_EXIST_ERROR)
363 goto out;
366 * REFTABLE_NOT_EXIST_ERROR can be caused by a concurrent
367 * writer. Check if there was one by checking if the name list
368 * changed.
370 err = read_lines(st->list_file, &names_after);
371 if (err < 0)
372 goto out;
373 if (names_equal(names_after, names)) {
374 err = REFTABLE_NOT_EXIST_ERROR;
375 goto out;
378 free_names(names);
379 names = NULL;
380 free_names(names_after);
381 names_after = NULL;
382 close(fd);
383 fd = -1;
385 delay = delay + (delay * rand()) / RAND_MAX + 1;
386 sleep_millisec(delay);
389 out:
391 * Invalidate the stat cache. It is sufficient to only close the file
392 * descriptor and keep the cached stat info because we never use the
393 * latter when the former is negative.
395 if (st->list_fd >= 0) {
396 close(st->list_fd);
397 st->list_fd = -1;
401 * Cache stat information in case it provides a useful signal to us.
402 * According to POSIX, "The st_ino and st_dev fields taken together
403 * uniquely identify the file within the system." That being said,
404 * Windows is not POSIX compliant and we do not have these fields
405 * available. So the information we have there is insufficient to
406 * determine whether two file descriptors point to the same file.
408 * While we could fall back to using other signals like the file's
409 * mtime, those are not sufficient to avoid races. We thus refrain from
410 * using the stat cache on such systems and fall back to the secondary
411 * caching mechanism, which is to check whether contents of the file
412 * have changed.
414 * On other systems which are POSIX compliant we must keep the file
415 * descriptor open. This is to avoid a race condition where two
416 * processes access the reftable stack at the same point in time:
418 * 1. A reads the reftable stack and caches its stat info.
420 * 2. B updates the stack, appending a new table to "tables.list".
421 * This will both use a new inode and result in a different file
422 * size, thus invalidating A's cache in theory.
424 * 3. B decides to auto-compact the stack and merges two tables. The
425 * file size now matches what A has cached again. Furthermore, the
426 * filesystem may decide to recycle the inode number of the file
427 * we have replaced in (2) because it is not in use anymore.
429 * 4. A reloads the reftable stack. Neither the inode number nor the
430 * file size changed. If the timestamps did not change either then
431 * we think the cached copy of our stack is up-to-date.
433 * By keeping the file descriptor open the inode number cannot be
434 * recycled, mitigating the race.
436 if (!err && fd >= 0 && !fstat(fd, &st->list_st) &&
437 st->list_st.st_dev && st->list_st.st_ino) {
438 st->list_fd = fd;
439 fd = -1;
442 if (fd >= 0)
443 close(fd);
444 free_names(names);
445 free_names(names_after);
446 return err;
449 /* -1 = error
450 0 = up to date
451 1 = changed. */
452 static int stack_uptodate(struct reftable_stack *st)
454 char **names = NULL;
455 int err;
456 int i = 0;
459 * When we have cached stat information available then we use it to
460 * verify whether the file has been rewritten.
462 * Note that we explicitly do not want to use `stat_validity_check()`
463 * and friends here because they may end up not comparing the `st_dev`
464 * and `st_ino` fields. These functions thus cannot guarantee that we
465 * indeed still have the same file.
467 if (st->list_fd >= 0) {
468 struct stat list_st;
470 if (stat(st->list_file, &list_st) < 0) {
472 * It's fine for "tables.list" to not exist. In that
473 * case, we have to refresh when the loaded stack has
474 * any readers.
476 if (errno == ENOENT)
477 return !!st->readers_len;
478 return REFTABLE_IO_ERROR;
482 * When "tables.list" refers to the same file we can assume
483 * that it didn't change. This is because we always use
484 * rename(3P) to update the file and never write to it
485 * directly.
487 if (st->list_st.st_dev == list_st.st_dev &&
488 st->list_st.st_ino == list_st.st_ino)
489 return 0;
492 err = read_lines(st->list_file, &names);
493 if (err < 0)
494 return err;
496 for (i = 0; i < st->readers_len; i++) {
497 if (!names[i]) {
498 err = 1;
499 goto done;
502 if (strcmp(st->readers[i]->name, names[i])) {
503 err = 1;
504 goto done;
508 if (names[st->merged->stack_len]) {
509 err = 1;
510 goto done;
513 done:
514 free_names(names);
515 return err;
518 int reftable_stack_reload(struct reftable_stack *st)
520 int err = stack_uptodate(st);
521 if (err > 0)
522 return reftable_stack_reload_maybe_reuse(st, 1);
523 return err;
526 int reftable_stack_add(struct reftable_stack *st,
527 int (*write)(struct reftable_writer *wr, void *arg),
528 void *arg)
530 int err = stack_try_add(st, write, arg);
531 if (err < 0) {
532 if (err == REFTABLE_LOCK_ERROR) {
533 /* Ignore error return, we want to propagate
534 REFTABLE_LOCK_ERROR.
536 reftable_stack_reload(st);
538 return err;
541 return 0;
544 static void format_name(struct strbuf *dest, uint64_t min, uint64_t max)
546 char buf[100];
547 uint32_t rnd = (uint32_t)git_rand();
548 snprintf(buf, sizeof(buf), "0x%012" PRIx64 "-0x%012" PRIx64 "-%08x",
549 min, max, rnd);
550 strbuf_reset(dest);
551 strbuf_addstr(dest, buf);
554 struct reftable_addition {
555 struct tempfile *lock_file;
556 struct reftable_stack *stack;
558 char **new_tables;
559 size_t new_tables_len, new_tables_cap;
560 uint64_t next_update_index;
563 #define REFTABLE_ADDITION_INIT {0}
565 static int reftable_stack_init_addition(struct reftable_addition *add,
566 struct reftable_stack *st)
568 struct strbuf lock_file_name = STRBUF_INIT;
569 int err = 0;
570 add->stack = st;
572 strbuf_addf(&lock_file_name, "%s.lock", st->list_file);
574 add->lock_file = create_tempfile(lock_file_name.buf);
575 if (!add->lock_file) {
576 if (errno == EEXIST) {
577 err = REFTABLE_LOCK_ERROR;
578 } else {
579 err = REFTABLE_IO_ERROR;
581 goto done;
583 if (st->config.default_permissions) {
584 if (chmod(add->lock_file->filename.buf, st->config.default_permissions) < 0) {
585 err = REFTABLE_IO_ERROR;
586 goto done;
590 err = stack_uptodate(st);
591 if (err < 0)
592 goto done;
594 if (err > 1) {
595 err = REFTABLE_LOCK_ERROR;
596 goto done;
599 add->next_update_index = reftable_stack_next_update_index(st);
600 done:
601 if (err) {
602 reftable_addition_close(add);
604 strbuf_release(&lock_file_name);
605 return err;
608 static void reftable_addition_close(struct reftable_addition *add)
610 struct strbuf nm = STRBUF_INIT;
611 size_t i;
613 for (i = 0; i < add->new_tables_len; i++) {
614 stack_filename(&nm, add->stack, add->new_tables[i]);
615 unlink(nm.buf);
616 reftable_free(add->new_tables[i]);
617 add->new_tables[i] = NULL;
619 reftable_free(add->new_tables);
620 add->new_tables = NULL;
621 add->new_tables_len = 0;
622 add->new_tables_cap = 0;
624 delete_tempfile(&add->lock_file);
625 strbuf_release(&nm);
628 void reftable_addition_destroy(struct reftable_addition *add)
630 if (!add) {
631 return;
633 reftable_addition_close(add);
634 reftable_free(add);
637 int reftable_addition_commit(struct reftable_addition *add)
639 struct strbuf table_list = STRBUF_INIT;
640 int lock_file_fd = get_tempfile_fd(add->lock_file);
641 int err = 0;
642 size_t i;
644 if (add->new_tables_len == 0)
645 goto done;
647 for (i = 0; i < add->stack->merged->stack_len; i++) {
648 strbuf_addstr(&table_list, add->stack->readers[i]->name);
649 strbuf_addstr(&table_list, "\n");
651 for (i = 0; i < add->new_tables_len; i++) {
652 strbuf_addstr(&table_list, add->new_tables[i]);
653 strbuf_addstr(&table_list, "\n");
656 err = write_in_full(lock_file_fd, table_list.buf, table_list.len);
657 strbuf_release(&table_list);
658 if (err < 0) {
659 err = REFTABLE_IO_ERROR;
660 goto done;
663 fsync_component_or_die(FSYNC_COMPONENT_REFERENCE, lock_file_fd,
664 get_tempfile_path(add->lock_file));
666 err = rename_tempfile(&add->lock_file, add->stack->list_file);
667 if (err < 0) {
668 err = REFTABLE_IO_ERROR;
669 goto done;
672 /* success, no more state to clean up. */
673 for (i = 0; i < add->new_tables_len; i++)
674 reftable_free(add->new_tables[i]);
675 reftable_free(add->new_tables);
676 add->new_tables = NULL;
677 add->new_tables_len = 0;
678 add->new_tables_cap = 0;
680 err = reftable_stack_reload_maybe_reuse(add->stack, 1);
681 if (err)
682 goto done;
684 if (!add->stack->disable_auto_compact)
685 err = reftable_stack_auto_compact(add->stack);
687 done:
688 reftable_addition_close(add);
689 return err;
692 int reftable_stack_new_addition(struct reftable_addition **dest,
693 struct reftable_stack *st)
695 int err = 0;
696 struct reftable_addition empty = REFTABLE_ADDITION_INIT;
697 REFTABLE_CALLOC_ARRAY(*dest, 1);
698 **dest = empty;
699 err = reftable_stack_init_addition(*dest, st);
700 if (err) {
701 reftable_free(*dest);
702 *dest = NULL;
704 return err;
707 static int stack_try_add(struct reftable_stack *st,
708 int (*write_table)(struct reftable_writer *wr,
709 void *arg),
710 void *arg)
712 struct reftable_addition add = REFTABLE_ADDITION_INIT;
713 int err = reftable_stack_init_addition(&add, st);
714 if (err < 0)
715 goto done;
716 if (err > 0) {
717 err = REFTABLE_LOCK_ERROR;
718 goto done;
721 err = reftable_addition_add(&add, write_table, arg);
722 if (err < 0)
723 goto done;
725 err = reftable_addition_commit(&add);
726 done:
727 reftable_addition_close(&add);
728 return err;
731 int reftable_addition_add(struct reftable_addition *add,
732 int (*write_table)(struct reftable_writer *wr,
733 void *arg),
734 void *arg)
736 struct strbuf temp_tab_file_name = STRBUF_INIT;
737 struct strbuf tab_file_name = STRBUF_INIT;
738 struct strbuf next_name = STRBUF_INIT;
739 struct reftable_writer *wr = NULL;
740 int err = 0;
741 int tab_fd = 0;
743 strbuf_reset(&next_name);
744 format_name(&next_name, add->next_update_index, add->next_update_index);
746 stack_filename(&temp_tab_file_name, add->stack, next_name.buf);
747 strbuf_addstr(&temp_tab_file_name, ".temp.XXXXXX");
749 tab_fd = mkstemp(temp_tab_file_name.buf);
750 if (tab_fd < 0) {
751 err = REFTABLE_IO_ERROR;
752 goto done;
754 if (add->stack->config.default_permissions) {
755 if (chmod(temp_tab_file_name.buf, add->stack->config.default_permissions)) {
756 err = REFTABLE_IO_ERROR;
757 goto done;
760 wr = reftable_new_writer(reftable_fd_write, reftable_fd_flush, &tab_fd,
761 &add->stack->config);
762 err = write_table(wr, arg);
763 if (err < 0)
764 goto done;
766 err = reftable_writer_close(wr);
767 if (err == REFTABLE_EMPTY_TABLE_ERROR) {
768 err = 0;
769 goto done;
771 if (err < 0)
772 goto done;
774 err = close(tab_fd);
775 tab_fd = 0;
776 if (err < 0) {
777 err = REFTABLE_IO_ERROR;
778 goto done;
781 err = stack_check_addition(add->stack, temp_tab_file_name.buf);
782 if (err < 0)
783 goto done;
785 if (wr->min_update_index < add->next_update_index) {
786 err = REFTABLE_API_ERROR;
787 goto done;
790 format_name(&next_name, wr->min_update_index, wr->max_update_index);
791 strbuf_addstr(&next_name, ".ref");
793 stack_filename(&tab_file_name, add->stack, next_name.buf);
796 On windows, this relies on rand() picking a unique destination name.
797 Maybe we should do retry loop as well?
799 err = rename(temp_tab_file_name.buf, tab_file_name.buf);
800 if (err < 0) {
801 err = REFTABLE_IO_ERROR;
802 goto done;
805 REFTABLE_ALLOC_GROW(add->new_tables, add->new_tables_len + 1,
806 add->new_tables_cap);
807 add->new_tables[add->new_tables_len++] = strbuf_detach(&next_name, NULL);
808 done:
809 if (tab_fd > 0) {
810 close(tab_fd);
811 tab_fd = 0;
813 if (temp_tab_file_name.len > 0) {
814 unlink(temp_tab_file_name.buf);
817 strbuf_release(&temp_tab_file_name);
818 strbuf_release(&tab_file_name);
819 strbuf_release(&next_name);
820 reftable_writer_free(wr);
821 return err;
824 uint64_t reftable_stack_next_update_index(struct reftable_stack *st)
826 int sz = st->merged->stack_len;
827 if (sz > 0)
828 return reftable_reader_max_update_index(st->readers[sz - 1]) +
830 return 1;
833 static int stack_compact_locked(struct reftable_stack *st,
834 size_t first, size_t last,
835 struct strbuf *temp_tab,
836 struct reftable_log_expiry_config *config)
838 struct strbuf next_name = STRBUF_INIT;
839 int tab_fd = -1;
840 struct reftable_writer *wr = NULL;
841 int err = 0;
843 format_name(&next_name,
844 reftable_reader_min_update_index(st->readers[first]),
845 reftable_reader_max_update_index(st->readers[last]));
847 stack_filename(temp_tab, st, next_name.buf);
848 strbuf_addstr(temp_tab, ".temp.XXXXXX");
850 tab_fd = mkstemp(temp_tab->buf);
851 if (st->config.default_permissions &&
852 chmod(temp_tab->buf, st->config.default_permissions) < 0) {
853 err = REFTABLE_IO_ERROR;
854 goto done;
857 wr = reftable_new_writer(reftable_fd_write, reftable_fd_flush, &tab_fd, &st->config);
859 err = stack_write_compact(st, wr, first, last, config);
860 if (err < 0)
861 goto done;
862 err = reftable_writer_close(wr);
863 if (err < 0)
864 goto done;
866 err = close(tab_fd);
867 tab_fd = 0;
869 done:
870 reftable_writer_free(wr);
871 if (tab_fd > 0) {
872 close(tab_fd);
873 tab_fd = 0;
875 if (err != 0 && temp_tab->len > 0) {
876 unlink(temp_tab->buf);
877 strbuf_release(temp_tab);
879 strbuf_release(&next_name);
880 return err;
883 static int stack_write_compact(struct reftable_stack *st,
884 struct reftable_writer *wr,
885 size_t first, size_t last,
886 struct reftable_log_expiry_config *config)
888 size_t subtabs_len = last - first + 1;
889 struct reftable_table *subtabs = reftable_calloc(
890 last - first + 1, sizeof(*subtabs));
891 struct reftable_merged_table *mt = NULL;
892 struct reftable_iterator it = { NULL };
893 struct reftable_ref_record ref = { NULL };
894 struct reftable_log_record log = { NULL };
895 uint64_t entries = 0;
896 int err = 0;
898 for (size_t i = first, j = 0; i <= last; i++) {
899 struct reftable_reader *t = st->readers[i];
900 reftable_table_from_reader(&subtabs[j++], t);
901 st->stats.bytes += t->size;
903 reftable_writer_set_limits(wr, st->readers[first]->min_update_index,
904 st->readers[last]->max_update_index);
906 err = reftable_new_merged_table(&mt, subtabs, subtabs_len,
907 st->config.hash_id);
908 if (err < 0) {
909 reftable_free(subtabs);
910 goto done;
913 err = reftable_merged_table_seek_ref(mt, &it, "");
914 if (err < 0)
915 goto done;
917 while (1) {
918 err = reftable_iterator_next_ref(&it, &ref);
919 if (err > 0) {
920 err = 0;
921 break;
923 if (err < 0)
924 goto done;
926 if (first == 0 && reftable_ref_record_is_deletion(&ref)) {
927 continue;
930 err = reftable_writer_add_ref(wr, &ref);
931 if (err < 0)
932 goto done;
933 entries++;
935 reftable_iterator_destroy(&it);
937 err = reftable_merged_table_seek_log(mt, &it, "");
938 if (err < 0)
939 goto done;
941 while (1) {
942 err = reftable_iterator_next_log(&it, &log);
943 if (err > 0) {
944 err = 0;
945 break;
947 if (err < 0)
948 goto done;
949 if (first == 0 && reftable_log_record_is_deletion(&log)) {
950 continue;
953 if (config && config->min_update_index > 0 &&
954 log.update_index < config->min_update_index) {
955 continue;
958 if (config && config->time > 0 &&
959 log.value.update.time < config->time) {
960 continue;
963 err = reftable_writer_add_log(wr, &log);
964 if (err < 0)
965 goto done;
966 entries++;
969 done:
970 reftable_iterator_destroy(&it);
971 if (mt) {
972 merged_table_release(mt);
973 reftable_merged_table_free(mt);
975 reftable_ref_record_release(&ref);
976 reftable_log_record_release(&log);
977 st->stats.entries_written += entries;
978 return err;
981 /* < 0: error. 0 == OK, > 0 attempt failed; could retry. */
982 static int stack_compact_range(struct reftable_stack *st,
983 size_t first, size_t last,
984 struct reftable_log_expiry_config *expiry)
986 char **delete_on_success = NULL, **subtable_locks = NULL, **listp = NULL;
987 struct strbuf temp_tab_file_name = STRBUF_INIT;
988 struct strbuf new_table_name = STRBUF_INIT;
989 struct strbuf lock_file_name = STRBUF_INIT;
990 struct strbuf ref_list_contents = STRBUF_INIT;
991 struct strbuf new_table_path = STRBUF_INIT;
992 size_t i, j, compact_count;
993 int err = 0;
994 int have_lock = 0;
995 int lock_file_fd = -1;
996 int is_empty_table = 0;
998 if (first > last || (!expiry && first == last)) {
999 err = 0;
1000 goto done;
1003 compact_count = last - first + 1;
1004 REFTABLE_CALLOC_ARRAY(delete_on_success, compact_count + 1);
1005 REFTABLE_CALLOC_ARRAY(subtable_locks, compact_count + 1);
1007 st->stats.attempts++;
1009 strbuf_reset(&lock_file_name);
1010 strbuf_addstr(&lock_file_name, st->list_file);
1011 strbuf_addstr(&lock_file_name, ".lock");
1013 lock_file_fd =
1014 open(lock_file_name.buf, O_EXCL | O_CREAT | O_WRONLY, 0666);
1015 if (lock_file_fd < 0) {
1016 if (errno == EEXIST) {
1017 err = 1;
1018 } else {
1019 err = REFTABLE_IO_ERROR;
1021 goto done;
1023 /* Don't want to write to the lock for now. */
1024 close(lock_file_fd);
1025 lock_file_fd = -1;
1027 have_lock = 1;
1028 err = stack_uptodate(st);
1029 if (err != 0)
1030 goto done;
1032 for (i = first, j = 0; i <= last; i++) {
1033 struct strbuf subtab_file_name = STRBUF_INIT;
1034 struct strbuf subtab_lock = STRBUF_INIT;
1035 int sublock_file_fd = -1;
1037 stack_filename(&subtab_file_name, st,
1038 reader_name(st->readers[i]));
1040 strbuf_reset(&subtab_lock);
1041 strbuf_addbuf(&subtab_lock, &subtab_file_name);
1042 strbuf_addstr(&subtab_lock, ".lock");
1044 sublock_file_fd = open(subtab_lock.buf,
1045 O_EXCL | O_CREAT | O_WRONLY, 0666);
1046 if (sublock_file_fd >= 0) {
1047 close(sublock_file_fd);
1048 } else if (sublock_file_fd < 0) {
1049 if (errno == EEXIST) {
1050 err = 1;
1051 } else {
1052 err = REFTABLE_IO_ERROR;
1056 subtable_locks[j] = subtab_lock.buf;
1057 delete_on_success[j] = subtab_file_name.buf;
1058 j++;
1060 if (err != 0)
1061 goto done;
1064 err = unlink(lock_file_name.buf);
1065 if (err < 0)
1066 goto done;
1067 have_lock = 0;
1069 err = stack_compact_locked(st, first, last, &temp_tab_file_name,
1070 expiry);
1071 /* Compaction + tombstones can create an empty table out of non-empty
1072 * tables. */
1073 is_empty_table = (err == REFTABLE_EMPTY_TABLE_ERROR);
1074 if (is_empty_table) {
1075 err = 0;
1077 if (err < 0)
1078 goto done;
1080 lock_file_fd =
1081 open(lock_file_name.buf, O_EXCL | O_CREAT | O_WRONLY, 0666);
1082 if (lock_file_fd < 0) {
1083 if (errno == EEXIST) {
1084 err = 1;
1085 } else {
1086 err = REFTABLE_IO_ERROR;
1088 goto done;
1090 have_lock = 1;
1091 if (st->config.default_permissions) {
1092 if (chmod(lock_file_name.buf, st->config.default_permissions) < 0) {
1093 err = REFTABLE_IO_ERROR;
1094 goto done;
1098 format_name(&new_table_name, st->readers[first]->min_update_index,
1099 st->readers[last]->max_update_index);
1100 strbuf_addstr(&new_table_name, ".ref");
1102 stack_filename(&new_table_path, st, new_table_name.buf);
1104 if (!is_empty_table) {
1105 /* retry? */
1106 err = rename(temp_tab_file_name.buf, new_table_path.buf);
1107 if (err < 0) {
1108 err = REFTABLE_IO_ERROR;
1109 goto done;
1113 for (i = 0; i < first; i++) {
1114 strbuf_addstr(&ref_list_contents, st->readers[i]->name);
1115 strbuf_addstr(&ref_list_contents, "\n");
1117 if (!is_empty_table) {
1118 strbuf_addbuf(&ref_list_contents, &new_table_name);
1119 strbuf_addstr(&ref_list_contents, "\n");
1121 for (i = last + 1; i < st->merged->stack_len; i++) {
1122 strbuf_addstr(&ref_list_contents, st->readers[i]->name);
1123 strbuf_addstr(&ref_list_contents, "\n");
1126 err = write_in_full(lock_file_fd, ref_list_contents.buf, ref_list_contents.len);
1127 if (err < 0) {
1128 err = REFTABLE_IO_ERROR;
1129 unlink(new_table_path.buf);
1130 goto done;
1133 err = fsync_component(FSYNC_COMPONENT_REFERENCE, lock_file_fd);
1134 if (err < 0) {
1135 err = REFTABLE_IO_ERROR;
1136 unlink(new_table_path.buf);
1137 goto done;
1140 err = close(lock_file_fd);
1141 lock_file_fd = -1;
1142 if (err < 0) {
1143 err = REFTABLE_IO_ERROR;
1144 unlink(new_table_path.buf);
1145 goto done;
1148 err = rename(lock_file_name.buf, st->list_file);
1149 if (err < 0) {
1150 err = REFTABLE_IO_ERROR;
1151 unlink(new_table_path.buf);
1152 goto done;
1154 have_lock = 0;
1156 /* Reload the stack before deleting. On windows, we can only delete the
1157 files after we closed them.
1159 err = reftable_stack_reload_maybe_reuse(st, first < last);
1161 listp = delete_on_success;
1162 while (*listp) {
1163 if (strcmp(*listp, new_table_path.buf)) {
1164 unlink(*listp);
1166 listp++;
1169 done:
1170 free_names(delete_on_success);
1172 if (subtable_locks) {
1173 listp = subtable_locks;
1174 while (*listp) {
1175 unlink(*listp);
1176 listp++;
1178 free_names(subtable_locks);
1180 if (lock_file_fd >= 0) {
1181 close(lock_file_fd);
1182 lock_file_fd = -1;
1184 if (have_lock) {
1185 unlink(lock_file_name.buf);
1187 strbuf_release(&new_table_name);
1188 strbuf_release(&new_table_path);
1189 strbuf_release(&ref_list_contents);
1190 strbuf_release(&temp_tab_file_name);
1191 strbuf_release(&lock_file_name);
1192 return err;
1195 int reftable_stack_compact_all(struct reftable_stack *st,
1196 struct reftable_log_expiry_config *config)
1198 return stack_compact_range(st, 0, st->merged->stack_len ?
1199 st->merged->stack_len - 1 : 0, config);
1202 static int stack_compact_range_stats(struct reftable_stack *st,
1203 size_t first, size_t last,
1204 struct reftable_log_expiry_config *config)
1206 int err = stack_compact_range(st, first, last, config);
1207 if (err > 0)
1208 st->stats.failures++;
1209 return err;
1212 static int segment_size(struct segment *s)
1214 return s->end - s->start;
1217 int fastlog2(uint64_t sz)
1219 int l = 0;
1220 if (sz == 0)
1221 return 0;
1222 for (; sz; sz /= 2) {
1223 l++;
1225 return l - 1;
1228 struct segment *sizes_to_segments(size_t *seglen, uint64_t *sizes, size_t n)
1230 struct segment *segs = reftable_calloc(n, sizeof(*segs));
1231 struct segment cur = { 0 };
1232 size_t next = 0, i;
1234 if (n == 0) {
1235 *seglen = 0;
1236 return segs;
1238 for (i = 0; i < n; i++) {
1239 int log = fastlog2(sizes[i]);
1240 if (cur.log != log && cur.bytes > 0) {
1241 struct segment fresh = {
1242 .start = i,
1245 segs[next++] = cur;
1246 cur = fresh;
1249 cur.log = log;
1250 cur.end = i + 1;
1251 cur.bytes += sizes[i];
1253 segs[next++] = cur;
1254 *seglen = next;
1255 return segs;
1258 struct segment suggest_compaction_segment(uint64_t *sizes, size_t n)
1260 struct segment min_seg = {
1261 .log = 64,
1263 struct segment *segs;
1264 size_t seglen = 0, i;
1266 segs = sizes_to_segments(&seglen, sizes, n);
1267 for (i = 0; i < seglen; i++) {
1268 if (segment_size(&segs[i]) == 1)
1269 continue;
1271 if (segs[i].log < min_seg.log)
1272 min_seg = segs[i];
1275 while (min_seg.start > 0) {
1276 size_t prev = min_seg.start - 1;
1277 if (fastlog2(min_seg.bytes) < fastlog2(sizes[prev]))
1278 break;
1280 min_seg.start = prev;
1281 min_seg.bytes += sizes[prev];
1284 reftable_free(segs);
1285 return min_seg;
1288 static uint64_t *stack_table_sizes_for_compaction(struct reftable_stack *st)
1290 uint64_t *sizes =
1291 reftable_calloc(st->merged->stack_len, sizeof(*sizes));
1292 int version = (st->config.hash_id == GIT_SHA1_FORMAT_ID) ? 1 : 2;
1293 int overhead = header_size(version) - 1;
1294 int i = 0;
1295 for (i = 0; i < st->merged->stack_len; i++) {
1296 sizes[i] = st->readers[i]->size - overhead;
1298 return sizes;
1301 int reftable_stack_auto_compact(struct reftable_stack *st)
1303 uint64_t *sizes = stack_table_sizes_for_compaction(st);
1304 struct segment seg =
1305 suggest_compaction_segment(sizes, st->merged->stack_len);
1306 reftable_free(sizes);
1307 if (segment_size(&seg) > 0)
1308 return stack_compact_range_stats(st, seg.start, seg.end - 1,
1309 NULL);
1311 return 0;
1314 struct reftable_compaction_stats *
1315 reftable_stack_compaction_stats(struct reftable_stack *st)
1317 return &st->stats;
1320 int reftable_stack_read_ref(struct reftable_stack *st, const char *refname,
1321 struct reftable_ref_record *ref)
1323 struct reftable_table tab = { NULL };
1324 reftable_table_from_merged_table(&tab, reftable_stack_merged_table(st));
1325 return reftable_table_read_ref(&tab, refname, ref);
1328 int reftable_stack_read_log(struct reftable_stack *st, const char *refname,
1329 struct reftable_log_record *log)
1331 struct reftable_iterator it = { NULL };
1332 struct reftable_merged_table *mt = reftable_stack_merged_table(st);
1333 int err = reftable_merged_table_seek_log(mt, &it, refname);
1334 if (err)
1335 goto done;
1337 err = reftable_iterator_next_log(&it, log);
1338 if (err)
1339 goto done;
1341 if (strcmp(log->refname, refname) ||
1342 reftable_log_record_is_deletion(log)) {
1343 err = 1;
1344 goto done;
1347 done:
1348 if (err) {
1349 reftable_log_record_release(log);
1351 reftable_iterator_destroy(&it);
1352 return err;
1355 static int stack_check_addition(struct reftable_stack *st,
1356 const char *new_tab_name)
1358 int err = 0;
1359 struct reftable_block_source src = { NULL };
1360 struct reftable_reader *rd = NULL;
1361 struct reftable_table tab = { NULL };
1362 struct reftable_ref_record *refs = NULL;
1363 struct reftable_iterator it = { NULL };
1364 int cap = 0;
1365 int len = 0;
1366 int i = 0;
1368 if (st->config.skip_name_check)
1369 return 0;
1371 err = reftable_block_source_from_file(&src, new_tab_name);
1372 if (err < 0)
1373 goto done;
1375 err = reftable_new_reader(&rd, &src, new_tab_name);
1376 if (err < 0)
1377 goto done;
1379 err = reftable_reader_seek_ref(rd, &it, "");
1380 if (err > 0) {
1381 err = 0;
1382 goto done;
1384 if (err < 0)
1385 goto done;
1387 while (1) {
1388 struct reftable_ref_record ref = { NULL };
1389 err = reftable_iterator_next_ref(&it, &ref);
1390 if (err > 0)
1391 break;
1392 if (err < 0)
1393 goto done;
1395 REFTABLE_ALLOC_GROW(refs, len + 1, cap);
1396 refs[len++] = ref;
1399 reftable_table_from_merged_table(&tab, reftable_stack_merged_table(st));
1401 err = validate_ref_record_addition(tab, refs, len);
1403 done:
1404 for (i = 0; i < len; i++) {
1405 reftable_ref_record_release(&refs[i]);
1408 free(refs);
1409 reftable_iterator_destroy(&it);
1410 reftable_reader_free(rd);
1411 return err;
1414 static int is_table_name(const char *s)
1416 const char *dot = strrchr(s, '.');
1417 return dot && !strcmp(dot, ".ref");
1420 static void remove_maybe_stale_table(struct reftable_stack *st, uint64_t max,
1421 const char *name)
1423 int err = 0;
1424 uint64_t update_idx = 0;
1425 struct reftable_block_source src = { NULL };
1426 struct reftable_reader *rd = NULL;
1427 struct strbuf table_path = STRBUF_INIT;
1428 stack_filename(&table_path, st, name);
1430 err = reftable_block_source_from_file(&src, table_path.buf);
1431 if (err < 0)
1432 goto done;
1434 err = reftable_new_reader(&rd, &src, name);
1435 if (err < 0)
1436 goto done;
1438 update_idx = reftable_reader_max_update_index(rd);
1439 reftable_reader_free(rd);
1441 if (update_idx <= max) {
1442 unlink(table_path.buf);
1444 done:
1445 strbuf_release(&table_path);
1448 static int reftable_stack_clean_locked(struct reftable_stack *st)
1450 uint64_t max = reftable_merged_table_max_update_index(
1451 reftable_stack_merged_table(st));
1452 DIR *dir = opendir(st->reftable_dir);
1453 struct dirent *d = NULL;
1454 if (!dir) {
1455 return REFTABLE_IO_ERROR;
1458 while ((d = readdir(dir))) {
1459 int i = 0;
1460 int found = 0;
1461 if (!is_table_name(d->d_name))
1462 continue;
1464 for (i = 0; !found && i < st->readers_len; i++) {
1465 found = !strcmp(reader_name(st->readers[i]), d->d_name);
1467 if (found)
1468 continue;
1470 remove_maybe_stale_table(st, max, d->d_name);
1473 closedir(dir);
1474 return 0;
1477 int reftable_stack_clean(struct reftable_stack *st)
1479 struct reftable_addition *add = NULL;
1480 int err = reftable_stack_new_addition(&add, st);
1481 if (err < 0) {
1482 goto done;
1485 err = reftable_stack_reload(st);
1486 if (err < 0) {
1487 goto done;
1490 err = reftable_stack_clean_locked(st);
1492 done:
1493 reftable_addition_destroy(add);
1494 return err;
1497 int reftable_stack_print_directory(const char *stackdir, uint32_t hash_id)
1499 struct reftable_stack *stack = NULL;
1500 struct reftable_write_options cfg = { .hash_id = hash_id };
1501 struct reftable_merged_table *merged = NULL;
1502 struct reftable_table table = { NULL };
1504 int err = reftable_new_stack(&stack, stackdir, cfg);
1505 if (err < 0)
1506 goto done;
1508 merged = reftable_stack_merged_table(stack);
1509 reftable_table_from_merged_table(&table, merged);
1510 err = reftable_table_print(&table);
1511 done:
1512 if (stack)
1513 reftable_stack_destroy(stack);
1514 return err;