2 Copyright 2020 Google LLC
4 Use of this source code is governed by a BSD-style
5 license that can be found in the LICENSE file or at
6 https://developers.google.com/open-source/licenses/bsd
11 #include "constants.h"
16 #include "reftable-merged.h"
17 #include "reftable-error.h"
20 struct merged_subiter
{
21 struct reftable_iterator iter
;
22 struct reftable_record rec
;
26 struct merged_subiter
*subiters
;
27 struct merged_iter_pqueue pq
;
31 int suppress_deletions
;
32 ssize_t advance_index
;
35 static int merged_iter_init(struct merged_iter
*mi
)
37 for (size_t i
= 0; i
< mi
->stack_len
; i
++) {
40 .rec
= &mi
->subiters
[i
].rec
,
44 reftable_record_init(&mi
->subiters
[i
].rec
, mi
->typ
);
45 err
= iterator_next(&mi
->subiters
[i
].iter
,
46 &mi
->subiters
[i
].rec
);
52 merged_iter_pqueue_add(&mi
->pq
, &e
);
58 static void merged_iter_close(void *p
)
60 struct merged_iter
*mi
= p
;
62 merged_iter_pqueue_release(&mi
->pq
);
63 for (size_t i
= 0; i
< mi
->stack_len
; i
++) {
64 reftable_iterator_destroy(&mi
->subiters
[i
].iter
);
65 reftable_record_release(&mi
->subiters
[i
].rec
);
67 reftable_free(mi
->subiters
);
70 static int merged_iter_advance_subiter(struct merged_iter
*mi
, size_t idx
)
74 .rec
= &mi
->subiters
[idx
].rec
,
78 err
= iterator_next(&mi
->subiters
[idx
].iter
, &mi
->subiters
[idx
].rec
);
82 merged_iter_pqueue_add(&mi
->pq
, &e
);
86 static int merged_iter_next_entry(struct merged_iter
*mi
,
87 struct reftable_record
*rec
)
89 struct pq_entry entry
= { 0 };
92 if (mi
->advance_index
>= 0) {
93 err
= merged_iter_advance_subiter(mi
, mi
->advance_index
);
96 mi
->advance_index
= -1;
99 if (merged_iter_pqueue_is_empty(mi
->pq
))
102 entry
= merged_iter_pqueue_remove(&mi
->pq
);
105 One can also use reftable as datacenter-local storage, where the ref
106 database is maintained in globally consistent database (eg.
107 CockroachDB or Spanner). In this scenario, replication delays together
108 with compaction may cause newer tables to contain older entries. In
109 such a deployment, the loop below must be changed to collect all
110 entries for the same key, and return new the newest one.
112 while (!merged_iter_pqueue_is_empty(mi
->pq
)) {
113 struct pq_entry top
= merged_iter_pqueue_top(mi
->pq
);
116 cmp
= reftable_record_cmp(top
.rec
, entry
.rec
);
120 merged_iter_pqueue_remove(&mi
->pq
);
121 err
= merged_iter_advance_subiter(mi
, top
.index
);
126 mi
->advance_index
= entry
.index
;
127 SWAP(*rec
, *entry
.rec
);
131 static int merged_iter_next(struct merged_iter
*mi
, struct reftable_record
*rec
)
134 int err
= merged_iter_next_entry(mi
, rec
);
135 if (err
== 0 && mi
->suppress_deletions
&&
136 reftable_record_is_deletion(rec
)) {
144 static int merged_iter_next_void(void *p
, struct reftable_record
*rec
)
146 struct merged_iter
*mi
= p
;
147 if (merged_iter_pqueue_is_empty(mi
->pq
) && mi
->advance_index
< 0)
149 return merged_iter_next(mi
, rec
);
152 static struct reftable_iterator_vtable merged_iter_vtable
= {
153 .next
= &merged_iter_next_void
,
154 .close
= &merged_iter_close
,
157 static void iterator_from_merged_iter(struct reftable_iterator
*it
,
158 struct merged_iter
*mi
)
162 it
->ops
= &merged_iter_vtable
;
165 int reftable_new_merged_table(struct reftable_merged_table
**dest
,
166 struct reftable_table
*stack
, size_t n
,
169 struct reftable_merged_table
*m
= NULL
;
170 uint64_t last_max
= 0;
171 uint64_t first_min
= 0;
173 for (size_t i
= 0; i
< n
; i
++) {
174 uint64_t min
= reftable_table_min_update_index(&stack
[i
]);
175 uint64_t max
= reftable_table_max_update_index(&stack
[i
]);
177 if (reftable_table_hash_id(&stack
[i
]) != hash_id
) {
178 return REFTABLE_FORMAT_ERROR
;
180 if (i
== 0 || min
< first_min
) {
183 if (i
== 0 || max
> last_max
) {
188 REFTABLE_CALLOC_ARRAY(m
, 1);
193 m
->hash_id
= hash_id
;
198 /* clears the list of subtable, without affecting the readers themselves. */
199 void merged_table_release(struct reftable_merged_table
*mt
)
201 FREE_AND_NULL(mt
->stack
);
205 void reftable_merged_table_free(struct reftable_merged_table
*mt
)
210 merged_table_release(mt
);
215 reftable_merged_table_max_update_index(struct reftable_merged_table
*mt
)
221 reftable_merged_table_min_update_index(struct reftable_merged_table
*mt
)
226 static int reftable_table_seek_record(struct reftable_table
*tab
,
227 struct reftable_iterator
*it
,
228 struct reftable_record
*rec
)
230 return tab
->ops
->seek_record(tab
->table_arg
, it
, rec
);
233 static int merged_table_seek_record(struct reftable_merged_table
*mt
,
234 struct reftable_iterator
*it
,
235 struct reftable_record
*rec
)
237 struct merged_iter merged
= {
238 .typ
= reftable_record_type(rec
),
239 .hash_id
= mt
->hash_id
,
240 .suppress_deletions
= mt
->suppress_deletions
,
243 struct merged_iter
*p
;
246 REFTABLE_CALLOC_ARRAY(merged
.subiters
, mt
->stack_len
);
247 for (size_t i
= 0; i
< mt
->stack_len
; i
++) {
248 err
= reftable_table_seek_record(&mt
->stack
[i
],
249 &merged
.subiters
[merged
.stack_len
].iter
, rec
);
256 err
= merged_iter_init(&merged
);
260 p
= reftable_malloc(sizeof(struct merged_iter
));
262 iterator_from_merged_iter(it
, p
);
266 merged_iter_close(&merged
);
270 int reftable_merged_table_seek_ref(struct reftable_merged_table
*mt
,
271 struct reftable_iterator
*it
,
274 struct reftable_record rec
= {
275 .type
= BLOCK_TYPE_REF
,
277 .refname
= (char *)name
,
280 return merged_table_seek_record(mt
, it
, &rec
);
283 int reftable_merged_table_seek_log_at(struct reftable_merged_table
*mt
,
284 struct reftable_iterator
*it
,
285 const char *name
, uint64_t update_index
)
287 struct reftable_record rec
= { .type
= BLOCK_TYPE_LOG
,
289 .refname
= (char *)name
,
290 .update_index
= update_index
,
292 return merged_table_seek_record(mt
, it
, &rec
);
295 int reftable_merged_table_seek_log(struct reftable_merged_table
*mt
,
296 struct reftable_iterator
*it
,
299 uint64_t max
= ~((uint64_t)0);
300 return reftable_merged_table_seek_log_at(mt
, it
, name
, max
);
303 uint32_t reftable_merged_table_hash_id(struct reftable_merged_table
*mt
)
308 static int reftable_merged_table_seek_void(void *tab
,
309 struct reftable_iterator
*it
,
310 struct reftable_record
*rec
)
312 return merged_table_seek_record(tab
, it
, rec
);
315 static uint32_t reftable_merged_table_hash_id_void(void *tab
)
317 return reftable_merged_table_hash_id(tab
);
320 static uint64_t reftable_merged_table_min_update_index_void(void *tab
)
322 return reftable_merged_table_min_update_index(tab
);
325 static uint64_t reftable_merged_table_max_update_index_void(void *tab
)
327 return reftable_merged_table_max_update_index(tab
);
330 static struct reftable_table_vtable merged_table_vtable
= {
331 .seek_record
= reftable_merged_table_seek_void
,
332 .hash_id
= reftable_merged_table_hash_id_void
,
333 .min_update_index
= reftable_merged_table_min_update_index_void
,
334 .max_update_index
= reftable_merged_table_max_update_index_void
,
337 void reftable_table_from_merged_table(struct reftable_table
*tab
,
338 struct reftable_merged_table
*merged
)
341 tab
->ops
= &merged_table_vtable
;
342 tab
->table_arg
= merged
;