2 #include "bundle-uri.h"
5 #include "environment.h"
7 #include "object-store.h"
9 #include "run-command.h"
16 enum bundle_list_heuristic heuristic
;
18 } heuristics
[BUNDLE_HEURISTIC__COUNT
] = {
19 { BUNDLE_HEURISTIC_NONE
, ""},
20 { BUNDLE_HEURISTIC_CREATIONTOKEN
, "creationToken" },
23 static int compare_bundles(const void *hashmap_cmp_fn_data
,
24 const struct hashmap_entry
*he1
,
25 const struct hashmap_entry
*he2
,
28 const struct remote_bundle_info
*e1
=
29 container_of(he1
, const struct remote_bundle_info
, ent
);
30 const struct remote_bundle_info
*e2
=
31 container_of(he2
, const struct remote_bundle_info
, ent
);
33 return strcmp(e1
->id
, id
? (const char *)id
: e2
->id
);
36 void init_bundle_list(struct bundle_list
*list
)
38 memset(list
, 0, sizeof(*list
));
40 /* Implied defaults. */
41 list
->mode
= BUNDLE_MODE_ALL
;
44 hashmap_init(&list
->bundles
, compare_bundles
, NULL
, 0);
47 static int clear_remote_bundle_info(struct remote_bundle_info
*bundle
,
50 FREE_AND_NULL(bundle
->id
);
51 FREE_AND_NULL(bundle
->uri
);
52 FREE_AND_NULL(bundle
->file
);
53 bundle
->unbundled
= 0;
57 void clear_bundle_list(struct bundle_list
*list
)
62 for_all_bundles_in_list(list
, clear_remote_bundle_info
, NULL
);
63 hashmap_clear_and_free(&list
->bundles
, struct remote_bundle_info
, ent
);
67 int for_all_bundles_in_list(struct bundle_list
*list
,
71 struct remote_bundle_info
*info
;
72 struct hashmap_iter i
;
74 hashmap_for_each_entry(&list
->bundles
, &i
, info
, ent
) {
75 int result
= iter(info
, data
);
84 static int summarize_bundle(struct remote_bundle_info
*info
, void *data
)
87 fprintf(fp
, "[bundle \"%s\"]\n", info
->id
);
88 fprintf(fp
, "\turi = %s\n", info
->uri
);
90 if (info
->creationToken
)
91 fprintf(fp
, "\tcreationToken = %"PRIu64
"\n", info
->creationToken
);
95 void print_bundle_list(FILE *fp
, struct bundle_list
*list
)
100 case BUNDLE_MODE_ALL
:
104 case BUNDLE_MODE_ANY
:
108 case BUNDLE_MODE_NONE
:
113 fprintf(fp
, "[bundle]\n");
114 fprintf(fp
, "\tversion = %d\n", list
->version
);
115 fprintf(fp
, "\tmode = %s\n", mode
);
117 if (list
->heuristic
) {
119 for (i
= 0; i
< BUNDLE_HEURISTIC__COUNT
; i
++) {
120 if (heuristics
[i
].heuristic
== list
->heuristic
) {
121 printf("\theuristic = %s\n",
122 heuristics
[list
->heuristic
].name
);
128 for_all_bundles_in_list(list
, summarize_bundle
, fp
);
132 * Given a key-value pair, update the state of the given bundle list.
133 * Returns 0 if the key-value pair is understood. Returns -1 if the key
134 * is not understood or the value is malformed.
136 static int bundle_list_update(const char *key
, const char *value
,
137 struct bundle_list
*list
)
139 struct strbuf id
= STRBUF_INIT
;
140 struct remote_bundle_info lookup
= REMOTE_BUNDLE_INFO_INIT
;
141 struct remote_bundle_info
*bundle
;
142 const char *subsection
, *subkey
;
143 size_t subsection_len
;
145 if (parse_config_key(key
, "bundle", &subsection
, &subsection_len
, &subkey
))
148 if (!subsection_len
) {
149 if (!strcmp(subkey
, "version")) {
151 if (!git_parse_int(value
, &version
))
156 list
->version
= version
;
160 if (!strcmp(subkey
, "mode")) {
161 if (!strcmp(value
, "all"))
162 list
->mode
= BUNDLE_MODE_ALL
;
163 else if (!strcmp(value
, "any"))
164 list
->mode
= BUNDLE_MODE_ANY
;
170 if (!strcmp(subkey
, "heuristic")) {
172 for (i
= 0; i
< BUNDLE_HEURISTIC__COUNT
; i
++) {
173 if (heuristics
[i
].heuristic
&&
174 heuristics
[i
].name
&&
175 !strcmp(value
, heuristics
[i
].name
)) {
176 list
->heuristic
= heuristics
[i
].heuristic
;
181 /* Ignore unknown heuristics. */
185 /* Ignore other unknown global keys. */
189 strbuf_add(&id
, subsection
, subsection_len
);
192 * Check for an existing bundle with this <id>, or create one
196 hashmap_entry_init(&lookup
.ent
, strhash(lookup
.id
));
197 if (!(bundle
= hashmap_get_entry(&list
->bundles
, &lookup
, ent
, NULL
))) {
198 CALLOC_ARRAY(bundle
, 1);
199 bundle
->id
= strbuf_detach(&id
, NULL
);
200 hashmap_entry_init(&bundle
->ent
, strhash(bundle
->id
));
201 hashmap_add(&list
->bundles
, &bundle
->ent
);
205 if (!strcmp(subkey
, "uri")) {
208 bundle
->uri
= relative_url(list
->baseURI
, value
, NULL
);
212 if (!strcmp(subkey
, "creationtoken")) {
213 if (sscanf(value
, "%"PRIu64
, &bundle
->creationToken
) != 1)
214 warning(_("could not parse bundle list key %s with value '%s'"),
215 "creationToken", value
);
220 * At this point, we ignore any information that we don't
221 * understand, assuming it to be hints for a heuristic the client
222 * does not currently understand.
227 static int config_to_bundle_list(const char *key
, const char *value
, void *data
)
229 struct bundle_list
*list
= data
;
230 return bundle_list_update(key
, value
, list
);
233 int bundle_uri_parse_config_format(const char *uri
,
234 const char *filename
,
235 struct bundle_list
*list
)
238 struct config_options opts
= {
239 .error_action
= CONFIG_ERROR_ERROR
,
242 if (!list
->baseURI
) {
243 struct strbuf baseURI
= STRBUF_INIT
;
244 strbuf_addstr(&baseURI
, uri
);
247 * If the URI does not end with a trailing slash, then
248 * remove the filename portion of the path. This is
249 * important for relative URIs.
251 strbuf_strip_file_from_path(&baseURI
);
252 list
->baseURI
= strbuf_detach(&baseURI
, NULL
);
254 result
= git_config_from_file_with_options(config_to_bundle_list
,
258 if (!result
&& list
->mode
== BUNDLE_MODE_NONE
) {
259 warning(_("bundle list at '%s' has no mode"), uri
);
266 static char *find_temp_filename(void)
269 struct strbuf name
= STRBUF_INIT
;
271 * Find a temporary filename that is available. This is briefly
272 * racy, but unlikely to collide.
274 fd
= odb_mkstemp(&name
, "bundles/tmp_uri_XXXXXX");
276 warning(_("failed to create temporary file"));
282 return strbuf_detach(&name
, NULL
);
285 static int download_https_uri_to_file(const char *file
, const char *uri
)
288 struct child_process cp
= CHILD_PROCESS_INIT
;
289 FILE *child_in
= NULL
, *child_out
= NULL
;
290 struct strbuf line
= STRBUF_INIT
;
293 strvec_pushl(&cp
.args
, "git-remote-https", uri
, NULL
);
298 if (start_command(&cp
))
301 child_in
= fdopen(cp
.in
, "w");
307 child_out
= fdopen(cp
.out
, "r");
313 fprintf(child_in
, "capabilities\n");
316 while (!strbuf_getline(&line
, child_out
)) {
319 if (!strcmp(line
.buf
, "get"))
322 strbuf_release(&line
);
325 result
= error(_("insufficient capabilities"));
329 fprintf(child_in
, "get %s %s\n\n", uri
, file
);
334 if (finish_command(&cp
))
341 static int copy_uri_to_file(const char *filename
, const char *uri
)
345 if (starts_with(uri
, "https:") ||
346 starts_with(uri
, "http:"))
347 return download_https_uri_to_file(filename
, uri
);
349 if (skip_prefix(uri
, "file://", &out
))
353 return copy_file(filename
, uri
, 0);
356 static int unbundle_from_file(struct repository
*r
, const char *file
)
360 struct bundle_header header
= BUNDLE_HEADER_INIT
;
361 struct string_list_item
*refname
;
362 struct strbuf bundle_ref
= STRBUF_INIT
;
363 size_t bundle_prefix_len
;
365 if ((bundle_fd
= read_bundle_header(file
, &header
)) < 0)
369 * Skip the reachability walk here, since we will be adding
370 * a reachable ref pointing to the new tips, which will reach
371 * the prerequisite commits.
373 if ((result
= unbundle(r
, &header
, bundle_fd
, NULL
,
374 VERIFY_BUNDLE_QUIET
)))
378 * Convert all refs/heads/ from the bundle into refs/bundles/
379 * in the local repository.
381 strbuf_addstr(&bundle_ref
, "refs/bundles/");
382 bundle_prefix_len
= bundle_ref
.len
;
384 for_each_string_list_item(refname
, &header
.references
) {
385 struct object_id
*oid
= refname
->util
;
386 struct object_id old_oid
;
387 const char *branch_name
;
390 if (!skip_prefix(refname
->string
, "refs/heads/", &branch_name
))
393 strbuf_setlen(&bundle_ref
, bundle_prefix_len
);
394 strbuf_addstr(&bundle_ref
, branch_name
);
396 has_old
= !read_ref(bundle_ref
.buf
, &old_oid
);
397 update_ref("fetched bundle", bundle_ref
.buf
, oid
,
398 has_old
? &old_oid
: NULL
,
399 REF_SKIP_OID_VERIFICATION
,
400 UPDATE_REFS_MSG_ON_ERR
);
403 bundle_header_release(&header
);
407 struct bundle_list_context
{
408 struct repository
*r
;
409 struct bundle_list
*list
;
410 enum bundle_list_mode mode
;
416 * This early definition is necessary because we use indirect recursion:
418 * While iterating through a bundle list that was downloaded as part
419 * of fetch_bundle_uri_internal(), iterator methods eventually call it
420 * again, but with depth + 1.
422 static int fetch_bundle_uri_internal(struct repository
*r
,
423 struct remote_bundle_info
*bundle
,
425 struct bundle_list
*list
);
427 static int download_bundle_to_file(struct remote_bundle_info
*bundle
, void *data
)
430 struct bundle_list_context
*ctx
= data
;
432 if (ctx
->mode
== BUNDLE_MODE_ANY
&& ctx
->count
)
435 res
= fetch_bundle_uri_internal(ctx
->r
, bundle
, ctx
->depth
+ 1, ctx
->list
);
438 * Only increment count if the download succeeded. If our mode is
439 * BUNDLE_MODE_ANY, then we will want to try other URIs in the
440 * list in case they work instead.
446 * To be opportunistic as possible, we continue iterating and
447 * download as many bundles as we can, so we can apply the ones
448 * that work, even in BUNDLE_MODE_ALL mode.
453 struct bundles_for_sorting
{
454 struct remote_bundle_info
**items
;
459 static int append_bundle(struct remote_bundle_info
*bundle
, void *data
)
461 struct bundles_for_sorting
*list
= data
;
462 list
->items
[list
->nr
++] = bundle
;
467 * For use in QSORT() to get a list sorted by creationToken
468 * in decreasing order.
470 static int compare_creation_token_decreasing(const void *va
, const void *vb
)
472 const struct remote_bundle_info
* const *a
= va
;
473 const struct remote_bundle_info
* const *b
= vb
;
475 if ((*a
)->creationToken
> (*b
)->creationToken
)
477 if ((*a
)->creationToken
< (*b
)->creationToken
)
482 static int fetch_bundles_by_token(struct repository
*r
,
483 struct bundle_list
*list
)
486 int move_direction
= 0;
487 const char *creationTokenStr
;
488 uint64_t maxCreationToken
= 0, newMaxCreationToken
= 0;
489 struct bundle_list_context ctx
= {
494 struct bundles_for_sorting bundles
= {
495 .alloc
= hashmap_get_size(&list
->bundles
),
498 ALLOC_ARRAY(bundles
.items
, bundles
.alloc
);
500 for_all_bundles_in_list(list
, append_bundle
, &bundles
);
507 QSORT(bundles
.items
, bundles
.nr
, compare_creation_token_decreasing
);
510 * If fetch.bundleCreationToken exists, parses to a uint64t, and
511 * is not strictly smaller than the maximum creation token in the
512 * bundle list, then do not download any bundles.
514 if (!repo_config_get_value(r
,
515 "fetch.bundlecreationtoken",
516 &creationTokenStr
) &&
517 sscanf(creationTokenStr
, "%"PRIu64
, &maxCreationToken
) == 1 &&
518 bundles
.items
[0]->creationToken
<= maxCreationToken
) {
524 * Attempt to download and unbundle the minimum number of bundles by
525 * creationToken in decreasing order. If we fail to unbundle (after
526 * a successful download) then move to the next non-downloaded bundle
527 * and attempt downloading. Once we succeed in applying a bundle,
528 * move to the previous unapplied bundle and attempt to unbundle it
531 * In the case of a fresh clone, we will likely download all of the
532 * bundles before successfully unbundling the oldest one, then the
533 * rest of the bundles unbundle successfully in increasing order
536 * If there are existing objects, then this process may terminate
537 * early when all required commits from "new" bundles exist in the
538 * repo's object store.
541 while (cur
>= 0 && cur
< bundles
.nr
) {
542 struct remote_bundle_info
*bundle
= bundles
.items
[cur
];
545 * If we need to dig into bundles below the previous
546 * creation token value, then likely we are in an erroneous
547 * state due to missing or invalid bundles. Halt the process
548 * instead of continuing to download extra data.
550 if (bundle
->creationToken
<= maxCreationToken
)
555 * Not downloaded yet. Try downloading.
557 * Note that bundle->file is non-NULL if a download
558 * was attempted, even if it failed to download.
560 if (fetch_bundle_uri_internal(ctx
.r
, bundle
, ctx
.depth
+ 1, ctx
.list
)) {
561 /* Mark as unbundled so we do not retry. */
562 bundle
->unbundled
= 1;
564 /* Try looking deeper in the list. */
569 /* We expect bundles when using creationTokens. */
570 if (!is_bundle(bundle
->file
, 1)) {
571 warning(_("file downloaded from '%s' is not a bundle"),
577 if (bundle
->file
&& !bundle
->unbundled
) {
579 * This was downloaded, but not successfully
580 * unbundled. Try unbundling again.
582 if (unbundle_from_file(ctx
.r
, bundle
->file
)) {
583 /* Try looking deeper in the list. */
587 * Succeeded in unbundle. Retry bundles
588 * that previously failed to unbundle.
591 bundle
->unbundled
= 1;
593 if (bundle
->creationToken
> newMaxCreationToken
)
594 newMaxCreationToken
= bundle
->creationToken
;
599 * Else case: downloaded and unbundled successfully.
600 * Skip this by moving in the same direction as the
605 /* Move in the specified direction and repeat. */
606 cur
+= move_direction
;
610 * We succeed if the loop terminates because 'cur' drops below
611 * zero. The other case is that we terminate because 'cur'
612 * reaches the end of the list, so we have a failure no matter
613 * which bundles we apply from the list.
616 struct strbuf value
= STRBUF_INIT
;
617 strbuf_addf(&value
, "%"PRIu64
"", newMaxCreationToken
);
618 if (repo_config_set_multivar_gently(ctx
.r
,
619 "fetch.bundleCreationToken",
621 warning(_("failed to store maximum creation token"));
623 strbuf_release(&value
);
630 static int download_bundle_list(struct repository
*r
,
631 struct bundle_list
*local_list
,
632 struct bundle_list
*global_list
,
635 struct bundle_list_context ctx
= {
639 .mode
= local_list
->mode
,
642 return for_all_bundles_in_list(local_list
, download_bundle_to_file
, &ctx
);
645 static int fetch_bundle_list_in_config_format(struct repository
*r
,
646 struct bundle_list
*global_list
,
647 struct remote_bundle_info
*bundle
,
651 struct bundle_list list_from_bundle
;
653 init_bundle_list(&list_from_bundle
);
655 if ((result
= bundle_uri_parse_config_format(bundle
->uri
,
660 if (list_from_bundle
.mode
== BUNDLE_MODE_NONE
) {
661 warning(_("unrecognized bundle mode from URI '%s'"),
668 * If this list uses the creationToken heuristic, then the URIs
669 * it advertises are expected to be bundles, not nested lists.
670 * We can drop 'global_list' and 'depth'.
672 if (list_from_bundle
.heuristic
== BUNDLE_HEURISTIC_CREATIONTOKEN
) {
673 result
= fetch_bundles_by_token(r
, &list_from_bundle
);
674 global_list
->heuristic
= BUNDLE_HEURISTIC_CREATIONTOKEN
;
675 } else if ((result
= download_bundle_list(r
, &list_from_bundle
,
676 global_list
, depth
)))
680 clear_bundle_list(&list_from_bundle
);
685 * This limits the recursion on fetch_bundle_uri_internal() when following
688 static int max_bundle_uri_depth
= 4;
691 * Recursively download all bundles advertised at the given URI
692 * to files. If the file is a bundle, then add it to the given
693 * 'list'. Otherwise, expect a bundle list and recurse on the
694 * URIs in that list according to the list mode (ANY or ALL).
696 static int fetch_bundle_uri_internal(struct repository
*r
,
697 struct remote_bundle_info
*bundle
,
699 struct bundle_list
*list
)
702 struct remote_bundle_info
*bcopy
;
704 if (depth
>= max_bundle_uri_depth
) {
705 warning(_("exceeded bundle URI recursion limit (%d)"),
706 max_bundle_uri_depth
);
711 !(bundle
->file
= find_temp_filename())) {
716 if ((result
= copy_uri_to_file(bundle
->file
, bundle
->uri
))) {
717 warning(_("failed to download bundle from URI '%s'"), bundle
->uri
);
721 if ((result
= !is_bundle(bundle
->file
, 1))) {
722 result
= fetch_bundle_list_in_config_format(
723 r
, list
, bundle
, depth
);
725 warning(_("file at URI '%s' is not a bundle or bundle list"),
730 /* Copy the bundle and insert it into the global list. */
731 CALLOC_ARRAY(bcopy
, 1);
732 bcopy
->id
= xstrdup(bundle
->id
);
733 bcopy
->file
= xstrdup(bundle
->file
);
734 hashmap_entry_init(&bcopy
->ent
, strhash(bcopy
->id
));
735 hashmap_add(&list
->bundles
, &bcopy
->ent
);
738 if (result
&& bundle
->file
)
739 unlink(bundle
->file
);
744 * This loop iterator breaks the loop with nonzero return code on the
745 * first successful unbundling of a bundle.
747 static int attempt_unbundle(struct remote_bundle_info
*info
, void *data
)
749 struct repository
*r
= data
;
751 if (!info
->file
|| info
->unbundled
)
754 if (!unbundle_from_file(r
, info
->file
)) {
762 static int unbundle_all_bundles(struct repository
*r
,
763 struct bundle_list
*list
)
766 * Iterate through all bundles looking for ones that can
767 * successfully unbundle. If any succeed, then perhaps another
768 * will succeed in the next attempt.
770 * Keep in mind that a non-zero result for the loop here means
771 * the loop terminated early on a successful unbundling, which
772 * signals that we can try again.
774 while (for_all_bundles_in_list(list
, attempt_unbundle
, r
)) ;
779 static int unlink_bundle(struct remote_bundle_info
*info
, void *data
)
782 unlink_or_warn(info
->file
);
786 int fetch_bundle_uri(struct repository
*r
, const char *uri
,
790 struct bundle_list list
;
791 struct remote_bundle_info bundle
= {
796 init_bundle_list(&list
);
798 /* If a bundle is added to this global list, then it is required. */
799 list
.mode
= BUNDLE_MODE_ALL
;
801 if ((result
= fetch_bundle_uri_internal(r
, &bundle
, 0, &list
)))
804 result
= unbundle_all_bundles(r
, &list
);
808 *has_heuristic
= (list
.heuristic
!= BUNDLE_HEURISTIC_NONE
);
809 for_all_bundles_in_list(&list
, unlink_bundle
, NULL
);
810 clear_bundle_list(&list
);
811 clear_remote_bundle_info(&bundle
, NULL
);
815 int fetch_bundle_list(struct repository
*r
, struct bundle_list
*list
)
818 struct bundle_list global_list
;
821 * If the creationToken heuristic is used, then the URIs
822 * advertised by 'list' are not nested lists and instead
823 * direct bundles. We do not need to use global_list.
825 if (list
->heuristic
== BUNDLE_HEURISTIC_CREATIONTOKEN
)
826 return fetch_bundles_by_token(r
, list
);
828 init_bundle_list(&global_list
);
830 /* If a bundle is added to this global list, then it is required. */
831 global_list
.mode
= BUNDLE_MODE_ALL
;
833 if ((result
= download_bundle_list(r
, list
, &global_list
, 0)))
836 if (list
->heuristic
== BUNDLE_HEURISTIC_CREATIONTOKEN
)
837 result
= fetch_bundles_by_token(r
, list
);
839 result
= unbundle_all_bundles(r
, &global_list
);
842 for_all_bundles_in_list(&global_list
, unlink_bundle
, NULL
);
843 clear_bundle_list(&global_list
);
851 int bundle_uri_advertise(struct repository
*r
, struct strbuf
*value UNUSED
)
853 static int advertise_bundle_uri
= -1;
855 if (advertise_bundle_uri
!= -1)
858 advertise_bundle_uri
= 0;
859 repo_config_get_maybe_bool(r
, "uploadpack.advertisebundleuris", &advertise_bundle_uri
);
862 return advertise_bundle_uri
;
865 static int config_to_packet_line(const char *key
, const char *value
, void *data
)
867 struct packet_reader
*writer
= data
;
869 if (starts_with(key
, "bundle."))
870 packet_write_fmt(writer
->fd
, "%s=%s", key
, value
);
875 int bundle_uri_command(struct repository
*r
,
876 struct packet_reader
*request
)
878 struct packet_writer writer
;
879 packet_writer_init(&writer
, 1);
881 while (packet_reader_read(request
) == PACKET_READ_NORMAL
)
882 die(_("bundle-uri: unexpected argument: '%s'"), request
->line
);
883 if (request
->status
!= PACKET_READ_FLUSH
)
884 die(_("bundle-uri: expected flush after arguments"));
887 * Read all "bundle.*" config lines to the client as key=value
890 repo_config(r
, config_to_packet_line
, &writer
);
892 packet_writer_flush(&writer
);
898 * General API for {transport,connect}.c etc.
900 int bundle_uri_parse_line(struct bundle_list
*list
, const char *line
)
904 struct strbuf key
= STRBUF_INIT
;
907 return error(_("bundle-uri: got an empty line"));
909 equals
= strchr(line
, '=');
912 return error(_("bundle-uri: line is not of the form 'key=value'"));
913 if (line
== equals
|| !*(equals
+ 1))
914 return error(_("bundle-uri: line has empty key or value"));
916 strbuf_add(&key
, line
, equals
- line
);
917 result
= bundle_list_update(key
.buf
, equals
+ 1, list
);
918 strbuf_release(&key
);