Merge branch 'ab/sequencer-unleak'
[git/debian.git] / submodule.c
blob3a0dfc417c05b627a5100f518768a1b32ee22339
2 #include "cache.h"
3 #include "repository.h"
4 #include "config.h"
5 #include "submodule-config.h"
6 #include "submodule.h"
7 #include "dir.h"
8 #include "diff.h"
9 #include "commit.h"
10 #include "revision.h"
11 #include "run-command.h"
12 #include "diffcore.h"
13 #include "refs.h"
14 #include "string-list.h"
15 #include "oid-array.h"
16 #include "strvec.h"
17 #include "blob.h"
18 #include "thread-utils.h"
19 #include "quote.h"
20 #include "remote.h"
21 #include "worktree.h"
22 #include "parse-options.h"
23 #include "object-store.h"
24 #include "commit-reach.h"
25 #include "shallow.h"
27 static int config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
28 static int initialized_fetch_ref_tips;
29 static struct oid_array ref_tips_before_fetch;
30 static struct oid_array ref_tips_after_fetch;
33 * Check if the .gitmodules file is unmerged. Parsing of the .gitmodules file
34 * will be disabled because we can't guess what might be configured in
35 * .gitmodules unless the user resolves the conflict.
37 int is_gitmodules_unmerged(struct index_state *istate)
39 int pos = index_name_pos(istate, GITMODULES_FILE, strlen(GITMODULES_FILE));
40 if (pos < 0) { /* .gitmodules not found or isn't merged */
41 pos = -1 - pos;
42 if (istate->cache_nr > pos) { /* there is a .gitmodules */
43 const struct cache_entry *ce = istate->cache[pos];
44 if (ce_namelen(ce) == strlen(GITMODULES_FILE) &&
45 !strcmp(ce->name, GITMODULES_FILE))
46 return 1;
50 return 0;
54 * Check if the .gitmodules file is safe to write.
56 * Writing to the .gitmodules file requires that the file exists in the
57 * working tree or, if it doesn't, that a brand new .gitmodules file is going
58 * to be created (i.e. it's neither in the index nor in the current branch).
60 * It is not safe to write to .gitmodules if it's not in the working tree but
61 * it is in the index or in the current branch, because writing new values
62 * (and staging them) would blindly overwrite ALL the old content.
64 int is_writing_gitmodules_ok(void)
66 struct object_id oid;
67 return file_exists(GITMODULES_FILE) ||
68 (get_oid(GITMODULES_INDEX, &oid) < 0 && get_oid(GITMODULES_HEAD, &oid) < 0);
72 * Check if the .gitmodules file has unstaged modifications. This must be
73 * checked before allowing modifications to the .gitmodules file with the
74 * intention to stage them later, because when continuing we would stage the
75 * modifications the user didn't stage herself too. That might change in a
76 * future version when we learn to stage the changes we do ourselves without
77 * staging any previous modifications.
79 int is_staging_gitmodules_ok(struct index_state *istate)
81 int pos = index_name_pos(istate, GITMODULES_FILE, strlen(GITMODULES_FILE));
83 if ((pos >= 0) && (pos < istate->cache_nr)) {
84 struct stat st;
85 if (lstat(GITMODULES_FILE, &st) == 0 &&
86 ie_modified(istate, istate->cache[pos], &st, 0) & DATA_CHANGED)
87 return 0;
90 return 1;
93 static int for_each_remote_ref_submodule(const char *submodule,
94 each_ref_fn fn, void *cb_data)
96 return refs_for_each_remote_ref(get_submodule_ref_store(submodule),
97 fn, cb_data);
101 * Try to update the "path" entry in the "submodule.<name>" section of the
102 * .gitmodules file. Return 0 only if a .gitmodules file was found, a section
103 * with the correct path=<oldpath> setting was found and we could update it.
105 int update_path_in_gitmodules(const char *oldpath, const char *newpath)
107 struct strbuf entry = STRBUF_INIT;
108 const struct submodule *submodule;
109 int ret;
111 if (!file_exists(GITMODULES_FILE)) /* Do nothing without .gitmodules */
112 return -1;
114 if (is_gitmodules_unmerged(the_repository->index))
115 die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));
117 submodule = submodule_from_path(the_repository, null_oid(), oldpath);
118 if (!submodule || !submodule->name) {
119 warning(_("Could not find section in .gitmodules where path=%s"), oldpath);
120 return -1;
122 strbuf_addstr(&entry, "submodule.");
123 strbuf_addstr(&entry, submodule->name);
124 strbuf_addstr(&entry, ".path");
125 ret = config_set_in_gitmodules_file_gently(entry.buf, newpath);
126 strbuf_release(&entry);
127 return ret;
131 * Try to remove the "submodule.<name>" section from .gitmodules where the given
132 * path is configured. Return 0 only if a .gitmodules file was found, a section
133 * with the correct path=<path> setting was found and we could remove it.
135 int remove_path_from_gitmodules(const char *path)
137 struct strbuf sect = STRBUF_INIT;
138 const struct submodule *submodule;
140 if (!file_exists(GITMODULES_FILE)) /* Do nothing without .gitmodules */
141 return -1;
143 if (is_gitmodules_unmerged(the_repository->index))
144 die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));
146 submodule = submodule_from_path(the_repository, null_oid(), path);
147 if (!submodule || !submodule->name) {
148 warning(_("Could not find section in .gitmodules where path=%s"), path);
149 return -1;
151 strbuf_addstr(&sect, "submodule.");
152 strbuf_addstr(&sect, submodule->name);
153 if (git_config_rename_section_in_file(GITMODULES_FILE, sect.buf, NULL) < 0) {
154 /* Maybe the user already did that, don't error out here */
155 warning(_("Could not remove .gitmodules entry for %s"), path);
156 strbuf_release(&sect);
157 return -1;
159 strbuf_release(&sect);
160 return 0;
163 void stage_updated_gitmodules(struct index_state *istate)
165 if (add_file_to_index(istate, GITMODULES_FILE, 0))
166 die(_("staging updated .gitmodules failed"));
169 static struct string_list added_submodule_odb_paths = STRING_LIST_INIT_NODUP;
171 void add_submodule_odb_by_path(const char *path)
173 string_list_insert(&added_submodule_odb_paths, xstrdup(path));
176 int register_all_submodule_odb_as_alternates(void)
178 int i;
179 int ret = added_submodule_odb_paths.nr;
181 for (i = 0; i < added_submodule_odb_paths.nr; i++)
182 add_to_alternates_memory(added_submodule_odb_paths.items[i].string);
183 if (ret) {
184 string_list_clear(&added_submodule_odb_paths, 0);
185 trace2_data_intmax("submodule", the_repository,
186 "register_all_submodule_odb_as_alternates/registered", ret);
187 if (git_env_bool("GIT_TEST_FATAL_REGISTER_SUBMODULE_ODB", 0))
188 BUG("register_all_submodule_odb_as_alternates() called");
190 return ret;
193 void set_diffopt_flags_from_submodule_config(struct diff_options *diffopt,
194 const char *path)
196 const struct submodule *submodule = submodule_from_path(the_repository,
197 null_oid(),
198 path);
199 if (submodule) {
200 const char *ignore;
201 char *key;
203 key = xstrfmt("submodule.%s.ignore", submodule->name);
204 if (repo_config_get_string_tmp(the_repository, key, &ignore))
205 ignore = submodule->ignore;
206 free(key);
208 if (ignore)
209 handle_ignore_submodules_arg(diffopt, ignore);
210 else if (is_gitmodules_unmerged(the_repository->index))
211 diffopt->flags.ignore_submodules = 1;
215 /* Cheap function that only determines if we're interested in submodules at all */
216 int git_default_submodule_config(const char *var, const char *value,
217 void *cb UNUSED)
219 if (!strcmp(var, "submodule.recurse")) {
220 int v = git_config_bool(var, value) ?
221 RECURSE_SUBMODULES_ON : RECURSE_SUBMODULES_OFF;
222 config_update_recurse_submodules = v;
224 return 0;
227 int option_parse_recurse_submodules_worktree_updater(const struct option *opt,
228 const char *arg, int unset)
230 if (unset) {
231 config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
232 return 0;
234 if (arg)
235 config_update_recurse_submodules =
236 parse_update_recurse_submodules_arg(opt->long_name,
237 arg);
238 else
239 config_update_recurse_submodules = RECURSE_SUBMODULES_ON;
241 return 0;
245 * Determine if a submodule has been initialized at a given 'path'
248 * NEEDSWORK: Emit a warning if submodule.active exists, but is valueless,
249 * ie, the config looks like: "[submodule] active\n".
250 * Since that is an invalid pathspec, we should inform the user.
252 int is_tree_submodule_active(struct repository *repo,
253 const struct object_id *treeish_name,
254 const char *path)
256 int ret = 0;
257 char *key = NULL;
258 char *value = NULL;
259 const struct string_list *sl;
260 const struct submodule *module;
262 module = submodule_from_path(repo, treeish_name, path);
264 /* early return if there isn't a path->module mapping */
265 if (!module)
266 return 0;
268 /* submodule.<name>.active is set */
269 key = xstrfmt("submodule.%s.active", module->name);
270 if (!repo_config_get_bool(repo, key, &ret)) {
271 free(key);
272 return ret;
274 free(key);
276 /* submodule.active is set */
277 sl = repo_config_get_value_multi(repo, "submodule.active");
278 if (sl) {
279 struct pathspec ps;
280 struct strvec args = STRVEC_INIT;
281 const struct string_list_item *item;
283 for_each_string_list_item(item, sl) {
284 strvec_push(&args, item->string);
287 parse_pathspec(&ps, 0, 0, NULL, args.v);
288 ret = match_pathspec(repo->index, &ps, path, strlen(path), 0, NULL, 1);
290 strvec_clear(&args);
291 clear_pathspec(&ps);
292 return ret;
295 /* fallback to checking if the URL is set */
296 key = xstrfmt("submodule.%s.url", module->name);
297 ret = !repo_config_get_string(repo, key, &value);
299 free(value);
300 free(key);
301 return ret;
304 int is_submodule_active(struct repository *repo, const char *path)
306 return is_tree_submodule_active(repo, null_oid(), path);
309 int is_submodule_populated_gently(const char *path, int *return_error_code)
311 int ret = 0;
312 char *gitdir = xstrfmt("%s/.git", path);
314 if (resolve_gitdir_gently(gitdir, return_error_code))
315 ret = 1;
317 free(gitdir);
318 return ret;
322 * Dies if the provided 'prefix' corresponds to an unpopulated submodule
324 void die_in_unpopulated_submodule(struct index_state *istate,
325 const char *prefix)
327 int i, prefixlen;
329 if (!prefix)
330 return;
332 prefixlen = strlen(prefix);
334 for (i = 0; i < istate->cache_nr; i++) {
335 struct cache_entry *ce = istate->cache[i];
336 int ce_len = ce_namelen(ce);
338 if (!S_ISGITLINK(ce->ce_mode))
339 continue;
340 if (prefixlen <= ce_len)
341 continue;
342 if (strncmp(ce->name, prefix, ce_len))
343 continue;
344 if (prefix[ce_len] != '/')
345 continue;
347 die(_("in unpopulated submodule '%s'"), ce->name);
352 * Dies if any paths in the provided pathspec descends into a submodule
354 void die_path_inside_submodule(struct index_state *istate,
355 const struct pathspec *ps)
357 int i, j;
359 for (i = 0; i < istate->cache_nr; i++) {
360 struct cache_entry *ce = istate->cache[i];
361 int ce_len = ce_namelen(ce);
363 if (!S_ISGITLINK(ce->ce_mode))
364 continue;
366 for (j = 0; j < ps->nr ; j++) {
367 const struct pathspec_item *item = &ps->items[j];
369 if (item->len <= ce_len)
370 continue;
371 if (item->match[ce_len] != '/')
372 continue;
373 if (strncmp(ce->name, item->match, ce_len))
374 continue;
375 if (item->len == ce_len + 1)
376 continue;
378 die(_("Pathspec '%s' is in submodule '%.*s'"),
379 item->original, ce_len, ce->name);
384 enum submodule_update_type parse_submodule_update_type(const char *value)
386 if (!strcmp(value, "none"))
387 return SM_UPDATE_NONE;
388 else if (!strcmp(value, "checkout"))
389 return SM_UPDATE_CHECKOUT;
390 else if (!strcmp(value, "rebase"))
391 return SM_UPDATE_REBASE;
392 else if (!strcmp(value, "merge"))
393 return SM_UPDATE_MERGE;
394 else if (*value == '!')
395 return SM_UPDATE_COMMAND;
396 else
397 return SM_UPDATE_UNSPECIFIED;
400 int parse_submodule_update_strategy(const char *value,
401 struct submodule_update_strategy *dst)
403 enum submodule_update_type type;
405 free((void*)dst->command);
406 dst->command = NULL;
408 type = parse_submodule_update_type(value);
409 if (type == SM_UPDATE_UNSPECIFIED)
410 return -1;
412 dst->type = type;
413 if (type == SM_UPDATE_COMMAND)
414 dst->command = xstrdup(value + 1);
416 return 0;
419 const char *submodule_update_type_to_string(enum submodule_update_type type)
421 switch (type) {
422 case SM_UPDATE_CHECKOUT:
423 return "checkout";
424 case SM_UPDATE_MERGE:
425 return "merge";
426 case SM_UPDATE_REBASE:
427 return "rebase";
428 case SM_UPDATE_NONE:
429 return "none";
430 case SM_UPDATE_UNSPECIFIED:
431 case SM_UPDATE_COMMAND:
432 BUG("init_submodule() should handle type %d", type);
433 default:
434 BUG("unexpected update strategy type: %d", type);
438 void handle_ignore_submodules_arg(struct diff_options *diffopt,
439 const char *arg)
441 diffopt->flags.ignore_submodule_set = 1;
442 diffopt->flags.ignore_submodules = 0;
443 diffopt->flags.ignore_untracked_in_submodules = 0;
444 diffopt->flags.ignore_dirty_submodules = 0;
446 if (!strcmp(arg, "all"))
447 diffopt->flags.ignore_submodules = 1;
448 else if (!strcmp(arg, "untracked"))
449 diffopt->flags.ignore_untracked_in_submodules = 1;
450 else if (!strcmp(arg, "dirty"))
451 diffopt->flags.ignore_dirty_submodules = 1;
452 else if (strcmp(arg, "none"))
453 die(_("bad --ignore-submodules argument: %s"), arg);
455 * Please update _git_status() in git-completion.bash when you
456 * add new options
460 static int prepare_submodule_diff_summary(struct repository *r, struct rev_info *rev,
461 const char *path,
462 struct commit *left, struct commit *right,
463 struct commit_list *merge_bases)
465 struct commit_list *list;
467 repo_init_revisions(r, rev, NULL);
468 setup_revisions(0, NULL, rev, NULL);
469 rev->left_right = 1;
470 rev->first_parent_only = 1;
471 left->object.flags |= SYMMETRIC_LEFT;
472 add_pending_object(rev, &left->object, path);
473 add_pending_object(rev, &right->object, path);
474 for (list = merge_bases; list; list = list->next) {
475 list->item->object.flags |= UNINTERESTING;
476 add_pending_object(rev, &list->item->object,
477 oid_to_hex(&list->item->object.oid));
479 return prepare_revision_walk(rev);
482 static void print_submodule_diff_summary(struct repository *r, struct rev_info *rev, struct diff_options *o)
484 static const char format[] = " %m %s";
485 struct strbuf sb = STRBUF_INIT;
486 struct commit *commit;
488 while ((commit = get_revision(rev))) {
489 struct pretty_print_context ctx = {0};
490 ctx.date_mode = rev->date_mode;
491 ctx.output_encoding = get_log_output_encoding();
492 strbuf_setlen(&sb, 0);
493 repo_format_commit_message(r, commit, format, &sb,
494 &ctx);
495 strbuf_addch(&sb, '\n');
496 if (commit->object.flags & SYMMETRIC_LEFT)
497 diff_emit_submodule_del(o, sb.buf);
498 else
499 diff_emit_submodule_add(o, sb.buf);
501 strbuf_release(&sb);
504 void prepare_submodule_repo_env(struct strvec *out)
506 prepare_other_repo_env(out, DEFAULT_GIT_DIR_ENVIRONMENT);
509 static void prepare_submodule_repo_env_in_gitdir(struct strvec *out)
511 prepare_other_repo_env(out, ".");
515 * Initialize a repository struct for a submodule based on the provided 'path'.
517 * Returns the repository struct on success,
518 * NULL when the submodule is not present.
520 static struct repository *open_submodule(const char *path)
522 struct strbuf sb = STRBUF_INIT;
523 struct repository *out = xmalloc(sizeof(*out));
525 if (submodule_to_gitdir(&sb, path) || repo_init(out, sb.buf, NULL)) {
526 strbuf_release(&sb);
527 free(out);
528 return NULL;
531 /* Mark it as a submodule */
532 out->submodule_prefix = xstrdup(path);
534 strbuf_release(&sb);
535 return out;
539 * Helper function to display the submodule header line prior to the full
540 * summary output.
542 * If it can locate the submodule git directory it will create a repository
543 * handle for the submodule and lookup both the left and right commits and
544 * put them into the left and right pointers.
546 static void show_submodule_header(struct diff_options *o,
547 const char *path,
548 struct object_id *one, struct object_id *two,
549 unsigned dirty_submodule,
550 struct repository *sub,
551 struct commit **left, struct commit **right,
552 struct commit_list **merge_bases)
554 const char *message = NULL;
555 struct strbuf sb = STRBUF_INIT;
556 int fast_forward = 0, fast_backward = 0;
558 if (dirty_submodule & DIRTY_SUBMODULE_UNTRACKED)
559 diff_emit_submodule_untracked(o, path);
561 if (dirty_submodule & DIRTY_SUBMODULE_MODIFIED)
562 diff_emit_submodule_modified(o, path);
564 if (is_null_oid(one))
565 message = "(new submodule)";
566 else if (is_null_oid(two))
567 message = "(submodule deleted)";
569 if (!sub) {
570 if (!message)
571 message = "(commits not present)";
572 goto output_header;
576 * Attempt to lookup the commit references, and determine if this is
577 * a fast forward or fast backwards update.
579 *left = lookup_commit_reference(sub, one);
580 *right = lookup_commit_reference(sub, two);
583 * Warn about missing commits in the submodule project, but only if
584 * they aren't null.
586 if ((!is_null_oid(one) && !*left) ||
587 (!is_null_oid(two) && !*right))
588 message = "(commits not present)";
590 *merge_bases = repo_get_merge_bases(sub, *left, *right);
591 if (*merge_bases) {
592 if ((*merge_bases)->item == *left)
593 fast_forward = 1;
594 else if ((*merge_bases)->item == *right)
595 fast_backward = 1;
598 if (oideq(one, two)) {
599 strbuf_release(&sb);
600 return;
603 output_header:
604 strbuf_addf(&sb, "Submodule %s ", path);
605 strbuf_add_unique_abbrev(&sb, one, DEFAULT_ABBREV);
606 strbuf_addstr(&sb, (fast_backward || fast_forward) ? ".." : "...");
607 strbuf_add_unique_abbrev(&sb, two, DEFAULT_ABBREV);
608 if (message)
609 strbuf_addf(&sb, " %s\n", message);
610 else
611 strbuf_addf(&sb, "%s:\n", fast_backward ? " (rewind)" : "");
612 diff_emit_submodule_header(o, sb.buf);
614 strbuf_release(&sb);
617 void show_submodule_diff_summary(struct diff_options *o, const char *path,
618 struct object_id *one, struct object_id *two,
619 unsigned dirty_submodule)
621 struct rev_info rev = REV_INFO_INIT;
622 struct commit *left = NULL, *right = NULL;
623 struct commit_list *merge_bases = NULL;
624 struct repository *sub;
626 sub = open_submodule(path);
627 show_submodule_header(o, path, one, two, dirty_submodule,
628 sub, &left, &right, &merge_bases);
631 * If we don't have both a left and a right pointer, there is no
632 * reason to try and display a summary. The header line should contain
633 * all the information the user needs.
635 if (!left || !right || !sub)
636 goto out;
638 /* Treat revision walker failure the same as missing commits */
639 if (prepare_submodule_diff_summary(sub, &rev, path, left, right, merge_bases)) {
640 diff_emit_submodule_error(o, "(revision walker failed)\n");
641 goto out;
644 print_submodule_diff_summary(sub, &rev, o);
646 out:
647 free_commit_list(merge_bases);
648 release_revisions(&rev);
649 clear_commit_marks(left, ~0);
650 clear_commit_marks(right, ~0);
651 if (sub) {
652 repo_clear(sub);
653 free(sub);
657 void show_submodule_inline_diff(struct diff_options *o, const char *path,
658 struct object_id *one, struct object_id *two,
659 unsigned dirty_submodule)
661 const struct object_id *old_oid = the_hash_algo->empty_tree, *new_oid = the_hash_algo->empty_tree;
662 struct commit *left = NULL, *right = NULL;
663 struct commit_list *merge_bases = NULL;
664 struct child_process cp = CHILD_PROCESS_INIT;
665 struct strbuf sb = STRBUF_INIT;
666 struct repository *sub;
668 sub = open_submodule(path);
669 show_submodule_header(o, path, one, two, dirty_submodule,
670 sub, &left, &right, &merge_bases);
672 /* We need a valid left and right commit to display a difference */
673 if (!(left || is_null_oid(one)) ||
674 !(right || is_null_oid(two)))
675 goto done;
677 if (left)
678 old_oid = one;
679 if (right)
680 new_oid = two;
682 cp.git_cmd = 1;
683 cp.dir = path;
684 cp.out = -1;
685 cp.no_stdin = 1;
687 /* TODO: other options may need to be passed here. */
688 strvec_pushl(&cp.args, "diff", "--submodule=diff", NULL);
689 strvec_pushf(&cp.args, "--color=%s", want_color(o->use_color) ?
690 "always" : "never");
692 if (o->flags.reverse_diff) {
693 strvec_pushf(&cp.args, "--src-prefix=%s%s/",
694 o->b_prefix, path);
695 strvec_pushf(&cp.args, "--dst-prefix=%s%s/",
696 o->a_prefix, path);
697 } else {
698 strvec_pushf(&cp.args, "--src-prefix=%s%s/",
699 o->a_prefix, path);
700 strvec_pushf(&cp.args, "--dst-prefix=%s%s/",
701 o->b_prefix, path);
703 strvec_push(&cp.args, oid_to_hex(old_oid));
705 * If the submodule has modified content, we will diff against the
706 * work tree, under the assumption that the user has asked for the
707 * diff format and wishes to actually see all differences even if they
708 * haven't yet been committed to the submodule yet.
710 if (!(dirty_submodule & DIRTY_SUBMODULE_MODIFIED))
711 strvec_push(&cp.args, oid_to_hex(new_oid));
713 prepare_submodule_repo_env(&cp.env);
715 if (!is_directory(path)) {
716 /* fall back to absorbed git dir, if any */
717 if (!sub)
718 goto done;
719 cp.dir = sub->gitdir;
720 strvec_push(&cp.env, GIT_DIR_ENVIRONMENT "=.");
721 strvec_push(&cp.env, GIT_WORK_TREE_ENVIRONMENT "=.");
724 if (start_command(&cp)) {
725 diff_emit_submodule_error(o, "(diff failed)\n");
726 goto done;
729 while (strbuf_getwholeline_fd(&sb, cp.out, '\n') != EOF)
730 diff_emit_submodule_pipethrough(o, sb.buf, sb.len);
732 if (finish_command(&cp))
733 diff_emit_submodule_error(o, "(diff failed)\n");
735 done:
736 strbuf_release(&sb);
737 free_commit_list(merge_bases);
738 if (left)
739 clear_commit_marks(left, ~0);
740 if (right)
741 clear_commit_marks(right, ~0);
742 if (sub) {
743 repo_clear(sub);
744 free(sub);
748 int should_update_submodules(void)
750 return config_update_recurse_submodules == RECURSE_SUBMODULES_ON;
753 const struct submodule *submodule_from_ce(const struct cache_entry *ce)
755 if (!S_ISGITLINK(ce->ce_mode))
756 return NULL;
758 if (!should_update_submodules())
759 return NULL;
761 return submodule_from_path(the_repository, null_oid(), ce->name);
765 struct collect_changed_submodules_cb_data {
766 struct repository *repo;
767 struct string_list *changed;
768 const struct object_id *commit_oid;
772 * this would normally be two functions: default_name_from_path() and
773 * path_from_default_name(). Since the default name is the same as
774 * the submodule path we can get away with just one function which only
775 * checks whether there is a submodule in the working directory at that
776 * location.
778 static const char *default_name_or_path(const char *path_or_name)
780 int error_code;
782 if (!is_submodule_populated_gently(path_or_name, &error_code))
783 return NULL;
785 return path_or_name;
789 * Holds relevant information for a changed submodule. Used as the .util
790 * member of the changed submodule name string_list_item.
792 * (super_oid, path) allows the submodule config to be read from _some_
793 * .gitmodules file. We store this information the first time we find a
794 * superproject commit that points to the submodule, but this is
795 * arbitrary - we can choose any (super_oid, path) that matches the
796 * submodule's name.
798 * NEEDSWORK: Storing an arbitrary commit is undesirable because we can't
799 * guarantee that we're reading the commit that the user would expect. A better
800 * scheme would be to just fetch a submodule by its name. This requires two
801 * steps:
802 * - Create a function that behaves like repo_submodule_init(), but accepts a
803 * submodule name instead of treeish_name and path. This should be easy
804 * because repo_submodule_init() internally uses the submodule's name.
806 * - Replace most instances of 'struct submodule' (which is the .gitmodules
807 * config) with just the submodule name. This is OK because we expect
808 * submodule settings to be stored in .git/config (via "git submodule init"),
809 * not .gitmodules. This also lets us delete get_non_gitmodules_submodule(),
810 * which constructs a bogus 'struct submodule' for the sake of giving a
811 * placeholder name to a gitlink.
813 struct changed_submodule_data {
815 * The first superproject commit in the rev walk that points to
816 * the submodule.
818 const struct object_id *super_oid;
820 * Path to the submodule in the superproject commit referenced
821 * by 'super_oid'.
823 char *path;
824 /* The submodule commits that have changed in the rev walk. */
825 struct oid_array new_commits;
828 static void changed_submodule_data_clear(struct changed_submodule_data *cs_data)
830 oid_array_clear(&cs_data->new_commits);
831 free(cs_data->path);
834 static void collect_changed_submodules_cb(struct diff_queue_struct *q,
835 struct diff_options *options UNUSED,
836 void *data)
838 struct collect_changed_submodules_cb_data *me = data;
839 struct string_list *changed = me->changed;
840 const struct object_id *commit_oid = me->commit_oid;
841 int i;
843 for (i = 0; i < q->nr; i++) {
844 struct diff_filepair *p = q->queue[i];
845 const struct submodule *submodule;
846 const char *name;
847 struct string_list_item *item;
848 struct changed_submodule_data *cs_data;
850 if (!S_ISGITLINK(p->two->mode))
851 continue;
853 submodule = submodule_from_path(me->repo,
854 commit_oid, p->two->path);
855 if (submodule)
856 name = submodule->name;
857 else {
858 name = default_name_or_path(p->two->path);
859 /* make sure name does not collide with existing one */
860 if (name)
861 submodule = submodule_from_name(me->repo,
862 commit_oid, name);
863 if (submodule) {
864 warning(_("Submodule in commit %s at path: "
865 "'%s' collides with a submodule named "
866 "the same. Skipping it."),
867 oid_to_hex(commit_oid), p->two->path);
868 name = NULL;
872 if (!name)
873 continue;
875 item = string_list_insert(changed, name);
876 if (item->util)
877 cs_data = item->util;
878 else {
879 item->util = xcalloc(1, sizeof(struct changed_submodule_data));
880 cs_data = item->util;
881 cs_data->super_oid = commit_oid;
882 cs_data->path = xstrdup(p->two->path);
884 oid_array_append(&cs_data->new_commits, &p->two->oid);
889 * Collect the paths of submodules in 'changed' which have changed based on
890 * the revisions as specified in 'argv'. Each entry in 'changed' will also
891 * have a corresponding 'struct oid_array' (in the 'util' field) which lists
892 * what the submodule pointers were updated to during the change.
894 static void collect_changed_submodules(struct repository *r,
895 struct string_list *changed,
896 struct strvec *argv)
898 struct rev_info rev;
899 const struct commit *commit;
900 int save_warning;
901 struct setup_revision_opt s_r_opt = {
902 .assume_dashdash = 1,
905 save_warning = warn_on_object_refname_ambiguity;
906 warn_on_object_refname_ambiguity = 0;
907 repo_init_revisions(r, &rev, NULL);
908 setup_revisions(argv->nr, argv->v, &rev, &s_r_opt);
909 warn_on_object_refname_ambiguity = save_warning;
910 if (prepare_revision_walk(&rev))
911 die(_("revision walk setup failed"));
913 while ((commit = get_revision(&rev))) {
914 struct rev_info diff_rev;
915 struct collect_changed_submodules_cb_data data;
916 data.repo = r;
917 data.changed = changed;
918 data.commit_oid = &commit->object.oid;
920 repo_init_revisions(r, &diff_rev, NULL);
921 diff_rev.diffopt.output_format |= DIFF_FORMAT_CALLBACK;
922 diff_rev.diffopt.format_callback = collect_changed_submodules_cb;
923 diff_rev.diffopt.format_callback_data = &data;
924 diff_rev.dense_combined_merges = 1;
925 diff_tree_combined_merge(commit, &diff_rev);
926 release_revisions(&diff_rev);
929 reset_revision_walk();
930 release_revisions(&rev);
933 static void free_submodules_data(struct string_list *submodules)
935 struct string_list_item *item;
936 for_each_string_list_item(item, submodules)
937 changed_submodule_data_clear(item->util);
939 string_list_clear(submodules, 1);
942 static int has_remote(const char *refname UNUSED,
943 const struct object_id *oid UNUSED,
944 int flags UNUSED, void *cb_data UNUSED)
946 return 1;
949 static int append_oid_to_argv(const struct object_id *oid, void *data)
951 struct strvec *argv = data;
952 strvec_push(argv, oid_to_hex(oid));
953 return 0;
956 struct has_commit_data {
957 struct repository *repo;
958 int result;
959 const char *path;
960 const struct object_id *super_oid;
963 static int check_has_commit(const struct object_id *oid, void *data)
965 struct has_commit_data *cb = data;
966 struct repository subrepo;
967 enum object_type type;
969 if (repo_submodule_init(&subrepo, cb->repo, cb->path, cb->super_oid)) {
970 cb->result = 0;
971 /* subrepo failed to init, so don't clean it up. */
972 return 0;
975 type = oid_object_info(&subrepo, oid, NULL);
977 switch (type) {
978 case OBJ_COMMIT:
979 goto cleanup;
980 case OBJ_BAD:
982 * Object is missing or invalid. If invalid, an error message
983 * has already been printed.
985 cb->result = 0;
986 goto cleanup;
987 default:
988 die(_("submodule entry '%s' (%s) is a %s, not a commit"),
989 cb->path, oid_to_hex(oid), type_name(type));
991 cleanup:
992 repo_clear(&subrepo);
993 return 0;
996 static int submodule_has_commits(struct repository *r,
997 const char *path,
998 const struct object_id *super_oid,
999 struct oid_array *commits)
1001 struct has_commit_data has_commit = {
1002 .repo = r,
1003 .result = 1,
1004 .path = path,
1005 .super_oid = super_oid
1008 oid_array_for_each_unique(commits, check_has_commit, &has_commit);
1010 if (has_commit.result) {
1012 * Even if the submodule is checked out and the commit is
1013 * present, make sure it exists in the submodule's object store
1014 * and that it is reachable from a ref.
1016 struct child_process cp = CHILD_PROCESS_INIT;
1017 struct strbuf out = STRBUF_INIT;
1019 strvec_pushl(&cp.args, "rev-list", "-n", "1", NULL);
1020 oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
1021 strvec_pushl(&cp.args, "--not", "--all", NULL);
1023 prepare_submodule_repo_env(&cp.env);
1024 cp.git_cmd = 1;
1025 cp.no_stdin = 1;
1026 cp.dir = path;
1028 if (capture_command(&cp, &out, GIT_MAX_HEXSZ + 1) || out.len)
1029 has_commit.result = 0;
1031 strbuf_release(&out);
1034 return has_commit.result;
1037 static int submodule_needs_pushing(struct repository *r,
1038 const char *path,
1039 struct oid_array *commits)
1041 if (!submodule_has_commits(r, path, null_oid(), commits))
1043 * NOTE: We do consider it safe to return "no" here. The
1044 * correct answer would be "We do not know" instead of
1045 * "No push needed", but it is quite hard to change
1046 * the submodule pointer without having the submodule
1047 * around. If a user did however change the submodules
1048 * without having the submodule around, this indicates
1049 * an expert who knows what they are doing or a
1050 * maintainer integrating work from other people. In
1051 * both cases it should be safe to skip this check.
1053 return 0;
1055 if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
1056 struct child_process cp = CHILD_PROCESS_INIT;
1057 struct strbuf buf = STRBUF_INIT;
1058 int needs_pushing = 0;
1060 strvec_push(&cp.args, "rev-list");
1061 oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
1062 strvec_pushl(&cp.args, "--not", "--remotes", "-n", "1" , NULL);
1064 prepare_submodule_repo_env(&cp.env);
1065 cp.git_cmd = 1;
1066 cp.no_stdin = 1;
1067 cp.out = -1;
1068 cp.dir = path;
1069 if (start_command(&cp))
1070 die(_("Could not run 'git rev-list <commits> --not --remotes -n 1' command in submodule %s"),
1071 path);
1072 if (strbuf_read(&buf, cp.out, the_hash_algo->hexsz + 1))
1073 needs_pushing = 1;
1074 finish_command(&cp);
1075 close(cp.out);
1076 strbuf_release(&buf);
1077 return needs_pushing;
1080 return 0;
1083 int find_unpushed_submodules(struct repository *r,
1084 struct oid_array *commits,
1085 const char *remotes_name,
1086 struct string_list *needs_pushing)
1088 struct string_list submodules = STRING_LIST_INIT_DUP;
1089 struct string_list_item *name;
1090 struct strvec argv = STRVEC_INIT;
1092 /* argv.v[0] will be ignored by setup_revisions */
1093 strvec_push(&argv, "find_unpushed_submodules");
1094 oid_array_for_each_unique(commits, append_oid_to_argv, &argv);
1095 strvec_push(&argv, "--not");
1096 strvec_pushf(&argv, "--remotes=%s", remotes_name);
1098 collect_changed_submodules(r, &submodules, &argv);
1100 for_each_string_list_item(name, &submodules) {
1101 struct changed_submodule_data *cs_data = name->util;
1102 const struct submodule *submodule;
1103 const char *path = NULL;
1105 submodule = submodule_from_name(r, null_oid(), name->string);
1106 if (submodule)
1107 path = submodule->path;
1108 else
1109 path = default_name_or_path(name->string);
1111 if (!path)
1112 continue;
1114 if (submodule_needs_pushing(r, path, &cs_data->new_commits))
1115 string_list_insert(needs_pushing, path);
1118 free_submodules_data(&submodules);
1119 strvec_clear(&argv);
1121 return needs_pushing->nr;
1124 static int push_submodule(const char *path,
1125 const struct remote *remote,
1126 const struct refspec *rs,
1127 const struct string_list *push_options,
1128 int dry_run)
1130 if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
1131 struct child_process cp = CHILD_PROCESS_INIT;
1132 strvec_push(&cp.args, "push");
1134 * When recursing into a submodule, treat any "only" configurations as "on-
1135 * demand", since "only" would not work (we need all submodules to be pushed
1136 * in order to be able to push the superproject).
1138 strvec_push(&cp.args, "--recurse-submodules=only-is-on-demand");
1139 if (dry_run)
1140 strvec_push(&cp.args, "--dry-run");
1142 if (push_options && push_options->nr) {
1143 const struct string_list_item *item;
1144 for_each_string_list_item(item, push_options)
1145 strvec_pushf(&cp.args, "--push-option=%s",
1146 item->string);
1149 if (remote->origin != REMOTE_UNCONFIGURED) {
1150 int i;
1151 strvec_push(&cp.args, remote->name);
1152 for (i = 0; i < rs->raw_nr; i++)
1153 strvec_push(&cp.args, rs->raw[i]);
1156 prepare_submodule_repo_env(&cp.env);
1157 cp.git_cmd = 1;
1158 cp.no_stdin = 1;
1159 cp.dir = path;
1160 if (run_command(&cp))
1161 return 0;
1162 close(cp.out);
1165 return 1;
1169 * Perform a check in the submodule to see if the remote and refspec work.
1170 * Die if the submodule can't be pushed.
1172 static void submodule_push_check(const char *path, const char *head,
1173 const struct remote *remote,
1174 const struct refspec *rs)
1176 struct child_process cp = CHILD_PROCESS_INIT;
1177 int i;
1179 strvec_push(&cp.args, "submodule--helper");
1180 strvec_push(&cp.args, "push-check");
1181 strvec_push(&cp.args, head);
1182 strvec_push(&cp.args, remote->name);
1184 for (i = 0; i < rs->raw_nr; i++)
1185 strvec_push(&cp.args, rs->raw[i]);
1187 prepare_submodule_repo_env(&cp.env);
1188 cp.git_cmd = 1;
1189 cp.no_stdin = 1;
1190 cp.no_stdout = 1;
1191 cp.dir = path;
1194 * Simply indicate if 'submodule--helper push-check' failed.
1195 * More detailed error information will be provided by the
1196 * child process.
1198 if (run_command(&cp))
1199 die(_("process for submodule '%s' failed"), path);
1202 int push_unpushed_submodules(struct repository *r,
1203 struct oid_array *commits,
1204 const struct remote *remote,
1205 const struct refspec *rs,
1206 const struct string_list *push_options,
1207 int dry_run)
1209 int i, ret = 1;
1210 struct string_list needs_pushing = STRING_LIST_INIT_DUP;
1212 if (!find_unpushed_submodules(r, commits,
1213 remote->name, &needs_pushing))
1214 return 1;
1217 * Verify that the remote and refspec can be propagated to all
1218 * submodules. This check can be skipped if the remote and refspec
1219 * won't be propagated due to the remote being unconfigured (e.g. a URL
1220 * instead of a remote name).
1222 if (remote->origin != REMOTE_UNCONFIGURED) {
1223 char *head;
1224 struct object_id head_oid;
1226 head = resolve_refdup("HEAD", 0, &head_oid, NULL);
1227 if (!head)
1228 die(_("Failed to resolve HEAD as a valid ref."));
1230 for (i = 0; i < needs_pushing.nr; i++)
1231 submodule_push_check(needs_pushing.items[i].string,
1232 head, remote, rs);
1233 free(head);
1236 /* Actually push the submodules */
1237 for (i = 0; i < needs_pushing.nr; i++) {
1238 const char *path = needs_pushing.items[i].string;
1239 fprintf(stderr, _("Pushing submodule '%s'\n"), path);
1240 if (!push_submodule(path, remote, rs,
1241 push_options, dry_run)) {
1242 fprintf(stderr, _("Unable to push submodule '%s'\n"), path);
1243 ret = 0;
1247 string_list_clear(&needs_pushing, 0);
1249 return ret;
1252 static int append_oid_to_array(const char *ref UNUSED,
1253 const struct object_id *oid,
1254 int flags UNUSED, void *data)
1256 struct oid_array *array = data;
1257 oid_array_append(array, oid);
1258 return 0;
1261 void check_for_new_submodule_commits(struct object_id *oid)
1263 if (!initialized_fetch_ref_tips) {
1264 for_each_ref(append_oid_to_array, &ref_tips_before_fetch);
1265 initialized_fetch_ref_tips = 1;
1268 oid_array_append(&ref_tips_after_fetch, oid);
1272 * Returns 1 if there is at least one submodule gitdir in
1273 * $GIT_DIR/modules and 0 otherwise. This follows
1274 * submodule_name_to_gitdir(), which looks for submodules in
1275 * $GIT_DIR/modules, not $GIT_COMMON_DIR.
1277 * A submodule can be moved to $GIT_DIR/modules manually by running "git
1278 * submodule absorbgitdirs", or it may be initialized there by "git
1279 * submodule update".
1281 static int repo_has_absorbed_submodules(struct repository *r)
1283 int ret;
1284 struct strbuf buf = STRBUF_INIT;
1286 strbuf_repo_git_path(&buf, r, "modules/");
1287 ret = file_exists(buf.buf) && !is_empty_dir(buf.buf);
1288 strbuf_release(&buf);
1289 return ret;
1292 static void calculate_changed_submodule_paths(struct repository *r,
1293 struct string_list *changed_submodule_names)
1295 struct strvec argv = STRVEC_INIT;
1296 struct string_list_item *name;
1298 /* No need to check if no submodules would be fetched */
1299 if (!submodule_from_path(r, NULL, NULL) &&
1300 !repo_has_absorbed_submodules(r))
1301 return;
1303 strvec_push(&argv, "--"); /* argv[0] program name */
1304 oid_array_for_each_unique(&ref_tips_after_fetch,
1305 append_oid_to_argv, &argv);
1306 strvec_push(&argv, "--not");
1307 oid_array_for_each_unique(&ref_tips_before_fetch,
1308 append_oid_to_argv, &argv);
1311 * Collect all submodules (whether checked out or not) for which new
1312 * commits have been recorded upstream in "changed_submodule_names".
1314 collect_changed_submodules(r, changed_submodule_names, &argv);
1316 for_each_string_list_item(name, changed_submodule_names) {
1317 struct changed_submodule_data *cs_data = name->util;
1318 const struct submodule *submodule;
1319 const char *path = NULL;
1321 submodule = submodule_from_name(r, null_oid(), name->string);
1322 if (submodule)
1323 path = submodule->path;
1324 else
1325 path = default_name_or_path(name->string);
1327 if (!path)
1328 continue;
1330 if (submodule_has_commits(r, path, null_oid(), &cs_data->new_commits)) {
1331 changed_submodule_data_clear(cs_data);
1332 *name->string = '\0';
1336 string_list_remove_empty_items(changed_submodule_names, 1);
1338 strvec_clear(&argv);
1339 oid_array_clear(&ref_tips_before_fetch);
1340 oid_array_clear(&ref_tips_after_fetch);
1341 initialized_fetch_ref_tips = 0;
1344 int submodule_touches_in_range(struct repository *r,
1345 struct object_id *excl_oid,
1346 struct object_id *incl_oid)
1348 struct string_list subs = STRING_LIST_INIT_DUP;
1349 struct strvec args = STRVEC_INIT;
1350 int ret;
1352 /* No need to check if there are no submodules configured */
1353 if (!submodule_from_path(r, NULL, NULL))
1354 return 0;
1356 strvec_push(&args, "--"); /* args[0] program name */
1357 strvec_push(&args, oid_to_hex(incl_oid));
1358 if (!is_null_oid(excl_oid)) {
1359 strvec_push(&args, "--not");
1360 strvec_push(&args, oid_to_hex(excl_oid));
1363 collect_changed_submodules(r, &subs, &args);
1364 ret = subs.nr;
1366 strvec_clear(&args);
1368 free_submodules_data(&subs);
1369 return ret;
1372 struct submodule_parallel_fetch {
1374 * The index of the last index entry processed by
1375 * get_fetch_task_from_index().
1377 int index_count;
1379 * The index of the last string_list entry processed by
1380 * get_fetch_task_from_changed().
1382 int changed_count;
1383 struct strvec args;
1384 struct repository *r;
1385 const char *prefix;
1386 int command_line_option;
1387 int default_option;
1388 int quiet;
1389 int result;
1392 * Names of submodules that have new commits. Generated by
1393 * walking the newly fetched superproject commits.
1395 struct string_list changed_submodule_names;
1397 * Names of submodules that have already been processed. Lets us
1398 * avoid fetching the same submodule more than once.
1400 struct string_list seen_submodule_names;
1402 /* Pending fetches by OIDs */
1403 struct fetch_task **oid_fetch_tasks;
1404 int oid_fetch_tasks_nr, oid_fetch_tasks_alloc;
1406 struct strbuf submodules_with_errors;
1408 #define SPF_INIT { \
1409 .args = STRVEC_INIT, \
1410 .changed_submodule_names = STRING_LIST_INIT_DUP, \
1411 .seen_submodule_names = STRING_LIST_INIT_DUP, \
1412 .submodules_with_errors = STRBUF_INIT, \
1415 static int get_fetch_recurse_config(const struct submodule *submodule,
1416 struct submodule_parallel_fetch *spf)
1418 if (spf->command_line_option != RECURSE_SUBMODULES_DEFAULT)
1419 return spf->command_line_option;
1421 if (submodule) {
1422 char *key;
1423 const char *value;
1425 int fetch_recurse = submodule->fetch_recurse;
1426 key = xstrfmt("submodule.%s.fetchRecurseSubmodules", submodule->name);
1427 if (!repo_config_get_string_tmp(spf->r, key, &value)) {
1428 fetch_recurse = parse_fetch_recurse_submodules_arg(key, value);
1430 free(key);
1432 if (fetch_recurse != RECURSE_SUBMODULES_NONE)
1433 /* local config overrules everything except commandline */
1434 return fetch_recurse;
1437 return spf->default_option;
1441 * Fetch in progress (if callback data) or
1442 * pending (if in oid_fetch_tasks in struct submodule_parallel_fetch)
1444 struct fetch_task {
1445 struct repository *repo;
1446 const struct submodule *sub;
1447 unsigned free_sub : 1; /* Do we need to free the submodule? */
1448 const char *default_argv; /* The default fetch mode. */
1449 struct strvec git_args; /* Args for the child git process. */
1451 struct oid_array *commits; /* Ensure these commits are fetched */
1455 * When a submodule is not defined in .gitmodules, we cannot access it
1456 * via the regular submodule-config. Create a fake submodule, which we can
1457 * work on.
1459 static const struct submodule *get_non_gitmodules_submodule(const char *path)
1461 struct submodule *ret = NULL;
1462 const char *name = default_name_or_path(path);
1464 if (!name)
1465 return NULL;
1467 ret = xmalloc(sizeof(*ret));
1468 memset(ret, 0, sizeof(*ret));
1469 ret->path = name;
1470 ret->name = name;
1472 return (const struct submodule *) ret;
1475 static void fetch_task_release(struct fetch_task *p)
1477 if (p->free_sub)
1478 free((void*)p->sub);
1479 p->free_sub = 0;
1480 p->sub = NULL;
1482 if (p->repo)
1483 repo_clear(p->repo);
1484 FREE_AND_NULL(p->repo);
1486 strvec_clear(&p->git_args);
1489 static struct repository *get_submodule_repo_for(struct repository *r,
1490 const char *path,
1491 const struct object_id *treeish_name)
1493 struct repository *ret = xmalloc(sizeof(*ret));
1495 if (repo_submodule_init(ret, r, path, treeish_name)) {
1496 free(ret);
1497 return NULL;
1500 return ret;
1503 static struct fetch_task *fetch_task_create(struct submodule_parallel_fetch *spf,
1504 const char *path,
1505 const struct object_id *treeish_name)
1507 struct fetch_task *task = xmalloc(sizeof(*task));
1508 memset(task, 0, sizeof(*task));
1510 task->sub = submodule_from_path(spf->r, treeish_name, path);
1512 if (!task->sub) {
1514 * No entry in .gitmodules? Technically not a submodule,
1515 * but historically we supported repositories that happen to be
1516 * in-place where a gitlink is. Keep supporting them.
1518 task->sub = get_non_gitmodules_submodule(path);
1519 if (!task->sub)
1520 goto cleanup;
1522 task->free_sub = 1;
1525 if (string_list_lookup(&spf->seen_submodule_names, task->sub->name))
1526 goto cleanup;
1528 switch (get_fetch_recurse_config(task->sub, spf))
1530 default:
1531 case RECURSE_SUBMODULES_DEFAULT:
1532 case RECURSE_SUBMODULES_ON_DEMAND:
1533 if (!task->sub ||
1534 !string_list_lookup(
1535 &spf->changed_submodule_names,
1536 task->sub->name))
1537 goto cleanup;
1538 task->default_argv = "on-demand";
1539 break;
1540 case RECURSE_SUBMODULES_ON:
1541 task->default_argv = "yes";
1542 break;
1543 case RECURSE_SUBMODULES_OFF:
1544 goto cleanup;
1547 task->repo = get_submodule_repo_for(spf->r, path, treeish_name);
1549 return task;
1551 cleanup:
1552 fetch_task_release(task);
1553 free(task);
1554 return NULL;
1557 static struct fetch_task *
1558 get_fetch_task_from_index(struct submodule_parallel_fetch *spf,
1559 struct strbuf *err)
1561 for (; spf->index_count < spf->r->index->cache_nr; spf->index_count++) {
1562 const struct cache_entry *ce =
1563 spf->r->index->cache[spf->index_count];
1564 struct fetch_task *task;
1566 if (!S_ISGITLINK(ce->ce_mode))
1567 continue;
1569 task = fetch_task_create(spf, ce->name, null_oid());
1570 if (!task)
1571 continue;
1573 if (task->repo) {
1574 if (!spf->quiet)
1575 strbuf_addf(err, _("Fetching submodule %s%s\n"),
1576 spf->prefix, ce->name);
1578 spf->index_count++;
1579 return task;
1580 } else {
1581 struct strbuf empty_submodule_path = STRBUF_INIT;
1583 fetch_task_release(task);
1584 free(task);
1587 * An empty directory is normal,
1588 * the submodule is not initialized
1590 strbuf_addf(&empty_submodule_path, "%s/%s/",
1591 spf->r->worktree,
1592 ce->name);
1593 if (S_ISGITLINK(ce->ce_mode) &&
1594 !is_empty_dir(empty_submodule_path.buf)) {
1595 spf->result = 1;
1596 strbuf_addf(err,
1597 _("Could not access submodule '%s'\n"),
1598 ce->name);
1600 strbuf_release(&empty_submodule_path);
1603 return NULL;
1606 static struct fetch_task *
1607 get_fetch_task_from_changed(struct submodule_parallel_fetch *spf,
1608 struct strbuf *err)
1610 for (; spf->changed_count < spf->changed_submodule_names.nr;
1611 spf->changed_count++) {
1612 struct string_list_item item =
1613 spf->changed_submodule_names.items[spf->changed_count];
1614 struct changed_submodule_data *cs_data = item.util;
1615 struct fetch_task *task;
1617 if (!is_tree_submodule_active(spf->r, cs_data->super_oid,cs_data->path))
1618 continue;
1620 task = fetch_task_create(spf, cs_data->path,
1621 cs_data->super_oid);
1622 if (!task)
1623 continue;
1625 if (!task->repo) {
1626 strbuf_addf(err, _("Could not access submodule '%s' at commit %s\n"),
1627 cs_data->path,
1628 find_unique_abbrev(cs_data->super_oid, DEFAULT_ABBREV));
1630 fetch_task_release(task);
1631 free(task);
1632 continue;
1635 if (!spf->quiet)
1636 strbuf_addf(err,
1637 _("Fetching submodule %s%s at commit %s\n"),
1638 spf->prefix, task->sub->path,
1639 find_unique_abbrev(cs_data->super_oid,
1640 DEFAULT_ABBREV));
1642 spf->changed_count++;
1644 * NEEDSWORK: Submodules set/unset a value for
1645 * core.worktree when they are populated/unpopulated by
1646 * "git checkout" (and similar commands, see
1647 * submodule_move_head() and
1648 * connect_work_tree_and_git_dir()), but if the
1649 * submodule is unpopulated in another way (e.g. "git
1650 * rm", "rm -r"), core.worktree will still be set even
1651 * though the directory doesn't exist, and the child
1652 * process will crash while trying to chdir into the
1653 * nonexistent directory.
1655 * In this case, we know that the submodule has no
1656 * working tree, so we can work around this by
1657 * setting "--work-tree=." (--bare does not work because
1658 * worktree settings take precedence over bare-ness).
1659 * However, this is not necessarily true in other cases,
1660 * so a generalized solution is still necessary.
1662 * Possible solutions:
1663 * - teach "git [add|rm]" to unset core.worktree and
1664 * discourage users from removing submodules without
1665 * using a Git command.
1666 * - teach submodule child processes to ignore stale
1667 * core.worktree values.
1669 strvec_push(&task->git_args, "--work-tree=.");
1670 return task;
1672 return NULL;
1675 static int get_next_submodule(struct child_process *cp, struct strbuf *err,
1676 void *data, void **task_cb)
1678 struct submodule_parallel_fetch *spf = data;
1679 struct fetch_task *task =
1680 get_fetch_task_from_index(spf, err);
1681 if (!task)
1682 task = get_fetch_task_from_changed(spf, err);
1684 if (task) {
1685 struct strbuf submodule_prefix = STRBUF_INIT;
1687 child_process_init(cp);
1688 cp->dir = task->repo->gitdir;
1689 prepare_submodule_repo_env_in_gitdir(&cp->env);
1690 cp->git_cmd = 1;
1691 strvec_init(&cp->args);
1692 if (task->git_args.nr)
1693 strvec_pushv(&cp->args, task->git_args.v);
1694 strvec_pushv(&cp->args, spf->args.v);
1695 strvec_push(&cp->args, task->default_argv);
1696 strvec_push(&cp->args, "--submodule-prefix");
1698 strbuf_addf(&submodule_prefix, "%s%s/",
1699 spf->prefix,
1700 task->sub->path);
1701 strvec_push(&cp->args, submodule_prefix.buf);
1702 *task_cb = task;
1704 strbuf_release(&submodule_prefix);
1705 string_list_insert(&spf->seen_submodule_names, task->sub->name);
1706 return 1;
1709 if (spf->oid_fetch_tasks_nr) {
1710 struct fetch_task *task =
1711 spf->oid_fetch_tasks[spf->oid_fetch_tasks_nr - 1];
1712 struct strbuf submodule_prefix = STRBUF_INIT;
1713 spf->oid_fetch_tasks_nr--;
1715 strbuf_addf(&submodule_prefix, "%s%s/",
1716 spf->prefix, task->sub->path);
1718 child_process_init(cp);
1719 prepare_submodule_repo_env_in_gitdir(&cp->env);
1720 cp->git_cmd = 1;
1721 cp->dir = task->repo->gitdir;
1723 strvec_init(&cp->args);
1724 strvec_pushv(&cp->args, spf->args.v);
1725 strvec_push(&cp->args, "on-demand");
1726 strvec_push(&cp->args, "--submodule-prefix");
1727 strvec_push(&cp->args, submodule_prefix.buf);
1729 /* NEEDSWORK: have get_default_remote from submodule--helper */
1730 strvec_push(&cp->args, "origin");
1731 oid_array_for_each_unique(task->commits,
1732 append_oid_to_argv, &cp->args);
1734 *task_cb = task;
1735 strbuf_release(&submodule_prefix);
1736 return 1;
1739 return 0;
1742 static int fetch_start_failure(struct strbuf *err,
1743 void *cb, void *task_cb)
1745 struct submodule_parallel_fetch *spf = cb;
1746 struct fetch_task *task = task_cb;
1748 spf->result = 1;
1750 fetch_task_release(task);
1751 return 0;
1754 static int commit_missing_in_sub(const struct object_id *oid, void *data)
1756 struct repository *subrepo = data;
1758 enum object_type type = oid_object_info(subrepo, oid, NULL);
1760 return type != OBJ_COMMIT;
1763 static int fetch_finish(int retvalue, struct strbuf *err,
1764 void *cb, void *task_cb)
1766 struct submodule_parallel_fetch *spf = cb;
1767 struct fetch_task *task = task_cb;
1769 struct string_list_item *it;
1770 struct changed_submodule_data *cs_data;
1772 if (!task || !task->sub)
1773 BUG("callback cookie bogus");
1775 if (retvalue) {
1777 * NEEDSWORK: This indicates that the overall fetch
1778 * failed, even though there may be a subsequent fetch
1779 * by commit hash that might work. It may be a good
1780 * idea to not indicate failure in this case, and only
1781 * indicate failure if the subsequent fetch fails.
1783 spf->result = 1;
1785 strbuf_addf(&spf->submodules_with_errors, "\t%s\n",
1786 task->sub->name);
1789 /* Is this the second time we process this submodule? */
1790 if (task->commits)
1791 goto out;
1793 it = string_list_lookup(&spf->changed_submodule_names, task->sub->name);
1794 if (!it)
1795 /* Could be an unchanged submodule, not contained in the list */
1796 goto out;
1798 cs_data = it->util;
1799 oid_array_filter(&cs_data->new_commits,
1800 commit_missing_in_sub,
1801 task->repo);
1803 /* Are there commits we want, but do not exist? */
1804 if (cs_data->new_commits.nr) {
1805 task->commits = &cs_data->new_commits;
1806 ALLOC_GROW(spf->oid_fetch_tasks,
1807 spf->oid_fetch_tasks_nr + 1,
1808 spf->oid_fetch_tasks_alloc);
1809 spf->oid_fetch_tasks[spf->oid_fetch_tasks_nr] = task;
1810 spf->oid_fetch_tasks_nr++;
1811 return 0;
1814 out:
1815 fetch_task_release(task);
1817 return 0;
1820 int fetch_submodules(struct repository *r,
1821 const struct strvec *options,
1822 const char *prefix, int command_line_option,
1823 int default_option,
1824 int quiet, int max_parallel_jobs)
1826 int i;
1827 struct submodule_parallel_fetch spf = SPF_INIT;
1828 const struct run_process_parallel_opts opts = {
1829 .tr2_category = "submodule",
1830 .tr2_label = "parallel/fetch",
1832 .processes = max_parallel_jobs,
1834 .get_next_task = get_next_submodule,
1835 .start_failure = fetch_start_failure,
1836 .task_finished = fetch_finish,
1837 .data = &spf,
1840 spf.r = r;
1841 spf.command_line_option = command_line_option;
1842 spf.default_option = default_option;
1843 spf.quiet = quiet;
1844 spf.prefix = prefix;
1846 if (!r->worktree)
1847 goto out;
1849 if (repo_read_index(r) < 0)
1850 die(_("index file corrupt"));
1852 strvec_push(&spf.args, "fetch");
1853 for (i = 0; i < options->nr; i++)
1854 strvec_push(&spf.args, options->v[i]);
1855 strvec_push(&spf.args, "--recurse-submodules-default");
1856 /* default value, "--submodule-prefix" and its value are added later */
1858 calculate_changed_submodule_paths(r, &spf.changed_submodule_names);
1859 string_list_sort(&spf.changed_submodule_names);
1860 run_processes_parallel(&opts);
1862 if (spf.submodules_with_errors.len > 0)
1863 fprintf(stderr, _("Errors during submodule fetch:\n%s"),
1864 spf.submodules_with_errors.buf);
1867 strvec_clear(&spf.args);
1868 out:
1869 free_submodules_data(&spf.changed_submodule_names);
1870 return spf.result;
1873 unsigned is_submodule_modified(const char *path, int ignore_untracked)
1875 struct child_process cp = CHILD_PROCESS_INIT;
1876 struct strbuf buf = STRBUF_INIT;
1877 FILE *fp;
1878 unsigned dirty_submodule = 0;
1879 const char *git_dir;
1880 int ignore_cp_exit_code = 0;
1882 strbuf_addf(&buf, "%s/.git", path);
1883 git_dir = read_gitfile(buf.buf);
1884 if (!git_dir)
1885 git_dir = buf.buf;
1886 if (!is_git_directory(git_dir)) {
1887 if (is_directory(git_dir))
1888 die(_("'%s' not recognized as a git repository"), git_dir);
1889 strbuf_release(&buf);
1890 /* The submodule is not checked out, so it is not modified */
1891 return 0;
1893 strbuf_reset(&buf);
1895 strvec_pushl(&cp.args, "status", "--porcelain=2", NULL);
1896 if (ignore_untracked)
1897 strvec_push(&cp.args, "-uno");
1899 prepare_submodule_repo_env(&cp.env);
1900 cp.git_cmd = 1;
1901 cp.no_stdin = 1;
1902 cp.out = -1;
1903 cp.dir = path;
1904 if (start_command(&cp))
1905 die(_("Could not run 'git status --porcelain=2' in submodule %s"), path);
1907 fp = xfdopen(cp.out, "r");
1908 while (strbuf_getwholeline(&buf, fp, '\n') != EOF) {
1909 /* regular untracked files */
1910 if (buf.buf[0] == '?')
1911 dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1913 if (buf.buf[0] == 'u' ||
1914 buf.buf[0] == '1' ||
1915 buf.buf[0] == '2') {
1916 /* T = line type, XY = status, SSSS = submodule state */
1917 if (buf.len < strlen("T XY SSSS"))
1918 BUG("invalid status --porcelain=2 line %s",
1919 buf.buf);
1921 if (buf.buf[5] == 'S' && buf.buf[8] == 'U')
1922 /* nested untracked file */
1923 dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1925 if (buf.buf[0] == 'u' ||
1926 buf.buf[0] == '2' ||
1927 memcmp(buf.buf + 5, "S..U", 4))
1928 /* other change */
1929 dirty_submodule |= DIRTY_SUBMODULE_MODIFIED;
1932 if ((dirty_submodule & DIRTY_SUBMODULE_MODIFIED) &&
1933 ((dirty_submodule & DIRTY_SUBMODULE_UNTRACKED) ||
1934 ignore_untracked)) {
1936 * We're not interested in any further information from
1937 * the child any more, neither output nor its exit code.
1939 ignore_cp_exit_code = 1;
1940 break;
1943 fclose(fp);
1945 if (finish_command(&cp) && !ignore_cp_exit_code)
1946 die(_("'git status --porcelain=2' failed in submodule %s"), path);
1948 strbuf_release(&buf);
1949 return dirty_submodule;
1952 int submodule_uses_gitfile(const char *path)
1954 struct child_process cp = CHILD_PROCESS_INIT;
1955 struct strbuf buf = STRBUF_INIT;
1956 const char *git_dir;
1958 strbuf_addf(&buf, "%s/.git", path);
1959 git_dir = read_gitfile(buf.buf);
1960 if (!git_dir) {
1961 strbuf_release(&buf);
1962 return 0;
1964 strbuf_release(&buf);
1966 /* Now test that all nested submodules use a gitfile too */
1967 strvec_pushl(&cp.args,
1968 "submodule", "foreach", "--quiet", "--recursive",
1969 "test -f .git", NULL);
1971 prepare_submodule_repo_env(&cp.env);
1972 cp.git_cmd = 1;
1973 cp.no_stdin = 1;
1974 cp.no_stderr = 1;
1975 cp.no_stdout = 1;
1976 cp.dir = path;
1977 if (run_command(&cp))
1978 return 0;
1980 return 1;
1984 * Check if it is a bad idea to remove a submodule, i.e. if we'd lose data
1985 * when doing so.
1987 * Return 1 if we'd lose data, return 0 if the removal is fine,
1988 * and negative values for errors.
1990 int bad_to_remove_submodule(const char *path, unsigned flags)
1992 ssize_t len;
1993 struct child_process cp = CHILD_PROCESS_INIT;
1994 struct strbuf buf = STRBUF_INIT;
1995 int ret = 0;
1997 if (!file_exists(path) || is_empty_dir(path))
1998 return 0;
2000 if (!submodule_uses_gitfile(path))
2001 return 1;
2003 strvec_pushl(&cp.args, "status", "--porcelain",
2004 "--ignore-submodules=none", NULL);
2006 if (flags & SUBMODULE_REMOVAL_IGNORE_UNTRACKED)
2007 strvec_push(&cp.args, "-uno");
2008 else
2009 strvec_push(&cp.args, "-uall");
2011 if (!(flags & SUBMODULE_REMOVAL_IGNORE_IGNORED_UNTRACKED))
2012 strvec_push(&cp.args, "--ignored");
2014 prepare_submodule_repo_env(&cp.env);
2015 cp.git_cmd = 1;
2016 cp.no_stdin = 1;
2017 cp.out = -1;
2018 cp.dir = path;
2019 if (start_command(&cp)) {
2020 if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
2021 die(_("could not start 'git status' in submodule '%s'"),
2022 path);
2023 ret = -1;
2024 goto out;
2027 len = strbuf_read(&buf, cp.out, 1024);
2028 if (len > 2)
2029 ret = 1;
2030 close(cp.out);
2032 if (finish_command(&cp)) {
2033 if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
2034 die(_("could not run 'git status' in submodule '%s'"),
2035 path);
2036 ret = -1;
2038 out:
2039 strbuf_release(&buf);
2040 return ret;
2043 void submodule_unset_core_worktree(const struct submodule *sub)
2045 struct strbuf config_path = STRBUF_INIT;
2047 submodule_name_to_gitdir(&config_path, the_repository, sub->name);
2048 strbuf_addstr(&config_path, "/config");
2050 if (git_config_set_in_file_gently(config_path.buf, "core.worktree", NULL))
2051 warning(_("Could not unset core.worktree setting in submodule '%s'"),
2052 sub->path);
2054 strbuf_release(&config_path);
2057 static int submodule_has_dirty_index(const struct submodule *sub)
2059 struct child_process cp = CHILD_PROCESS_INIT;
2061 prepare_submodule_repo_env(&cp.env);
2063 cp.git_cmd = 1;
2064 strvec_pushl(&cp.args, "diff-index", "--quiet",
2065 "--cached", "HEAD", NULL);
2066 cp.no_stdin = 1;
2067 cp.no_stdout = 1;
2068 cp.dir = sub->path;
2069 if (start_command(&cp))
2070 die(_("could not recurse into submodule '%s'"), sub->path);
2072 return finish_command(&cp);
2075 static void submodule_reset_index(const char *path, const char *super_prefix)
2077 struct child_process cp = CHILD_PROCESS_INIT;
2078 prepare_submodule_repo_env(&cp.env);
2080 cp.git_cmd = 1;
2081 cp.no_stdin = 1;
2082 cp.dir = path;
2084 /* TODO: determine if this might overwright untracked files */
2085 strvec_pushl(&cp.args, "read-tree", "-u", "--reset", NULL);
2086 strvec_pushf(&cp.args, "--super-prefix=%s%s/",
2087 (super_prefix ? super_prefix : ""), path);
2089 strvec_push(&cp.args, empty_tree_oid_hex());
2091 if (run_command(&cp))
2092 die(_("could not reset submodule index"));
2096 * Moves a submodule at a given path from a given head to another new head.
2097 * For edge cases (a submodule coming into existence or removing a submodule)
2098 * pass NULL for old or new respectively.
2100 int submodule_move_head(const char *path, const char *super_prefix,
2101 const char *old_head, const char *new_head,
2102 unsigned flags)
2104 int ret = 0;
2105 struct child_process cp = CHILD_PROCESS_INIT;
2106 const struct submodule *sub;
2107 int *error_code_ptr, error_code;
2109 if (!is_submodule_active(the_repository, path))
2110 return 0;
2112 if (flags & SUBMODULE_MOVE_HEAD_FORCE)
2114 * Pass non NULL pointer to is_submodule_populated_gently
2115 * to prevent die()-ing. We'll use connect_work_tree_and_git_dir
2116 * to fixup the submodule in the force case later.
2118 error_code_ptr = &error_code;
2119 else
2120 error_code_ptr = NULL;
2122 if (old_head && !is_submodule_populated_gently(path, error_code_ptr))
2123 return 0;
2125 sub = submodule_from_path(the_repository, null_oid(), path);
2127 if (!sub)
2128 BUG("could not get submodule information for '%s'", path);
2130 if (old_head && !(flags & SUBMODULE_MOVE_HEAD_FORCE)) {
2131 /* Check if the submodule has a dirty index. */
2132 if (submodule_has_dirty_index(sub))
2133 return error(_("submodule '%s' has dirty index"), path);
2136 if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
2137 if (old_head) {
2138 if (!submodule_uses_gitfile(path))
2139 absorb_git_dir_into_superproject(path,
2140 super_prefix);
2141 } else {
2142 struct strbuf gitdir = STRBUF_INIT;
2143 submodule_name_to_gitdir(&gitdir, the_repository,
2144 sub->name);
2145 connect_work_tree_and_git_dir(path, gitdir.buf, 0);
2146 strbuf_release(&gitdir);
2148 /* make sure the index is clean as well */
2149 submodule_reset_index(path, super_prefix);
2152 if (old_head && (flags & SUBMODULE_MOVE_HEAD_FORCE)) {
2153 struct strbuf gitdir = STRBUF_INIT;
2154 submodule_name_to_gitdir(&gitdir, the_repository,
2155 sub->name);
2156 connect_work_tree_and_git_dir(path, gitdir.buf, 1);
2157 strbuf_release(&gitdir);
2161 prepare_submodule_repo_env(&cp.env);
2163 cp.git_cmd = 1;
2164 cp.no_stdin = 1;
2165 cp.dir = path;
2167 strvec_pushl(&cp.args, "read-tree", "--recurse-submodules", NULL);
2168 strvec_pushf(&cp.args, "--super-prefix=%s%s/",
2169 (super_prefix ? super_prefix : ""), path);
2171 if (flags & SUBMODULE_MOVE_HEAD_DRY_RUN)
2172 strvec_push(&cp.args, "-n");
2173 else
2174 strvec_push(&cp.args, "-u");
2176 if (flags & SUBMODULE_MOVE_HEAD_FORCE)
2177 strvec_push(&cp.args, "--reset");
2178 else
2179 strvec_push(&cp.args, "-m");
2181 if (!(flags & SUBMODULE_MOVE_HEAD_FORCE))
2182 strvec_push(&cp.args, old_head ? old_head : empty_tree_oid_hex());
2184 strvec_push(&cp.args, new_head ? new_head : empty_tree_oid_hex());
2186 if (run_command(&cp)) {
2187 ret = error(_("Submodule '%s' could not be updated."), path);
2188 goto out;
2191 if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
2192 if (new_head) {
2193 child_process_init(&cp);
2194 /* also set the HEAD accordingly */
2195 cp.git_cmd = 1;
2196 cp.no_stdin = 1;
2197 cp.dir = path;
2199 prepare_submodule_repo_env(&cp.env);
2200 strvec_pushl(&cp.args, "update-ref", "HEAD",
2201 "--no-deref", new_head, NULL);
2203 if (run_command(&cp)) {
2204 ret = -1;
2205 goto out;
2207 } else {
2208 struct strbuf sb = STRBUF_INIT;
2210 strbuf_addf(&sb, "%s/.git", path);
2211 unlink_or_warn(sb.buf);
2212 strbuf_release(&sb);
2214 if (is_empty_dir(path))
2215 rmdir_or_warn(path);
2217 submodule_unset_core_worktree(sub);
2220 out:
2221 return ret;
2224 int validate_submodule_git_dir(char *git_dir, const char *submodule_name)
2226 size_t len = strlen(git_dir), suffix_len = strlen(submodule_name);
2227 char *p;
2228 int ret = 0;
2230 if (len <= suffix_len || (p = git_dir + len - suffix_len)[-1] != '/' ||
2231 strcmp(p, submodule_name))
2232 BUG("submodule name '%s' not a suffix of git dir '%s'",
2233 submodule_name, git_dir);
2236 * We prevent the contents of sibling submodules' git directories to
2237 * clash.
2239 * Example: having a submodule named `hippo` and another one named
2240 * `hippo/hooks` would result in the git directories
2241 * `.git/modules/hippo/` and `.git/modules/hippo/hooks/`, respectively,
2242 * but the latter directory is already designated to contain the hooks
2243 * of the former.
2245 for (; *p; p++) {
2246 if (is_dir_sep(*p)) {
2247 char c = *p;
2249 *p = '\0';
2250 if (is_git_directory(git_dir))
2251 ret = -1;
2252 *p = c;
2254 if (ret < 0)
2255 return error(_("submodule git dir '%s' is "
2256 "inside git dir '%.*s'"),
2257 git_dir,
2258 (int)(p - git_dir), git_dir);
2262 return 0;
2266 * Embeds a single submodules git directory into the superprojects git dir,
2267 * non recursively.
2269 static void relocate_single_git_dir_into_superproject(const char *path,
2270 const char *super_prefix)
2272 char *old_git_dir = NULL, *real_old_git_dir = NULL, *real_new_git_dir = NULL;
2273 struct strbuf new_gitdir = STRBUF_INIT;
2274 const struct submodule *sub;
2276 if (submodule_uses_worktrees(path))
2277 die(_("relocate_gitdir for submodule '%s' with "
2278 "more than one worktree not supported"), path);
2280 old_git_dir = xstrfmt("%s/.git", path);
2281 if (read_gitfile(old_git_dir))
2282 /* If it is an actual gitfile, it doesn't need migration. */
2283 return;
2285 real_old_git_dir = real_pathdup(old_git_dir, 1);
2287 sub = submodule_from_path(the_repository, null_oid(), path);
2288 if (!sub)
2289 die(_("could not lookup name for submodule '%s'"), path);
2291 submodule_name_to_gitdir(&new_gitdir, the_repository, sub->name);
2292 if (validate_submodule_git_dir(new_gitdir.buf, sub->name) < 0)
2293 die(_("refusing to move '%s' into an existing git dir"),
2294 real_old_git_dir);
2295 if (safe_create_leading_directories_const(new_gitdir.buf) < 0)
2296 die(_("could not create directory '%s'"), new_gitdir.buf);
2297 real_new_git_dir = real_pathdup(new_gitdir.buf, 1);
2299 fprintf(stderr, _("Migrating git directory of '%s%s' from\n'%s' to\n'%s'\n"),
2300 super_prefix ? super_prefix : "", path,
2301 real_old_git_dir, real_new_git_dir);
2303 relocate_gitdir(path, real_old_git_dir, real_new_git_dir);
2305 free(old_git_dir);
2306 free(real_old_git_dir);
2307 free(real_new_git_dir);
2308 strbuf_release(&new_gitdir);
2311 static void absorb_git_dir_into_superproject_recurse(const char *path,
2312 const char *super_prefix)
2315 struct child_process cp = CHILD_PROCESS_INIT;
2317 cp.dir = path;
2318 cp.git_cmd = 1;
2319 cp.no_stdin = 1;
2320 strvec_pushl(&cp.args, "submodule--helper",
2321 "absorbgitdirs", NULL);
2322 strvec_pushf(&cp.args, "--super-prefix=%s%s/", super_prefix ?
2323 super_prefix : "", path);
2325 prepare_submodule_repo_env(&cp.env);
2326 if (run_command(&cp))
2327 die(_("could not recurse into submodule '%s'"), path);
2331 * Migrate the git directory of the submodule given by path from
2332 * having its git directory within the working tree to the git dir nested
2333 * in its superprojects git dir under modules/.
2335 void absorb_git_dir_into_superproject(const char *path,
2336 const char *super_prefix)
2338 int err_code;
2339 const char *sub_git_dir;
2340 struct strbuf gitdir = STRBUF_INIT;
2341 strbuf_addf(&gitdir, "%s/.git", path);
2342 sub_git_dir = resolve_gitdir_gently(gitdir.buf, &err_code);
2344 /* Not populated? */
2345 if (!sub_git_dir) {
2346 const struct submodule *sub;
2347 struct strbuf sub_gitdir = STRBUF_INIT;
2349 if (err_code == READ_GITFILE_ERR_STAT_FAILED) {
2350 /* unpopulated as expected */
2351 strbuf_release(&gitdir);
2352 return;
2355 if (err_code != READ_GITFILE_ERR_NOT_A_REPO)
2356 /* We don't know what broke here. */
2357 read_gitfile_error_die(err_code, path, NULL);
2360 * Maybe populated, but no git directory was found?
2361 * This can happen if the superproject is a submodule
2362 * itself and was just absorbed. The absorption of the
2363 * superproject did not rewrite the git file links yet,
2364 * fix it now.
2366 sub = submodule_from_path(the_repository, null_oid(), path);
2367 if (!sub)
2368 die(_("could not lookup name for submodule '%s'"), path);
2369 submodule_name_to_gitdir(&sub_gitdir, the_repository, sub->name);
2370 connect_work_tree_and_git_dir(path, sub_gitdir.buf, 0);
2371 strbuf_release(&sub_gitdir);
2372 } else {
2373 /* Is it already absorbed into the superprojects git dir? */
2374 char *real_sub_git_dir = real_pathdup(sub_git_dir, 1);
2375 char *real_common_git_dir = real_pathdup(get_git_common_dir(), 1);
2377 if (!starts_with(real_sub_git_dir, real_common_git_dir))
2378 relocate_single_git_dir_into_superproject(path, super_prefix);
2380 free(real_sub_git_dir);
2381 free(real_common_git_dir);
2383 strbuf_release(&gitdir);
2385 absorb_git_dir_into_superproject_recurse(path, super_prefix);
2388 int get_superproject_working_tree(struct strbuf *buf)
2390 struct child_process cp = CHILD_PROCESS_INIT;
2391 struct strbuf sb = STRBUF_INIT;
2392 struct strbuf one_up = STRBUF_INIT;
2393 char *cwd = xgetcwd();
2394 int ret = 0;
2395 const char *subpath;
2396 int code;
2397 ssize_t len;
2399 if (!is_inside_work_tree())
2401 * FIXME:
2402 * We might have a superproject, but it is harder
2403 * to determine.
2405 return 0;
2407 if (!strbuf_realpath(&one_up, "../", 0))
2408 return 0;
2410 subpath = relative_path(cwd, one_up.buf, &sb);
2411 strbuf_release(&one_up);
2413 prepare_submodule_repo_env(&cp.env);
2414 strvec_pop(&cp.env);
2416 strvec_pushl(&cp.args, "--literal-pathspecs", "-C", "..",
2417 "ls-files", "-z", "--stage", "--full-name", "--",
2418 subpath, NULL);
2419 strbuf_reset(&sb);
2421 cp.no_stdin = 1;
2422 cp.no_stderr = 1;
2423 cp.out = -1;
2424 cp.git_cmd = 1;
2426 if (start_command(&cp))
2427 die(_("could not start ls-files in .."));
2429 len = strbuf_read(&sb, cp.out, PATH_MAX);
2430 close(cp.out);
2432 if (starts_with(sb.buf, "160000")) {
2433 int super_sub_len;
2434 int cwd_len = strlen(cwd);
2435 char *super_sub, *super_wt;
2438 * There is a superproject having this repo as a submodule.
2439 * The format is <mode> SP <hash> SP <stage> TAB <full name> \0,
2440 * We're only interested in the name after the tab.
2442 super_sub = strchr(sb.buf, '\t') + 1;
2443 super_sub_len = strlen(super_sub);
2445 if (super_sub_len > cwd_len ||
2446 strcmp(&cwd[cwd_len - super_sub_len], super_sub))
2447 BUG("returned path string doesn't match cwd?");
2449 super_wt = xstrdup(cwd);
2450 super_wt[cwd_len - super_sub_len] = '\0';
2452 strbuf_realpath(buf, super_wt, 1);
2453 ret = 1;
2454 free(super_wt);
2456 free(cwd);
2457 strbuf_release(&sb);
2459 code = finish_command(&cp);
2461 if (code == 128)
2462 /* '../' is not a git repository */
2463 return 0;
2464 if (code == 0 && len == 0)
2465 /* There is an unrelated git repository at '../' */
2466 return 0;
2467 if (code)
2468 die(_("ls-tree returned unexpected return code %d"), code);
2470 return ret;
2474 * Put the gitdir for a submodule (given relative to the main
2475 * repository worktree) into `buf`, or return -1 on error.
2477 int submodule_to_gitdir(struct strbuf *buf, const char *submodule)
2479 const struct submodule *sub;
2480 const char *git_dir;
2481 int ret = 0;
2483 strbuf_reset(buf);
2484 strbuf_addstr(buf, submodule);
2485 strbuf_complete(buf, '/');
2486 strbuf_addstr(buf, ".git");
2488 git_dir = read_gitfile(buf->buf);
2489 if (git_dir) {
2490 strbuf_reset(buf);
2491 strbuf_addstr(buf, git_dir);
2493 if (!is_git_directory(buf->buf)) {
2494 sub = submodule_from_path(the_repository, null_oid(),
2495 submodule);
2496 if (!sub) {
2497 ret = -1;
2498 goto cleanup;
2500 strbuf_reset(buf);
2501 submodule_name_to_gitdir(buf, the_repository, sub->name);
2504 cleanup:
2505 return ret;
2508 void submodule_name_to_gitdir(struct strbuf *buf, struct repository *r,
2509 const char *submodule_name)
2512 * NEEDSWORK: The current way of mapping a submodule's name to
2513 * its location in .git/modules/ has problems with some naming
2514 * schemes. For example, if a submodule is named "foo" and
2515 * another is named "foo/bar" (whether present in the same
2516 * superproject commit or not - the problem will arise if both
2517 * superproject commits have been checked out at any point in
2518 * time), or if two submodule names only have different cases in
2519 * a case-insensitive filesystem.
2521 * There are several solutions, including encoding the path in
2522 * some way, introducing a submodule.<name>.gitdir config in
2523 * .git/config (not .gitmodules) that allows overriding what the
2524 * gitdir of a submodule would be (and teach Git, upon noticing
2525 * a clash, to automatically determine a non-clashing name and
2526 * to write such a config), or introducing a
2527 * submodule.<name>.gitdir config in .gitmodules that repo
2528 * administrators can explicitly set. Nothing has been decided,
2529 * so for now, just append the name at the end of the path.
2531 strbuf_repo_git_path(buf, r, "modules/");
2532 strbuf_addstr(buf, submodule_name);