]> git.ipfire.org Git - thirdparty/git.git/blob - submodule.c
ead3fb5dadca3a8689453df52ac0a414dd22df1e
[thirdparty/git.git] / submodule.c
1 #define USE_THE_REPOSITORY_VARIABLE
2 #define DISABLE_SIGN_COMPARE_WARNINGS
3
4 #include "git-compat-util.h"
5 #include "abspath.h"
6 #include "repository.h"
7 #include "config.h"
8 #include "submodule-config.h"
9 #include "submodule.h"
10 #include "dir.h"
11 #include "diff.h"
12 #include "commit.h"
13 #include "environment.h"
14 #include "gettext.h"
15 #include "hex.h"
16 #include "revision.h"
17 #include "run-command.h"
18 #include "diffcore.h"
19 #include "refs.h"
20 #include "string-list.h"
21 #include "oid-array.h"
22 #include "strvec.h"
23 #include "thread-utils.h"
24 #include "path.h"
25 #include "remote.h"
26 #include "worktree.h"
27 #include "parse-options.h"
28 #include "object-file.h"
29 #include "object-name.h"
30 #include "object-store.h"
31 #include "commit-reach.h"
32 #include "read-cache-ll.h"
33 #include "setup.h"
34 #include "trace2.h"
35
36 static int config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
37 static int initialized_fetch_ref_tips;
38 static struct oid_array ref_tips_before_fetch;
39 static struct oid_array ref_tips_after_fetch;
40
41 /*
42 * Check if the .gitmodules file is unmerged. Parsing of the .gitmodules file
43 * will be disabled because we can't guess what might be configured in
44 * .gitmodules unless the user resolves the conflict.
45 */
46 int is_gitmodules_unmerged(struct index_state *istate)
47 {
48 int pos = index_name_pos(istate, GITMODULES_FILE, strlen(GITMODULES_FILE));
49 if (pos < 0) { /* .gitmodules not found or isn't merged */
50 pos = -1 - pos;
51 if (istate->cache_nr > pos) { /* there is a .gitmodules */
52 const struct cache_entry *ce = istate->cache[pos];
53 if (ce_namelen(ce) == strlen(GITMODULES_FILE) &&
54 !strcmp(ce->name, GITMODULES_FILE))
55 return 1;
56 }
57 }
58
59 return 0;
60 }
61
62 /*
63 * Check if the .gitmodules file is safe to write.
64 *
65 * Writing to the .gitmodules file requires that the file exists in the
66 * working tree or, if it doesn't, that a brand new .gitmodules file is going
67 * to be created (i.e. it's neither in the index nor in the current branch).
68 *
69 * It is not safe to write to .gitmodules if it's not in the working tree but
70 * it is in the index or in the current branch, because writing new values
71 * (and staging them) would blindly overwrite ALL the old content.
72 */
73 int is_writing_gitmodules_ok(void)
74 {
75 struct object_id oid;
76 return file_exists(GITMODULES_FILE) ||
77 (repo_get_oid(the_repository, GITMODULES_INDEX, &oid) < 0 && repo_get_oid(the_repository, GITMODULES_HEAD, &oid) < 0);
78 }
79
80 /*
81 * Check if the .gitmodules file has unstaged modifications. This must be
82 * checked before allowing modifications to the .gitmodules file with the
83 * intention to stage them later, because when continuing we would stage the
84 * modifications the user didn't stage herself too. That might change in a
85 * future version when we learn to stage the changes we do ourselves without
86 * staging any previous modifications.
87 */
88 int is_staging_gitmodules_ok(struct index_state *istate)
89 {
90 int pos = index_name_pos(istate, GITMODULES_FILE, strlen(GITMODULES_FILE));
91
92 if ((pos >= 0) && (pos < istate->cache_nr)) {
93 struct stat st;
94 if (lstat(GITMODULES_FILE, &st) == 0 &&
95 ie_modified(istate, istate->cache[pos], &st, 0) & DATA_CHANGED)
96 return 0;
97 }
98
99 return 1;
100 }
101
102 static int for_each_remote_ref_submodule(const char *submodule,
103 each_ref_fn fn, void *cb_data)
104 {
105 return refs_for_each_remote_ref(repo_get_submodule_ref_store(the_repository,
106 submodule),
107 fn, cb_data);
108 }
109
110 /*
111 * Try to update the "path" entry in the "submodule.<name>" section of the
112 * .gitmodules file. Return 0 only if a .gitmodules file was found, a section
113 * with the correct path=<oldpath> setting was found and we could update it.
114 */
115 int update_path_in_gitmodules(const char *oldpath, const char *newpath)
116 {
117 struct strbuf entry = STRBUF_INIT;
118 const struct submodule *submodule;
119 int ret;
120
121 if (!file_exists(GITMODULES_FILE)) /* Do nothing without .gitmodules */
122 return -1;
123
124 if (is_gitmodules_unmerged(the_repository->index))
125 die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));
126
127 submodule = submodule_from_path(the_repository, null_oid(the_hash_algo), oldpath);
128 if (!submodule || !submodule->name) {
129 warning(_("Could not find section in .gitmodules where path=%s"), oldpath);
130 return -1;
131 }
132 strbuf_addstr(&entry, "submodule.");
133 strbuf_addstr(&entry, submodule->name);
134 strbuf_addstr(&entry, ".path");
135 ret = config_set_in_gitmodules_file_gently(entry.buf, newpath);
136 strbuf_release(&entry);
137 return ret;
138 }
139
140 /*
141 * Try to remove the "submodule.<name>" section from .gitmodules where the given
142 * path is configured. Return 0 only if a .gitmodules file was found, a section
143 * with the correct path=<path> setting was found and we could remove it.
144 */
145 int remove_path_from_gitmodules(const char *path)
146 {
147 struct strbuf sect = STRBUF_INIT;
148 const struct submodule *submodule;
149
150 if (!file_exists(GITMODULES_FILE)) /* Do nothing without .gitmodules */
151 return -1;
152
153 if (is_gitmodules_unmerged(the_repository->index))
154 die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));
155
156 submodule = submodule_from_path(the_repository, null_oid(the_hash_algo), path);
157 if (!submodule || !submodule->name) {
158 warning(_("Could not find section in .gitmodules where path=%s"), path);
159 return -1;
160 }
161 strbuf_addstr(&sect, "submodule.");
162 strbuf_addstr(&sect, submodule->name);
163 if (repo_config_rename_section_in_file(the_repository, GITMODULES_FILE, sect.buf, NULL) < 0) {
164 /* Maybe the user already did that, don't error out here */
165 warning(_("Could not remove .gitmodules entry for %s"), path);
166 strbuf_release(&sect);
167 return -1;
168 }
169 strbuf_release(&sect);
170 return 0;
171 }
172
173 void stage_updated_gitmodules(struct index_state *istate)
174 {
175 if (add_file_to_index(istate, GITMODULES_FILE, 0))
176 die(_("staging updated .gitmodules failed"));
177 }
178
179 static struct string_list added_submodule_odb_paths = STRING_LIST_INIT_DUP;
180
181 void add_submodule_odb_by_path(const char *path)
182 {
183 string_list_insert(&added_submodule_odb_paths, path);
184 }
185
186 int register_all_submodule_odb_as_alternates(void)
187 {
188 int i;
189 int ret = added_submodule_odb_paths.nr;
190
191 for (i = 0; i < added_submodule_odb_paths.nr; i++)
192 add_to_alternates_memory(added_submodule_odb_paths.items[i].string);
193 if (ret) {
194 string_list_clear(&added_submodule_odb_paths, 0);
195 trace2_data_intmax("submodule", the_repository,
196 "register_all_submodule_odb_as_alternates/registered", ret);
197 if (git_env_bool("GIT_TEST_FATAL_REGISTER_SUBMODULE_ODB", 0))
198 BUG("register_all_submodule_odb_as_alternates() called");
199 }
200 return ret;
201 }
202
203 void set_diffopt_flags_from_submodule_config(struct diff_options *diffopt,
204 const char *path)
205 {
206 const struct submodule *submodule = submodule_from_path(the_repository,
207 null_oid(the_hash_algo),
208 path);
209 if (submodule) {
210 const char *ignore;
211 char *key;
212
213 key = xstrfmt("submodule.%s.ignore", submodule->name);
214 if (repo_config_get_string_tmp(the_repository, key, &ignore))
215 ignore = submodule->ignore;
216 free(key);
217
218 if (ignore)
219 handle_ignore_submodules_arg(diffopt, ignore);
220 else if (is_gitmodules_unmerged(the_repository->index))
221 diffopt->flags.ignore_submodules = 1;
222 }
223 }
224
225 /* Cheap function that only determines if we're interested in submodules at all */
226 int git_default_submodule_config(const char *var, const char *value,
227 void *cb UNUSED)
228 {
229 if (!strcmp(var, "submodule.recurse")) {
230 int v = git_config_bool(var, value) ?
231 RECURSE_SUBMODULES_ON : RECURSE_SUBMODULES_OFF;
232 config_update_recurse_submodules = v;
233 }
234 return 0;
235 }
236
237 int option_parse_recurse_submodules_worktree_updater(const struct option *opt,
238 const char *arg, int unset)
239 {
240 if (unset) {
241 config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
242 return 0;
243 }
244 if (arg)
245 config_update_recurse_submodules =
246 parse_update_recurse_submodules_arg(opt->long_name,
247 arg);
248 else
249 config_update_recurse_submodules = RECURSE_SUBMODULES_ON;
250
251 return 0;
252 }
253
254 /*
255 * Determine if a submodule has been initialized at a given 'path'
256 */
257 /*
258 * NEEDSWORK: Emit a warning if submodule.active exists, but is valueless,
259 * ie, the config looks like: "[submodule] active\n".
260 * Since that is an invalid pathspec, we should inform the user.
261 */
262 int is_tree_submodule_active(struct repository *repo,
263 const struct object_id *treeish_name,
264 const char *path)
265 {
266 int ret = 0;
267 char *key = NULL;
268 char *value = NULL;
269 const struct string_list *sl;
270 const struct submodule *module;
271
272 module = submodule_from_path(repo, treeish_name, path);
273
274 /* early return if there isn't a path->module mapping */
275 if (!module)
276 return 0;
277
278 /* submodule.<name>.active is set */
279 key = xstrfmt("submodule.%s.active", module->name);
280 if (!repo_config_get_bool(repo, key, &ret)) {
281 free(key);
282 return ret;
283 }
284 free(key);
285
286 /* submodule.active is set */
287 if (!repo_config_get_string_multi(repo, "submodule.active", &sl)) {
288 struct pathspec ps;
289 struct strvec args = STRVEC_INIT;
290 const struct string_list_item *item;
291
292 for_each_string_list_item(item, sl) {
293 strvec_push(&args, item->string);
294 }
295
296 parse_pathspec(&ps, 0, 0, NULL, args.v);
297 ret = match_pathspec(repo->index, &ps, path, strlen(path), 0, NULL, 1);
298
299 strvec_clear(&args);
300 clear_pathspec(&ps);
301 return ret;
302 }
303
304 /* fallback to checking if the URL is set */
305 key = xstrfmt("submodule.%s.url", module->name);
306 ret = !repo_config_get_string(repo, key, &value);
307
308 free(value);
309 free(key);
310 return ret;
311 }
312
313 int is_submodule_active(struct repository *repo, const char *path)
314 {
315 return is_tree_submodule_active(repo, null_oid(the_hash_algo), path);
316 }
317
318 int is_submodule_populated_gently(const char *path, int *return_error_code)
319 {
320 int ret = 0;
321 char *gitdir = xstrfmt("%s/.git", path);
322
323 if (resolve_gitdir_gently(gitdir, return_error_code))
324 ret = 1;
325
326 free(gitdir);
327 return ret;
328 }
329
330 /*
331 * Dies if the provided 'prefix' corresponds to an unpopulated submodule
332 */
333 void die_in_unpopulated_submodule(struct index_state *istate,
334 const char *prefix)
335 {
336 int i, prefixlen;
337
338 if (!prefix)
339 return;
340
341 prefixlen = strlen(prefix);
342
343 for (i = 0; i < istate->cache_nr; i++) {
344 struct cache_entry *ce = istate->cache[i];
345 int ce_len = ce_namelen(ce);
346
347 if (!S_ISGITLINK(ce->ce_mode))
348 continue;
349 if (prefixlen <= ce_len)
350 continue;
351 if (strncmp(ce->name, prefix, ce_len))
352 continue;
353 if (prefix[ce_len] != '/')
354 continue;
355
356 die(_("in unpopulated submodule '%s'"), ce->name);
357 }
358 }
359
360 /*
361 * Dies if any paths in the provided pathspec descends into a submodule
362 */
363 void die_path_inside_submodule(struct index_state *istate,
364 const struct pathspec *ps)
365 {
366 int i, j;
367
368 for (i = 0; i < istate->cache_nr; i++) {
369 struct cache_entry *ce = istate->cache[i];
370 int ce_len = ce_namelen(ce);
371
372 if (!S_ISGITLINK(ce->ce_mode))
373 continue;
374
375 for (j = 0; j < ps->nr ; j++) {
376 const struct pathspec_item *item = &ps->items[j];
377
378 if (item->len <= ce_len)
379 continue;
380 if (item->match[ce_len] != '/')
381 continue;
382 if (strncmp(ce->name, item->match, ce_len))
383 continue;
384 if (item->len == ce_len + 1)
385 continue;
386
387 die(_("Pathspec '%s' is in submodule '%.*s'"),
388 item->original, ce_len, ce->name);
389 }
390 }
391 }
392
393 enum submodule_update_type parse_submodule_update_type(const char *value)
394 {
395 if (!strcmp(value, "none"))
396 return SM_UPDATE_NONE;
397 else if (!strcmp(value, "checkout"))
398 return SM_UPDATE_CHECKOUT;
399 else if (!strcmp(value, "rebase"))
400 return SM_UPDATE_REBASE;
401 else if (!strcmp(value, "merge"))
402 return SM_UPDATE_MERGE;
403 else if (*value == '!')
404 return SM_UPDATE_COMMAND;
405 else
406 return SM_UPDATE_UNSPECIFIED;
407 }
408
409 int parse_submodule_update_strategy(const char *value,
410 struct submodule_update_strategy *dst)
411 {
412 enum submodule_update_type type;
413
414 free((void*)dst->command);
415 dst->command = NULL;
416
417 type = parse_submodule_update_type(value);
418 if (type == SM_UPDATE_UNSPECIFIED)
419 return -1;
420
421 dst->type = type;
422 if (type == SM_UPDATE_COMMAND)
423 dst->command = xstrdup(value + 1);
424
425 return 0;
426 }
427
428 void submodule_update_strategy_release(struct submodule_update_strategy *strategy)
429 {
430 free((char *) strategy->command);
431 }
432
433 const char *submodule_update_type_to_string(enum submodule_update_type type)
434 {
435 switch (type) {
436 case SM_UPDATE_CHECKOUT:
437 return "checkout";
438 case SM_UPDATE_MERGE:
439 return "merge";
440 case SM_UPDATE_REBASE:
441 return "rebase";
442 case SM_UPDATE_NONE:
443 return "none";
444 case SM_UPDATE_UNSPECIFIED:
445 case SM_UPDATE_COMMAND:
446 BUG("init_submodule() should handle type %d", type);
447 default:
448 BUG("unexpected update strategy type: %d", type);
449 }
450 }
451
452 void handle_ignore_submodules_arg(struct diff_options *diffopt,
453 const char *arg)
454 {
455 diffopt->flags.ignore_submodule_set = 1;
456 diffopt->flags.ignore_submodules = 0;
457 diffopt->flags.ignore_untracked_in_submodules = 0;
458 diffopt->flags.ignore_dirty_submodules = 0;
459
460 if (!strcmp(arg, "all"))
461 diffopt->flags.ignore_submodules = 1;
462 else if (!strcmp(arg, "untracked"))
463 diffopt->flags.ignore_untracked_in_submodules = 1;
464 else if (!strcmp(arg, "dirty"))
465 diffopt->flags.ignore_dirty_submodules = 1;
466 else if (strcmp(arg, "none"))
467 die(_("bad --ignore-submodules argument: %s"), arg);
468 /*
469 * Please update _git_status() in git-completion.bash when you
470 * add new options
471 */
472 }
473
474 static int prepare_submodule_diff_summary(struct repository *r, struct rev_info *rev,
475 const char *path,
476 struct commit *left, struct commit *right,
477 struct commit_list *merge_bases)
478 {
479 struct commit_list *list;
480
481 repo_init_revisions(r, rev, NULL);
482 setup_revisions(0, NULL, rev, NULL);
483 rev->left_right = 1;
484 rev->first_parent_only = 1;
485 left->object.flags |= SYMMETRIC_LEFT;
486 add_pending_object(rev, &left->object, path);
487 add_pending_object(rev, &right->object, path);
488 for (list = merge_bases; list; list = list->next) {
489 list->item->object.flags |= UNINTERESTING;
490 add_pending_object(rev, &list->item->object,
491 oid_to_hex(&list->item->object.oid));
492 }
493 return prepare_revision_walk(rev);
494 }
495
496 static void print_submodule_diff_summary(struct repository *r, struct rev_info *rev, struct diff_options *o)
497 {
498 static const char format[] = " %m %s";
499 struct strbuf sb = STRBUF_INIT;
500 struct commit *commit;
501
502 while ((commit = get_revision(rev))) {
503 struct pretty_print_context ctx = {0};
504 ctx.date_mode = rev->date_mode;
505 ctx.output_encoding = get_log_output_encoding();
506 strbuf_setlen(&sb, 0);
507 repo_format_commit_message(r, commit, format, &sb,
508 &ctx);
509 strbuf_addch(&sb, '\n');
510 if (commit->object.flags & SYMMETRIC_LEFT)
511 diff_emit_submodule_del(o, sb.buf);
512 else
513 diff_emit_submodule_add(o, sb.buf);
514 }
515 strbuf_release(&sb);
516 }
517
518 void prepare_submodule_repo_env(struct strvec *out)
519 {
520 prepare_other_repo_env(out, DEFAULT_GIT_DIR_ENVIRONMENT);
521 }
522
523 static void prepare_submodule_repo_env_in_gitdir(struct strvec *out)
524 {
525 prepare_other_repo_env(out, ".");
526 }
527
528 /*
529 * Initialize a repository struct for a submodule based on the provided 'path'.
530 *
531 * Returns the repository struct on success,
532 * NULL when the submodule is not present.
533 */
534 static struct repository *open_submodule(const char *path)
535 {
536 struct strbuf sb = STRBUF_INIT;
537 struct repository *out = xmalloc(sizeof(*out));
538
539 if (submodule_to_gitdir(the_repository, &sb, path) ||
540 repo_init(out, sb.buf, NULL)) {
541 strbuf_release(&sb);
542 free(out);
543 return NULL;
544 }
545
546 /* Mark it as a submodule */
547 out->submodule_prefix = xstrdup(path);
548
549 strbuf_release(&sb);
550 return out;
551 }
552
553 /*
554 * Helper function to display the submodule header line prior to the full
555 * summary output.
556 *
557 * If it can locate the submodule git directory it will create a repository
558 * handle for the submodule and lookup both the left and right commits and
559 * put them into the left and right pointers.
560 */
561 static void show_submodule_header(struct diff_options *o,
562 const char *path,
563 struct object_id *one, struct object_id *two,
564 unsigned dirty_submodule,
565 struct repository *sub,
566 struct commit **left, struct commit **right,
567 struct commit_list **merge_bases)
568 {
569 const char *message = NULL;
570 struct strbuf sb = STRBUF_INIT;
571 int fast_forward = 0, fast_backward = 0;
572
573 if (dirty_submodule & DIRTY_SUBMODULE_UNTRACKED)
574 diff_emit_submodule_untracked(o, path);
575
576 if (dirty_submodule & DIRTY_SUBMODULE_MODIFIED)
577 diff_emit_submodule_modified(o, path);
578
579 if (is_null_oid(one))
580 message = "(new submodule)";
581 else if (is_null_oid(two))
582 message = "(submodule deleted)";
583
584 if (!sub) {
585 if (!message)
586 message = "(commits not present)";
587 goto output_header;
588 }
589
590 /*
591 * Attempt to lookup the commit references, and determine if this is
592 * a fast forward or fast backwards update.
593 */
594 *left = lookup_commit_reference(sub, one);
595 *right = lookup_commit_reference(sub, two);
596
597 /*
598 * Warn about missing commits in the submodule project, but only if
599 * they aren't null.
600 */
601 if ((!is_null_oid(one) && !*left) ||
602 (!is_null_oid(two) && !*right))
603 message = "(commits not present)";
604
605 *merge_bases = NULL;
606 if (repo_get_merge_bases(sub, *left, *right, merge_bases) < 0) {
607 message = "(corrupt repository)";
608 goto output_header;
609 }
610
611 if (*merge_bases) {
612 if ((*merge_bases)->item == *left)
613 fast_forward = 1;
614 else if ((*merge_bases)->item == *right)
615 fast_backward = 1;
616 }
617
618 if (oideq(one, two)) {
619 strbuf_release(&sb);
620 return;
621 }
622
623 output_header:
624 strbuf_addf(&sb, "Submodule %s ", path);
625 strbuf_add_unique_abbrev(&sb, one, DEFAULT_ABBREV);
626 strbuf_addstr(&sb, (fast_backward || fast_forward) ? ".." : "...");
627 strbuf_add_unique_abbrev(&sb, two, DEFAULT_ABBREV);
628 if (message)
629 strbuf_addf(&sb, " %s\n", message);
630 else
631 strbuf_addf(&sb, "%s:\n", fast_backward ? " (rewind)" : "");
632 diff_emit_submodule_header(o, sb.buf);
633
634 strbuf_release(&sb);
635 }
636
637 void show_submodule_diff_summary(struct diff_options *o, const char *path,
638 struct object_id *one, struct object_id *two,
639 unsigned dirty_submodule)
640 {
641 struct rev_info rev = REV_INFO_INIT;
642 struct commit *left = NULL, *right = NULL;
643 struct commit_list *merge_bases = NULL;
644 struct repository *sub;
645
646 sub = open_submodule(path);
647 show_submodule_header(o, path, one, two, dirty_submodule,
648 sub, &left, &right, &merge_bases);
649
650 /*
651 * If we don't have both a left and a right pointer, there is no
652 * reason to try and display a summary. The header line should contain
653 * all the information the user needs.
654 */
655 if (!left || !right || !sub)
656 goto out;
657
658 /* Treat revision walker failure the same as missing commits */
659 if (prepare_submodule_diff_summary(sub, &rev, path, left, right, merge_bases)) {
660 diff_emit_submodule_error(o, "(revision walker failed)\n");
661 goto out;
662 }
663
664 print_submodule_diff_summary(sub, &rev, o);
665
666 out:
667 free_commit_list(merge_bases);
668 release_revisions(&rev);
669 clear_commit_marks(left, ~0);
670 clear_commit_marks(right, ~0);
671 if (sub) {
672 repo_clear(sub);
673 free(sub);
674 }
675 }
676
677 void show_submodule_inline_diff(struct diff_options *o, const char *path,
678 struct object_id *one, struct object_id *two,
679 unsigned dirty_submodule)
680 {
681 const struct object_id *old_oid = the_hash_algo->empty_tree, *new_oid = the_hash_algo->empty_tree;
682 struct commit *left = NULL, *right = NULL;
683 struct commit_list *merge_bases = NULL;
684 struct child_process cp = CHILD_PROCESS_INIT;
685 struct strbuf sb = STRBUF_INIT;
686 struct repository *sub;
687
688 sub = open_submodule(path);
689 show_submodule_header(o, path, one, two, dirty_submodule,
690 sub, &left, &right, &merge_bases);
691
692 /* We need a valid left and right commit to display a difference */
693 if (!(left || is_null_oid(one)) ||
694 !(right || is_null_oid(two)))
695 goto done;
696
697 if (left)
698 old_oid = one;
699 if (right)
700 new_oid = two;
701
702 cp.git_cmd = 1;
703 cp.dir = path;
704 cp.out = -1;
705 cp.no_stdin = 1;
706
707 /* TODO: other options may need to be passed here. */
708 strvec_pushl(&cp.args, "diff", "--submodule=diff", NULL);
709 strvec_pushf(&cp.args, "--color=%s", want_color(o->use_color) ?
710 "always" : "never");
711
712 if (o->flags.reverse_diff) {
713 strvec_pushf(&cp.args, "--src-prefix=%s%s/",
714 o->b_prefix, path);
715 strvec_pushf(&cp.args, "--dst-prefix=%s%s/",
716 o->a_prefix, path);
717 } else {
718 strvec_pushf(&cp.args, "--src-prefix=%s%s/",
719 o->a_prefix, path);
720 strvec_pushf(&cp.args, "--dst-prefix=%s%s/",
721 o->b_prefix, path);
722 }
723 strvec_push(&cp.args, oid_to_hex(old_oid));
724 /*
725 * If the submodule has modified content, we will diff against the
726 * work tree, under the assumption that the user has asked for the
727 * diff format and wishes to actually see all differences even if they
728 * haven't yet been committed to the submodule yet.
729 */
730 if (!(dirty_submodule & DIRTY_SUBMODULE_MODIFIED))
731 strvec_push(&cp.args, oid_to_hex(new_oid));
732
733 prepare_submodule_repo_env(&cp.env);
734
735 if (!is_directory(path)) {
736 /* fall back to absorbed git dir, if any */
737 if (!sub)
738 goto done;
739 cp.dir = sub->gitdir;
740 strvec_push(&cp.env, GIT_DIR_ENVIRONMENT "=.");
741 strvec_push(&cp.env, GIT_WORK_TREE_ENVIRONMENT "=.");
742 }
743
744 if (start_command(&cp)) {
745 diff_emit_submodule_error(o, "(diff failed)\n");
746 goto done;
747 }
748
749 while (strbuf_getwholeline_fd(&sb, cp.out, '\n') != EOF)
750 diff_emit_submodule_pipethrough(o, sb.buf, sb.len);
751
752 if (finish_command(&cp))
753 diff_emit_submodule_error(o, "(diff failed)\n");
754
755 done:
756 strbuf_release(&sb);
757 free_commit_list(merge_bases);
758 if (left)
759 clear_commit_marks(left, ~0);
760 if (right)
761 clear_commit_marks(right, ~0);
762 if (sub) {
763 repo_clear(sub);
764 free(sub);
765 }
766 }
767
768 int should_update_submodules(void)
769 {
770 return config_update_recurse_submodules == RECURSE_SUBMODULES_ON;
771 }
772
773 const struct submodule *submodule_from_ce(const struct cache_entry *ce)
774 {
775 if (!S_ISGITLINK(ce->ce_mode))
776 return NULL;
777
778 if (!should_update_submodules())
779 return NULL;
780
781 return submodule_from_path(the_repository, null_oid(the_hash_algo), ce->name);
782 }
783
784
785 struct collect_changed_submodules_cb_data {
786 struct repository *repo;
787 struct string_list *changed;
788 const struct object_id *commit_oid;
789 };
790
791 /*
792 * this would normally be two functions: default_name_from_path() and
793 * path_from_default_name(). Since the default name is the same as
794 * the submodule path we can get away with just one function which only
795 * checks whether there is a submodule in the working directory at that
796 * location.
797 */
798 static const char *default_name_or_path(const char *path_or_name)
799 {
800 int error_code;
801
802 if (!is_submodule_populated_gently(path_or_name, &error_code))
803 return NULL;
804
805 return path_or_name;
806 }
807
808 /*
809 * Holds relevant information for a changed submodule. Used as the .util
810 * member of the changed submodule name string_list_item.
811 *
812 * (super_oid, path) allows the submodule config to be read from _some_
813 * .gitmodules file. We store this information the first time we find a
814 * superproject commit that points to the submodule, but this is
815 * arbitrary - we can choose any (super_oid, path) that matches the
816 * submodule's name.
817 *
818 * NEEDSWORK: Storing an arbitrary commit is undesirable because we can't
819 * guarantee that we're reading the commit that the user would expect. A better
820 * scheme would be to just fetch a submodule by its name. This requires two
821 * steps:
822 * - Create a function that behaves like repo_submodule_init(), but accepts a
823 * submodule name instead of treeish_name and path. This should be easy
824 * because repo_submodule_init() internally uses the submodule's name.
825 *
826 * - Replace most instances of 'struct submodule' (which is the .gitmodules
827 * config) with just the submodule name. This is OK because we expect
828 * submodule settings to be stored in .git/config (via "git submodule init"),
829 * not .gitmodules. This also lets us delete get_non_gitmodules_submodule(),
830 * which constructs a bogus 'struct submodule' for the sake of giving a
831 * placeholder name to a gitlink.
832 */
833 struct changed_submodule_data {
834 /*
835 * The first superproject commit in the rev walk that points to
836 * the submodule.
837 */
838 const struct object_id *super_oid;
839 /*
840 * Path to the submodule in the superproject commit referenced
841 * by 'super_oid'.
842 */
843 char *path;
844 /* The submodule commits that have changed in the rev walk. */
845 struct oid_array new_commits;
846 };
847
848 static void changed_submodule_data_clear(struct changed_submodule_data *cs_data)
849 {
850 oid_array_clear(&cs_data->new_commits);
851 free(cs_data->path);
852 }
853
854 static void collect_changed_submodules_cb(struct diff_queue_struct *q,
855 struct diff_options *options UNUSED,
856 void *data)
857 {
858 struct collect_changed_submodules_cb_data *me = data;
859 struct string_list *changed = me->changed;
860 const struct object_id *commit_oid = me->commit_oid;
861 int i;
862
863 for (i = 0; i < q->nr; i++) {
864 struct diff_filepair *p = q->queue[i];
865 const struct submodule *submodule;
866 const char *name;
867 struct string_list_item *item;
868 struct changed_submodule_data *cs_data;
869
870 if (!S_ISGITLINK(p->two->mode))
871 continue;
872
873 submodule = submodule_from_path(me->repo,
874 commit_oid, p->two->path);
875 if (submodule)
876 name = submodule->name;
877 else {
878 name = default_name_or_path(p->two->path);
879 /* make sure name does not collide with existing one */
880 if (name)
881 submodule = submodule_from_name(me->repo,
882 commit_oid, name);
883 if (submodule) {
884 warning(_("Submodule in commit %s at path: "
885 "'%s' collides with a submodule named "
886 "the same. Skipping it."),
887 oid_to_hex(commit_oid), p->two->path);
888 name = NULL;
889 }
890 }
891
892 if (!name)
893 continue;
894
895 item = string_list_insert(changed, name);
896 if (item->util)
897 cs_data = item->util;
898 else {
899 item->util = xcalloc(1, sizeof(struct changed_submodule_data));
900 cs_data = item->util;
901 cs_data->super_oid = commit_oid;
902 cs_data->path = xstrdup(p->two->path);
903 }
904 oid_array_append(&cs_data->new_commits, &p->two->oid);
905 }
906 }
907
908 /*
909 * Collect the paths of submodules in 'changed' which have changed based on
910 * the revisions as specified in 'argv'. Each entry in 'changed' will also
911 * have a corresponding 'struct oid_array' (in the 'util' field) which lists
912 * what the submodule pointers were updated to during the change.
913 */
914 static void collect_changed_submodules(struct repository *r,
915 struct string_list *changed,
916 struct strvec *argv)
917 {
918 struct rev_info rev;
919 const struct commit *commit;
920 int save_warning;
921 struct setup_revision_opt s_r_opt = {
922 .assume_dashdash = 1,
923 };
924
925 save_warning = warn_on_object_refname_ambiguity;
926 warn_on_object_refname_ambiguity = 0;
927 repo_init_revisions(r, &rev, NULL);
928 setup_revisions(argv->nr, argv->v, &rev, &s_r_opt);
929 warn_on_object_refname_ambiguity = save_warning;
930 if (prepare_revision_walk(&rev))
931 die(_("revision walk setup failed"));
932
933 while ((commit = get_revision(&rev))) {
934 struct rev_info diff_rev;
935 struct collect_changed_submodules_cb_data data;
936 data.repo = r;
937 data.changed = changed;
938 data.commit_oid = &commit->object.oid;
939
940 repo_init_revisions(r, &diff_rev, NULL);
941 diff_rev.diffopt.output_format |= DIFF_FORMAT_CALLBACK;
942 diff_rev.diffopt.format_callback = collect_changed_submodules_cb;
943 diff_rev.diffopt.format_callback_data = &data;
944 diff_rev.dense_combined_merges = 1;
945 diff_tree_combined_merge(commit, &diff_rev);
946 release_revisions(&diff_rev);
947 }
948
949 reset_revision_walk();
950 release_revisions(&rev);
951 }
952
953 static void free_submodules_data(struct string_list *submodules)
954 {
955 struct string_list_item *item;
956 for_each_string_list_item(item, submodules)
957 changed_submodule_data_clear(item->util);
958
959 string_list_clear(submodules, 1);
960 }
961
962 static int has_remote(const char *refname UNUSED,
963 const char *referent UNUSED,
964 const struct object_id *oid UNUSED,
965 int flags UNUSED, void *cb_data UNUSED)
966 {
967 return 1;
968 }
969
970 static int append_oid_to_argv(const struct object_id *oid, void *data)
971 {
972 struct strvec *argv = data;
973 strvec_push(argv, oid_to_hex(oid));
974 return 0;
975 }
976
977 struct has_commit_data {
978 struct repository *repo;
979 int result;
980 const char *path;
981 const struct object_id *super_oid;
982 };
983
984 static int check_has_commit(const struct object_id *oid, void *data)
985 {
986 struct has_commit_data *cb = data;
987 struct repository subrepo;
988 enum object_type type;
989
990 if (repo_submodule_init(&subrepo, cb->repo, cb->path, cb->super_oid)) {
991 cb->result = 0;
992 /* subrepo failed to init, so don't clean it up. */
993 return 0;
994 }
995
996 type = oid_object_info(&subrepo, oid, NULL);
997
998 switch (type) {
999 case OBJ_COMMIT:
1000 goto cleanup;
1001 case OBJ_BAD:
1002 /*
1003 * Object is missing or invalid. If invalid, an error message
1004 * has already been printed.
1005 */
1006 cb->result = 0;
1007 goto cleanup;
1008 default:
1009 die(_("submodule entry '%s' (%s) is a %s, not a commit"),
1010 cb->path, oid_to_hex(oid), type_name(type));
1011 }
1012 cleanup:
1013 repo_clear(&subrepo);
1014 return 0;
1015 }
1016
1017 static int submodule_has_commits(struct repository *r,
1018 const char *path,
1019 const struct object_id *super_oid,
1020 struct oid_array *commits)
1021 {
1022 struct has_commit_data has_commit = {
1023 .repo = r,
1024 .result = 1,
1025 .path = path,
1026 .super_oid = super_oid
1027 };
1028
1029 if (validate_submodule_path(path) < 0)
1030 exit(128);
1031
1032 oid_array_for_each_unique(commits, check_has_commit, &has_commit);
1033
1034 if (has_commit.result) {
1035 /*
1036 * Even if the submodule is checked out and the commit is
1037 * present, make sure it exists in the submodule's object store
1038 * and that it is reachable from a ref.
1039 */
1040 struct child_process cp = CHILD_PROCESS_INIT;
1041 struct strbuf out = STRBUF_INIT;
1042
1043 strvec_pushl(&cp.args, "rev-list", "-n", "1", NULL);
1044 oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
1045 strvec_pushl(&cp.args, "--not", "--all", NULL);
1046
1047 prepare_submodule_repo_env(&cp.env);
1048 cp.git_cmd = 1;
1049 cp.no_stdin = 1;
1050 cp.dir = path;
1051
1052 if (capture_command(&cp, &out, GIT_MAX_HEXSZ + 1) || out.len)
1053 has_commit.result = 0;
1054
1055 strbuf_release(&out);
1056 }
1057
1058 return has_commit.result;
1059 }
1060
1061 static int submodule_needs_pushing(struct repository *r,
1062 const char *path,
1063 struct oid_array *commits)
1064 {
1065 if (!submodule_has_commits(r, path, null_oid(the_hash_algo), commits))
1066 /*
1067 * NOTE: We do consider it safe to return "no" here. The
1068 * correct answer would be "We do not know" instead of
1069 * "No push needed", but it is quite hard to change
1070 * the submodule pointer without having the submodule
1071 * around. If a user did however change the submodules
1072 * without having the submodule around, this indicates
1073 * an expert who knows what they are doing or a
1074 * maintainer integrating work from other people. In
1075 * both cases it should be safe to skip this check.
1076 */
1077 return 0;
1078
1079 if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
1080 struct child_process cp = CHILD_PROCESS_INIT;
1081 struct strbuf buf = STRBUF_INIT;
1082 int needs_pushing = 0;
1083
1084 strvec_push(&cp.args, "rev-list");
1085 oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
1086 strvec_pushl(&cp.args, "--not", "--remotes", "-n", "1" , NULL);
1087
1088 prepare_submodule_repo_env(&cp.env);
1089 cp.git_cmd = 1;
1090 cp.no_stdin = 1;
1091 cp.out = -1;
1092 cp.dir = path;
1093 if (start_command(&cp))
1094 die(_("Could not run 'git rev-list <commits> --not --remotes -n 1' command in submodule %s"),
1095 path);
1096 if (strbuf_read(&buf, cp.out, the_hash_algo->hexsz + 1))
1097 needs_pushing = 1;
1098 finish_command(&cp);
1099 close(cp.out);
1100 strbuf_release(&buf);
1101 return needs_pushing;
1102 }
1103
1104 return 0;
1105 }
1106
1107 int find_unpushed_submodules(struct repository *r,
1108 struct oid_array *commits,
1109 const char *remotes_name,
1110 struct string_list *needs_pushing)
1111 {
1112 struct string_list submodules = STRING_LIST_INIT_DUP;
1113 struct string_list_item *name;
1114 struct strvec argv = STRVEC_INIT;
1115
1116 /* argv.v[0] will be ignored by setup_revisions */
1117 strvec_push(&argv, "find_unpushed_submodules");
1118 oid_array_for_each_unique(commits, append_oid_to_argv, &argv);
1119 strvec_push(&argv, "--not");
1120 strvec_pushf(&argv, "--remotes=%s", remotes_name);
1121
1122 collect_changed_submodules(r, &submodules, &argv);
1123
1124 for_each_string_list_item(name, &submodules) {
1125 struct changed_submodule_data *cs_data = name->util;
1126 const struct submodule *submodule;
1127 const char *path = NULL;
1128
1129 submodule = submodule_from_name(r, null_oid(the_hash_algo), name->string);
1130 if (submodule)
1131 path = submodule->path;
1132 else
1133 path = default_name_or_path(name->string);
1134
1135 if (!path)
1136 continue;
1137
1138 if (submodule_needs_pushing(r, path, &cs_data->new_commits))
1139 string_list_insert(needs_pushing, path);
1140 }
1141
1142 free_submodules_data(&submodules);
1143 strvec_clear(&argv);
1144
1145 return needs_pushing->nr;
1146 }
1147
1148 static int push_submodule(const char *path,
1149 const struct remote *remote,
1150 const struct refspec *rs,
1151 const struct string_list *push_options,
1152 int dry_run)
1153 {
1154 if (validate_submodule_path(path) < 0)
1155 exit(128);
1156
1157 if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
1158 struct child_process cp = CHILD_PROCESS_INIT;
1159 strvec_push(&cp.args, "push");
1160 /*
1161 * When recursing into a submodule, treat any "only" configurations as "on-
1162 * demand", since "only" would not work (we need all submodules to be pushed
1163 * in order to be able to push the superproject).
1164 */
1165 strvec_push(&cp.args, "--recurse-submodules=only-is-on-demand");
1166 if (dry_run)
1167 strvec_push(&cp.args, "--dry-run");
1168
1169 if (push_options && push_options->nr) {
1170 const struct string_list_item *item;
1171 for_each_string_list_item(item, push_options)
1172 strvec_pushf(&cp.args, "--push-option=%s",
1173 item->string);
1174 }
1175
1176 if (remote->origin != REMOTE_UNCONFIGURED) {
1177 int i;
1178 strvec_push(&cp.args, remote->name);
1179 for (i = 0; i < rs->nr; i++)
1180 strvec_push(&cp.args, rs->items[i].raw);
1181 }
1182
1183 prepare_submodule_repo_env(&cp.env);
1184 cp.git_cmd = 1;
1185 cp.no_stdin = 1;
1186 cp.dir = path;
1187 if (run_command(&cp))
1188 return 0;
1189 close(cp.out);
1190 }
1191
1192 return 1;
1193 }
1194
1195 /*
1196 * Perform a check in the submodule to see if the remote and refspec work.
1197 * Die if the submodule can't be pushed.
1198 */
1199 static void submodule_push_check(const char *path, const char *head,
1200 const struct remote *remote,
1201 const struct refspec *rs)
1202 {
1203 struct child_process cp = CHILD_PROCESS_INIT;
1204 int i;
1205
1206 if (validate_submodule_path(path) < 0)
1207 exit(128);
1208
1209 strvec_push(&cp.args, "submodule--helper");
1210 strvec_push(&cp.args, "push-check");
1211 strvec_push(&cp.args, head);
1212 strvec_push(&cp.args, remote->name);
1213
1214 for (i = 0; i < rs->nr; i++)
1215 strvec_push(&cp.args, rs->items[i].raw);
1216
1217 prepare_submodule_repo_env(&cp.env);
1218 cp.git_cmd = 1;
1219 cp.no_stdin = 1;
1220 cp.no_stdout = 1;
1221 cp.dir = path;
1222
1223 /*
1224 * Simply indicate if 'submodule--helper push-check' failed.
1225 * More detailed error information will be provided by the
1226 * child process.
1227 */
1228 if (run_command(&cp))
1229 die(_("process for submodule '%s' failed"), path);
1230 }
1231
1232 int push_unpushed_submodules(struct repository *r,
1233 struct oid_array *commits,
1234 const struct remote *remote,
1235 const struct refspec *rs,
1236 const struct string_list *push_options,
1237 int dry_run)
1238 {
1239 int i, ret = 1;
1240 struct string_list needs_pushing = STRING_LIST_INIT_DUP;
1241
1242 if (!find_unpushed_submodules(r, commits,
1243 remote->name, &needs_pushing))
1244 return 1;
1245
1246 /*
1247 * Verify that the remote and refspec can be propagated to all
1248 * submodules. This check can be skipped if the remote and refspec
1249 * won't be propagated due to the remote being unconfigured (e.g. a URL
1250 * instead of a remote name).
1251 */
1252 if (remote->origin != REMOTE_UNCONFIGURED) {
1253 char *head;
1254 struct object_id head_oid;
1255
1256 head = refs_resolve_refdup(get_main_ref_store(the_repository),
1257 "HEAD", 0, &head_oid, NULL);
1258 if (!head)
1259 die(_("Failed to resolve HEAD as a valid ref."));
1260
1261 for (i = 0; i < needs_pushing.nr; i++)
1262 submodule_push_check(needs_pushing.items[i].string,
1263 head, remote, rs);
1264 free(head);
1265 }
1266
1267 /* Actually push the submodules */
1268 for (i = 0; i < needs_pushing.nr; i++) {
1269 const char *path = needs_pushing.items[i].string;
1270 fprintf(stderr, _("Pushing submodule '%s'\n"), path);
1271 if (!push_submodule(path, remote, rs,
1272 push_options, dry_run)) {
1273 fprintf(stderr, _("Unable to push submodule '%s'\n"), path);
1274 ret = 0;
1275 }
1276 }
1277
1278 string_list_clear(&needs_pushing, 0);
1279
1280 return ret;
1281 }
1282
1283 static int append_oid_to_array(const char *ref UNUSED,
1284 const char *referent UNUSED,
1285 const struct object_id *oid,
1286 int flags UNUSED, void *data)
1287 {
1288 struct oid_array *array = data;
1289 oid_array_append(array, oid);
1290 return 0;
1291 }
1292
1293 void check_for_new_submodule_commits(struct object_id *oid)
1294 {
1295 if (!initialized_fetch_ref_tips) {
1296 refs_for_each_ref(get_main_ref_store(the_repository),
1297 append_oid_to_array, &ref_tips_before_fetch);
1298 initialized_fetch_ref_tips = 1;
1299 }
1300
1301 oid_array_append(&ref_tips_after_fetch, oid);
1302 }
1303
1304 /*
1305 * Returns 1 if there is at least one submodule gitdir in
1306 * $GIT_DIR/modules and 0 otherwise. This follows
1307 * submodule_name_to_gitdir(), which looks for submodules in
1308 * $GIT_DIR/modules, not $GIT_COMMON_DIR.
1309 *
1310 * A submodule can be moved to $GIT_DIR/modules manually by running "git
1311 * submodule absorbgitdirs", or it may be initialized there by "git
1312 * submodule update".
1313 */
1314 static int repo_has_absorbed_submodules(struct repository *r)
1315 {
1316 int ret;
1317 struct strbuf buf = STRBUF_INIT;
1318
1319 repo_git_path_append(r, &buf, "modules/");
1320 ret = file_exists(buf.buf) && !is_empty_dir(buf.buf);
1321 strbuf_release(&buf);
1322 return ret;
1323 }
1324
1325 static void calculate_changed_submodule_paths(struct repository *r,
1326 struct string_list *changed_submodule_names)
1327 {
1328 struct strvec argv = STRVEC_INIT;
1329 struct string_list_item *name;
1330
1331 /* No need to check if no submodules would be fetched */
1332 if (!submodule_from_path(r, NULL, NULL) &&
1333 !repo_has_absorbed_submodules(r))
1334 return;
1335
1336 strvec_push(&argv, "--"); /* argv[0] program name */
1337 oid_array_for_each_unique(&ref_tips_after_fetch,
1338 append_oid_to_argv, &argv);
1339 strvec_push(&argv, "--not");
1340 oid_array_for_each_unique(&ref_tips_before_fetch,
1341 append_oid_to_argv, &argv);
1342
1343 /*
1344 * Collect all submodules (whether checked out or not) for which new
1345 * commits have been recorded upstream in "changed_submodule_names".
1346 */
1347 collect_changed_submodules(r, changed_submodule_names, &argv);
1348
1349 for_each_string_list_item(name, changed_submodule_names) {
1350 struct changed_submodule_data *cs_data = name->util;
1351 const struct submodule *submodule;
1352 const char *path = NULL;
1353
1354 submodule = submodule_from_name(r, null_oid(the_hash_algo), name->string);
1355 if (submodule)
1356 path = submodule->path;
1357 else
1358 path = default_name_or_path(name->string);
1359
1360 if (!path)
1361 continue;
1362
1363 if (submodule_has_commits(r, path, null_oid(the_hash_algo), &cs_data->new_commits)) {
1364 changed_submodule_data_clear(cs_data);
1365 *name->string = '\0';
1366 }
1367 }
1368
1369 string_list_remove_empty_items(changed_submodule_names, 1);
1370
1371 strvec_clear(&argv);
1372 oid_array_clear(&ref_tips_before_fetch);
1373 oid_array_clear(&ref_tips_after_fetch);
1374 initialized_fetch_ref_tips = 0;
1375 }
1376
1377 int submodule_touches_in_range(struct repository *r,
1378 struct object_id *excl_oid,
1379 struct object_id *incl_oid)
1380 {
1381 struct string_list subs = STRING_LIST_INIT_DUP;
1382 struct strvec args = STRVEC_INIT;
1383 int ret;
1384
1385 /* No need to check if there are no submodules configured */
1386 if (!submodule_from_path(r, NULL, NULL))
1387 return 0;
1388
1389 strvec_push(&args, "--"); /* args[0] program name */
1390 strvec_push(&args, oid_to_hex(incl_oid));
1391 if (!is_null_oid(excl_oid)) {
1392 strvec_push(&args, "--not");
1393 strvec_push(&args, oid_to_hex(excl_oid));
1394 }
1395
1396 collect_changed_submodules(r, &subs, &args);
1397 ret = subs.nr;
1398
1399 strvec_clear(&args);
1400
1401 free_submodules_data(&subs);
1402 return ret;
1403 }
1404
1405 struct submodule_parallel_fetch {
1406 /*
1407 * The index of the last index entry processed by
1408 * get_fetch_task_from_index().
1409 */
1410 int index_count;
1411 /*
1412 * The index of the last string_list entry processed by
1413 * get_fetch_task_from_changed().
1414 */
1415 int changed_count;
1416 struct strvec args;
1417 struct repository *r;
1418 const char *prefix;
1419 int command_line_option;
1420 int default_option;
1421 int quiet;
1422 int result;
1423
1424 /*
1425 * Names of submodules that have new commits. Generated by
1426 * walking the newly fetched superproject commits.
1427 */
1428 struct string_list changed_submodule_names;
1429 /*
1430 * Names of submodules that have already been processed. Lets us
1431 * avoid fetching the same submodule more than once.
1432 */
1433 struct string_list seen_submodule_names;
1434
1435 /* Pending fetches by OIDs */
1436 struct fetch_task **oid_fetch_tasks;
1437 int oid_fetch_tasks_nr, oid_fetch_tasks_alloc;
1438
1439 struct strbuf submodules_with_errors;
1440 };
1441 #define SPF_INIT { \
1442 .args = STRVEC_INIT, \
1443 .changed_submodule_names = STRING_LIST_INIT_DUP, \
1444 .seen_submodule_names = STRING_LIST_INIT_DUP, \
1445 .submodules_with_errors = STRBUF_INIT, \
1446 }
1447
1448 static int get_fetch_recurse_config(const struct submodule *submodule,
1449 struct submodule_parallel_fetch *spf)
1450 {
1451 if (spf->command_line_option != RECURSE_SUBMODULES_DEFAULT)
1452 return spf->command_line_option;
1453
1454 if (submodule) {
1455 char *key;
1456 const char *value;
1457
1458 int fetch_recurse = submodule->fetch_recurse;
1459 key = xstrfmt("submodule.%s.fetchRecurseSubmodules", submodule->name);
1460 if (!repo_config_get_string_tmp(spf->r, key, &value)) {
1461 fetch_recurse = parse_fetch_recurse_submodules_arg(key, value);
1462 }
1463 free(key);
1464
1465 if (fetch_recurse != RECURSE_SUBMODULES_NONE)
1466 /* local config overrules everything except commandline */
1467 return fetch_recurse;
1468 }
1469
1470 return spf->default_option;
1471 }
1472
1473 /*
1474 * Fetch in progress (if callback data) or
1475 * pending (if in oid_fetch_tasks in struct submodule_parallel_fetch)
1476 */
1477 struct fetch_task {
1478 struct repository *repo;
1479 const struct submodule *sub;
1480 unsigned free_sub : 1; /* Do we need to free the submodule? */
1481 const char *default_argv; /* The default fetch mode. */
1482 struct strvec git_args; /* Args for the child git process. */
1483
1484 struct oid_array *commits; /* Ensure these commits are fetched */
1485 };
1486
1487 /**
1488 * When a submodule is not defined in .gitmodules, we cannot access it
1489 * via the regular submodule-config. Create a fake submodule, which we can
1490 * work on.
1491 */
1492 static const struct submodule *get_non_gitmodules_submodule(const char *path)
1493 {
1494 struct submodule *ret;
1495 const char *name = default_name_or_path(path);
1496
1497 if (!name)
1498 return NULL;
1499
1500 CALLOC_ARRAY(ret, 1);
1501 ret->path = name;
1502 ret->name = name;
1503
1504 return (const struct submodule *) ret;
1505 }
1506
1507 static void fetch_task_free(struct fetch_task *p)
1508 {
1509 if (p->free_sub)
1510 free((void*)p->sub);
1511 p->free_sub = 0;
1512 p->sub = NULL;
1513
1514 if (p->repo)
1515 repo_clear(p->repo);
1516 FREE_AND_NULL(p->repo);
1517
1518 strvec_clear(&p->git_args);
1519 free(p);
1520 }
1521
1522 static struct repository *get_submodule_repo_for(struct repository *r,
1523 const char *path,
1524 const struct object_id *treeish_name)
1525 {
1526 struct repository *ret = xmalloc(sizeof(*ret));
1527
1528 if (repo_submodule_init(ret, r, path, treeish_name)) {
1529 free(ret);
1530 return NULL;
1531 }
1532
1533 return ret;
1534 }
1535
1536 static struct fetch_task *fetch_task_create(struct submodule_parallel_fetch *spf,
1537 const char *path,
1538 const struct object_id *treeish_name)
1539 {
1540 struct fetch_task *task;
1541
1542 CALLOC_ARRAY(task, 1);
1543
1544 if (validate_submodule_path(path) < 0)
1545 exit(128);
1546
1547 task->sub = submodule_from_path(spf->r, treeish_name, path);
1548
1549 if (!task->sub) {
1550 /*
1551 * No entry in .gitmodules? Technically not a submodule,
1552 * but historically we supported repositories that happen to be
1553 * in-place where a gitlink is. Keep supporting them.
1554 */
1555 task->sub = get_non_gitmodules_submodule(path);
1556 if (!task->sub)
1557 goto cleanup;
1558
1559 task->free_sub = 1;
1560 }
1561
1562 if (string_list_lookup(&spf->seen_submodule_names, task->sub->name))
1563 goto cleanup;
1564
1565 switch (get_fetch_recurse_config(task->sub, spf))
1566 {
1567 default:
1568 case RECURSE_SUBMODULES_DEFAULT:
1569 case RECURSE_SUBMODULES_ON_DEMAND:
1570 if (!task->sub ||
1571 !string_list_lookup(
1572 &spf->changed_submodule_names,
1573 task->sub->name))
1574 goto cleanup;
1575 task->default_argv = "on-demand";
1576 break;
1577 case RECURSE_SUBMODULES_ON:
1578 task->default_argv = "yes";
1579 break;
1580 case RECURSE_SUBMODULES_OFF:
1581 goto cleanup;
1582 }
1583
1584 task->repo = get_submodule_repo_for(spf->r, path, treeish_name);
1585
1586 return task;
1587
1588 cleanup:
1589 fetch_task_free(task);
1590 return NULL;
1591 }
1592
1593 static struct fetch_task *
1594 get_fetch_task_from_index(struct submodule_parallel_fetch *spf,
1595 struct strbuf *err)
1596 {
1597 for (; spf->index_count < spf->r->index->cache_nr; spf->index_count++) {
1598 const struct cache_entry *ce =
1599 spf->r->index->cache[spf->index_count];
1600 struct fetch_task *task;
1601
1602 if (!S_ISGITLINK(ce->ce_mode))
1603 continue;
1604
1605 task = fetch_task_create(spf, ce->name, null_oid(the_hash_algo));
1606 if (!task)
1607 continue;
1608
1609 if (task->repo) {
1610 if (!spf->quiet)
1611 strbuf_addf(err, _("Fetching submodule %s%s\n"),
1612 spf->prefix, ce->name);
1613
1614 spf->index_count++;
1615 return task;
1616 } else {
1617 struct strbuf empty_submodule_path = STRBUF_INIT;
1618
1619 fetch_task_free(task);
1620
1621 /*
1622 * An empty directory is normal,
1623 * the submodule is not initialized
1624 */
1625 strbuf_addf(&empty_submodule_path, "%s/%s/",
1626 spf->r->worktree,
1627 ce->name);
1628 if (S_ISGITLINK(ce->ce_mode) &&
1629 !is_empty_dir(empty_submodule_path.buf)) {
1630 spf->result = 1;
1631 strbuf_addf(err,
1632 _("Could not access submodule '%s'\n"),
1633 ce->name);
1634 }
1635 strbuf_release(&empty_submodule_path);
1636 }
1637 }
1638 return NULL;
1639 }
1640
1641 static struct fetch_task *
1642 get_fetch_task_from_changed(struct submodule_parallel_fetch *spf,
1643 struct strbuf *err)
1644 {
1645 for (; spf->changed_count < spf->changed_submodule_names.nr;
1646 spf->changed_count++) {
1647 struct string_list_item item =
1648 spf->changed_submodule_names.items[spf->changed_count];
1649 struct changed_submodule_data *cs_data = item.util;
1650 struct fetch_task *task;
1651
1652 if (!is_tree_submodule_active(spf->r, cs_data->super_oid,cs_data->path))
1653 continue;
1654
1655 task = fetch_task_create(spf, cs_data->path,
1656 cs_data->super_oid);
1657 if (!task)
1658 continue;
1659
1660 if (!task->repo) {
1661 strbuf_addf(err, _("Could not access submodule '%s' at commit %s\n"),
1662 cs_data->path,
1663 repo_find_unique_abbrev(the_repository, cs_data->super_oid, DEFAULT_ABBREV));
1664
1665 fetch_task_free(task);
1666 continue;
1667 }
1668
1669 if (!spf->quiet)
1670 strbuf_addf(err,
1671 _("Fetching submodule %s%s at commit %s\n"),
1672 spf->prefix, task->sub->path,
1673 repo_find_unique_abbrev(the_repository, cs_data->super_oid,
1674 DEFAULT_ABBREV));
1675
1676 spf->changed_count++;
1677 /*
1678 * NEEDSWORK: Submodules set/unset a value for
1679 * core.worktree when they are populated/unpopulated by
1680 * "git checkout" (and similar commands, see
1681 * submodule_move_head() and
1682 * connect_work_tree_and_git_dir()), but if the
1683 * submodule is unpopulated in another way (e.g. "git
1684 * rm", "rm -r"), core.worktree will still be set even
1685 * though the directory doesn't exist, and the child
1686 * process will crash while trying to chdir into the
1687 * nonexistent directory.
1688 *
1689 * In this case, we know that the submodule has no
1690 * working tree, so we can work around this by
1691 * setting "--work-tree=." (--bare does not work because
1692 * worktree settings take precedence over bare-ness).
1693 * However, this is not necessarily true in other cases,
1694 * so a generalized solution is still necessary.
1695 *
1696 * Possible solutions:
1697 * - teach "git [add|rm]" to unset core.worktree and
1698 * discourage users from removing submodules without
1699 * using a Git command.
1700 * - teach submodule child processes to ignore stale
1701 * core.worktree values.
1702 */
1703 strvec_push(&task->git_args, "--work-tree=.");
1704 return task;
1705 }
1706 return NULL;
1707 }
1708
1709 static int get_next_submodule(struct child_process *cp, struct strbuf *err,
1710 void *data, void **task_cb)
1711 {
1712 struct submodule_parallel_fetch *spf = data;
1713 struct fetch_task *task =
1714 get_fetch_task_from_index(spf, err);
1715 if (!task)
1716 task = get_fetch_task_from_changed(spf, err);
1717
1718 if (task) {
1719 child_process_init(cp);
1720 cp->dir = task->repo->gitdir;
1721 prepare_submodule_repo_env_in_gitdir(&cp->env);
1722 cp->git_cmd = 1;
1723 strvec_init(&cp->args);
1724 if (task->git_args.nr)
1725 strvec_pushv(&cp->args, task->git_args.v);
1726 strvec_pushv(&cp->args, spf->args.v);
1727 strvec_push(&cp->args, task->default_argv);
1728 strvec_pushf(&cp->args, "--submodule-prefix=%s%s/",
1729 spf->prefix, task->sub->path);
1730
1731 *task_cb = task;
1732
1733 string_list_insert(&spf->seen_submodule_names, task->sub->name);
1734 return 1;
1735 }
1736
1737 if (spf->oid_fetch_tasks_nr) {
1738 struct fetch_task *task =
1739 spf->oid_fetch_tasks[spf->oid_fetch_tasks_nr - 1];
1740 spf->oid_fetch_tasks_nr--;
1741
1742 child_process_init(cp);
1743 prepare_submodule_repo_env_in_gitdir(&cp->env);
1744 cp->git_cmd = 1;
1745 cp->dir = task->repo->gitdir;
1746
1747 strvec_init(&cp->args);
1748 strvec_pushv(&cp->args, spf->args.v);
1749 strvec_push(&cp->args, "on-demand");
1750 strvec_pushf(&cp->args, "--submodule-prefix=%s%s/",
1751 spf->prefix, task->sub->path);
1752
1753 /* NEEDSWORK: have get_default_remote from submodule--helper */
1754 strvec_push(&cp->args, "origin");
1755 oid_array_for_each_unique(task->commits,
1756 append_oid_to_argv, &cp->args);
1757
1758 *task_cb = task;
1759 return 1;
1760 }
1761
1762 return 0;
1763 }
1764
1765 static int fetch_start_failure(struct strbuf *err UNUSED,
1766 void *cb, void *task_cb)
1767 {
1768 struct submodule_parallel_fetch *spf = cb;
1769 struct fetch_task *task = task_cb;
1770
1771 spf->result = 1;
1772
1773 fetch_task_free(task);
1774 return 0;
1775 }
1776
1777 static int commit_missing_in_sub(const struct object_id *oid, void *data)
1778 {
1779 struct repository *subrepo = data;
1780
1781 enum object_type type = oid_object_info(subrepo, oid, NULL);
1782
1783 return type != OBJ_COMMIT;
1784 }
1785
1786 static int fetch_finish(int retvalue, struct strbuf *err UNUSED,
1787 void *cb, void *task_cb)
1788 {
1789 struct submodule_parallel_fetch *spf = cb;
1790 struct fetch_task *task = task_cb;
1791
1792 struct string_list_item *it;
1793 struct changed_submodule_data *cs_data;
1794
1795 if (!task || !task->sub)
1796 BUG("callback cookie bogus");
1797
1798 if (retvalue) {
1799 /*
1800 * NEEDSWORK: This indicates that the overall fetch
1801 * failed, even though there may be a subsequent fetch
1802 * by commit hash that might work. It may be a good
1803 * idea to not indicate failure in this case, and only
1804 * indicate failure if the subsequent fetch fails.
1805 */
1806 spf->result = 1;
1807
1808 strbuf_addf(&spf->submodules_with_errors, "\t%s\n",
1809 task->sub->name);
1810 }
1811
1812 /* Is this the second time we process this submodule? */
1813 if (task->commits)
1814 goto out;
1815
1816 it = string_list_lookup(&spf->changed_submodule_names, task->sub->name);
1817 if (!it)
1818 /* Could be an unchanged submodule, not contained in the list */
1819 goto out;
1820
1821 cs_data = it->util;
1822 oid_array_filter(&cs_data->new_commits,
1823 commit_missing_in_sub,
1824 task->repo);
1825
1826 /* Are there commits we want, but do not exist? */
1827 if (cs_data->new_commits.nr) {
1828 task->commits = &cs_data->new_commits;
1829 ALLOC_GROW(spf->oid_fetch_tasks,
1830 spf->oid_fetch_tasks_nr + 1,
1831 spf->oid_fetch_tasks_alloc);
1832 spf->oid_fetch_tasks[spf->oid_fetch_tasks_nr] = task;
1833 spf->oid_fetch_tasks_nr++;
1834 return 0;
1835 }
1836
1837 out:
1838 fetch_task_free(task);
1839 return 0;
1840 }
1841
1842 int fetch_submodules(struct repository *r,
1843 const struct strvec *options,
1844 const char *prefix, int command_line_option,
1845 int default_option,
1846 int quiet, int max_parallel_jobs)
1847 {
1848 int i;
1849 struct submodule_parallel_fetch spf = SPF_INIT;
1850 const struct run_process_parallel_opts opts = {
1851 .tr2_category = "submodule",
1852 .tr2_label = "parallel/fetch",
1853
1854 .processes = max_parallel_jobs,
1855
1856 .get_next_task = get_next_submodule,
1857 .start_failure = fetch_start_failure,
1858 .task_finished = fetch_finish,
1859 .data = &spf,
1860 };
1861
1862 spf.r = r;
1863 spf.command_line_option = command_line_option;
1864 spf.default_option = default_option;
1865 spf.quiet = quiet;
1866 spf.prefix = prefix;
1867
1868 if (!r->worktree)
1869 goto out;
1870
1871 if (repo_read_index(r) < 0)
1872 die(_("index file corrupt"));
1873
1874 strvec_push(&spf.args, "fetch");
1875 for (i = 0; i < options->nr; i++)
1876 strvec_push(&spf.args, options->v[i]);
1877 strvec_push(&spf.args, "--recurse-submodules-default");
1878 /* default value, "--submodule-prefix" and its value are added later */
1879
1880 calculate_changed_submodule_paths(r, &spf.changed_submodule_names);
1881 string_list_sort(&spf.changed_submodule_names);
1882 run_processes_parallel(&opts);
1883
1884 if (spf.submodules_with_errors.len > 0)
1885 fprintf(stderr, _("Errors during submodule fetch:\n%s"),
1886 spf.submodules_with_errors.buf);
1887
1888
1889 strvec_clear(&spf.args);
1890 out:
1891 free_submodules_data(&spf.changed_submodule_names);
1892 string_list_clear(&spf.seen_submodule_names, 0);
1893 strbuf_release(&spf.submodules_with_errors);
1894 free(spf.oid_fetch_tasks);
1895 return spf.result;
1896 }
1897
1898 unsigned is_submodule_modified(const char *path, int ignore_untracked)
1899 {
1900 struct child_process cp = CHILD_PROCESS_INIT;
1901 struct strbuf buf = STRBUF_INIT;
1902 FILE *fp;
1903 unsigned dirty_submodule = 0;
1904 const char *git_dir;
1905 int ignore_cp_exit_code = 0;
1906
1907 if (validate_submodule_path(path) < 0)
1908 exit(128);
1909
1910 strbuf_addf(&buf, "%s/.git", path);
1911 git_dir = read_gitfile(buf.buf);
1912 if (!git_dir)
1913 git_dir = buf.buf;
1914 if (!is_git_directory(git_dir)) {
1915 if (is_directory(git_dir))
1916 die(_("'%s' not recognized as a git repository"), git_dir);
1917 strbuf_release(&buf);
1918 /* The submodule is not checked out, so it is not modified */
1919 return 0;
1920 }
1921 strbuf_reset(&buf);
1922
1923 strvec_pushl(&cp.args, "status", "--porcelain=2", NULL);
1924 if (ignore_untracked)
1925 strvec_push(&cp.args, "-uno");
1926
1927 prepare_submodule_repo_env(&cp.env);
1928 cp.git_cmd = 1;
1929 cp.no_stdin = 1;
1930 cp.out = -1;
1931 cp.dir = path;
1932 if (start_command(&cp))
1933 die(_("Could not run 'git status --porcelain=2' in submodule %s"), path);
1934
1935 fp = xfdopen(cp.out, "r");
1936 while (strbuf_getwholeline(&buf, fp, '\n') != EOF) {
1937 /* regular untracked files */
1938 if (buf.buf[0] == '?')
1939 dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1940
1941 if (buf.buf[0] == 'u' ||
1942 buf.buf[0] == '1' ||
1943 buf.buf[0] == '2') {
1944 /* T = line type, XY = status, SSSS = submodule state */
1945 if (buf.len < strlen("T XY SSSS"))
1946 BUG("invalid status --porcelain=2 line %s",
1947 buf.buf);
1948
1949 if (buf.buf[5] == 'S' && buf.buf[8] == 'U')
1950 /* nested untracked file */
1951 dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1952
1953 if (buf.buf[0] == 'u' ||
1954 buf.buf[0] == '2' ||
1955 memcmp(buf.buf + 5, "S..U", 4))
1956 /* other change */
1957 dirty_submodule |= DIRTY_SUBMODULE_MODIFIED;
1958 }
1959
1960 if ((dirty_submodule & DIRTY_SUBMODULE_MODIFIED) &&
1961 ((dirty_submodule & DIRTY_SUBMODULE_UNTRACKED) ||
1962 ignore_untracked)) {
1963 /*
1964 * We're not interested in any further information from
1965 * the child any more, neither output nor its exit code.
1966 */
1967 ignore_cp_exit_code = 1;
1968 break;
1969 }
1970 }
1971 fclose(fp);
1972
1973 if (finish_command(&cp) && !ignore_cp_exit_code)
1974 die(_("'git status --porcelain=2' failed in submodule %s"), path);
1975
1976 strbuf_release(&buf);
1977 return dirty_submodule;
1978 }
1979
1980 int submodule_uses_gitfile(const char *path)
1981 {
1982 struct child_process cp = CHILD_PROCESS_INIT;
1983 struct strbuf buf = STRBUF_INIT;
1984 const char *git_dir;
1985
1986 if (validate_submodule_path(path) < 0)
1987 exit(128);
1988
1989 strbuf_addf(&buf, "%s/.git", path);
1990 git_dir = read_gitfile(buf.buf);
1991 if (!git_dir) {
1992 strbuf_release(&buf);
1993 return 0;
1994 }
1995 strbuf_release(&buf);
1996
1997 /* Now test that all nested submodules use a gitfile too */
1998 strvec_pushl(&cp.args,
1999 "submodule", "foreach", "--quiet", "--recursive",
2000 "test -f .git", NULL);
2001
2002 prepare_submodule_repo_env(&cp.env);
2003 cp.git_cmd = 1;
2004 cp.no_stdin = 1;
2005 cp.no_stderr = 1;
2006 cp.no_stdout = 1;
2007 cp.dir = path;
2008 if (run_command(&cp))
2009 return 0;
2010
2011 return 1;
2012 }
2013
2014 /*
2015 * Check if it is a bad idea to remove a submodule, i.e. if we'd lose data
2016 * when doing so.
2017 *
2018 * Return 1 if we'd lose data, return 0 if the removal is fine,
2019 * and negative values for errors.
2020 */
2021 int bad_to_remove_submodule(const char *path, unsigned flags)
2022 {
2023 ssize_t len;
2024 struct child_process cp = CHILD_PROCESS_INIT;
2025 struct strbuf buf = STRBUF_INIT;
2026 int ret = 0;
2027
2028 if (validate_submodule_path(path) < 0)
2029 exit(128);
2030
2031 if (!file_exists(path) || is_empty_dir(path))
2032 return 0;
2033
2034 if (!submodule_uses_gitfile(path))
2035 return 1;
2036
2037 strvec_pushl(&cp.args, "status", "--porcelain",
2038 "--ignore-submodules=none", NULL);
2039
2040 if (flags & SUBMODULE_REMOVAL_IGNORE_UNTRACKED)
2041 strvec_push(&cp.args, "-uno");
2042 else
2043 strvec_push(&cp.args, "-uall");
2044
2045 if (!(flags & SUBMODULE_REMOVAL_IGNORE_IGNORED_UNTRACKED))
2046 strvec_push(&cp.args, "--ignored");
2047
2048 prepare_submodule_repo_env(&cp.env);
2049 cp.git_cmd = 1;
2050 cp.no_stdin = 1;
2051 cp.out = -1;
2052 cp.dir = path;
2053 if (start_command(&cp)) {
2054 if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
2055 die(_("could not start 'git status' in submodule '%s'"),
2056 path);
2057 ret = -1;
2058 goto out;
2059 }
2060
2061 len = strbuf_read(&buf, cp.out, 1024);
2062 if (len > 2)
2063 ret = 1;
2064 close(cp.out);
2065
2066 if (finish_command(&cp)) {
2067 if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
2068 die(_("could not run 'git status' in submodule '%s'"),
2069 path);
2070 ret = -1;
2071 }
2072 out:
2073 strbuf_release(&buf);
2074 return ret;
2075 }
2076
2077 void submodule_unset_core_worktree(const struct submodule *sub)
2078 {
2079 struct strbuf config_path = STRBUF_INIT;
2080
2081 if (validate_submodule_path(sub->path) < 0)
2082 exit(128);
2083
2084 submodule_name_to_gitdir(&config_path, the_repository, sub->name);
2085 strbuf_addstr(&config_path, "/config");
2086
2087 if (git_config_set_in_file_gently(config_path.buf, "core.worktree", NULL, NULL))
2088 warning(_("Could not unset core.worktree setting in submodule '%s'"),
2089 sub->path);
2090
2091 strbuf_release(&config_path);
2092 }
2093
2094 static int submodule_has_dirty_index(const struct submodule *sub)
2095 {
2096 struct child_process cp = CHILD_PROCESS_INIT;
2097
2098 if (validate_submodule_path(sub->path) < 0)
2099 exit(128);
2100
2101 prepare_submodule_repo_env(&cp.env);
2102
2103 cp.git_cmd = 1;
2104 strvec_pushl(&cp.args, "diff-index", "--quiet",
2105 "--cached", "HEAD", NULL);
2106 cp.no_stdin = 1;
2107 cp.no_stdout = 1;
2108 cp.dir = sub->path;
2109 if (start_command(&cp))
2110 die(_("could not recurse into submodule '%s'"), sub->path);
2111
2112 return finish_command(&cp);
2113 }
2114
2115 static void submodule_reset_index(const char *path, const char *super_prefix)
2116 {
2117 struct child_process cp = CHILD_PROCESS_INIT;
2118
2119 if (validate_submodule_path(path) < 0)
2120 exit(128);
2121
2122 prepare_submodule_repo_env(&cp.env);
2123
2124 cp.git_cmd = 1;
2125 cp.no_stdin = 1;
2126 cp.dir = path;
2127
2128 /* TODO: determine if this might overwright untracked files */
2129 strvec_pushl(&cp.args, "read-tree", "-u", "--reset", NULL);
2130 strvec_pushf(&cp.args, "--super-prefix=%s%s/",
2131 (super_prefix ? super_prefix : ""), path);
2132
2133 strvec_push(&cp.args, empty_tree_oid_hex(the_repository->hash_algo));
2134
2135 if (run_command(&cp))
2136 die(_("could not reset submodule index"));
2137 }
2138
2139 /**
2140 * Moves a submodule at a given path from a given head to another new head.
2141 * For edge cases (a submodule coming into existence or removing a submodule)
2142 * pass NULL for old or new respectively.
2143 */
2144 int submodule_move_head(const char *path, const char *super_prefix,
2145 const char *old_head, const char *new_head,
2146 unsigned flags)
2147 {
2148 int ret = 0;
2149 struct child_process cp = CHILD_PROCESS_INIT;
2150 const struct submodule *sub;
2151 int *error_code_ptr, error_code;
2152
2153 if (!is_submodule_active(the_repository, path))
2154 return 0;
2155
2156 if (flags & SUBMODULE_MOVE_HEAD_FORCE)
2157 /*
2158 * Pass non NULL pointer to is_submodule_populated_gently
2159 * to prevent die()-ing. We'll use connect_work_tree_and_git_dir
2160 * to fixup the submodule in the force case later.
2161 */
2162 error_code_ptr = &error_code;
2163 else
2164 error_code_ptr = NULL;
2165
2166 if (old_head && !is_submodule_populated_gently(path, error_code_ptr))
2167 return 0;
2168
2169 sub = submodule_from_path(the_repository, null_oid(the_hash_algo), path);
2170
2171 if (!sub)
2172 BUG("could not get submodule information for '%s'", path);
2173
2174 if (old_head && !(flags & SUBMODULE_MOVE_HEAD_FORCE)) {
2175 /* Check if the submodule has a dirty index. */
2176 if (submodule_has_dirty_index(sub))
2177 return error(_("submodule '%s' has dirty index"), path);
2178 }
2179
2180 if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
2181 if (old_head) {
2182 if (!submodule_uses_gitfile(path))
2183 absorb_git_dir_into_superproject(path,
2184 super_prefix);
2185 else {
2186 char *dotgit = xstrfmt("%s/.git", path);
2187 char *git_dir = xstrdup(read_gitfile(dotgit));
2188
2189 free(dotgit);
2190 if (validate_submodule_git_dir(git_dir,
2191 sub->name) < 0)
2192 die(_("refusing to create/use '%s' in "
2193 "another submodule's git dir"),
2194 git_dir);
2195 free(git_dir);
2196 }
2197 } else {
2198 struct strbuf gitdir = STRBUF_INIT;
2199 submodule_name_to_gitdir(&gitdir, the_repository,
2200 sub->name);
2201 if (validate_submodule_git_dir(gitdir.buf,
2202 sub->name) < 0)
2203 die(_("refusing to create/use '%s' in another "
2204 "submodule's git dir"),
2205 gitdir.buf);
2206 connect_work_tree_and_git_dir(path, gitdir.buf, 0);
2207 strbuf_release(&gitdir);
2208
2209 /* make sure the index is clean as well */
2210 submodule_reset_index(path, super_prefix);
2211 }
2212
2213 if (old_head && (flags & SUBMODULE_MOVE_HEAD_FORCE)) {
2214 struct strbuf gitdir = STRBUF_INIT;
2215 submodule_name_to_gitdir(&gitdir, the_repository,
2216 sub->name);
2217 connect_work_tree_and_git_dir(path, gitdir.buf, 1);
2218 strbuf_release(&gitdir);
2219 }
2220 }
2221
2222 prepare_submodule_repo_env(&cp.env);
2223
2224 cp.git_cmd = 1;
2225 cp.no_stdin = 1;
2226 cp.dir = path;
2227
2228 strvec_pushl(&cp.args, "read-tree", "--recurse-submodules", NULL);
2229 strvec_pushf(&cp.args, "--super-prefix=%s%s/",
2230 (super_prefix ? super_prefix : ""), path);
2231
2232 if (flags & SUBMODULE_MOVE_HEAD_DRY_RUN)
2233 strvec_push(&cp.args, "-n");
2234 else
2235 strvec_push(&cp.args, "-u");
2236
2237 if (flags & SUBMODULE_MOVE_HEAD_FORCE)
2238 strvec_push(&cp.args, "--reset");
2239 else
2240 strvec_push(&cp.args, "-m");
2241
2242 if (!(flags & SUBMODULE_MOVE_HEAD_FORCE))
2243 strvec_push(&cp.args, old_head ? old_head : empty_tree_oid_hex(the_repository->hash_algo));
2244
2245 strvec_push(&cp.args, new_head ? new_head : empty_tree_oid_hex(the_repository->hash_algo));
2246
2247 if (run_command(&cp)) {
2248 ret = error(_("Submodule '%s' could not be updated."), path);
2249 goto out;
2250 }
2251
2252 if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
2253 if (new_head) {
2254 child_process_init(&cp);
2255 /* also set the HEAD accordingly */
2256 cp.git_cmd = 1;
2257 cp.no_stdin = 1;
2258 cp.dir = path;
2259
2260 prepare_submodule_repo_env(&cp.env);
2261 strvec_pushl(&cp.args, "update-ref", "HEAD",
2262 "--no-deref", new_head, NULL);
2263
2264 if (run_command(&cp)) {
2265 ret = -1;
2266 goto out;
2267 }
2268 } else {
2269 struct strbuf sb = STRBUF_INIT;
2270
2271 strbuf_addf(&sb, "%s/.git", path);
2272 unlink_or_warn(sb.buf);
2273 strbuf_release(&sb);
2274
2275 if (is_empty_dir(path))
2276 rmdir_or_warn(path);
2277
2278 submodule_unset_core_worktree(sub);
2279 }
2280 }
2281 out:
2282 return ret;
2283 }
2284
2285 int validate_submodule_git_dir(char *git_dir, const char *submodule_name)
2286 {
2287 size_t len = strlen(git_dir), suffix_len = strlen(submodule_name);
2288 char *p;
2289 int ret = 0;
2290
2291 if (len <= suffix_len || (p = git_dir + len - suffix_len)[-1] != '/' ||
2292 strcmp(p, submodule_name))
2293 BUG("submodule name '%s' not a suffix of git dir '%s'",
2294 submodule_name, git_dir);
2295
2296 /*
2297 * We prevent the contents of sibling submodules' git directories to
2298 * clash.
2299 *
2300 * Example: having a submodule named `hippo` and another one named
2301 * `hippo/hooks` would result in the git directories
2302 * `.git/modules/hippo/` and `.git/modules/hippo/hooks/`, respectively,
2303 * but the latter directory is already designated to contain the hooks
2304 * of the former.
2305 */
2306 for (; *p; p++) {
2307 if (is_dir_sep(*p)) {
2308 char c = *p;
2309
2310 *p = '\0';
2311 if (is_git_directory(git_dir))
2312 ret = -1;
2313 *p = c;
2314
2315 if (ret < 0)
2316 return error(_("submodule git dir '%s' is "
2317 "inside git dir '%.*s'"),
2318 git_dir,
2319 (int)(p - git_dir), git_dir);
2320 }
2321 }
2322
2323 return 0;
2324 }
2325
2326 int validate_submodule_path(const char *path)
2327 {
2328 char *p = xstrdup(path);
2329 struct stat st;
2330 int i, ret = 0;
2331 char sep;
2332
2333 for (i = 0; !ret && p[i]; i++) {
2334 if (!is_dir_sep(p[i]))
2335 continue;
2336
2337 sep = p[i];
2338 p[i] = '\0';
2339 /* allow missing components, but no symlinks */
2340 ret = lstat(p, &st) || !S_ISLNK(st.st_mode) ? 0 : -1;
2341 p[i] = sep;
2342 if (ret)
2343 error(_("expected '%.*s' in submodule path '%s' not to "
2344 "be a symbolic link"), i, p, p);
2345 }
2346 if (!lstat(p, &st) && S_ISLNK(st.st_mode))
2347 ret = error(_("expected submodule path '%s' not to be a "
2348 "symbolic link"), p);
2349 free(p);
2350 return ret;
2351 }
2352
2353
2354 /*
2355 * Embeds a single submodules git directory into the superprojects git dir,
2356 * non recursively.
2357 */
2358 static void relocate_single_git_dir_into_superproject(const char *path,
2359 const char *super_prefix)
2360 {
2361 char *old_git_dir = NULL, *real_old_git_dir = NULL, *real_new_git_dir = NULL;
2362 struct strbuf new_gitdir = STRBUF_INIT;
2363 const struct submodule *sub;
2364
2365 if (validate_submodule_path(path) < 0)
2366 exit(128);
2367
2368 if (submodule_uses_worktrees(path))
2369 die(_("relocate_gitdir for submodule '%s' with "
2370 "more than one worktree not supported"), path);
2371
2372 old_git_dir = xstrfmt("%s/.git", path);
2373 if (read_gitfile(old_git_dir))
2374 /* If it is an actual gitfile, it doesn't need migration. */
2375 return;
2376
2377 real_old_git_dir = real_pathdup(old_git_dir, 1);
2378
2379 sub = submodule_from_path(the_repository, null_oid(the_hash_algo), path);
2380 if (!sub)
2381 die(_("could not lookup name for submodule '%s'"), path);
2382
2383 submodule_name_to_gitdir(&new_gitdir, the_repository, sub->name);
2384 if (validate_submodule_git_dir(new_gitdir.buf, sub->name) < 0)
2385 die(_("refusing to move '%s' into an existing git dir"),
2386 real_old_git_dir);
2387 if (safe_create_leading_directories_const(the_repository, new_gitdir.buf) < 0)
2388 die(_("could not create directory '%s'"), new_gitdir.buf);
2389 real_new_git_dir = real_pathdup(new_gitdir.buf, 1);
2390
2391 fprintf(stderr, _("Migrating git directory of '%s%s' from\n'%s' to\n'%s'\n"),
2392 super_prefix ? super_prefix : "", path,
2393 real_old_git_dir, real_new_git_dir);
2394
2395 relocate_gitdir(path, real_old_git_dir, real_new_git_dir);
2396
2397 free(old_git_dir);
2398 free(real_old_git_dir);
2399 free(real_new_git_dir);
2400 strbuf_release(&new_gitdir);
2401 }
2402
2403 static void absorb_git_dir_into_superproject_recurse(const char *path,
2404 const char *super_prefix)
2405 {
2406
2407 struct child_process cp = CHILD_PROCESS_INIT;
2408
2409 if (validate_submodule_path(path) < 0)
2410 exit(128);
2411
2412 cp.dir = path;
2413 cp.git_cmd = 1;
2414 cp.no_stdin = 1;
2415 strvec_pushl(&cp.args, "submodule--helper",
2416 "absorbgitdirs", NULL);
2417 strvec_pushf(&cp.args, "--super-prefix=%s%s/", super_prefix ?
2418 super_prefix : "", path);
2419
2420 prepare_submodule_repo_env(&cp.env);
2421 if (run_command(&cp))
2422 die(_("could not recurse into submodule '%s'"), path);
2423 }
2424
2425 /*
2426 * Migrate the git directory of the submodule given by path from
2427 * having its git directory within the working tree to the git dir nested
2428 * in its superprojects git dir under modules/.
2429 */
2430 void absorb_git_dir_into_superproject(const char *path,
2431 const char *super_prefix)
2432 {
2433 int err_code;
2434 const char *sub_git_dir;
2435 struct strbuf gitdir = STRBUF_INIT;
2436
2437 if (validate_submodule_path(path) < 0)
2438 exit(128);
2439
2440 strbuf_addf(&gitdir, "%s/.git", path);
2441 sub_git_dir = resolve_gitdir_gently(gitdir.buf, &err_code);
2442
2443 /* Not populated? */
2444 if (!sub_git_dir) {
2445 const struct submodule *sub;
2446 struct strbuf sub_gitdir = STRBUF_INIT;
2447
2448 if (err_code == READ_GITFILE_ERR_STAT_FAILED) {
2449 /* unpopulated as expected */
2450 strbuf_release(&gitdir);
2451 return;
2452 }
2453
2454 if (err_code != READ_GITFILE_ERR_NOT_A_REPO)
2455 /* We don't know what broke here. */
2456 read_gitfile_error_die(err_code, path, NULL);
2457
2458 /*
2459 * Maybe populated, but no git directory was found?
2460 * This can happen if the superproject is a submodule
2461 * itself and was just absorbed. The absorption of the
2462 * superproject did not rewrite the git file links yet,
2463 * fix it now.
2464 */
2465 sub = submodule_from_path(the_repository, null_oid(the_hash_algo), path);
2466 if (!sub)
2467 die(_("could not lookup name for submodule '%s'"), path);
2468 submodule_name_to_gitdir(&sub_gitdir, the_repository, sub->name);
2469 connect_work_tree_and_git_dir(path, sub_gitdir.buf, 0);
2470 strbuf_release(&sub_gitdir);
2471 } else {
2472 /* Is it already absorbed into the superprojects git dir? */
2473 char *real_sub_git_dir = real_pathdup(sub_git_dir, 1);
2474 char *real_common_git_dir = real_pathdup(repo_get_common_dir(the_repository), 1);
2475
2476 if (!starts_with(real_sub_git_dir, real_common_git_dir))
2477 relocate_single_git_dir_into_superproject(path, super_prefix);
2478
2479 free(real_sub_git_dir);
2480 free(real_common_git_dir);
2481 }
2482 strbuf_release(&gitdir);
2483
2484 absorb_git_dir_into_superproject_recurse(path, super_prefix);
2485 }
2486
2487 int get_superproject_working_tree(struct strbuf *buf)
2488 {
2489 struct child_process cp = CHILD_PROCESS_INIT;
2490 struct strbuf sb = STRBUF_INIT;
2491 struct strbuf one_up = STRBUF_INIT;
2492 char *cwd = xgetcwd();
2493 int ret = 0;
2494 const char *subpath;
2495 int code;
2496 ssize_t len;
2497
2498 if (!is_inside_work_tree())
2499 /*
2500 * FIXME:
2501 * We might have a superproject, but it is harder
2502 * to determine.
2503 */
2504 return 0;
2505
2506 if (!strbuf_realpath(&one_up, "../", 0))
2507 return 0;
2508
2509 subpath = relative_path(cwd, one_up.buf, &sb);
2510 strbuf_release(&one_up);
2511
2512 prepare_submodule_repo_env(&cp.env);
2513 strvec_pop(&cp.env);
2514
2515 strvec_pushl(&cp.args, "--literal-pathspecs", "-C", "..",
2516 "ls-files", "-z", "--stage", "--full-name", "--",
2517 subpath, NULL);
2518 strbuf_reset(&sb);
2519
2520 cp.no_stdin = 1;
2521 cp.no_stderr = 1;
2522 cp.out = -1;
2523 cp.git_cmd = 1;
2524
2525 if (start_command(&cp))
2526 die(_("could not start ls-files in .."));
2527
2528 len = strbuf_read(&sb, cp.out, PATH_MAX);
2529 close(cp.out);
2530
2531 if (starts_with(sb.buf, "160000")) {
2532 int super_sub_len;
2533 int cwd_len = strlen(cwd);
2534 char *super_sub, *super_wt;
2535
2536 /*
2537 * There is a superproject having this repo as a submodule.
2538 * The format is <mode> SP <hash> SP <stage> TAB <full name> \0,
2539 * We're only interested in the name after the tab.
2540 */
2541 super_sub = strchr(sb.buf, '\t') + 1;
2542 super_sub_len = strlen(super_sub);
2543
2544 if (super_sub_len > cwd_len ||
2545 strcmp(&cwd[cwd_len - super_sub_len], super_sub))
2546 BUG("returned path string doesn't match cwd?");
2547
2548 super_wt = xstrdup(cwd);
2549 super_wt[cwd_len - super_sub_len] = '\0';
2550
2551 strbuf_realpath(buf, super_wt, 1);
2552 ret = 1;
2553 free(super_wt);
2554 }
2555 free(cwd);
2556 strbuf_release(&sb);
2557
2558 code = finish_command(&cp);
2559
2560 if (code == 128)
2561 /* '../' is not a git repository */
2562 return 0;
2563 if (code == 0 && len == 0)
2564 /* There is an unrelated git repository at '../' */
2565 return 0;
2566 if (code)
2567 die(_("ls-tree returned unexpected return code %d"), code);
2568
2569 return ret;
2570 }
2571
2572 /*
2573 * Put the gitdir for a submodule (given relative to the main
2574 * repository worktree) into `buf`, or return -1 on error.
2575 */
2576 int submodule_to_gitdir(struct repository *repo,
2577 struct strbuf *buf, const char *submodule)
2578 {
2579 const struct submodule *sub;
2580 const char *git_dir;
2581 int ret = 0;
2582
2583 if (validate_submodule_path(submodule) < 0)
2584 exit(128);
2585
2586 strbuf_reset(buf);
2587 strbuf_addstr(buf, submodule);
2588 strbuf_complete(buf, '/');
2589 strbuf_addstr(buf, ".git");
2590
2591 git_dir = read_gitfile(buf->buf);
2592 if (git_dir) {
2593 strbuf_reset(buf);
2594 strbuf_addstr(buf, git_dir);
2595 }
2596 if (!is_git_directory(buf->buf)) {
2597 sub = submodule_from_path(repo, null_oid(the_hash_algo), submodule);
2598 if (!sub) {
2599 ret = -1;
2600 goto cleanup;
2601 }
2602 strbuf_reset(buf);
2603 submodule_name_to_gitdir(buf, repo, sub->name);
2604 }
2605
2606 cleanup:
2607 return ret;
2608 }
2609
2610 void submodule_name_to_gitdir(struct strbuf *buf, struct repository *r,
2611 const char *submodule_name)
2612 {
2613 /*
2614 * NEEDSWORK: The current way of mapping a submodule's name to
2615 * its location in .git/modules/ has problems with some naming
2616 * schemes. For example, if a submodule is named "foo" and
2617 * another is named "foo/bar" (whether present in the same
2618 * superproject commit or not - the problem will arise if both
2619 * superproject commits have been checked out at any point in
2620 * time), or if two submodule names only have different cases in
2621 * a case-insensitive filesystem.
2622 *
2623 * There are several solutions, including encoding the path in
2624 * some way, introducing a submodule.<name>.gitdir config in
2625 * .git/config (not .gitmodules) that allows overriding what the
2626 * gitdir of a submodule would be (and teach Git, upon noticing
2627 * a clash, to automatically determine a non-clashing name and
2628 * to write such a config), or introducing a
2629 * submodule.<name>.gitdir config in .gitmodules that repo
2630 * administrators can explicitly set. Nothing has been decided,
2631 * so for now, just append the name at the end of the path.
2632 */
2633 repo_git_path_append(r, buf, "modules/");
2634 strbuf_addstr(buf, submodule_name);
2635 }