submodule.c 52.1 KB
Newer Older
1
#include "cache.h"
2
#include "submodule-config.h"
3 4 5 6 7
#include "submodule.h"
#include "dir.h"
#include "diff.h"
#include "commit.h"
#include "revision.h"
8
#include "run-command.h"
9
#include "diffcore.h"
10
#include "refs.h"
11
#include "string-list.h"
12
#include "sha1-array.h"
13
#include "argv-array.h"
14
#include "blob.h"
15
#include "thread-utils.h"
16
#include "quote.h"
17
#include "remote.h"
18
#include "worktree.h"
19

20
static int config_fetch_recurse_submodules = RECURSE_SUBMODULES_ON_DEMAND;
21
static int config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
22
static int parallel_jobs = 1;
23
static struct string_list changed_submodule_paths = STRING_LIST_INIT_DUP;
24
static int initialized_fetch_ref_tips;
25 26
static struct oid_array ref_tips_before_fetch;
static struct oid_array ref_tips_after_fetch;
27

28 29 30 31 32 33 34 35 36
/*
 * The following flag is set if the .gitmodules file is unmerged. We then
 * disable recursion for all submodules where .git/config doesn't have a
 * matching config entry because we can't guess what might be configured in
 * .gitmodules unless the user resolves the conflict. When a command line
 * option is given (which always overrides configuration) this flag will be
 * ignored.
 */
static int gitmodules_is_unmerged;
37

38 39 40 41 42 43 44 45 46 47 48 49 50 51 52
/*
 * This flag is set if the .gitmodules file had unstaged modifications on
 * startup. This must be checked before allowing modifications to the
 * .gitmodules file with the intention to stage them later, because when
 * continuing we would stage the modifications the user didn't stage herself
 * too. That might change in a future version when we learn to stage the
 * changes we do ourselves without staging any previous modifications.
 */
static int gitmodules_is_modified;

int is_staging_gitmodules_ok(void)
{
	return !gitmodules_is_modified;
}

53 54 55 56 57 58 59 60
/*
 * Try to update the "path" entry in the "submodule.<name>" section of the
 * .gitmodules file. Return 0 only if a .gitmodules file was found, a section
 * with the correct path=<oldpath> setting was found and we could update it.
 */
int update_path_in_gitmodules(const char *oldpath, const char *newpath)
{
	struct strbuf entry = STRBUF_INIT;
61
	const struct submodule *submodule;
62 63 64 65 66 67 68

	if (!file_exists(".gitmodules")) /* Do nothing without .gitmodules */
		return -1;

	if (gitmodules_is_unmerged)
		die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));

69 70
	submodule = submodule_from_path(null_sha1, oldpath);
	if (!submodule || !submodule->name) {
71 72 73 74
		warning(_("Could not find section in .gitmodules where path=%s"), oldpath);
		return -1;
	}
	strbuf_addstr(&entry, "submodule.");
75
	strbuf_addstr(&entry, submodule->name);
76
	strbuf_addstr(&entry, ".path");
77
	if (git_config_set_in_file_gently(".gitmodules", entry.buf, newpath) < 0) {
78 79 80 81 82 83 84 85 86
		/* Maybe the user already did that, don't error out here */
		warning(_("Could not update .gitmodules entry %s"), entry.buf);
		strbuf_release(&entry);
		return -1;
	}
	strbuf_release(&entry);
	return 0;
}

87 88 89 90 91 92 93 94
/*
 * Try to remove the "submodule.<name>" section from .gitmodules where the given
 * path is configured. Return 0 only if a .gitmodules file was found, a section
 * with the correct path=<path> setting was found and we could remove it.
 */
int remove_path_from_gitmodules(const char *path)
{
	struct strbuf sect = STRBUF_INIT;
95
	const struct submodule *submodule;
96 97 98 99 100 101 102

	if (!file_exists(".gitmodules")) /* Do nothing without .gitmodules */
		return -1;

	if (gitmodules_is_unmerged)
		die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));

103 104
	submodule = submodule_from_path(null_sha1, path);
	if (!submodule || !submodule->name) {
105 106 107 108
		warning(_("Could not find section in .gitmodules where path=%s"), path);
		return -1;
	}
	strbuf_addstr(&sect, "submodule.");
109
	strbuf_addstr(&sect, submodule->name);
110 111 112 113 114 115 116 117 118 119
	if (git_config_rename_section_in_file(".gitmodules", sect.buf, NULL) < 0) {
		/* Maybe the user already did that, don't error out here */
		warning(_("Could not remove .gitmodules entry for %s"), path);
		strbuf_release(&sect);
		return -1;
	}
	strbuf_release(&sect);
	return 0;
}

120 121
void stage_updated_gitmodules(void)
{
122
	if (add_file_to_cache(".gitmodules", 0))
123 124 125
		die(_("staging updated .gitmodules failed"));
}

126
static int add_submodule_odb(const char *path)
127 128
{
	struct strbuf objects_directory = STRBUF_INIT;
J
Jens Lehmann 已提交
129
	int ret = 0;
130

131 132 133
	ret = strbuf_git_path_submodule(&objects_directory, path, "objects/");
	if (ret)
		goto done;
J
Jens Lehmann 已提交
134 135 136 137
	if (!is_directory(objects_directory.buf)) {
		ret = -1;
		goto done;
	}
138
	add_to_alternates_memory(objects_directory.buf);
J
Jens Lehmann 已提交
139 140 141
done:
	strbuf_release(&objects_directory);
	return ret;
142 143
}

144 145 146
void set_diffopt_flags_from_submodule_config(struct diff_options *diffopt,
					     const char *path)
{
147 148 149 150
	const struct submodule *submodule = submodule_from_path(null_sha1, path);
	if (submodule) {
		if (submodule->ignore)
			handle_ignore_submodules_arg(diffopt, submodule->ignore);
151 152
		else if (gitmodules_is_unmerged)
			DIFF_OPT_SET(diffopt, IGNORE_SUBMODULES);
153 154 155
	}
}

156
int submodule_config(const char *var, const char *value, void *cb)
157
{
158 159 160 161 162 163
	if (!strcmp(var, "submodule.fetchjobs")) {
		parallel_jobs = git_config_int(var, value);
		if (parallel_jobs < 0)
			die(_("negative values not allowed for submodule.fetchJobs"));
		return 0;
	} else if (starts_with(var, "submodule."))
164
		return parse_submodule_config_option(var, value);
165
	else if (!strcmp(var, "fetch.recursesubmodules")) {
166
		config_fetch_recurse_submodules = parse_fetch_recurse_submodules_arg(var, value);
167 168
		return 0;
	}
169 170 171
	return 0;
}

172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197
int option_parse_recurse_submodules_worktree_updater(const struct option *opt,
						     const char *arg, int unset)
{
	if (unset) {
		config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
		return 0;
	}
	if (arg)
		config_update_recurse_submodules =
			parse_update_recurse_submodules_arg(opt->long_name,
							    arg);
	else
		config_update_recurse_submodules = RECURSE_SUBMODULES_ON;

	return 0;
}

void load_submodule_cache(void)
{
	if (config_update_recurse_submodules == RECURSE_SUBMODULES_OFF)
		return;

	gitmodules_config();
	git_config(submodule_config, NULL);
}

198 199 200 201 202
void gitmodules_config(void)
{
	const char *work_tree = get_git_work_tree();
	if (work_tree) {
		struct strbuf gitmodules_path = STRBUF_INIT;
203
		int pos;
204 205
		strbuf_addstr(&gitmodules_path, work_tree);
		strbuf_addstr(&gitmodules_path, "/.gitmodules");
206 207 208 209 210 211 212 213 214 215 216
		if (read_cache() < 0)
			die("index file corrupt");
		pos = cache_name_pos(".gitmodules", 11);
		if (pos < 0) { /* .gitmodules not found or isn't merged */
			pos = -1 - pos;
			if (active_nr > pos) {  /* there is a .gitmodules */
				const struct cache_entry *ce = active_cache[pos];
				if (ce_namelen(ce) == 11 &&
				    !memcmp(ce->name, ".gitmodules", 11))
					gitmodules_is_unmerged = 1;
			}
217 218 219 220 221
		} else if (pos < active_nr) {
			struct stat st;
			if (lstat(".gitmodules", &st) == 0 &&
			    ce_match_stat(active_cache[pos], &st, 0) & DATA_CHANGED)
				gitmodules_is_modified = 1;
222 223 224 225
		}

		if (!gitmodules_is_unmerged)
			git_config_from_file(submodule_config, gitmodules_path.buf, NULL);
226 227 228 229
		strbuf_release(&gitmodules_path);
	}
}

230 231 232 233 234 235 236 237 238 239 240 241
void gitmodules_config_sha1(const unsigned char *commit_sha1)
{
	struct strbuf rev = STRBUF_INIT;
	unsigned char sha1[20];

	if (gitmodule_sha1_from_commit(commit_sha1, sha1, &rev)) {
		git_config_from_blob_sha1(submodule_config, rev.buf,
					  sha1, NULL);
	}
	strbuf_release(&rev);
}

242
/*
243 244 245 246 247 248
 * NEEDSWORK: With the addition of different configuration options to determine
 * if a submodule is of interests, the validity of this function's name comes
 * into question.  Once the dust has settled and more concrete terminology is
 * decided upon, come up with a more proper name for this function.  One
 * potential candidate could be 'is_submodule_active()'.
 *
249 250 251 252 253
 * Determine if a submodule has been initialized at a given 'path'
 */
int is_submodule_initialized(const char *path)
{
	int ret = 0;
254 255 256 257
	char *key = NULL;
	char *value = NULL;
	const struct string_list *sl;
	const struct submodule *module = submodule_from_path(null_sha1, path);
258

259 260 261
	/* early return if there isn't a path->module mapping */
	if (!module)
		return 0;
262

263 264 265 266 267 268 269
	/* submodule.<name>.active is set */
	key = xstrfmt("submodule.%s.active", module->name);
	if (!git_config_get_bool(key, &ret)) {
		free(key);
		return ret;
	}
	free(key);
270

271 272 273 274 275 276
	/* submodule.active is set */
	sl = git_config_get_value_multi("submodule.active");
	if (sl) {
		struct pathspec ps;
		struct argv_array args = ARGV_ARRAY_INIT;
		const struct string_list_item *item;
277

278 279 280 281 282 283 284 285 286 287
		for_each_string_list_item(item, sl) {
			argv_array_push(&args, item->string);
		}

		parse_pathspec(&ps, 0, 0, NULL, args.argv);
		ret = match_pathspec(&ps, path, strlen(path), 0, NULL, 1);

		argv_array_clear(&args);
		clear_pathspec(&ps);
		return ret;
288 289
	}

290 291 292 293 294 295
	/* fallback to checking if the URL is set */
	key = xstrfmt("submodule.%s.url", module->name);
	ret = !git_config_get_string(key, &value);

	free(value);
	free(key);
296 297 298
	return ret;
}

299
int is_submodule_populated_gently(const char *path, int *return_error_code)
300 301 302 303
{
	int ret = 0;
	char *gitdir = xstrfmt("%s/.git", path);

304
	if (resolve_gitdir_gently(gitdir, return_error_code))
305 306 307 308 309 310
		ret = 1;

	free(gitdir);
	return ret;
}

311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331
int parse_submodule_update_strategy(const char *value,
		struct submodule_update_strategy *dst)
{
	free((void*)dst->command);
	dst->command = NULL;
	if (!strcmp(value, "none"))
		dst->type = SM_UPDATE_NONE;
	else if (!strcmp(value, "checkout"))
		dst->type = SM_UPDATE_CHECKOUT;
	else if (!strcmp(value, "rebase"))
		dst->type = SM_UPDATE_REBASE;
	else if (!strcmp(value, "merge"))
		dst->type = SM_UPDATE_MERGE;
	else if (skip_prefix(value, "!", &value)) {
		dst->type = SM_UPDATE_COMMAND;
		dst->command = xstrdup(value);
	} else
		return -1;
	return 0;
}

332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352
const char *submodule_strategy_to_string(const struct submodule_update_strategy *s)
{
	struct strbuf sb = STRBUF_INIT;
	switch (s->type) {
	case SM_UPDATE_CHECKOUT:
		return "checkout";
	case SM_UPDATE_MERGE:
		return "merge";
	case SM_UPDATE_REBASE:
		return "rebase";
	case SM_UPDATE_NONE:
		return "none";
	case SM_UPDATE_UNSPECIFIED:
		return NULL;
	case SM_UPDATE_COMMAND:
		strbuf_addf(&sb, "!%s", s->command);
		return strbuf_detach(&sb, NULL);
	}
	return NULL;
}

353 354 355
void handle_ignore_submodules_arg(struct diff_options *diffopt,
				  const char *arg)
{
356 357 358 359
	DIFF_OPT_CLR(diffopt, IGNORE_SUBMODULES);
	DIFF_OPT_CLR(diffopt, IGNORE_UNTRACKED_IN_SUBMODULES);
	DIFF_OPT_CLR(diffopt, IGNORE_DIRTY_SUBMODULES);

360 361 362 363 364 365
	if (!strcmp(arg, "all"))
		DIFF_OPT_SET(diffopt, IGNORE_SUBMODULES);
	else if (!strcmp(arg, "untracked"))
		DIFF_OPT_SET(diffopt, IGNORE_UNTRACKED_IN_SUBMODULES);
	else if (!strcmp(arg, "dirty"))
		DIFF_OPT_SET(diffopt, IGNORE_DIRTY_SUBMODULES);
366
	else if (strcmp(arg, "none"))
367 368 369
		die("bad --ignore-submodules argument: %s", arg);
}

370 371
static int prepare_submodule_summary(struct rev_info *rev, const char *path,
		struct commit *left, struct commit *right,
372
		struct commit_list *merge_bases)
373
{
374
	struct commit_list *list;
375 376 377 378 379 380 381 382 383 384 385

	init_revisions(rev, NULL);
	setup_revisions(0, NULL, rev, NULL);
	rev->left_right = 1;
	rev->first_parent_only = 1;
	left->object.flags |= SYMMETRIC_LEFT;
	add_pending_object(rev, &left->object, path);
	add_pending_object(rev, &right->object, path);
	for (list = merge_bases; list; list = list->next) {
		list->item->object.flags |= UNINTERESTING;
		add_pending_object(rev, &list->item->object,
386
			oid_to_hex(&list->item->object.oid));
387 388 389 390 391
	}
	return prepare_revision_walk(rev);
}

static void print_submodule_summary(struct rev_info *rev, FILE *f,
392
		const char *line_prefix,
393 394 395 396 397 398 399 400 401
		const char *del, const char *add, const char *reset)
{
	static const char format[] = "  %m %s";
	struct strbuf sb = STRBUF_INIT;
	struct commit *commit;

	while ((commit = get_revision(rev))) {
		struct pretty_print_context ctx = {0};
		ctx.date_mode = rev->date_mode;
402
		ctx.output_encoding = get_log_output_encoding();
403
		strbuf_setlen(&sb, 0);
404
		strbuf_addstr(&sb, line_prefix);
405 406 407 408 409 410 411 412 413 414 415 416 417 418 419
		if (commit->object.flags & SYMMETRIC_LEFT) {
			if (del)
				strbuf_addstr(&sb, del);
		}
		else if (add)
			strbuf_addstr(&sb, add);
		format_commit_message(commit, format, &sb, &ctx);
		if (reset)
			strbuf_addstr(&sb, reset);
		strbuf_addch(&sb, '\n');
		fprintf(f, "%s", sb.buf);
	}
	strbuf_release(&sb);
}

420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436
static void prepare_submodule_repo_env_no_git_dir(struct argv_array *out)
{
	const char * const *var;

	for (var = local_repo_env; *var; var++) {
		if (strcmp(*var, CONFIG_DATA_ENVIRONMENT))
			argv_array_push(out, *var);
	}
}

void prepare_submodule_repo_env(struct argv_array *out)
{
	prepare_submodule_repo_env_no_git_dir(out);
	argv_array_pushf(out, "%s=%s", GIT_DIR_ENVIRONMENT,
			 DEFAULT_GIT_DIR_ENVIRONMENT);
}

437 438 439 440 441 442
/* Helper function to display the submodule header line prior to the full
 * summary output. If it can locate the submodule objects directory it will
 * attempt to lookup both the left and right commits and put them into the
 * left and right pointers.
 */
static void show_submodule_header(FILE *f, const char *path,
443
		const char *line_prefix,
444
		struct object_id *one, struct object_id *two,
445
		unsigned dirty_submodule, const char *meta,
446 447 448
		const char *reset,
		struct commit **left, struct commit **right,
		struct commit_list **merge_bases)
449 450 451 452 453
{
	const char *message = NULL;
	struct strbuf sb = STRBUF_INIT;
	int fast_forward = 0, fast_backward = 0;

454
	if (dirty_submodule & DIRTY_SUBMODULE_UNTRACKED)
455 456
		fprintf(f, "%sSubmodule %s contains untracked content\n",
			line_prefix, path);
457
	if (dirty_submodule & DIRTY_SUBMODULE_MODIFIED)
458 459
		fprintf(f, "%sSubmodule %s contains modified content\n",
			line_prefix, path);
460

461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494
	if (is_null_oid(one))
		message = "(new submodule)";
	else if (is_null_oid(two))
		message = "(submodule deleted)";

	if (add_submodule_odb(path)) {
		if (!message)
			message = "(not initialized)";
		goto output_header;
	}

	/*
	 * Attempt to lookup the commit references, and determine if this is
	 * a fast forward or fast backwards update.
	 */
	*left = lookup_commit_reference(one->hash);
	*right = lookup_commit_reference(two->hash);

	/*
	 * Warn about missing commits in the submodule project, but only if
	 * they aren't null.
	 */
	if ((!is_null_oid(one) && !*left) ||
	     (!is_null_oid(two) && !*right))
		message = "(commits not present)";

	*merge_bases = get_merge_bases(*left, *right);
	if (*merge_bases) {
		if ((*merge_bases)->item == *left)
			fast_forward = 1;
		else if ((*merge_bases)->item == *right)
			fast_backward = 1;
	}

495
	if (!oidcmp(one, two)) {
496 497 498 499
		strbuf_release(&sb);
		return;
	}

500
output_header:
501
	strbuf_addf(&sb, "%s%sSubmodule %s ", line_prefix, meta, path);
J
Junio C Hamano 已提交
502
	strbuf_add_unique_abbrev(&sb, one->hash, DEFAULT_ABBREV);
503
	strbuf_addstr(&sb, (fast_backward || fast_forward) ? ".." : "...");
J
Junio C Hamano 已提交
504
	strbuf_add_unique_abbrev(&sb, two->hash, DEFAULT_ABBREV);
505
	if (message)
506
		strbuf_addf(&sb, " %s%s\n", message, reset);
507
	else
508
		strbuf_addf(&sb, "%s:%s\n", fast_backward ? " (rewind)" : "", reset);
509 510 511 512
	fwrite(sb.buf, sb.len, 1, f);

	strbuf_release(&sb);
}
513

514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549
void show_submodule_summary(FILE *f, const char *path,
		const char *line_prefix,
		struct object_id *one, struct object_id *two,
		unsigned dirty_submodule, const char *meta,
		const char *del, const char *add, const char *reset)
{
	struct rev_info rev;
	struct commit *left = NULL, *right = NULL;
	struct commit_list *merge_bases = NULL;

	show_submodule_header(f, path, line_prefix, one, two, dirty_submodule,
			      meta, reset, &left, &right, &merge_bases);

	/*
	 * If we don't have both a left and a right pointer, there is no
	 * reason to try and display a summary. The header line should contain
	 * all the information the user needs.
	 */
	if (!left || !right)
		goto out;

	/* Treat revision walker failure the same as missing commits */
	if (prepare_submodule_summary(&rev, path, left, right, merge_bases)) {
		fprintf(f, "%s(revision walker failed)\n", line_prefix);
		goto out;
	}

	print_submodule_summary(&rev, f, line_prefix, del, add, reset);

out:
	if (merge_bases)
		free_commit_list(merge_bases);
	clear_commit_marks(left, ~0);
	clear_commit_marks(right, ~0);
}

550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605
void show_submodule_inline_diff(FILE *f, const char *path,
		const char *line_prefix,
		struct object_id *one, struct object_id *two,
		unsigned dirty_submodule, const char *meta,
		const char *del, const char *add, const char *reset,
		const struct diff_options *o)
{
	const struct object_id *old = &empty_tree_oid, *new = &empty_tree_oid;
	struct commit *left = NULL, *right = NULL;
	struct commit_list *merge_bases = NULL;
	struct strbuf submodule_dir = STRBUF_INIT;
	struct child_process cp = CHILD_PROCESS_INIT;

	show_submodule_header(f, path, line_prefix, one, two, dirty_submodule,
			      meta, reset, &left, &right, &merge_bases);

	/* We need a valid left and right commit to display a difference */
	if (!(left || is_null_oid(one)) ||
	    !(right || is_null_oid(two)))
		goto done;

	if (left)
		old = one;
	if (right)
		new = two;

	fflush(f);
	cp.git_cmd = 1;
	cp.dir = path;
	cp.out = dup(fileno(f));
	cp.no_stdin = 1;

	/* TODO: other options may need to be passed here. */
	argv_array_push(&cp.args, "diff");
	argv_array_pushf(&cp.args, "--line-prefix=%s", line_prefix);
	if (DIFF_OPT_TST(o, REVERSE_DIFF)) {
		argv_array_pushf(&cp.args, "--src-prefix=%s%s/",
				 o->b_prefix, path);
		argv_array_pushf(&cp.args, "--dst-prefix=%s%s/",
				 o->a_prefix, path);
	} else {
		argv_array_pushf(&cp.args, "--src-prefix=%s%s/",
				 o->a_prefix, path);
		argv_array_pushf(&cp.args, "--dst-prefix=%s%s/",
				 o->b_prefix, path);
	}
	argv_array_push(&cp.args, oid_to_hex(old));
	/*
	 * If the submodule has modified content, we will diff against the
	 * work tree, under the assumption that the user has asked for the
	 * diff format and wishes to actually see all differences even if they
	 * haven't yet been committed to the submodule yet.
	 */
	if (!(dirty_submodule & DIRTY_SUBMODULE_MODIFIED))
		argv_array_push(&cp.args, oid_to_hex(new));

606
	prepare_submodule_repo_env(&cp.env_array);
607 608 609 610 611 612 613 614 615 616 617 618 619
	if (run_command(&cp))
		fprintf(f, "(diff failed)\n");

done:
	strbuf_release(&submodule_dir);
	if (merge_bases)
		free_commit_list(merge_bases);
	if (left)
		clear_commit_marks(left, ~0);
	if (right)
		clear_commit_marks(right, ~0);
}

620 621 622 623 624
void set_config_fetch_recurse_submodules(int value)
{
	config_fetch_recurse_submodules = value;
}

625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640
int should_update_submodules(void)
{
	return config_update_recurse_submodules == RECURSE_SUBMODULES_ON;
}

const struct submodule *submodule_from_ce(const struct cache_entry *ce)
{
	if (!S_ISGITLINK(ce->ce_mode))
		return NULL;

	if (!should_update_submodules())
		return NULL;

	return submodule_from_path(null_sha1, ce->name);
}

641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728
static struct oid_array *submodule_commits(struct string_list *submodules,
					   const char *path)
{
	struct string_list_item *item;

	item = string_list_insert(submodules, path);
	if (item->util)
		return (struct oid_array *) item->util;

	/* NEEDSWORK: should we have oid_array_init()? */
	item->util = xcalloc(1, sizeof(struct oid_array));
	return (struct oid_array *) item->util;
}

static void collect_changed_submodules_cb(struct diff_queue_struct *q,
					  struct diff_options *options,
					  void *data)
{
	int i;
	struct string_list *changed = data;

	for (i = 0; i < q->nr; i++) {
		struct diff_filepair *p = q->queue[i];
		struct oid_array *commits;
		if (!S_ISGITLINK(p->two->mode))
			continue;

		if (S_ISGITLINK(p->one->mode)) {
			/*
			 * NEEDSWORK: We should honor the name configured in
			 * the .gitmodules file of the commit we are examining
			 * here to be able to correctly follow submodules
			 * being moved around.
			 */
			commits = submodule_commits(changed, p->two->path);
			oid_array_append(commits, &p->two->oid);
		} else {
			/* Submodule is new or was moved here */
			/*
			 * NEEDSWORK: When the .git directories of submodules
			 * live inside the superprojects .git directory some
			 * day we should fetch new submodules directly into
			 * that location too when config or options request
			 * that so they can be checked out from there.
			 */
			continue;
		}
	}
}

/*
 * Collect the paths of submodules in 'changed' which have changed based on
 * the revisions as specified in 'argv'.  Each entry in 'changed' will also
 * have a corresponding 'struct oid_array' (in the 'util' field) which lists
 * what the submodule pointers were updated to during the change.
 */
static void collect_changed_submodules(struct string_list *changed,
				       struct argv_array *argv)
{
	struct rev_info rev;
	const struct commit *commit;

	init_revisions(&rev, NULL);
	setup_revisions(argv->argc, argv->argv, &rev, NULL);
	if (prepare_revision_walk(&rev))
		die("revision walk setup failed");

	while ((commit = get_revision(&rev))) {
		struct rev_info diff_rev;

		init_revisions(&diff_rev, NULL);
		diff_rev.diffopt.output_format |= DIFF_FORMAT_CALLBACK;
		diff_rev.diffopt.format_callback = collect_changed_submodules_cb;
		diff_rev.diffopt.format_callback_data = changed;
		diff_tree_combined_merge(commit, 1, &diff_rev);
	}

	reset_revision_walk();
}

static void free_submodules_oids(struct string_list *submodules)
{
	struct string_list_item *item;
	for_each_string_list_item(item, submodules)
		oid_array_clear((struct oid_array *) item->util);
	string_list_clear(submodules, 1);
}

729 730
static int has_remote(const char *refname, const struct object_id *oid,
		      int flags, void *cb_data)
731 732 733 734
{
	return 1;
}

735
static int append_oid_to_argv(const struct object_id *oid, void *data)
736
{
737
	struct argv_array *argv = data;
738
	argv_array_push(argv, oid_to_hex(oid));
739 740 741
	return 0;
}

742
static int check_has_commit(const struct object_id *oid, void *data)
743
{
744 745
	int *has_commit = data;

746
	if (!lookup_commit_reference(oid->hash))
747 748 749 750 751
		*has_commit = 0;

	return 0;
}

752
static int submodule_has_commits(const char *path, struct oid_array *commits)
753 754 755
{
	int has_commit = 1;

756 757 758 759 760 761 762 763 764
	/*
	 * Perform a cheap, but incorrect check for the existance of 'commits'.
	 * This is done by adding the submodule's object store to the in-core
	 * object store, and then querying for each commit's existance.  If we
	 * do not have the commit object anywhere, there is no chance we have
	 * it in the object store of the correct submodule and have it
	 * reachable from a ref, so we can fail early without spawning rev-list
	 * which is expensive.
	 */
765 766 767
	if (add_submodule_odb(path))
		return 0;

768
	oid_array_for_each_unique(commits, check_has_commit, &has_commit);
769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793

	if (has_commit) {
		/*
		 * Even if the submodule is checked out and the commit is
		 * present, make sure it exists in the submodule's object store
		 * and that it is reachable from a ref.
		 */
		struct child_process cp = CHILD_PROCESS_INIT;
		struct strbuf out = STRBUF_INIT;

		argv_array_pushl(&cp.args, "rev-list", "-n", "1", NULL);
		oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
		argv_array_pushl(&cp.args, "--not", "--all", NULL);

		prepare_submodule_repo_env(&cp.env_array);
		cp.git_cmd = 1;
		cp.no_stdin = 1;
		cp.dir = path;

		if (capture_command(&cp, &out, GIT_MAX_HEXSZ + 1) || out.len)
			has_commit = 0;

		strbuf_release(&out);
	}

794 795 796
	return has_commit;
}

797
static int submodule_needs_pushing(const char *path, struct oid_array *commits)
798 799
{
	if (!submodule_has_commits(path, commits))
800 801 802 803 804 805 806 807 808 809 810
		/*
		 * NOTE: We do consider it safe to return "no" here. The
		 * correct answer would be "We do not know" instead of
		 * "No push needed", but it is quite hard to change
		 * the submodule pointer without having the submodule
		 * around. If a user did however change the submodules
		 * without having the submodule around, this indicates
		 * an expert who knows what they are doing or a
		 * maintainer integrating work from other people. In
		 * both cases it should be safe to skip this check.
		 */
811 812 813
		return 0;

	if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
814
		struct child_process cp = CHILD_PROCESS_INIT;
815 816 817
		struct strbuf buf = STRBUF_INIT;
		int needs_pushing = 0;

818
		argv_array_push(&cp.args, "rev-list");
819
		oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
820 821
		argv_array_pushl(&cp.args, "--not", "--remotes", "-n", "1" , NULL);

822
		prepare_submodule_repo_env(&cp.env_array);
823 824 825 826 827
		cp.git_cmd = 1;
		cp.no_stdin = 1;
		cp.out = -1;
		cp.dir = path;
		if (start_command(&cp))
828 829
			die("Could not run 'git rev-list <commits> --not --remotes -n 1' command in submodule %s",
					path);
830 831 832 833 834 835 836 837 838 839 840
		if (strbuf_read(&buf, cp.out, 41))
			needs_pushing = 1;
		finish_command(&cp);
		close(cp.out);
		strbuf_release(&buf);
		return needs_pushing;
	}

	return 0;
}

841
int find_unpushed_submodules(struct oid_array *commits,
842
		const char *remotes_name, struct string_list *needs_pushing)
843
{
844 845
	struct string_list submodules = STRING_LIST_INIT_DUP;
	struct string_list_item *submodule;
846
	struct argv_array argv = ARGV_ARRAY_INIT;
847

848 849
	/* argv.argv[0] will be ignored by setup_revisions */
	argv_array_push(&argv, "find_unpushed_submodules");
850
	oid_array_for_each_unique(commits, append_oid_to_argv, &argv);
851 852 853
	argv_array_push(&argv, "--not");
	argv_array_pushf(&argv, "--remotes=%s", remotes_name);

854
	collect_changed_submodules(&submodules, &argv);
855

856
	for_each_string_list_item(submodule, &submodules) {
857 858
		struct oid_array *commits = submodule->util;
		const char *path = submodule->string;
859

860 861
		if (submodule_needs_pushing(path, commits))
			string_list_insert(needs_pushing, path);
862
	}
863 864

	free_submodules_oids(&submodules);
865
	argv_array_clear(&argv);
866

867
	return needs_pushing->nr;
868 869
}

870
static int push_submodule(const char *path,
871 872
			  const struct remote *remote,
			  const char **refspec, int refspec_nr,
873 874
			  const struct string_list *push_options,
			  int dry_run)
875 876 877 878 879
{
	if (add_submodule_odb(path))
		return 1;

	if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
880
		struct child_process cp = CHILD_PROCESS_INIT;
881 882 883
		argv_array_push(&cp.args, "push");
		if (dry_run)
			argv_array_push(&cp.args, "--dry-run");
884

885 886 887 888 889 890
		if (push_options && push_options->nr) {
			const struct string_list_item *item;
			for_each_string_list_item(item, push_options)
				argv_array_pushf(&cp.args, "--push-option=%s",
						 item->string);
		}
891 892 893 894 895 896 897 898

		if (remote->origin != REMOTE_UNCONFIGURED) {
			int i;
			argv_array_push(&cp.args, remote->name);
			for (i = 0; i < refspec_nr; i++)
				argv_array_push(&cp.args, refspec[i]);
		}

899
		prepare_submodule_repo_env(&cp.env_array);
900 901 902 903 904 905 906 907 908 909 910
		cp.git_cmd = 1;
		cp.no_stdin = 1;
		cp.dir = path;
		if (run_command(&cp))
			return 0;
		close(cp.out);
	}

	return 1;
}

911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942
/*
 * Perform a check in the submodule to see if the remote and refspec work.
 * Die if the submodule can't be pushed.
 */
static void submodule_push_check(const char *path, const struct remote *remote,
				 const char **refspec, int refspec_nr)
{
	struct child_process cp = CHILD_PROCESS_INIT;
	int i;

	argv_array_push(&cp.args, "submodule--helper");
	argv_array_push(&cp.args, "push-check");
	argv_array_push(&cp.args, remote->name);

	for (i = 0; i < refspec_nr; i++)
		argv_array_push(&cp.args, refspec[i]);

	prepare_submodule_repo_env(&cp.env_array);
	cp.git_cmd = 1;
	cp.no_stdin = 1;
	cp.no_stdout = 1;
	cp.dir = path;

	/*
	 * Simply indicate if 'submodule--helper push-check' failed.
	 * More detailed error information will be provided by the
	 * child process.
	 */
	if (run_command(&cp))
		die("process for submodule '%s' failed", path);
}

943
int push_unpushed_submodules(struct oid_array *commits,
944 945
			     const struct remote *remote,
			     const char **refspec, int refspec_nr,
946
			     const struct string_list *push_options,
947
			     int dry_run)
948 949
{
	int i, ret = 1;
950
	struct string_list needs_pushing = STRING_LIST_INIT_DUP;
951

952
	if (!find_unpushed_submodules(commits, remote->name, &needs_pushing))
953 954
		return 1;

955 956 957 958 959 960 961 962 963 964 965 966
	/*
	 * Verify that the remote and refspec can be propagated to all
	 * submodules.  This check can be skipped if the remote and refspec
	 * won't be propagated due to the remote being unconfigured (e.g. a URL
	 * instead of a remote name).
	 */
	if (remote->origin != REMOTE_UNCONFIGURED)
		for (i = 0; i < needs_pushing.nr; i++)
			submodule_push_check(needs_pushing.items[i].string,
					     remote, refspec, refspec_nr);

	/* Actually push the submodules */
967 968 969
	for (i = 0; i < needs_pushing.nr; i++) {
		const char *path = needs_pushing.items[i].string;
		fprintf(stderr, "Pushing submodule '%s'\n", path);
970 971
		if (!push_submodule(path, remote, refspec, refspec_nr,
				    push_options, dry_run)) {
972 973 974 975 976 977 978 979 980 981
			fprintf(stderr, "Unable to push submodule '%s'\n", path);
			ret = 0;
		}
	}

	string_list_clear(&needs_pushing, 0);

	return ret;
}

982 983
static int append_oid_to_array(const char *ref, const struct object_id *oid,
			       int flags, void *data)
984
{
985 986
	struct oid_array *array = data;
	oid_array_append(array, oid);
987 988 989
	return 0;
}

990
void check_for_new_submodule_commits(struct object_id *oid)
991 992
{
	if (!initialized_fetch_ref_tips) {
993
		for_each_ref(append_oid_to_array, &ref_tips_before_fetch);
994 995 996
		initialized_fetch_ref_tips = 1;
	}

997
	oid_array_append(&ref_tips_after_fetch, oid);
998 999 1000
}

static void calculate_changed_submodule_paths(void)
1001
{
1002
	struct argv_array argv = ARGV_ARRAY_INIT;
1003 1004
	struct string_list changed_submodules = STRING_LIST_INIT_DUP;
	const struct string_list_item *item;
1005

1006
	/* No need to check if there are no submodules configured */
1007
	if (!submodule_from_path(NULL, NULL))
1008 1009
		return;

1010
	argv_array_push(&argv, "--"); /* argv[0] program name */
1011
	oid_array_for_each_unique(&ref_tips_after_fetch,
1012
				   append_oid_to_argv, &argv);
1013
	argv_array_push(&argv, "--not");
1014
	oid_array_for_each_unique(&ref_tips_before_fetch,
1015
				   append_oid_to_argv, &argv);
1016 1017 1018 1019 1020

	/*
	 * Collect all submodules (whether checked out or not) for which new
	 * commits have been recorded upstream in "changed_submodule_paths".
	 */
1021 1022 1023 1024 1025 1026 1027 1028
	collect_changed_submodules(&changed_submodules, &argv);

	for_each_string_list_item(item, &changed_submodules) {
		struct oid_array *commits = item->util;
		const char *path = item->string;

		if (!submodule_has_commits(path, commits))
			string_list_append(&changed_submodule_paths, path);
1029
	}
1030

1031
	free_submodules_oids(&changed_submodules);
1032
	argv_array_clear(&argv);
1033 1034
	oid_array_clear(&ref_tips_before_fetch);
	oid_array_clear(&ref_tips_after_fetch);
1035
	initialized_fetch_ref_tips = 0;
1036 1037
}

1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050
struct submodule_parallel_fetch {
	int count;
	struct argv_array args;
	const char *work_tree;
	const char *prefix;
	int command_line_option;
	int quiet;
	int result;
};
#define SPF_INIT {0, ARGV_ARRAY_INIT, NULL, NULL, 0, 0, 0}

static int get_next_submodule(struct child_process *cp,
			      struct strbuf *err, void *data, void **task_cb)
1051
{
1052 1053
	int ret = 0;
	struct submodule_parallel_fetch *spf = data;
1054

1055
	for (; spf->count < active_nr; spf->count++) {
1056 1057 1058
		struct strbuf submodule_path = STRBUF_INIT;
		struct strbuf submodule_git_dir = STRBUF_INIT;
		struct strbuf submodule_prefix = STRBUF_INIT;
1059
		const struct cache_entry *ce = active_cache[spf->count];
1060 1061
		const char *git_dir, *default_argv;
		const struct submodule *submodule;
1062 1063 1064 1065

		if (!S_ISGITLINK(ce->ce_mode))
			continue;

1066 1067 1068
		submodule = submodule_from_path(null_sha1, ce->name);
		if (!submodule)
			submodule = submodule_from_name(null_sha1, ce->name);
1069

1070
		default_argv = "yes";
1071
		if (spf->command_line_option == RECURSE_SUBMODULES_DEFAULT) {
1072 1073 1074 1075 1076
			if (submodule &&
			    submodule->fetch_recurse !=
						RECURSE_SUBMODULES_NONE) {
				if (submodule->fetch_recurse ==
						RECURSE_SUBMODULES_OFF)
1077
					continue;
1078 1079
				if (submodule->fetch_recurse ==
						RECURSE_SUBMODULES_ON_DEMAND) {
1080 1081 1082 1083
					if (!unsorted_string_list_lookup(&changed_submodule_paths, ce->name))
						continue;
					default_argv = "on-demand";
				}
1084
			} else {
1085 1086
				if ((config_fetch_recurse_submodules == RECURSE_SUBMODULES_OFF) ||
				    gitmodules_is_unmerged)
1087
					continue;
1088 1089 1090 1091 1092
				if (config_fetch_recurse_submodules == RECURSE_SUBMODULES_ON_DEMAND) {
					if (!unsorted_string_list_lookup(&changed_submodule_paths, ce->name))
						continue;
					default_argv = "on-demand";
				}
1093
			}
1094
		} else if (spf->command_line_option == RECURSE_SUBMODULES_ON_DEMAND) {
1095 1096 1097
			if (!unsorted_string_list_lookup(&changed_submodule_paths, ce->name))
				continue;
			default_argv = "on-demand";
1098 1099
		}

1100
		strbuf_addf(&submodule_path, "%s/%s", spf->work_tree, ce->name);
1101
		strbuf_addf(&submodule_git_dir, "%s/.git", submodule_path.buf);
1102
		strbuf_addf(&submodule_prefix, "%s%s/", spf->prefix, ce->name);
1103
		git_dir = read_gitfile(submodule_git_dir.buf);
1104 1105 1106
		if (!git_dir)
			git_dir = submodule_git_dir.buf;
		if (is_directory(git_dir)) {
1107 1108
			child_process_init(cp);
			cp->dir = strbuf_detach(&submodule_path, NULL);
1109
			prepare_submodule_repo_env(&cp->env_array);
1110 1111 1112 1113 1114 1115 1116 1117 1118 1119
			cp->git_cmd = 1;
			if (!spf->quiet)
				strbuf_addf(err, "Fetching submodule %s%s\n",
					    spf->prefix, ce->name);
			argv_array_init(&cp->args);
			argv_array_pushv(&cp->args, spf->args.argv);
			argv_array_push(&cp->args, default_argv);
			argv_array_push(&cp->args, "--submodule-prefix");
			argv_array_push(&cp->args, submodule_prefix.buf);
			ret = 1;
1120 1121 1122 1123
		}
		strbuf_release(&submodule_path);
		strbuf_release(&submodule_git_dir);
		strbuf_release(&submodule_prefix);
1124 1125 1126 1127
		if (ret) {
			spf->count++;
			return 1;
		}
1128
	}
1129 1130 1131
	return 0;
}

1132
static int fetch_start_failure(struct strbuf *err,
1133 1134 1135 1136 1137 1138 1139 1140 1141
			       void *cb, void *task_cb)
{
	struct submodule_parallel_fetch *spf = cb;

	spf->result = 1;

	return 0;
}

1142 1143
static int fetch_finish(int retvalue, struct strbuf *err,
			void *cb, void *task_cb)
1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154
{
	struct submodule_parallel_fetch *spf = cb;

	if (retvalue)
		spf->result = 1;

	return 0;
}

int fetch_populated_submodules(const struct argv_array *options,
			       const char *prefix, int command_line_option,
1155
			       int quiet, int max_parallel_jobs)
1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176
{
	int i;
	struct submodule_parallel_fetch spf = SPF_INIT;

	spf.work_tree = get_git_work_tree();
	spf.command_line_option = command_line_option;
	spf.quiet = quiet;
	spf.prefix = prefix;

	if (!spf.work_tree)
		goto out;

	if (read_cache() < 0)
		die("index file corrupt");

	argv_array_push(&spf.args, "fetch");
	for (i = 0; i < options->argc; i++)
		argv_array_push(&spf.args, options->argv[i]);
	argv_array_push(&spf.args, "--recurse-submodules-default");
	/* default value, "--submodule-prefix" and its value are added later */

1177 1178 1179
	if (max_parallel_jobs < 0)
		max_parallel_jobs = parallel_jobs;

1180 1181 1182 1183 1184 1185 1186 1187
	calculate_changed_submodule_paths();
	run_processes_parallel(max_parallel_jobs,
			       get_next_submodule,
			       fetch_start_failure,
			       fetch_finish,
			       &spf);

	argv_array_clear(&spf.args);
1188 1189
out:
	string_list_clear(&changed_submodule_paths, 1);
1190
	return spf.result;
1191 1192
}

1193
unsigned is_submodule_modified(const char *path, int ignore_untracked)
1194
{
1195
	struct child_process cp = CHILD_PROCESS_INIT;
1196
	struct strbuf buf = STRBUF_INIT;
1197
	FILE *fp;
1198
	unsigned dirty_submodule = 0;
1199
	const char *git_dir;
1200
	int ignore_cp_exit_code = 0;
1201

1202
	strbuf_addf(&buf, "%s/.git", path);
1203
	git_dir = read_gitfile(buf.buf);
1204 1205
	if (!git_dir)
		git_dir = buf.buf;
1206 1207 1208
	if (!is_git_directory(git_dir)) {
		if (is_directory(git_dir))
			die(_("'%s' not recognized as a git repository"), git_dir);
1209 1210 1211 1212 1213 1214
		strbuf_release(&buf);
		/* The submodule is not checked out, so it is not modified */
		return 0;
	}
	strbuf_reset(&buf);

1215
	argv_array_pushl(&cp.args, "status", "--porcelain=2", NULL);
1216
	if (ignore_untracked)
1217
		argv_array_push(&cp.args, "-uno");
1218

1219
	prepare_submodule_repo_env(&cp.env_array);
1220 1221 1222
	cp.git_cmd = 1;
	cp.no_stdin = 1;
	cp.out = -1;
1223
	cp.dir = path;
1224
	if (start_command(&cp))
1225
		die("Could not run 'git status --porcelain=2' in submodule %s", path);
1226

1227 1228
	fp = xfdopen(cp.out, "r");
	while (strbuf_getwholeline(&buf, fp, '\n') != EOF) {
1229 1230
		/* regular untracked files */
		if (buf.buf[0] == '?')
1231
			dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249

		if (buf.buf[0] == 'u' ||
		    buf.buf[0] == '1' ||
		    buf.buf[0] == '2') {
			/* T = line type, XY = status, SSSS = submodule state */
			if (buf.len < strlen("T XY SSSS"))
				die("BUG: invalid status --porcelain=2 line %s",
				    buf.buf);

			if (buf.buf[5] == 'S' && buf.buf[8] == 'U')
				/* nested untracked file */
				dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;

			if (buf.buf[0] == 'u' ||
			    buf.buf[0] == '2' ||
			    memcmp(buf.buf + 5, "S..U", 4))
				/* other change */
				dirty_submodule |= DIRTY_SUBMODULE_MODIFIED;
1250
		}
1251 1252 1253

		if ((dirty_submodule & DIRTY_SUBMODULE_MODIFIED) &&
		    ((dirty_submodule & DIRTY_SUBMODULE_UNTRACKED) ||
1254 1255 1256 1257 1258 1259
		     ignore_untracked)) {
			/*
			 * We're not interested in any further information from
			 * the child any more, neither output nor its exit code.
			 */
			ignore_cp_exit_code = 1;
1260
			break;
1261
		}
1262
	}
1263
	fclose(fp);
1264

1265
	if (finish_command(&cp) && !ignore_cp_exit_code)
1266
		die("'git status --porcelain=2' failed in submodule %s", path);
1267 1268

	strbuf_release(&buf);
1269
	return dirty_submodule;
1270
}
1271

1272 1273
int submodule_uses_gitfile(const char *path)
{
1274
	struct child_process cp = CHILD_PROCESS_INIT;
1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295
	const char *argv[] = {
		"submodule",
		"foreach",
		"--quiet",
		"--recursive",
		"test -f .git",
		NULL,
	};
	struct strbuf buf = STRBUF_INIT;
	const char *git_dir;

	strbuf_addf(&buf, "%s/.git", path);
	git_dir = read_gitfile(buf.buf);
	if (!git_dir) {
		strbuf_release(&buf);
		return 0;
	}
	strbuf_release(&buf);

	/* Now test that all nested submodules use a gitfile too */
	cp.argv = argv;
1296
	prepare_submodule_repo_env(&cp.env_array);
1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307
	cp.git_cmd = 1;
	cp.no_stdin = 1;
	cp.no_stderr = 1;
	cp.no_stdout = 1;
	cp.dir = path;
	if (run_command(&cp))
		return 0;

	return 1;
}

1308 1309 1310 1311 1312 1313 1314 1315
/*
 * Check if it is a bad idea to remove a submodule, i.e. if we'd lose data
 * when doing so.
 *
 * Return 1 if we'd lose data, return 0 if the removal is fine,
 * and negative values for errors.
 */
int bad_to_remove_submodule(const char *path, unsigned flags)
1316 1317
{
	ssize_t len;
1318
	struct child_process cp = CHILD_PROCESS_INIT;
1319
	struct strbuf buf = STRBUF_INIT;
1320
	int ret = 0;
1321

1322
	if (!file_exists(path) || is_empty_dir(path))
1323
		return 0;
1324 1325

	if (!submodule_uses_gitfile(path))
1326
		return 1;
1327

1328
	argv_array_pushl(&cp.args, "status", "--porcelain",
1329
				   "--ignore-submodules=none", NULL);
1330 1331 1332 1333 1334 1335 1336 1337

	if (flags & SUBMODULE_REMOVAL_IGNORE_UNTRACKED)
		argv_array_push(&cp.args, "-uno");
	else
		argv_array_push(&cp.args, "-uall");

	if (!(flags & SUBMODULE_REMOVAL_IGNORE_IGNORED_UNTRACKED))
		argv_array_push(&cp.args, "--ignored");
1338

1339
	prepare_submodule_repo_env(&cp.env_array);
1340 1341 1342 1343
	cp.git_cmd = 1;
	cp.no_stdin = 1;
	cp.out = -1;
	cp.dir = path;
1344 1345
	if (start_command(&cp)) {
		if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
1346
			die(_("could not start 'git status' in submodule '%s'"),
1347 1348 1349 1350
				path);
		ret = -1;
		goto out;
	}
1351 1352 1353

	len = strbuf_read(&buf, cp.out, 1024);
	if (len > 2)
1354
		ret = 1;
1355 1356
	close(cp.out);

1357 1358
	if (finish_command(&cp)) {
		if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
1359
			die(_("could not run 'git status' in submodule '%s'"),
1360 1361 1362 1363
				path);
		ret = -1;
	}
out:
1364
	strbuf_release(&buf);
1365
	return ret;
1366 1367
}

1368 1369 1370 1371 1372 1373 1374 1375
static const char *get_super_prefix_or_empty(void)
{
	const char *s = get_super_prefix();
	if (!s)
		s = "";
	return s;
}

1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425
static int submodule_has_dirty_index(const struct submodule *sub)
{
	struct child_process cp = CHILD_PROCESS_INIT;

	prepare_submodule_repo_env_no_git_dir(&cp.env_array);

	cp.git_cmd = 1;
	argv_array_pushl(&cp.args, "diff-index", "--quiet",
				   "--cached", "HEAD", NULL);
	cp.no_stdin = 1;
	cp.no_stdout = 1;
	cp.dir = sub->path;
	if (start_command(&cp))
		die("could not recurse into submodule '%s'", sub->path);

	return finish_command(&cp);
}

static void submodule_reset_index(const char *path)
{
	struct child_process cp = CHILD_PROCESS_INIT;
	prepare_submodule_repo_env_no_git_dir(&cp.env_array);

	cp.git_cmd = 1;
	cp.no_stdin = 1;
	cp.dir = path;

	argv_array_pushf(&cp.args, "--super-prefix=%s%s/",
				   get_super_prefix_or_empty(), path);
	argv_array_pushl(&cp.args, "read-tree", "-u", "--reset", NULL);

	argv_array_push(&cp.args, EMPTY_TREE_SHA1_HEX);

	if (run_command(&cp))
		die("could not reset submodule index");
}

/**
 * Moves a submodule at a given path from a given head to another new head.
 * For edge cases (a submodule coming into existence or removing a submodule)
 * pass NULL for old or new respectively.
 */
int submodule_move_head(const char *path,
			 const char *old,
			 const char *new,
			 unsigned flags)
{
	int ret = 0;
	struct child_process cp = CHILD_PROCESS_INIT;
	const struct submodule *sub;
1426
	int *error_code_ptr, error_code;
1427

1428 1429 1430
	if (!is_submodule_initialized(path))
		return 0;

1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442
	if (flags & SUBMODULE_MOVE_HEAD_FORCE)
		/*
		 * Pass non NULL pointer to is_submodule_populated_gently
		 * to prevent die()-ing. We'll use connect_work_tree_and_git_dir
		 * to fixup the submodule in the force case later.
		 */
		error_code_ptr = &error_code;
	else
		error_code_ptr = NULL;

	if (old && !is_submodule_populated_gently(path, error_code_ptr))
		return 0;
1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460

	sub = submodule_from_path(null_sha1, path);

	if (!sub)
		die("BUG: could not get submodule information for '%s'", path);

	if (old && !(flags & SUBMODULE_MOVE_HEAD_FORCE)) {
		/* Check if the submodule has a dirty index. */
		if (submodule_has_dirty_index(sub))
			return error(_("submodule '%s' has dirty index"), path);
	}

	if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
		if (old) {
			if (!submodule_uses_gitfile(path))
				absorb_git_dir_into_superproject("", path,
					ABSORB_GITDIR_RECURSE_SUBMODULES);
		} else {
1461
			char *gitdir = xstrfmt("%s/modules/%s",
1462
				    get_git_common_dir(), sub->name);
1463 1464
			connect_work_tree_and_git_dir(path, gitdir);
			free(gitdir);
1465 1466 1467 1468

			/* make sure the index is clean as well */
			submodule_reset_index(path);
		}
1469 1470 1471 1472 1473 1474 1475

		if (old && (flags & SUBMODULE_MOVE_HEAD_FORCE)) {
			char *gitdir = xstrfmt("%s/modules/%s",
				    get_git_common_dir(), sub->name);
			connect_work_tree_and_git_dir(path, gitdir);
			free(gitdir);
		}
1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513
	}

	prepare_submodule_repo_env_no_git_dir(&cp.env_array);

	cp.git_cmd = 1;
	cp.no_stdin = 1;
	cp.dir = path;

	argv_array_pushf(&cp.args, "--super-prefix=%s%s/",
			get_super_prefix_or_empty(), path);
	argv_array_pushl(&cp.args, "read-tree", NULL);

	if (flags & SUBMODULE_MOVE_HEAD_DRY_RUN)
		argv_array_push(&cp.args, "-n");
	else
		argv_array_push(&cp.args, "-u");

	if (flags & SUBMODULE_MOVE_HEAD_FORCE)
		argv_array_push(&cp.args, "--reset");
	else
		argv_array_push(&cp.args, "-m");

	argv_array_push(&cp.args, old ? old : EMPTY_TREE_SHA1_HEX);
	argv_array_push(&cp.args, new ? new : EMPTY_TREE_SHA1_HEX);

	if (run_command(&cp)) {
		ret = -1;
		goto out;
	}

	if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
		if (new) {
			struct child_process cp1 = CHILD_PROCESS_INIT;
			/* also set the HEAD accordingly */
			cp1.git_cmd = 1;
			cp1.no_stdin = 1;
			cp1.dir = path;

1514
			argv_array_pushl(&cp1.args, "update-ref", "HEAD", new, NULL);
1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534

			if (run_command(&cp1)) {
				ret = -1;
				goto out;
			}
		} else {
			struct strbuf sb = STRBUF_INIT;

			strbuf_addf(&sb, "%s/.git", path);
			unlink_or_warn(sb.buf);
			strbuf_release(&sb);

			if (is_empty_dir(path))
				rmdir_or_warn(path);
		}
	}
out:
	return ret;
}

1535 1536 1537 1538
static int find_first_merges(struct object_array *result, const char *path,
		struct commit *a, struct commit *b)
{
	int i, j;
1539
	struct object_array merges = OBJECT_ARRAY_INIT;
1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552
	struct commit *commit;
	int contains_another;

	char merged_revision[42];
	const char *rev_args[] = { "rev-list", "--merges", "--ancestry-path",
				   "--all", merged_revision, NULL };
	struct rev_info revs;
	struct setup_revision_opt rev_opts;

	memset(result, 0, sizeof(struct object_array));
	memset(&rev_opts, 0, sizeof(rev_opts));

	/* get all revisions that merge commit a */
1553
	xsnprintf(merged_revision, sizeof(merged_revision), "^%s",
1554
			oid_to_hex(&a->object.oid));
1555 1556
	init_revisions(&revs, NULL);
	rev_opts.submodule = path;
1557
	setup_revisions(ARRAY_SIZE(rev_args)-1, rev_args, &revs, &rev_opts);
1558 1559 1560 1561 1562 1563

	/* save all revisions from the above list that contain b */
	if (prepare_revision_walk(&revs))
		die("revision walk setup failed");
	while ((commit = get_revision(&revs)) != NULL) {
		struct object *o = &(commit->object);
1564
		if (in_merge_bases(b, commit))
1565 1566
			add_object_array(o, NULL, &merges);
	}
1567
	reset_revision_walk();
1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578

	/* Now we've got all merges that contain a and b. Prune all
	 * merges that contain another found merge and save them in
	 * result.
	 */
	for (i = 0; i < merges.nr; i++) {
		struct commit *m1 = (struct commit *) merges.objects[i].item;

		contains_another = 0;
		for (j = 0; j < merges.nr; j++) {
			struct commit *m2 = (struct commit *) merges.objects[j].item;
1579
			if (i != j && in_merge_bases(m2, m1)) {
1580 1581 1582 1583 1584 1585
				contains_another = 1;
				break;
			}
		}

		if (!contains_another)
1586
			add_object_array(merges.objects[i].item, NULL, result);
1587 1588 1589 1590 1591 1592 1593 1594 1595 1596
	}

	free(merges.objects);
	return result->nr;
}

static void print_commit(struct commit *commit)
{
	struct strbuf sb = STRBUF_INIT;
	struct pretty_print_context ctx = {0};
1597
	ctx.date_mode.type = DATE_NORMAL;
1598 1599 1600 1601 1602 1603 1604 1605 1606 1607
	format_commit_message(commit, " %h: %m %s", &sb, &ctx);
	fprintf(stderr, "%s\n", sb.buf);
	strbuf_release(&sb);
}

#define MERGE_WARNING(path, msg) \
	warning("Failed to merge submodule %s (%s)", path, msg);

int merge_submodule(unsigned char result[20], const char *path,
		    const unsigned char base[20], const unsigned char a[20],
1608
		    const unsigned char b[20], int search)
1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639
{
	struct commit *commit_base, *commit_a, *commit_b;
	int parent_count;
	struct object_array merges;

	int i;

	/* store a in result in case we fail */
	hashcpy(result, a);

	/* we can not handle deletion conflicts */
	if (is_null_sha1(base))
		return 0;
	if (is_null_sha1(a))
		return 0;
	if (is_null_sha1(b))
		return 0;

	if (add_submodule_odb(path)) {
		MERGE_WARNING(path, "not checked out");
		return 0;
	}

	if (!(commit_base = lookup_commit_reference(base)) ||
	    !(commit_a = lookup_commit_reference(a)) ||
	    !(commit_b = lookup_commit_reference(b))) {
		MERGE_WARNING(path, "commits not present");
		return 0;
	}

	/* check whether both changes are forward */
1640 1641
	if (!in_merge_bases(commit_base, commit_a) ||
	    !in_merge_bases(commit_base, commit_b)) {
1642 1643 1644 1645 1646
		MERGE_WARNING(path, "commits don't follow merge-base");
		return 0;
	}

	/* Case #1: a is contained in b or vice versa */
1647
	if (in_merge_bases(commit_a, commit_b)) {
1648 1649 1650
		hashcpy(result, b);
		return 1;
	}
1651
	if (in_merge_bases(commit_b, commit_a)) {
1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662
		hashcpy(result, a);
		return 1;
	}

	/*
	 * Case #2: There are one or more merges that contain a and b in
	 * the submodule. If there is only one, then present it as a
	 * suggestion to the user, but leave it marked unmerged so the
	 * user needs to confirm the resolution.
	 */

1663 1664 1665 1666
	/* Skip the search if makes no sense to the calling context.  */
	if (!search)
		return 0;

1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684
	/* find commit which merges them */
	parent_count = find_first_merges(&merges, path, commit_a, commit_b);
	switch (parent_count) {
	case 0:
		MERGE_WARNING(path, "merge following commits not found");
		break;

	case 1:
		MERGE_WARNING(path, "not fast-forward");
		fprintf(stderr, "Found a possible merge resolution "
				"for the submodule:\n");
		print_commit((struct commit *) merges.objects[0].item);
		fprintf(stderr,
			"If this is correct simply add it to the index "
			"for example\n"
			"by using:\n\n"
			"  git update-index --cacheinfo 160000 %s \"%s\"\n\n"
			"which will accept this suggestion.\n",
1685
			oid_to_hex(&merges.objects[0].item->oid), path);
1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696
		break;

	default:
		MERGE_WARNING(path, "multiple merges found");
		for (i = 0; i < merges.nr; i++)
			print_commit((struct commit *) merges.objects[i].item);
	}

	free(merges.objects);
	return 0;
}
1697

1698 1699 1700 1701
int parallel_submodules(void)
{
	return parallel_jobs;
}
1702

1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722
/*
 * Embeds a single submodules git directory into the superprojects git dir,
 * non recursively.
 */
static void relocate_single_git_dir_into_superproject(const char *prefix,
						      const char *path)
{
	char *old_git_dir = NULL, *real_old_git_dir = NULL, *real_new_git_dir = NULL;
	const char *new_git_dir;
	const struct submodule *sub;

	if (submodule_uses_worktrees(path))
		die(_("relocate_gitdir for submodule '%s' with "
		      "more than one worktree not supported"), path);

	old_git_dir = xstrfmt("%s/.git", path);
	if (read_gitfile(old_git_dir))
		/* If it is an actual gitfile, it doesn't need migration. */
		return;

1723
	real_old_git_dir = real_pathdup(old_git_dir, 1);
1724 1725 1726 1727 1728 1729 1730 1731

	sub = submodule_from_path(null_sha1, path);
	if (!sub)
		die(_("could not lookup name for submodule '%s'"), path);

	new_git_dir = git_path("modules/%s", sub->name);
	if (safe_create_leading_directories_const(new_git_dir) < 0)
		die(_("could not create directory '%s'"), new_git_dir);
1732
	real_new_git_dir = real_pathdup(new_git_dir, 1);
1733 1734

	fprintf(stderr, _("Migrating git directory of '%s%s' from\n'%s' to\n'%s'\n"),
1735
		get_super_prefix_or_empty(), path,
1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753
		real_old_git_dir, real_new_git_dir);

	relocate_gitdir(path, real_old_git_dir, real_new_git_dir);

	free(old_git_dir);
	free(real_old_git_dir);
	free(real_new_git_dir);
}

/*
 * Migrate the git directory of the submodule given by path from
 * having its git directory within the working tree to the git dir nested
 * in its superprojects git dir under modules/.
 */
void absorb_git_dir_into_superproject(const char *prefix,
				      const char *path,
				      unsigned flags)
{
1754 1755
	int err_code;
	const char *sub_git_dir;
1756 1757
	struct strbuf gitdir = STRBUF_INIT;
	strbuf_addf(&gitdir, "%s/.git", path);
1758
	sub_git_dir = resolve_gitdir_gently(gitdir.buf, &err_code);
1759 1760

	/* Not populated? */
1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783
	if (!sub_git_dir) {
		const struct submodule *sub;

		if (err_code == READ_GITFILE_ERR_STAT_FAILED) {
			/* unpopulated as expected */
			strbuf_release(&gitdir);
			return;
		}

		if (err_code != READ_GITFILE_ERR_NOT_A_REPO)
			/* We don't know what broke here. */
			read_gitfile_error_die(err_code, path, NULL);

		/*
		* Maybe populated, but no git directory was found?
		* This can happen if the superproject is a submodule
		* itself and was just absorbed. The absorption of the
		* superproject did not rewrite the git file links yet,
		* fix it now.
		*/
		sub = submodule_from_path(null_sha1, path);
		if (!sub)
			die(_("could not lookup name for submodule '%s'"), path);
1784 1785
		connect_work_tree_and_git_dir(path,
			git_path("modules/%s", sub->name));
1786 1787
	} else {
		/* Is it already absorbed into the superprojects git dir? */
1788 1789
		char *real_sub_git_dir = real_pathdup(sub_git_dir, 1);
		char *real_common_git_dir = real_pathdup(get_git_common_dir(), 1);
1790

1791 1792 1793 1794 1795 1796 1797
		if (!starts_with(real_sub_git_dir, real_common_git_dir))
			relocate_single_git_dir_into_superproject(prefix, path);

		free(real_sub_git_dir);
		free(real_common_git_dir);
	}
	strbuf_release(&gitdir);
1798 1799 1800 1801 1802 1803 1804 1805

	if (flags & ABSORB_GITDIR_RECURSE_SUBMODULES) {
		struct child_process cp = CHILD_PROCESS_INIT;
		struct strbuf sb = STRBUF_INIT;

		if (flags & ~ABSORB_GITDIR_RECURSE_SUBMODULES)
			die("BUG: we don't know how to pass the flags down?");

1806
		strbuf_addstr(&sb, get_super_prefix_or_empty());
1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822
		strbuf_addstr(&sb, path);
		strbuf_addch(&sb, '/');

		cp.dir = path;
		cp.git_cmd = 1;
		cp.no_stdin = 1;
		argv_array_pushl(&cp.args, "--super-prefix", sb.buf,
					   "submodule--helper",
					   "absorb-git-dirs", NULL);
		prepare_submodule_repo_env(&cp.env_array);
		if (run_command(&cp))
			die(_("could not recurse into submodule '%s'"), path);

		strbuf_release(&sb);
	}
}
1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904

const char *get_superproject_working_tree(void)
{
	struct child_process cp = CHILD_PROCESS_INIT;
	struct strbuf sb = STRBUF_INIT;
	const char *one_up = real_path_if_valid("../");
	const char *cwd = xgetcwd();
	const char *ret = NULL;
	const char *subpath;
	int code;
	ssize_t len;

	if (!is_inside_work_tree())
		/*
		 * FIXME:
		 * We might have a superproject, but it is harder
		 * to determine.
		 */
		return NULL;

	if (!one_up)
		return NULL;

	subpath = relative_path(cwd, one_up, &sb);

	prepare_submodule_repo_env(&cp.env_array);
	argv_array_pop(&cp.env_array);

	argv_array_pushl(&cp.args, "--literal-pathspecs", "-C", "..",
			"ls-files", "-z", "--stage", "--full-name", "--",
			subpath, NULL);
	strbuf_reset(&sb);

	cp.no_stdin = 1;
	cp.no_stderr = 1;
	cp.out = -1;
	cp.git_cmd = 1;

	if (start_command(&cp))
		die(_("could not start ls-files in .."));

	len = strbuf_read(&sb, cp.out, PATH_MAX);
	close(cp.out);

	if (starts_with(sb.buf, "160000")) {
		int super_sub_len;
		int cwd_len = strlen(cwd);
		char *super_sub, *super_wt;

		/*
		 * There is a superproject having this repo as a submodule.
		 * The format is <mode> SP <hash> SP <stage> TAB <full name> \0,
		 * We're only interested in the name after the tab.
		 */
		super_sub = strchr(sb.buf, '\t') + 1;
		super_sub_len = sb.buf + sb.len - super_sub - 1;

		if (super_sub_len > cwd_len ||
		    strcmp(&cwd[cwd_len - super_sub_len], super_sub))
			die (_("BUG: returned path string doesn't match cwd?"));

		super_wt = xstrdup(cwd);
		super_wt[cwd_len - super_sub_len] = '\0';

		ret = real_path(super_wt);
		free(super_wt);
	}
	strbuf_release(&sb);

	code = finish_command(&cp);

	if (code == 128)
		/* '../' is not a git repository */
		return NULL;
	if (code == 0 && len == 0)
		/* There is an unrelated git repository at '../' */
		return NULL;
	if (code)
		die(_("ls-tree returned unexpected return code %d"), code);

	return ret;
}
1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935

int submodule_to_gitdir(struct strbuf *buf, const char *submodule)
{
	const struct submodule *sub;
	const char *git_dir;
	int ret = 0;

	strbuf_reset(buf);
	strbuf_addstr(buf, submodule);
	strbuf_complete(buf, '/');
	strbuf_addstr(buf, ".git");

	git_dir = read_gitfile(buf->buf);
	if (git_dir) {
		strbuf_reset(buf);
		strbuf_addstr(buf, git_dir);
	}
	if (!is_git_directory(buf->buf)) {
		gitmodules_config();
		sub = submodule_from_path(null_sha1, submodule);
		if (!sub) {
			ret = -1;
			goto cleanup;
		}
		strbuf_reset(buf);
		strbuf_git_path(buf, "%s/%s", "modules", sub->name);
	}

cleanup:
	return ret;
}