revision.c 85.3 KB
Newer Older
1 2 3 4 5
#include "cache.h"
#include "tag.h"
#include "blob.h"
#include "tree.h"
#include "commit.h"
6
#include "diff.h"
7 8
#include "refs.h"
#include "revision.h"
9
#include "graph.h"
10
#include "grep.h"
11
#include "reflog-walk.h"
J
Junio C Hamano 已提交
12
#include "patch-ids.h"
13
#include "decorate.h"
14
#include "log-tree.h"
15
#include "string-list.h"
16
#include "line-log.h"
17
#include "mailmap.h"
18
#include "commit-slab.h"
19

20 21
volatile show_early_output_fn_t show_early_output;

22
char *path_name(const struct name_path *path, const char *name)
23
{
24
	const struct name_path *p;
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
	char *n, *m;
	int nlen = strlen(name);
	int len = nlen + 1;

	for (p = path; p; p = p->up) {
		if (p->elem_len)
			len += p->elem_len + 1;
	}
	n = xmalloc(len);
	m = n + len - (nlen + 1);
	strcpy(m, name);
	for (p = path; p; p = p->up) {
		if (p->elem_len) {
			m -= p->elem_len + 1;
			memcpy(m, p->elem, p->elem_len);
			m[p->elem_len] = '/';
		}
	}
	return n;
}

46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74
static int show_path_component_truncated(FILE *out, const char *name, int len)
{
	int cnt;
	for (cnt = 0; cnt < len; cnt++) {
		int ch = name[cnt];
		if (!ch || ch == '\n')
			return -1;
		fputc(ch, out);
	}
	return len;
}

static int show_path_truncated(FILE *out, const struct name_path *path)
{
	int emitted, ours;

	if (!path)
		return 0;
	emitted = show_path_truncated(out, path->up);
	if (emitted < 0)
		return emitted;
	if (emitted)
		fputc('/', out);
	ours = show_path_component_truncated(out, path->elem, path->elem_len);
	if (ours < 0)
		return ours;
	return ours || emitted;
}

75 76
void show_object_with_name(FILE *out, struct object *obj,
			   const struct name_path *path, const char *component)
77
{
78 79 80 81
	struct name_path leaf;
	leaf.up = (struct name_path *)path;
	leaf.elem = component;
	leaf.elem_len = strlen(component);
82

83 84 85
	fprintf(out, "%s ", sha1_to_hex(obj->sha1));
	show_path_truncated(out, &leaf);
	fputc('\n', out);
86 87
}

88 89 90 91
void add_object(struct object *obj,
		struct object_array *p,
		struct name_path *path,
		const char *name)
92
{
93 94 95
	char *pn = path_name(path, name);
	add_object_array(obj, pn, p);
	free(pn);
96 97 98 99
}

static void mark_blob_uninteresting(struct blob *blob)
{
100 101
	if (!blob)
		return;
102 103 104 105 106 107 108
	if (blob->object.flags & UNINTERESTING)
		return;
	blob->object.flags |= UNINTERESTING;
}

void mark_tree_uninteresting(struct tree *tree)
{
109
	struct tree_desc desc;
110
	struct name_entry entry;
111 112
	struct object *obj = &tree->object;

113 114
	if (!tree)
		return;
115 116 117 118 119 120 121
	if (obj->flags & UNINTERESTING)
		return;
	obj->flags |= UNINTERESTING;
	if (!has_sha1_file(obj->sha1))
		return;
	if (parse_tree(tree) < 0)
		die("bad tree %s", sha1_to_hex(obj->sha1));
122

123
	init_tree_desc(&desc, tree->buffer, tree->size);
124
	while (tree_entry(&desc, &entry)) {
125 126
		switch (object_type(entry.mode)) {
		case OBJ_TREE:
127
			mark_tree_uninteresting(lookup_tree(entry.sha1));
128 129
			break;
		case OBJ_BLOB:
130
			mark_blob_uninteresting(lookup_blob(entry.sha1));
131 132 133 134 135
			break;
		default:
			/* Subproject commit - not in this repository */
			break;
		}
136
	}
137 138 139 140 141

	/*
	 * We don't care about the tree any more
	 * after it has been marked uninteresting.
	 */
142
	free_tree_buffer(tree);
143 144 145 146
}

void mark_parents_uninteresting(struct commit *commit)
{
147 148 149 150
	struct commit_list *parents = NULL, *l;

	for (l = commit->parents; l; l = l->next)
		commit_list_insert(l->item, &parents);
151 152 153

	while (parents) {
		struct commit *commit = parents->item;
154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172
		l = parents;
		parents = parents->next;
		free(l);

		while (commit) {
			/*
			 * A missing commit is ok iff its parent is marked
			 * uninteresting.
			 *
			 * We just mark such a thing parsed, so that when
			 * it is popped next time around, we won't be trying
			 * to parse it and get an error.
			 */
			if (!has_sha1_file(commit->object.sha1))
				commit->object.parsed = 1;

			if (commit->object.flags & UNINTERESTING)
				break;

173
			commit->object.flags |= UNINTERESTING;
174

175 176 177 178 179 180 181 182
			/*
			 * Normally we haven't parsed the parent
			 * yet, so we won't have a parent of a parent
			 * here. However, it may turn out that we've
			 * reached this commit some other way (where it
			 * wasn't uninteresting), in which case we need
			 * to mark its parents recursively too..
			 */
183 184
			if (!commit->parents)
				break;
185

186 187 188 189
			for (l = commit->parents->next; l; l = l->next)
				commit_list_insert(l->item, &parents);
			commit = commit->parents->item;
		}
190 191 192
	}
}

193 194 195
static void add_pending_object_with_mode(struct rev_info *revs,
					 struct object *obj,
					 const char *name, unsigned mode)
196
{
J
Junio C Hamano 已提交
197 198
	if (!obj)
		return;
L
Linus Torvalds 已提交
199
	if (revs->no_walk && (obj->flags & UNINTERESTING))
L
Linus Torvalds 已提交
200
		revs->no_walk = 0;
J
Junio C Hamano 已提交
201 202
	if (revs->reflog_info && obj->type == OBJ_COMMIT) {
		struct strbuf buf = STRBUF_INIT;
203
		int len = interpret_branch_name(name, 0, &buf);
J
Junio C Hamano 已提交
204 205 206 207 208 209 210 211 212 213 214
		int st;

		if (0 < len && name[len] && buf.len)
			strbuf_addstr(&buf, name + len);
		st = add_reflog_for_walk(revs->reflog_info,
					 (struct commit *)obj,
					 buf.buf[0] ? buf.buf: name);
		strbuf_release(&buf);
		if (st)
			return;
	}
215
	add_object_array_with_mode(obj, name, &revs->pending, mode);
216 217
}

218 219
void add_pending_object(struct rev_info *revs,
			struct object *obj, const char *name)
J
Junio C Hamano 已提交
220 221 222 223
{
	add_pending_object_with_mode(revs, obj, name, S_IFINVALID);
}

224 225 226 227 228 229 230 231 232 233 234 235
void add_head_to_pending(struct rev_info *revs)
{
	unsigned char sha1[20];
	struct object *obj;
	if (get_sha1("HEAD", sha1))
		return;
	obj = parse_object(sha1);
	if (!obj)
		return;
	add_pending_object(revs, obj, "HEAD");
}

236 237 238
static struct object *get_reference(struct rev_info *revs, const char *name,
				    const unsigned char *sha1,
				    unsigned int flags)
239 240 241 242
{
	struct object *object;

	object = parse_object(sha1);
J
Junio C Hamano 已提交
243 244 245
	if (!object) {
		if (revs->ignore_missing)
			return object;
246
		die("bad object %s", name);
J
Junio C Hamano 已提交
247
	}
248 249 250 251
	object->flags |= flags;
	return object;
}

252 253 254 255 256 257 258
void add_pending_sha1(struct rev_info *revs, const char *name,
		      const unsigned char *sha1, unsigned int flags)
{
	struct object *object = get_reference(revs, name, sha1, flags);
	add_pending_object(revs, object, name);
}

259 260
static struct commit *handle_commit(struct rev_info *revs,
				    struct object *object, const char *name)
261 262
{
	unsigned long flags = object->flags;
263 264 265 266

	/*
	 * Tag object? Look what it points to..
	 */
267
	while (object->type == OBJ_TAG) {
268
		struct tag *tag = (struct tag *) object;
269
		if (revs->tag_objects && !(flags & UNINTERESTING))
270
			add_pending_object(revs, object, tag->tag);
271 272
		if (!tag->tagged)
			die("bad tag");
273
		object = parse_object(tag->tagged->sha1);
274 275 276
		if (!object) {
			if (flags & UNINTERESTING)
				return NULL;
277
			die("bad object %s", sha1_to_hex(tag->tagged->sha1));
278
		}
279 280 281 282 283 284
	}

	/*
	 * Commit object? Just return it, we'll do all the complex
	 * reachability crud.
	 */
285
	if (object->type == OBJ_COMMIT) {
286 287 288
		struct commit *commit = (struct commit *)object;
		if (parse_commit(commit) < 0)
			die("unable to parse commit %s", name);
289
		if (flags & UNINTERESTING) {
290
			commit->object.flags |= UNINTERESTING;
291
			mark_parents_uninteresting(commit);
292 293
			revs->limited = 1;
		}
294 295
		if (revs->show_source && !commit->util)
			commit->util = (void *) name;
296 297 298 299
		return commit;
	}

	/*
M
Mike Ralphson 已提交
300
	 * Tree object? Either mark it uninteresting, or add it
301 302
	 * to the list of objects to look at later..
	 */
303
	if (object->type == OBJ_TREE) {
304 305 306 307 308 309 310 311 312 313 314 315 316 317
		struct tree *tree = (struct tree *)object;
		if (!revs->tree_objects)
			return NULL;
		if (flags & UNINTERESTING) {
			mark_tree_uninteresting(tree);
			return NULL;
		}
		add_pending_object(revs, object, "");
		return NULL;
	}

	/*
	 * Blob object? You know the drill by now..
	 */
318
	if (object->type == OBJ_BLOB) {
319 320 321 322 323 324 325 326 327 328 329 330 331
		struct blob *blob = (struct blob *)object;
		if (!revs->blob_objects)
			return NULL;
		if (flags & UNINTERESTING) {
			mark_blob_uninteresting(blob);
			return NULL;
		}
		add_pending_object(revs, object, "");
		return NULL;
	}
	die("%s is unknown object", name);
}

332 333 334 335 336 337 338 339 340 341 342 343 344
static int everybody_uninteresting(struct commit_list *orig)
{
	struct commit_list *list = orig;
	while (list) {
		struct commit *commit = list->item;
		list = list->next;
		if (commit->object.flags & UNINTERESTING)
			continue;
		return 0;
	}
	return 1;
}

345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418
/*
 * A definition of "relevant" commit that we can use to simplify limited graphs
 * by eliminating side branches.
 *
 * A "relevant" commit is one that is !UNINTERESTING (ie we are including it
 * in our list), or that is a specified BOTTOM commit. Then after computing
 * a limited list, during processing we can generally ignore boundary merges
 * coming from outside the graph, (ie from irrelevant parents), and treat
 * those merges as if they were single-parent. TREESAME is defined to consider
 * only relevant parents, if any. If we are TREESAME to our on-graph parents,
 * we don't care if we were !TREESAME to non-graph parents.
 *
 * Treating bottom commits as relevant ensures that a limited graph's
 * connection to the actual bottom commit is not viewed as a side branch, but
 * treated as part of the graph. For example:
 *
 *   ....Z...A---X---o---o---B
 *        .     /
 *         W---Y
 *
 * When computing "A..B", the A-X connection is at least as important as
 * Y-X, despite A being flagged UNINTERESTING.
 *
 * And when computing --ancestry-path "A..B", the A-X connection is more
 * important than Y-X, despite both A and Y being flagged UNINTERESTING.
 */
static inline int relevant_commit(struct commit *commit)
{
	return (commit->object.flags & (UNINTERESTING | BOTTOM)) != UNINTERESTING;
}

/*
 * Return a single relevant commit from a parent list. If we are a TREESAME
 * commit, and this selects one of our parents, then we can safely simplify to
 * that parent.
 */
static struct commit *one_relevant_parent(const struct rev_info *revs,
					  struct commit_list *orig)
{
	struct commit_list *list = orig;
	struct commit *relevant = NULL;

	if (!orig)
		return NULL;

	/*
	 * For 1-parent commits, or if first-parent-only, then return that
	 * first parent (even if not "relevant" by the above definition).
	 * TREESAME will have been set purely on that parent.
	 */
	if (revs->first_parent_only || !orig->next)
		return orig->item;

	/*
	 * For multi-parent commits, identify a sole relevant parent, if any.
	 * If we have only one relevant parent, then TREESAME will be set purely
	 * with regard to that parent, and we can simplify accordingly.
	 *
	 * If we have more than one relevant parent, or no relevant parents
	 * (and multiple irrelevant ones), then we can't select a parent here
	 * and return NULL.
	 */
	while (list) {
		struct commit *commit = list->item;
		list = list->next;
		if (relevant_commit(commit)) {
			if (relevant)
				return NULL;
			relevant = commit;
		}
	}
	return relevant;
}

419 420
/*
 * The goal is to get REV_TREE_NEW as the result only if the
421 422 423 424 425 426
 * diff consists of all '+' (and no other changes), REV_TREE_OLD
 * if the whole diff is removal of old data, and otherwise
 * REV_TREE_DIFFERENT (of course if the trees are the same we
 * want REV_TREE_SAME).
 * That means that once we get to REV_TREE_DIFFERENT, we do not
 * have to look any further.
427
 */
428
static int tree_difference = REV_TREE_SAME;
429 430 431 432

static void file_add_remove(struct diff_options *options,
		    int addremove, unsigned mode,
		    const unsigned char *sha1,
433
		    int sha1_valid,
434
		    const char *fullpath, unsigned dirty_submodule)
435
{
436
	int diff = addremove == '+' ? REV_TREE_NEW : REV_TREE_OLD;
437

438
	tree_difference |= diff;
439
	if (tree_difference == REV_TREE_DIFFERENT)
440
		DIFF_OPT_SET(options, HAS_CHANGES);
441 442 443 444 445 446
}

static void file_change(struct diff_options *options,
		 unsigned old_mode, unsigned new_mode,
		 const unsigned char *old_sha1,
		 const unsigned char *new_sha1,
447
		 int old_sha1_valid, int new_sha1_valid,
448 449
		 const char *fullpath,
		 unsigned old_dirty_submodule, unsigned new_dirty_submodule)
450
{
451
	tree_difference = REV_TREE_DIFFERENT;
452
	DIFF_OPT_SET(options, HAS_CHANGES);
453 454
}

455 456
static int rev_compare_tree(struct rev_info *revs,
			    struct commit *parent, struct commit *commit)
457
{
458 459 460
	struct tree *t1 = parent->tree;
	struct tree *t2 = commit->tree;

461
	if (!t1)
462
		return REV_TREE_NEW;
463 464
	if (!t2)
		return REV_TREE_OLD;
465 466 467 468 469 470 471 472 473 474 475 476 477 478 479

	if (revs->simplify_by_decoration) {
		/*
		 * If we are simplifying by decoration, then the commit
		 * is worth showing if it has a tag pointing at it.
		 */
		if (lookup_decoration(&name_decoration, &commit->object))
			return REV_TREE_DIFFERENT;
		/*
		 * A commit that is not pointed by a tag is uninteresting
		 * if we are not limited by path.  This means that you will
		 * see the usual "commits that touch the paths" plus any
		 * tagged commit by specifying both --simplify-by-decoration
		 * and pathspec.
		 */
480
		if (!revs->prune_data.nr)
481 482
			return REV_TREE_SAME;
	}
483

484
	tree_difference = REV_TREE_SAME;
485
	DIFF_OPT_CLR(&revs->pruning, HAS_CHANGES);
486
	if (diff_tree_sha1(t1->object.sha1, t2->object.sha1, "",
487
			   &revs->pruning) < 0)
488
		return REV_TREE_DIFFERENT;
489 490 491
	return tree_difference;
}

492
static int rev_same_tree_as_empty(struct rev_info *revs, struct commit *commit)
493 494 495
{
	int retval;
	void *tree;
496
	unsigned long size;
497
	struct tree_desc empty, real;
498
	struct tree *t1 = commit->tree;
499 500 501 502

	if (!t1)
		return 0;

503
	tree = read_object_with_reference(t1->object.sha1, tree_type, &size, NULL);
504 505
	if (!tree)
		return 0;
506 507
	init_tree_desc(&real, tree, size);
	init_tree_desc(&empty, "", 0);
508

509
	tree_difference = REV_TREE_SAME;
510
	DIFF_OPT_CLR(&revs->pruning, HAS_CHANGES);
511
	retval = diff_tree(&empty, &real, "", &revs->pruning);
512 513
	free(tree);

514
	return retval >= 0 && (tree_difference == REV_TREE_SAME);
515 516
}

517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589
struct treesame_state {
	unsigned int nparents;
	unsigned char treesame[FLEX_ARRAY];
};

static struct treesame_state *initialise_treesame(struct rev_info *revs, struct commit *commit)
{
	unsigned n = commit_list_count(commit->parents);
	struct treesame_state *st = xcalloc(1, sizeof(*st) + n);
	st->nparents = n;
	add_decoration(&revs->treesame, &commit->object, st);
	return st;
}

/*
 * Must be called immediately after removing the nth_parent from a commit's
 * parent list, if we are maintaining the per-parent treesame[] decoration.
 * This does not recalculate the master TREESAME flag - update_treesame()
 * should be called to update it after a sequence of treesame[] modifications
 * that may have affected it.
 */
static int compact_treesame(struct rev_info *revs, struct commit *commit, unsigned nth_parent)
{
	struct treesame_state *st;
	int old_same;

	if (!commit->parents) {
		/*
		 * Have just removed the only parent from a non-merge.
		 * Different handling, as we lack decoration.
		 */
		if (nth_parent != 0)
			die("compact_treesame %u", nth_parent);
		old_same = !!(commit->object.flags & TREESAME);
		if (rev_same_tree_as_empty(revs, commit))
			commit->object.flags |= TREESAME;
		else
			commit->object.flags &= ~TREESAME;
		return old_same;
	}

	st = lookup_decoration(&revs->treesame, &commit->object);
	if (!st || nth_parent >= st->nparents)
		die("compact_treesame %u", nth_parent);

	old_same = st->treesame[nth_parent];
	memmove(st->treesame + nth_parent,
		st->treesame + nth_parent + 1,
		st->nparents - nth_parent - 1);

	/*
	 * If we've just become a non-merge commit, update TREESAME
	 * immediately, and remove the no-longer-needed decoration.
	 * If still a merge, defer update until update_treesame().
	 */
	if (--st->nparents == 1) {
		if (commit->parents->next)
			die("compact_treesame parents mismatch");
		if (st->treesame[0] && revs->dense)
			commit->object.flags |= TREESAME;
		else
			commit->object.flags &= ~TREESAME;
		free(add_decoration(&revs->treesame, &commit->object, NULL));
	}

	return old_same;
}

static unsigned update_treesame(struct rev_info *revs, struct commit *commit)
{
	if (commit->parents && commit->parents->next) {
		unsigned n;
		struct treesame_state *st;
590 591 592
		struct commit_list *p;
		unsigned relevant_parents;
		unsigned relevant_change, irrelevant_change;
593 594 595 596

		st = lookup_decoration(&revs->treesame, &commit->object);
		if (!st)
			die("update_treesame %s", sha1_to_hex(commit->object.sha1));
597 598 599 600 601 602 603 604
		relevant_parents = 0;
		relevant_change = irrelevant_change = 0;
		for (p = commit->parents, n = 0; p; n++, p = p->next) {
			if (relevant_commit(p->item)) {
				relevant_change |= !st->treesame[n];
				relevant_parents++;
			} else
				irrelevant_change |= !st->treesame[n];
605
		}
606 607 608 609
		if (relevant_parents ? relevant_change : irrelevant_change)
			commit->object.flags &= ~TREESAME;
		else
			commit->object.flags |= TREESAME;
610 611 612 613 614
	}

	return commit->object.flags & TREESAME;
}

615 616 617 618 619 620 621 622 623 624 625 626 627 628 629
static inline int limiting_can_increase_treesame(const struct rev_info *revs)
{
	/*
	 * TREESAME is irrelevant unless prune && dense;
	 * if simplify_history is set, we can't have a mixture of TREESAME and
	 *    !TREESAME INTERESTING parents (and we don't have treesame[]
	 *    decoration anyway);
	 * if first_parent_only is set, then the TREESAME flag is locked
	 *    against the first parent (and again we lack treesame[] decoration).
	 */
	return revs->prune && revs->dense &&
	       !revs->simplify_history &&
	       !revs->first_parent_only;
}

630 631 632
static void try_to_simplify_commit(struct rev_info *revs, struct commit *commit)
{
	struct commit_list **pp, *parent;
633
	struct treesame_state *ts = NULL;
634 635
	int relevant_change = 0, irrelevant_change = 0;
	int relevant_parents, nth_parent;
636

L
Linus Torvalds 已提交
637 638 639
	/*
	 * If we don't do pruning, everything is interesting
	 */
640
	if (!revs->prune)
L
Linus Torvalds 已提交
641 642
		return;

643 644 645 646
	if (!commit->tree)
		return;

	if (!commit->parents) {
647
		if (rev_same_tree_as_empty(revs, commit))
648
			commit->object.flags |= TREESAME;
649 650 651
		return;
	}

L
Linus Torvalds 已提交
652 653 654 655
	/*
	 * Normal non-merge commit? If we don't want to make the
	 * history dense, we consider it always to be a change..
	 */
656
	if (!revs->dense && !commit->parents->next)
L
Linus Torvalds 已提交
657 658
		return;

659
	for (pp = &commit->parents, nth_parent = 0, relevant_parents = 0;
660 661
	     (parent = *pp) != NULL;
	     pp = &parent->next, nth_parent++) {
662
		struct commit *p = parent->item;
663 664
		if (relevant_commit(p))
			relevant_parents++;
665

666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687
		if (nth_parent == 1) {
			/*
			 * This our second loop iteration - so we now know
			 * we're dealing with a merge.
			 *
			 * Do not compare with later parents when we care only about
			 * the first parent chain, in order to avoid derailing the
			 * traversal to follow a side branch that brought everything
			 * in the path we are limited to by the pathspec.
			 */
			if (revs->first_parent_only)
				break;
			/*
			 * If this will remain a potentially-simplifiable
			 * merge, remember per-parent treesame if needed.
			 * Initialise the array with the comparison from our
			 * first iteration.
			 */
			if (revs->treesame.name &&
			    !revs->simplify_history &&
			    !(commit->object.flags & UNINTERESTING)) {
				ts = initialise_treesame(revs, commit);
688
				if (!(irrelevant_change || relevant_change))
689 690 691
					ts->treesame[0] = 1;
			}
		}
692 693 694 695
		if (parse_commit(p) < 0)
			die("cannot simplify commit %s (because of %s)",
			    sha1_to_hex(commit->object.sha1),
			    sha1_to_hex(p->object.sha1));
696
		switch (rev_compare_tree(revs, p, commit)) {
697
		case REV_TREE_SAME:
698
			if (!revs->simplify_history || !relevant_commit(p)) {
699 700 701 702 703 704
				/* Even if a merge with an uninteresting
				 * side branch brought the entire change
				 * we are interested in, we do not want
				 * to lose the other branches of this
				 * merge, so we just keep going.
				 */
705 706
				if (ts)
					ts->treesame[nth_parent] = 1;
707 708
				continue;
			}
709 710
			parent->next = NULL;
			commit->parents = parent;
711
			commit->object.flags |= TREESAME;
712 713
			return;

714 715
		case REV_TREE_NEW:
			if (revs->remove_empty_trees &&
716
			    rev_same_tree_as_empty(revs, p)) {
717 718 719 720 721 722 723
				/* We are adding all the specified
				 * paths from this parent, so the
				 * history beyond this parent is not
				 * interesting.  Remove its parents
				 * (they are grandparents for us).
				 * IOW, we pretend this parent is a
				 * "root" commit.
724
				 */
725 726 727 728
				if (parse_commit(p) < 0)
					die("cannot simplify commit %s (invalid %s)",
					    sha1_to_hex(commit->object.sha1),
					    sha1_to_hex(p->object.sha1));
729
				p->parents = NULL;
730 731
			}
		/* fallthrough */
732
		case REV_TREE_OLD:
733
		case REV_TREE_DIFFERENT:
734 735 736 737
			if (relevant_commit(p))
				relevant_change = 1;
			else
				irrelevant_change = 1;
738 739 740 741
			continue;
		}
		die("bad tree compare for commit %s", sha1_to_hex(commit->object.sha1));
	}
742 743 744 745 746 747 748 749 750 751 752 753 754

	/*
	 * TREESAME is straightforward for single-parent commits. For merge
	 * commits, it is most useful to define it so that "irrelevant"
	 * parents cannot make us !TREESAME - if we have any relevant
	 * parents, then we only consider TREESAMEness with respect to them,
	 * allowing irrelevant merges from uninteresting branches to be
	 * simplified away. Only if we have only irrelevant parents do we
	 * base TREESAME on them. Note that this logic is replicated in
	 * update_treesame, which should be kept in sync.
	 */
	if (relevant_parents ? !relevant_change : !irrelevant_change)
		commit->object.flags |= TREESAME;
755 756
}

757
static void commit_list_insert_by_date_cached(struct commit *p, struct commit_list **head,
758 759 760 761 762
		    struct commit_list *cached_base, struct commit_list **cache)
{
	struct commit_list *new_entry;

	if (cached_base && p->date < cached_base->item->date)
763
		new_entry = commit_list_insert_by_date(p, &cached_base->next);
764
	else
765
		new_entry = commit_list_insert_by_date(p, head);
766 767 768 769 770 771 772

	if (cache && (!*cache || p->date < (*cache)->item->date))
		*cache = new_entry;
}

static int add_parents_to_list(struct rev_info *revs, struct commit *commit,
		    struct commit_list **list, struct commit_list **cache_ptr)
773 774
{
	struct commit_list *parent = commit->parents;
J
Junio C Hamano 已提交
775
	unsigned left_flag;
776
	struct commit_list *cached_base = cache_ptr ? *cache_ptr : NULL;
777

778
	if (commit->object.flags & ADDED)
779
		return 0;
780 781
	commit->object.flags |= ADDED;

782 783 784 785
	if (revs->include_check &&
	    !revs->include_check(commit, revs->include_check_data))
		return 0;

786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801
	/*
	 * If the commit is uninteresting, don't try to
	 * prune parents - we want the maximal uninteresting
	 * set.
	 *
	 * Normally we haven't parsed the parent
	 * yet, so we won't have a parent of a parent
	 * here. However, it may turn out that we've
	 * reached this commit some other way (where it
	 * wasn't uninteresting), in which case we need
	 * to mark its parents recursively too..
	 */
	if (commit->object.flags & UNINTERESTING) {
		while (parent) {
			struct commit *p = parent->item;
			parent = parent->next;
802 803
			if (p)
				p->object.flags |= UNINTERESTING;
804
			if (parse_commit(p) < 0)
805
				continue;
806 807 808 809 810
			if (p->parents)
				mark_parents_uninteresting(p);
			if (p->object.flags & SEEN)
				continue;
			p->object.flags |= SEEN;
811
			commit_list_insert_by_date_cached(p, list, cached_base, cache_ptr);
812
		}
813
		return 0;
814 815 816 817 818 819 820
	}

	/*
	 * Ok, the commit wasn't uninteresting. Try to
	 * simplify the commit history and find the parent
	 * that has no differences in the path set if one exists.
	 */
L
Linus Torvalds 已提交
821
	try_to_simplify_commit(revs, commit);
822

L
Linus Torvalds 已提交
823
	if (revs->no_walk)
824
		return 0;
L
Linus Torvalds 已提交
825

J
Junio C Hamano 已提交
826
	left_flag = (commit->object.flags & SYMMETRIC_LEFT);
827

828
	for (parent = commit->parents; parent; parent = parent->next) {
829 830
		struct commit *p = parent->item;

831 832
		if (parse_commit(p) < 0)
			return -1;
833 834
		if (revs->show_source && !p->util)
			p->util = commit->util;
J
Junio C Hamano 已提交
835
		p->object.flags |= left_flag;
836 837
		if (!(p->object.flags & SEEN)) {
			p->object.flags |= SEEN;
838
			commit_list_insert_by_date_cached(p, list, cached_base, cache_ptr);
839
		}
J
Junio C Hamano 已提交
840
		if (revs->first_parent_only)
841
			break;
842
	}
843
	return 0;
844 845
}

846
static void cherry_pick_list(struct commit_list *list, struct rev_info *revs)
J
Junio C Hamano 已提交
847 848 849 850 851
{
	struct commit_list *p;
	int left_count = 0, right_count = 0;
	int left_first;
	struct patch_ids ids;
852
	unsigned cherry_flag;
J
Junio C Hamano 已提交
853 854 855 856 857 858 859 860 861 862 863 864 865

	/* First count the commits on the left and on the right */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		unsigned flags = commit->object.flags;
		if (flags & BOUNDARY)
			;
		else if (flags & SYMMETRIC_LEFT)
			left_count++;
		else
			right_count++;
	}

866 867 868
	if (!left_count || !right_count)
		return;

J
Junio C Hamano 已提交
869 870
	left_first = left_count < right_count;
	init_patch_ids(&ids);
871
	ids.diffopts.pathspec = revs->diffopt.pathspec;
J
Junio C Hamano 已提交
872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889

	/* Compute patch-ids for one side */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		unsigned flags = commit->object.flags;

		if (flags & BOUNDARY)
			continue;
		/*
		 * If we have fewer left, left_first is set and we omit
		 * commits on the right branch in this loop.  If we have
		 * fewer right, we skip the left ones.
		 */
		if (left_first != !!(flags & SYMMETRIC_LEFT))
			continue;
		commit->util = add_commit_patch_id(commit, &ids);
	}

890 891 892
	/* either cherry_mark or cherry_pick are true */
	cherry_flag = revs->cherry_mark ? PATCHSAME : SHOWN;

J
Junio C Hamano 已提交
893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914
	/* Check the other side */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		struct patch_id *id;
		unsigned flags = commit->object.flags;

		if (flags & BOUNDARY)
			continue;
		/*
		 * If we have fewer left, left_first is set and we omit
		 * commits on the left branch in this loop.
		 */
		if (left_first == !!(flags & SYMMETRIC_LEFT))
			continue;

		/*
		 * Have we seen the same patch id?
		 */
		id = has_commit_patch_id(commit, &ids);
		if (!id)
			continue;
		id->seen = 1;
915
		commit->object.flags |= cherry_flag;
J
Junio C Hamano 已提交
916 917 918 919 920 921 922 923 924 925 926
	}

	/* Now check the original side for seen ones */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		struct patch_id *ent;

		ent = commit->util;
		if (!ent)
			continue;
		if (ent->seen)
927
			commit->object.flags |= cherry_flag;
J
Junio C Hamano 已提交
928 929 930 931 932 933
		commit->util = NULL;
	}

	free_patch_ids(&ids);
}

934 935 936 937
/* How many extra uninteresting commits we want to see.. */
#define SLOP 5

static int still_interesting(struct commit_list *src, unsigned long date, int slop)
938
{
939 940 941 942 943 944 945 946 947 948
	/*
	 * No source list at all? We're definitely done..
	 */
	if (!src)
		return 0;

	/*
	 * Does the destination list contain entries with a date
	 * before the source list? Definitely _not_ done.
	 */
949
	if (date <= src->item->date)
950 951 952 953 954 955 956 957 958 959 960
		return SLOP;

	/*
	 * Does the source list still have interesting commits in
	 * it? Definitely not done..
	 */
	if (!everybody_uninteresting(src))
		return SLOP;

	/* Ok, we're closing in.. */
	return slop-1;
961 962
}

J
Junio C Hamano 已提交
963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040
/*
 * "rev-list --ancestry-path A..B" computes commits that are ancestors
 * of B but not ancestors of A but further limits the result to those
 * that are descendants of A.  This takes the list of bottom commits and
 * the result of "A..B" without --ancestry-path, and limits the latter
 * further to the ones that can reach one of the commits in "bottom".
 */
static void limit_to_ancestry(struct commit_list *bottom, struct commit_list *list)
{
	struct commit_list *p;
	struct commit_list *rlist = NULL;
	int made_progress;

	/*
	 * Reverse the list so that it will be likely that we would
	 * process parents before children.
	 */
	for (p = list; p; p = p->next)
		commit_list_insert(p->item, &rlist);

	for (p = bottom; p; p = p->next)
		p->item->object.flags |= TMP_MARK;

	/*
	 * Mark the ones that can reach bottom commits in "list",
	 * in a bottom-up fashion.
	 */
	do {
		made_progress = 0;
		for (p = rlist; p; p = p->next) {
			struct commit *c = p->item;
			struct commit_list *parents;
			if (c->object.flags & (TMP_MARK | UNINTERESTING))
				continue;
			for (parents = c->parents;
			     parents;
			     parents = parents->next) {
				if (!(parents->item->object.flags & TMP_MARK))
					continue;
				c->object.flags |= TMP_MARK;
				made_progress = 1;
				break;
			}
		}
	} while (made_progress);

	/*
	 * NEEDSWORK: decide if we want to remove parents that are
	 * not marked with TMP_MARK from commit->parents for commits
	 * in the resulting list.  We may not want to do that, though.
	 */

	/*
	 * The ones that are not marked with TMP_MARK are uninteresting
	 */
	for (p = list; p; p = p->next) {
		struct commit *c = p->item;
		if (c->object.flags & TMP_MARK)
			continue;
		c->object.flags |= UNINTERESTING;
	}

	/* We are done with the TMP_MARK */
	for (p = list; p; p = p->next)
		p->item->object.flags &= ~TMP_MARK;
	for (p = bottom; p; p = p->next)
		p->item->object.flags &= ~TMP_MARK;
	free_commit_list(rlist);
}

/*
 * Before walking the history, keep the set of "negative" refs the
 * caller has asked to exclude.
 *
 * This is used to compute "rev-list --ancestry-path A..B", as we need
 * to filter the result of "A..B" further to the ones that can actually
 * reach A.
 */
1041
static struct commit_list *collect_bottom_commits(struct commit_list *list)
J
Junio C Hamano 已提交
1042
{
1043 1044 1045 1046
	struct commit_list *elem, *bottom = NULL;
	for (elem = list; elem; elem = elem->next)
		if (elem->item->object.flags & BOTTOM)
			commit_list_insert(elem->item, &bottom);
J
Junio C Hamano 已提交
1047 1048 1049
	return bottom;
}

1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066
/* Assumes either left_only or right_only is set */
static void limit_left_right(struct commit_list *list, struct rev_info *revs)
{
	struct commit_list *p;

	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;

		if (revs->right_only) {
			if (commit->object.flags & SYMMETRIC_LEFT)
				commit->object.flags |= SHOWN;
		} else	/* revs->left_only is set */
			if (!(commit->object.flags & SYMMETRIC_LEFT))
				commit->object.flags |= SHOWN;
	}
}

1067
static int limit_list(struct rev_info *revs)
1068
{
1069 1070
	int slop = SLOP;
	unsigned long date = ~0ul;
1071 1072 1073
	struct commit_list *list = revs->commits;
	struct commit_list *newlist = NULL;
	struct commit_list **p = &newlist;
J
Junio C Hamano 已提交
1074 1075 1076
	struct commit_list *bottom = NULL;

	if (revs->ancestry_path) {
1077
		bottom = collect_bottom_commits(list);
J
Junio C Hamano 已提交
1078
		if (!bottom)
1079
			die("--ancestry-path given but there are no bottom commits");
J
Junio C Hamano 已提交
1080
	}
1081 1082 1083 1084 1085

	while (list) {
		struct commit_list *entry = list;
		struct commit *commit = list->item;
		struct object *obj = &commit->object;
1086
		show_early_output_fn_t show;
1087 1088 1089 1090 1091 1092

		list = list->next;
		free(entry);

		if (revs->max_age != -1 && (commit->date < revs->max_age))
			obj->flags |= UNINTERESTING;
1093
		if (add_parents_to_list(revs, commit, &list, NULL) < 0)
1094
			return -1;
1095 1096
		if (obj->flags & UNINTERESTING) {
			mark_parents_uninteresting(commit);
1097 1098 1099 1100
			if (revs->show_all)
				p = &commit_list_insert(commit, p)->next;
			slop = still_interesting(list, date, slop);
			if (slop)
1101
				continue;
1102 1103 1104 1105
			/* If showing all, add the whole pending list to the end */
			if (revs->show_all)
				*p = list;
			break;
1106 1107 1108
		}
		if (revs->min_age != -1 && (commit->date > revs->min_age))
			continue;
1109
		date = commit->date;
1110
		p = &commit_list_insert(commit, p)->next;
1111 1112 1113 1114 1115 1116 1117

		show = show_early_output;
		if (!show)
			continue;

		show(revs, newlist);
		show_early_output = NULL;
1118
	}
1119
	if (revs->cherry_pick || revs->cherry_mark)
1120
		cherry_pick_list(newlist, revs);
J
Junio C Hamano 已提交
1121

1122 1123 1124
	if (revs->left_only || revs->right_only)
		limit_left_right(newlist, revs);

J
Junio C Hamano 已提交
1125 1126 1127 1128 1129
	if (bottom) {
		limit_to_ancestry(bottom, newlist);
		free_commit_list(bottom);
	}

1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141
	/*
	 * Check if any commits have become TREESAME by some of their parents
	 * becoming UNINTERESTING.
	 */
	if (limiting_can_increase_treesame(revs))
		for (list = newlist; list; list = list->next) {
			struct commit *c = list->item;
			if (c->object.flags & (UNINTERESTING | TREESAME))
				continue;
			update_treesame(revs, c);
		}

1142
	revs->commits = newlist;
1143
	return 0;
1144 1145
}

1146 1147 1148 1149
/*
 * Add an entry to refs->cmdline with the specified information.
 * *name is copied.
 */
1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160
static void add_rev_cmdline(struct rev_info *revs,
			    struct object *item,
			    const char *name,
			    int whence,
			    unsigned flags)
{
	struct rev_cmdline_info *info = &revs->cmdline;
	int nr = info->nr;

	ALLOC_GROW(info->rev, nr + 1, info->alloc);
	info->rev[nr].item = item;
1161
	info->rev[nr].name = xstrdup(name);
1162 1163 1164 1165 1166
	info->rev[nr].whence = whence;
	info->rev[nr].flags = flags;
	info->nr++;
}

1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179
static void add_rev_cmdline_list(struct rev_info *revs,
				 struct commit_list *commit_list,
				 int whence,
				 unsigned flags)
{
	while (commit_list) {
		struct object *object = &commit_list->item->object;
		add_rev_cmdline(revs, object, sha1_to_hex(object->sha1),
				whence, flags);
		commit_list = commit_list->next;
	}
}

1180 1181
struct all_refs_cb {
	int all_flags;
1182
	int warned_bad_reflog;
1183 1184 1185
	struct rev_info *all_revs;
	const char *name_for_errormsg;
};
1186

1187
static int handle_one_ref(const char *path, const unsigned char *sha1, int flag, void *cb_data)
1188
{
1189 1190 1191
	struct all_refs_cb *cb = cb_data;
	struct object *object = get_reference(cb->all_revs, path, sha1,
					      cb->all_flags);
1192
	add_rev_cmdline(cb->all_revs, object, path, REV_CMD_REF, cb->all_flags);
1193
	add_pending_sha1(cb->all_revs, path, sha1, cb->all_flags);
1194 1195 1196
	return 0;
}

I
Ilari Liusvaara 已提交
1197 1198 1199 1200 1201 1202 1203
static void init_all_refs_cb(struct all_refs_cb *cb, struct rev_info *revs,
	unsigned flags)
{
	cb->all_revs = revs;
	cb->all_flags = flags;
}

1204 1205
static void handle_refs(const char *submodule, struct rev_info *revs, unsigned flags,
		int (*for_each)(const char *, each_ref_fn, void *))
1206
{
1207
	struct all_refs_cb cb;
I
Ilari Liusvaara 已提交
1208
	init_all_refs_cb(&cb, revs, flags);
1209
	for_each(submodule, handle_one_ref, &cb);
1210 1211
}

1212
static void handle_one_reflog_commit(unsigned char *sha1, void *cb_data)
1213 1214
{
	struct all_refs_cb *cb = cb_data;
1215 1216 1217 1218
	if (!is_null_sha1(sha1)) {
		struct object *o = parse_object(sha1);
		if (o) {
			o->flags |= cb->all_flags;
1219
			/* ??? CMDLINEFLAGS ??? */
1220 1221 1222
			add_pending_object(cb->all_revs, o, "");
		}
		else if (!cb->warned_bad_reflog) {
1223
			warning("reflog of '%s' references pruned commits",
1224 1225 1226
				cb->name_for_errormsg);
			cb->warned_bad_reflog = 1;
		}
1227
	}
1228 1229
}

1230 1231 1232
static int handle_one_reflog_ent(unsigned char *osha1, unsigned char *nsha1,
		const char *email, unsigned long timestamp, int tz,
		const char *message, void *cb_data)
1233 1234 1235
{
	handle_one_reflog_commit(osha1, cb_data);
	handle_one_reflog_commit(nsha1, cb_data);
1236 1237 1238 1239 1240 1241
	return 0;
}

static int handle_one_reflog(const char *path, const unsigned char *sha1, int flag, void *cb_data)
{
	struct all_refs_cb *cb = cb_data;
1242
	cb->warned_bad_reflog = 0;
1243 1244 1245 1246 1247 1248 1249 1250 1251 1252
	cb->name_for_errormsg = path;
	for_each_reflog_ent(path, handle_one_reflog_ent, cb_data);
	return 0;
}

static void handle_reflog(struct rev_info *revs, unsigned flags)
{
	struct all_refs_cb cb;
	cb.all_revs = revs;
	cb.all_flags = flags;
1253
	for_each_reflog(handle_one_reflog, &cb);
1254 1255
}

1256
static int add_parents_only(struct rev_info *revs, const char *arg_, int flags)
1257 1258 1259 1260 1261
{
	unsigned char sha1[20];
	struct object *it;
	struct commit *commit;
	struct commit_list *parents;
1262
	const char *arg = arg_;
1263 1264

	if (*arg == '^') {
1265
		flags ^= UNINTERESTING | BOTTOM;
1266 1267
		arg++;
	}
1268
	if (get_sha1_committish(arg, sha1))
1269 1270 1271
		return 0;
	while (1) {
		it = get_reference(revs, arg, sha1, 0);
J
Junio C Hamano 已提交
1272 1273
		if (!it && revs->ignore_missing)
			return 0;
1274
		if (it->type != OBJ_TAG)
1275
			break;
1276 1277
		if (!((struct tag*)it)->tagged)
			return 0;
1278
		hashcpy(sha1, ((struct tag*)it)->tagged->sha1);
1279
	}
1280
	if (it->type != OBJ_COMMIT)
1281 1282 1283 1284 1285
		return 0;
	commit = (struct commit *)it;
	for (parents = commit->parents; parents; parents = parents->next) {
		it = &parents->item->object;
		it->flags |= flags;
1286
		add_rev_cmdline(revs, it, arg_, REV_CMD_PARENTS_ONLY, flags);
1287 1288 1289 1290 1291
		add_pending_object(revs, it, arg);
	}
	return 1;
}

1292
void init_revisions(struct rev_info *revs, const char *prefix)
1293 1294
{
	memset(revs, 0, sizeof(*revs));
1295

1296
	revs->abbrev = DEFAULT_ABBREV;
1297
	revs->ignore_merges = 1;
L
Linus Torvalds 已提交
1298
	revs->simplify_history = 1;
1299
	DIFF_OPT_SET(&revs->pruning, RECURSIVE);
1300
	DIFF_OPT_SET(&revs->pruning, QUICK);
1301 1302
	revs->pruning.add_remove = file_add_remove;
	revs->pruning.change = file_change;
J
Junio C Hamano 已提交
1303
	revs->sort_order = REV_SORT_IN_GRAPH_ORDER;
1304
	revs->dense = 1;
1305
	revs->prefix = prefix;
1306 1307
	revs->max_age = -1;
	revs->min_age = -1;
J
Junio C Hamano 已提交
1308
	revs->skip_count = -1;
1309
	revs->max_count = -1;
1310
	revs->max_parents = -1;
1311

1312 1313
	revs->commit_format = CMIT_FMT_DEFAULT;

1314 1315
	init_grep_defaults();
	grep_init(&revs->grep_filter, prefix);
J
Jeff King 已提交
1316 1317 1318
	revs->grep_filter.status_only = 1;
	revs->grep_filter.regflags = REG_NEWLINE;

1319
	diff_setup(&revs->diffopt);
1320
	if (prefix && !revs->diffopt.prefix) {
1321 1322 1323
		revs->diffopt.prefix = prefix;
		revs->diffopt.prefix_length = strlen(prefix);
	}
1324 1325

	revs->notes_opt.use_default_notes = -1;
1326 1327
}

R
Rene Scharfe 已提交
1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339
static void add_pending_commit_list(struct rev_info *revs,
                                    struct commit_list *commit_list,
                                    unsigned int flags)
{
	while (commit_list) {
		struct object *object = &commit_list->item->object;
		object->flags |= flags;
		add_pending_object(revs, object, sha1_to_hex(object->sha1));
		commit_list = commit_list->next;
	}
}

1340 1341 1342 1343 1344 1345 1346 1347
static void prepare_show_merge(struct rev_info *revs)
{
	struct commit_list *bases;
	struct commit *head, *other;
	unsigned char sha1[20];
	const char **prune = NULL;
	int i, prune_num = 1; /* counting terminating NULL */

1348
	if (get_sha1("HEAD", sha1))
1349
		die("--merge without HEAD?");
1350 1351
	head = lookup_commit_or_die(sha1, "HEAD");
	if (get_sha1("MERGE_HEAD", sha1))
1352
		die("--merge without MERGE_HEAD?");
1353
	other = lookup_commit_or_die(sha1, "MERGE_HEAD");
1354 1355 1356
	add_pending_object(revs, &head->object, "HEAD");
	add_pending_object(revs, &other->object, "MERGE_HEAD");
	bases = get_merge_bases(head, other, 1);
1357 1358
	add_rev_cmdline_list(revs, bases, REV_CMD_MERGE_BASE, UNINTERESTING | BOTTOM);
	add_pending_commit_list(revs, bases, UNINTERESTING | BOTTOM);
1359 1360
	free_commit_list(bases);
	head->object.flags |= SYMMETRIC_LEFT;
1361 1362 1363 1364

	if (!active_nr)
		read_cache();
	for (i = 0; i < active_nr; i++) {
1365
		const struct cache_entry *ce = active_cache[i];
1366 1367
		if (!ce_stage(ce))
			continue;
1368
		if (ce_path_match(ce, &revs->prune_data)) {
1369 1370 1371 1372 1373 1374 1375 1376 1377
			prune_num++;
			prune = xrealloc(prune, sizeof(*prune) * prune_num);
			prune[prune_num-2] = ce->name;
			prune[prune_num-1] = NULL;
		}
		while ((i+1 < active_nr) &&
		       ce_same_name(ce, active_cache[i+1]))
			i++;
	}
1378
	free_pathspec(&revs->prune_data);
1379
	parse_pathspec(&revs->prune_data, PATHSPEC_ALL_MAGIC, 0, "", prune);
1380
	revs->limited = 1;
1381 1382
}

1383
int handle_revision_arg(const char *arg_, struct rev_info *revs, int flags, unsigned revarg_opt)
1384
{
1385
	struct object_context oc;
1386 1387 1388 1389
	char *dotdot;
	struct object *object;
	unsigned char sha1[20];
	int local_flags;
1390
	const char *arg = arg_;
1391
	int cant_be_filename = revarg_opt & REVARG_CANNOT_BE_FILENAME;
1392
	unsigned get_sha1_flags = 0;
1393

1394 1395
	flags = flags & UNINTERESTING ? flags | BOTTOM : flags & ~BOTTOM;

1396 1397 1398 1399 1400 1401
	dotdot = strstr(arg, "..");
	if (dotdot) {
		unsigned char from_sha1[20];
		const char *next = dotdot + 2;
		const char *this = arg;
		int symmetric = *next == '.';
1402
		unsigned int flags_exclude = flags ^ (UNINTERESTING | BOTTOM);
1403
		static const char head_by_default[] = "HEAD";
1404
		unsigned int a_flags;
1405 1406 1407 1408 1409

		*dotdot = 0;
		next += symmetric;

		if (!*next)
1410
			next = head_by_default;
1411
		if (dotdot == arg)
1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423
			this = head_by_default;
		if (this == head_by_default && next == head_by_default &&
		    !symmetric) {
			/*
			 * Just ".."?  That is not a range but the
			 * pathspec for the parent directory.
			 */
			if (!cant_be_filename) {
				*dotdot = '.';
				return -1;
			}
		}
1424 1425
		if (!get_sha1_committish(this, from_sha1) &&
		    !get_sha1_committish(next, sha1)) {
1426 1427 1428 1429 1430 1431
			struct commit *a, *b;
			struct commit_list *exclude;

			a = lookup_commit_reference(from_sha1);
			b = lookup_commit_reference(sha1);
			if (!a || !b) {
J
Junio C Hamano 已提交
1432 1433
				if (revs->ignore_missing)
					return 0;
1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446
				die(symmetric ?
				    "Invalid symmetric difference expression %s...%s" :
				    "Invalid revision range %s..%s",
				    arg, next);
			}

			if (!cant_be_filename) {
				*dotdot = '.';
				verify_non_filename(revs->prefix, arg);
			}

			if (symmetric) {
				exclude = get_merge_bases(a, b, 1);
1447 1448 1449
				add_rev_cmdline_list(revs, exclude,
						     REV_CMD_MERGE_BASE,
						     flags_exclude);
1450 1451 1452
				add_pending_commit_list(revs, exclude,
							flags_exclude);
				free_commit_list(exclude);
1453
				a_flags = flags | SYMMETRIC_LEFT;
1454
			} else
1455 1456
				a_flags = flags_exclude;
			a->object.flags |= a_flags;
1457
			b->object.flags |= flags;
1458 1459 1460 1461
			add_rev_cmdline(revs, &a->object, this,
					REV_CMD_LEFT, a_flags);
			add_rev_cmdline(revs, &b->object, next,
					REV_CMD_RIGHT, flags);
1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474
			add_pending_object(revs, &a->object, this);
			add_pending_object(revs, &b->object, next);
			return 0;
		}
		*dotdot = '.';
	}
	dotdot = strstr(arg, "^@");
	if (dotdot && !dotdot[2]) {
		*dotdot = 0;
		if (add_parents_only(revs, arg, flags))
			return 0;
		*dotdot = '^';
	}
1475 1476 1477
	dotdot = strstr(arg, "^!");
	if (dotdot && !dotdot[2]) {
		*dotdot = 0;
1478
		if (!add_parents_only(revs, arg, flags ^ (UNINTERESTING | BOTTOM)))
1479 1480 1481
			*dotdot = '^';
	}

1482 1483
	local_flags = 0;
	if (*arg == '^') {
1484
		local_flags = UNINTERESTING | BOTTOM;
1485 1486
		arg++;
	}
1487 1488 1489 1490 1491

	if (revarg_opt & REVARG_COMMITTISH)
		get_sha1_flags = GET_SHA1_COMMITTISH;

	if (get_sha1_with_context(arg, get_sha1_flags, sha1, &oc))
J
Junio C Hamano 已提交
1492
		return revs->ignore_missing ? 0 : -1;
1493 1494 1495
	if (!cant_be_filename)
		verify_non_filename(revs->prefix, arg);
	object = get_reference(revs, arg, sha1, flags ^ local_flags);
1496
	add_rev_cmdline(revs, object, arg_, REV_CMD_REV, flags ^ local_flags);
1497
	add_pending_object_with_mode(revs, object, arg, oc.mode);
1498 1499 1500
	return 0;
}

1501 1502 1503 1504 1505
struct cmdline_pathspec {
	int alloc;
	int nr;
	const char **path;
};
1506

1507 1508 1509 1510 1511 1512 1513
static void append_prune_data(struct cmdline_pathspec *prune, const char **av)
{
	while (*av) {
		ALLOC_GROW(prune->path, prune->nr+1, prune->alloc);
		prune->path[prune->nr++] = *(av++);
	}
}
1514

1515 1516 1517
static void read_pathspec_from_stdin(struct rev_info *revs, struct strbuf *sb,
				     struct cmdline_pathspec *prune)
{
1518 1519 1520 1521
	while (strbuf_getwholeline(sb, stdin, '\n') != EOF) {
		int len = sb->len;
		if (len && sb->buf[len - 1] == '\n')
			sb->buf[--len] = '\0';
1522 1523
		ALLOC_GROW(prune->path, prune->nr+1, prune->alloc);
		prune->path[prune->nr++] = xstrdup(sb->buf);
1524 1525 1526
	}
}

1527 1528
static void read_revisions_from_stdin(struct rev_info *revs,
				      struct cmdline_pathspec *prune)
1529
{
1530
	struct strbuf sb;
1531
	int seen_dashdash = 0;
1532

1533 1534 1535 1536 1537
	strbuf_init(&sb, 1000);
	while (strbuf_getwholeline(&sb, stdin, '\n') != EOF) {
		int len = sb.len;
		if (len && sb.buf[len - 1] == '\n')
			sb.buf[--len] = '\0';
1538 1539
		if (!len)
			break;
1540 1541 1542 1543 1544
		if (sb.buf[0] == '-') {
			if (len == 2 && sb.buf[1] == '-') {
				seen_dashdash = 1;
				break;
			}
1545
			die("options not supported in --stdin mode");
1546
		}
1547
		if (handle_revision_arg(sb.buf, revs, 0,
1548
					REVARG_CANNOT_BE_FILENAME))
1549
			die("bad revision '%s'", sb.buf);
1550
	}
1551 1552
	if (seen_dashdash)
		read_pathspec_from_stdin(revs, &sb, prune);
1553
	strbuf_release(&sb);
1554 1555
}

1556
static void add_grep(struct rev_info *revs, const char *ptn, enum grep_pat_token what)
1557
{
J
Jeff King 已提交
1558
	append_grep_pattern(&revs->grep_filter, ptn, "command line", 0, what);
1559 1560
}

1561
static void add_header_grep(struct rev_info *revs, enum grep_header_field field, const char *pattern)
1562
{
1563
	append_header_grep_pattern(&revs->grep_filter, field, pattern);
1564 1565 1566 1567
}

static void add_message_grep(struct rev_info *revs, const char *pattern)
{
1568
	add_grep(revs, pattern, GREP_PATTERN_BODY);
1569 1570
}

1571 1572
static int handle_revision_opt(struct rev_info *revs, int argc, const char **argv,
			       int *unkc, const char **unkv)
1573 1574
{
	const char *arg = argv[0];
1575 1576
	const char *optarg;
	int argcount;
1577 1578 1579 1580 1581

	/* pseudo revision arguments */
	if (!strcmp(arg, "--all") || !strcmp(arg, "--branches") ||
	    !strcmp(arg, "--tags") || !strcmp(arg, "--remotes") ||
	    !strcmp(arg, "--reflog") || !strcmp(arg, "--not") ||
1582
	    !strcmp(arg, "--no-walk") || !strcmp(arg, "--do-walk") ||
1583 1584
	    !strcmp(arg, "--bisect") || !prefixcmp(arg, "--glob=") ||
	    !prefixcmp(arg, "--branches=") || !prefixcmp(arg, "--tags=") ||
1585
	    !prefixcmp(arg, "--remotes=") || !prefixcmp(arg, "--no-walk="))
1586 1587
	{
		unkv[(*unkc)++] = arg;
1588
		return 1;
1589 1590
	}

1591 1592
	if ((argcount = parse_long_opt("max-count", argv, &optarg))) {
		revs->max_count = atoi(optarg);
1593
		revs->no_walk = 0;
1594 1595 1596 1597
		return argcount;
	} else if ((argcount = parse_long_opt("skip", argv, &optarg))) {
		revs->skip_count = atoi(optarg);
		return argcount;
1598 1599 1600
	} else if ((*arg == '-') && isdigit(arg[1])) {
	/* accept -<digit>, like traditional "head" */
		revs->max_count = atoi(arg + 1);
1601
		revs->no_walk = 0;
1602 1603 1604 1605
	} else if (!strcmp(arg, "-n")) {
		if (argc <= 1)
			return error("-n requires an argument");
		revs->max_count = atoi(argv[1]);
1606
		revs->no_walk = 0;
1607 1608 1609
		return 2;
	} else if (!prefixcmp(arg, "-n")) {
		revs->max_count = atoi(arg + 2);
1610
		revs->no_walk = 0;
1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628
	} else if ((argcount = parse_long_opt("max-age", argv, &optarg))) {
		revs->max_age = atoi(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("since", argv, &optarg))) {
		revs->max_age = approxidate(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("after", argv, &optarg))) {
		revs->max_age = approxidate(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("min-age", argv, &optarg))) {
		revs->min_age = atoi(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("before", argv, &optarg))) {
		revs->min_age = approxidate(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("until", argv, &optarg))) {
		revs->min_age = approxidate(optarg);
		return argcount;
1629 1630
	} else if (!strcmp(arg, "--first-parent")) {
		revs->first_parent_only = 1;
J
Junio C Hamano 已提交
1631 1632
	} else if (!strcmp(arg, "--ancestry-path")) {
		revs->ancestry_path = 1;
1633
		revs->simplify_history = 0;
J
Junio C Hamano 已提交
1634
		revs->limited = 1;
1635 1636 1637 1638 1639 1640 1641 1642 1643 1644
	} else if (!strcmp(arg, "-g") || !strcmp(arg, "--walk-reflogs")) {
		init_reflog_walk(&revs->reflog_info);
	} else if (!strcmp(arg, "--default")) {
		if (argc <= 1)
			return error("bad --default argument");
		revs->def = argv[1];
		return 2;
	} else if (!strcmp(arg, "--merge")) {
		revs->show_merge = 1;
	} else if (!strcmp(arg, "--topo-order")) {
J
Junio C Hamano 已提交
1645
		revs->sort_order = REV_SORT_IN_GRAPH_ORDER;
1646
		revs->topo_order = 1;
1647 1648
	} else if (!strcmp(arg, "--simplify-merges")) {
		revs->simplify_merges = 1;
1649
		revs->topo_order = 1;
1650 1651 1652
		revs->rewrite_parents = 1;
		revs->simplify_history = 0;
		revs->limited = 1;
1653 1654
	} else if (!strcmp(arg, "--simplify-by-decoration")) {
		revs->simplify_merges = 1;
1655
		revs->topo_order = 1;
1656 1657 1658 1659 1660
		revs->rewrite_parents = 1;
		revs->simplify_history = 0;
		revs->simplify_by_decoration = 1;
		revs->limited = 1;
		revs->prune = 1;
1661
		load_ref_decorations(DECORATE_SHORT_REFS);
1662
	} else if (!strcmp(arg, "--date-order")) {
J
Junio C Hamano 已提交
1663
		revs->sort_order = REV_SORT_BY_COMMIT_DATE;
1664
		revs->topo_order = 1;
J
Junio C Hamano 已提交
1665 1666
	} else if (!strcmp(arg, "--author-date-order")) {
		revs->sort_order = REV_SORT_BY_AUTHOR_DATE;
1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688
		revs->topo_order = 1;
	} else if (!prefixcmp(arg, "--early-output")) {
		int count = 100;
		switch (arg[14]) {
		case '=':
			count = atoi(arg+15);
			/* Fallthrough */
		case 0:
			revs->topo_order = 1;
		       revs->early_output = count;
		}
	} else if (!strcmp(arg, "--parents")) {
		revs->rewrite_parents = 1;
		revs->print_parents = 1;
	} else if (!strcmp(arg, "--dense")) {
		revs->dense = 1;
	} else if (!strcmp(arg, "--sparse")) {
		revs->dense = 0;
	} else if (!strcmp(arg, "--show-all")) {
		revs->show_all = 1;
	} else if (!strcmp(arg, "--remove-empty")) {
		revs->remove_empty_trees = 1;
1689
	} else if (!strcmp(arg, "--merges")) {
1690
		revs->min_parents = 2;
1691
	} else if (!strcmp(arg, "--no-merges")) {
1692 1693 1694 1695 1696 1697 1698 1699 1700
		revs->max_parents = 1;
	} else if (!prefixcmp(arg, "--min-parents=")) {
		revs->min_parents = atoi(arg+14);
	} else if (!prefixcmp(arg, "--no-min-parents")) {
		revs->min_parents = 0;
	} else if (!prefixcmp(arg, "--max-parents=")) {
		revs->max_parents = atoi(arg+14);
	} else if (!prefixcmp(arg, "--no-max-parents")) {
		revs->max_parents = -1;
1701 1702 1703 1704
	} else if (!strcmp(arg, "--boundary")) {
		revs->boundary = 1;
	} else if (!strcmp(arg, "--left-right")) {
		revs->left_right = 1;
1705
	} else if (!strcmp(arg, "--left-only")) {
1706
		if (revs->right_only)
M
Michael J Gruber 已提交
1707 1708
			die("--left-only is incompatible with --right-only"
			    " or --cherry");
1709 1710
		revs->left_only = 1;
	} else if (!strcmp(arg, "--right-only")) {
1711 1712
		if (revs->left_only)
			die("--right-only is incompatible with --left-only");
1713
		revs->right_only = 1;
M
Michael J Gruber 已提交
1714 1715 1716 1717 1718
	} else if (!strcmp(arg, "--cherry")) {
		if (revs->left_only)
			die("--cherry is incompatible with --left-only");
		revs->cherry_mark = 1;
		revs->right_only = 1;
1719
		revs->max_parents = 1;
M
Michael J Gruber 已提交
1720
		revs->limited = 1;
T
Thomas Rast 已提交
1721 1722
	} else if (!strcmp(arg, "--count")) {
		revs->count = 1;
1723 1724 1725 1726 1727
	} else if (!strcmp(arg, "--cherry-mark")) {
		if (revs->cherry_pick)
			die("--cherry-mark is incompatible with --cherry-pick");
		revs->cherry_mark = 1;
		revs->limited = 1; /* needs limit_list() */
1728
	} else if (!strcmp(arg, "--cherry-pick")) {
1729 1730
		if (revs->cherry_mark)
			die("--cherry-pick is incompatible with --cherry-mark");
1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741
		revs->cherry_pick = 1;
		revs->limited = 1;
	} else if (!strcmp(arg, "--objects")) {
		revs->tag_objects = 1;
		revs->tree_objects = 1;
		revs->blob_objects = 1;
	} else if (!strcmp(arg, "--objects-edge")) {
		revs->tag_objects = 1;
		revs->tree_objects = 1;
		revs->blob_objects = 1;
		revs->edge_hint = 1;
J
Junio C Hamano 已提交
1742 1743 1744 1745 1746
	} else if (!strcmp(arg, "--verify-objects")) {
		revs->tag_objects = 1;
		revs->tree_objects = 1;
		revs->blob_objects = 1;
		revs->verify_objects = 1;
1747 1748
	} else if (!strcmp(arg, "--unpacked")) {
		revs->unpacked = 1;
J
Junio C Hamano 已提交
1749 1750
	} else if (!prefixcmp(arg, "--unpacked=")) {
		die("--unpacked=<packfile> no longer supported.");
1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771
	} else if (!strcmp(arg, "-r")) {
		revs->diff = 1;
		DIFF_OPT_SET(&revs->diffopt, RECURSIVE);
	} else if (!strcmp(arg, "-t")) {
		revs->diff = 1;
		DIFF_OPT_SET(&revs->diffopt, RECURSIVE);
		DIFF_OPT_SET(&revs->diffopt, TREE_IN_RECURSIVE);
	} else if (!strcmp(arg, "-m")) {
		revs->ignore_merges = 0;
	} else if (!strcmp(arg, "-c")) {
		revs->diff = 1;
		revs->dense_combined_merges = 0;
		revs->combine_merges = 1;
	} else if (!strcmp(arg, "--cc")) {
		revs->diff = 1;
		revs->dense_combined_merges = 1;
		revs->combine_merges = 1;
	} else if (!strcmp(arg, "-v")) {
		revs->verbose_header = 1;
	} else if (!strcmp(arg, "--pretty")) {
		revs->verbose_header = 1;
1772
		revs->pretty_given = 1;
1773
		get_commit_format(arg+8, revs);
1774
	} else if (!prefixcmp(arg, "--pretty=") || !prefixcmp(arg, "--format=")) {
1775 1776 1777 1778
		/*
		 * Detached form ("--pretty X" as opposed to "--pretty=X")
		 * not allowed, since the argument is optional.
		 */
1779
		revs->verbose_header = 1;
1780
		revs->pretty_given = 1;
1781
		get_commit_format(arg+9, revs);
1782
	} else if (!strcmp(arg, "--show-notes") || !strcmp(arg, "--notes")) {
1783 1784
		revs->show_notes = 1;
		revs->show_notes_given = 1;
1785
		revs->notes_opt.use_default_notes = 1;
J
Junio C Hamano 已提交
1786 1787
	} else if (!strcmp(arg, "--show-signature")) {
		revs->show_signature = 1;
1788 1789
	} else if (!prefixcmp(arg, "--show-notes=") ||
		   !prefixcmp(arg, "--notes=")) {
1790 1791 1792
		struct strbuf buf = STRBUF_INIT;
		revs->show_notes = 1;
		revs->show_notes_given = 1;
1793 1794 1795 1796 1797 1798 1799
		if (!prefixcmp(arg, "--show-notes")) {
			if (revs->notes_opt.use_default_notes < 0)
				revs->notes_opt.use_default_notes = 1;
			strbuf_addstr(&buf, arg+13);
		}
		else
			strbuf_addstr(&buf, arg+8);
1800
		expand_notes_ref(&buf);
1801
		string_list_append(&revs->notes_opt.extra_notes_refs,
1802
				   strbuf_detach(&buf, NULL));
1803 1804 1805
	} else if (!strcmp(arg, "--no-notes")) {
		revs->show_notes = 0;
		revs->show_notes_given = 1;
1806 1807 1808 1809 1810 1811
		revs->notes_opt.use_default_notes = -1;
		/* we have been strdup'ing ourselves, so trick
		 * string_list into free()ing strings */
		revs->notes_opt.extra_notes_refs.strdup_strings = 1;
		string_list_clear(&revs->notes_opt.extra_notes_refs, 0);
		revs->notes_opt.extra_notes_refs.strdup_strings = 0;
1812 1813
	} else if (!strcmp(arg, "--standard-notes")) {
		revs->show_notes_given = 1;
1814
		revs->notes_opt.use_default_notes = 1;
1815
	} else if (!strcmp(arg, "--no-standard-notes")) {
1816
		revs->notes_opt.use_default_notes = 0;
1817 1818 1819
	} else if (!strcmp(arg, "--oneline")) {
		revs->verbose_header = 1;
		get_commit_format("oneline", revs);
1820
		revs->pretty_given = 1;
1821
		revs->abbrev_commit = 1;
1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843
	} else if (!strcmp(arg, "--graph")) {
		revs->topo_order = 1;
		revs->rewrite_parents = 1;
		revs->graph = graph_init(revs);
	} else if (!strcmp(arg, "--root")) {
		revs->show_root_diff = 1;
	} else if (!strcmp(arg, "--no-commit-id")) {
		revs->no_commit_id = 1;
	} else if (!strcmp(arg, "--always")) {
		revs->always_show_header = 1;
	} else if (!strcmp(arg, "--no-abbrev")) {
		revs->abbrev = 0;
	} else if (!strcmp(arg, "--abbrev")) {
		revs->abbrev = DEFAULT_ABBREV;
	} else if (!prefixcmp(arg, "--abbrev=")) {
		revs->abbrev = strtoul(arg + 9, NULL, 10);
		if (revs->abbrev < MINIMUM_ABBREV)
			revs->abbrev = MINIMUM_ABBREV;
		else if (revs->abbrev > 40)
			revs->abbrev = 40;
	} else if (!strcmp(arg, "--abbrev-commit")) {
		revs->abbrev_commit = 1;
1844 1845 1846
		revs->abbrev_commit_given = 1;
	} else if (!strcmp(arg, "--no-abbrev-commit")) {
		revs->abbrev_commit = 0;
1847 1848 1849 1850 1851 1852 1853
	} else if (!strcmp(arg, "--full-diff")) {
		revs->diff = 1;
		revs->full_diff = 1;
	} else if (!strcmp(arg, "--full-history")) {
		revs->simplify_history = 0;
	} else if (!strcmp(arg, "--relative-date")) {
		revs->date_mode = DATE_RELATIVE;
J
Jeff King 已提交
1854
		revs->date_mode_explicit = 1;
1855 1856
	} else if ((argcount = parse_long_opt("date", argv, &optarg))) {
		revs->date_mode = parse_date_format(optarg);
J
Jeff King 已提交
1857
		revs->date_mode_explicit = 1;
1858
		return argcount;
1859 1860 1861 1862 1863 1864
	} else if (!strcmp(arg, "--log-size")) {
		revs->show_log_size = 1;
	}
	/*
	 * Grepping the commit log
	 */
1865 1866 1867 1868 1869 1870
	else if ((argcount = parse_long_opt("author", argv, &optarg))) {
		add_header_grep(revs, GREP_HEADER_AUTHOR, optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("committer", argv, &optarg))) {
		add_header_grep(revs, GREP_HEADER_COMMITTER, optarg);
		return argcount;
1871 1872 1873
	} else if ((argcount = parse_long_opt("grep-reflog", argv, &optarg))) {
		add_header_grep(revs, GREP_HEADER_REFLOG, optarg);
		return argcount;
1874 1875 1876
	} else if ((argcount = parse_long_opt("grep", argv, &optarg))) {
		add_message_grep(revs, optarg);
		return argcount;
1877 1878
	} else if (!strcmp(arg, "--grep-debug")) {
		revs->grep_filter.debug = 1;
1879 1880
	} else if (!strcmp(arg, "--basic-regexp")) {
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_BRE, &revs->grep_filter);
1881
	} else if (!strcmp(arg, "--extended-regexp") || !strcmp(arg, "-E")) {
1882
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_ERE, &revs->grep_filter);
1883
	} else if (!strcmp(arg, "--regexp-ignore-case") || !strcmp(arg, "-i")) {
J
Jeff King 已提交
1884
		revs->grep_filter.regflags |= REG_ICASE;
1885
		DIFF_OPT_SET(&revs->diffopt, PICKAXE_IGNORE_CASE);
1886
	} else if (!strcmp(arg, "--fixed-strings") || !strcmp(arg, "-F")) {
1887
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_FIXED, &revs->grep_filter);
1888 1889
	} else if (!strcmp(arg, "--perl-regexp")) {
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_PCRE, &revs->grep_filter);
1890
	} else if (!strcmp(arg, "--all-match")) {
J
Jeff King 已提交
1891
		revs->grep_filter.all_match = 1;
1892 1893 1894
	} else if ((argcount = parse_long_opt("encoding", argv, &optarg))) {
		if (strcmp(optarg, "none"))
			git_log_output_encoding = xstrdup(optarg);
1895 1896
		else
			git_log_output_encoding = "";
1897
		return argcount;
1898 1899 1900 1901 1902
	} else if (!strcmp(arg, "--reverse")) {
		revs->reverse ^= 1;
	} else if (!strcmp(arg, "--children")) {
		revs->children.name = "children";
		revs->limited = 1;
J
Junio C Hamano 已提交
1903 1904
	} else if (!strcmp(arg, "--ignore-missing")) {
		revs->ignore_missing = 1;
1905 1906 1907 1908 1909 1910 1911 1912 1913 1914
	} else {
		int opts = diff_opt_parse(&revs->diffopt, argv, argc);
		if (!opts)
			unkv[(*unkc)++] = arg;
		return opts;
	}

	return 1;
}

1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928
void parse_revision_opt(struct rev_info *revs, struct parse_opt_ctx_t *ctx,
			const struct option *options,
			const char * const usagestr[])
{
	int n = handle_revision_opt(revs, ctx->argc, ctx->argv,
				    &ctx->cpidx, ctx->out);
	if (n <= 0) {
		error("unknown option `%s'", ctx->argv[0]);
		usage_with_options(usagestr, options);
	}
	ctx->argv += n;
	ctx->argc -= n;
}

1929
static int for_each_bad_bisect_ref(const char *submodule, each_ref_fn fn, void *cb_data)
1930
{
1931
	return for_each_ref_in_submodule(submodule, "refs/bisect/bad", fn, cb_data);
1932 1933
}

1934
static int for_each_good_bisect_ref(const char *submodule, each_ref_fn fn, void *cb_data)
1935
{
1936
	return for_each_ref_in_submodule(submodule, "refs/bisect/good", fn, cb_data);
1937 1938
}

1939 1940 1941 1942 1943 1944 1945 1946
static int handle_revision_pseudo_opt(const char *submodule,
				struct rev_info *revs,
				int argc, const char **argv, int *flags)
{
	const char *arg = argv[0];
	const char *optarg;
	int argcount;

1947 1948 1949 1950 1951 1952 1953 1954 1955 1956
	/*
	 * NOTE!
	 *
	 * Commands like "git shortlog" will not accept the options below
	 * unless parse_revision_opt queues them (as opposed to erroring
	 * out).
	 *
	 * When implementing your new pseudo-option, remember to
	 * register it in the list at the top of handle_revision_opt.
	 */
1957 1958 1959 1960 1961 1962 1963
	if (!strcmp(arg, "--all")) {
		handle_refs(submodule, revs, *flags, for_each_ref_submodule);
		handle_refs(submodule, revs, *flags, head_ref_submodule);
	} else if (!strcmp(arg, "--branches")) {
		handle_refs(submodule, revs, *flags, for_each_branch_ref_submodule);
	} else if (!strcmp(arg, "--bisect")) {
		handle_refs(submodule, revs, *flags, for_each_bad_bisect_ref);
1964
		handle_refs(submodule, revs, *flags ^ (UNINTERESTING | BOTTOM), for_each_good_bisect_ref);
1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986 1987 1988 1989
		revs->bisect = 1;
	} else if (!strcmp(arg, "--tags")) {
		handle_refs(submodule, revs, *flags, for_each_tag_ref_submodule);
	} else if (!strcmp(arg, "--remotes")) {
		handle_refs(submodule, revs, *flags, for_each_remote_ref_submodule);
	} else if ((argcount = parse_long_opt("glob", argv, &optarg))) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref(handle_one_ref, optarg, &cb);
		return argcount;
	} else if (!prefixcmp(arg, "--branches=")) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref_in(handle_one_ref, arg + 11, "refs/heads/", &cb);
	} else if (!prefixcmp(arg, "--tags=")) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref_in(handle_one_ref, arg + 7, "refs/tags/", &cb);
	} else if (!prefixcmp(arg, "--remotes=")) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref_in(handle_one_ref, arg + 10, "refs/remotes/", &cb);
	} else if (!strcmp(arg, "--reflog")) {
		handle_reflog(revs, *flags);
	} else if (!strcmp(arg, "--not")) {
1990
		*flags ^= UNINTERESTING | BOTTOM;
1991
	} else if (!strcmp(arg, "--no-walk")) {
1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003
		revs->no_walk = REVISION_WALK_NO_WALK_SORTED;
	} else if (!prefixcmp(arg, "--no-walk=")) {
		/*
		 * Detached form ("--no-walk X" as opposed to "--no-walk=X")
		 * not allowed, since the argument is optional.
		 */
		if (!strcmp(arg + 10, "sorted"))
			revs->no_walk = REVISION_WALK_NO_WALK_SORTED;
		else if (!strcmp(arg + 10, "unsorted"))
			revs->no_walk = REVISION_WALK_NO_WALK_UNSORTED;
		else
			return error("invalid argument to --no-walk");
2004 2005 2006 2007 2008 2009 2010 2011 2012
	} else if (!strcmp(arg, "--do-walk")) {
		revs->no_walk = 0;
	} else {
		return 0;
	}

	return 1;
}

2013 2014 2015 2016
/*
 * Parse revision information, filling in the "rev_info" structure,
 * and removing the used arguments from the argument list.
 *
2017 2018
 * Returns the number of arguments left that weren't recognized
 * (which are also moved to the head of the argument list)
2019
 */
2020
int setup_revisions(int argc, const char **argv, struct rev_info *revs, struct setup_revision_opt *opt)
2021
{
2022
	int i, flags, left, seen_dashdash, read_from_stdin, got_rev_arg = 0, revarg_opt;
2023
	struct cmdline_pathspec prune_data;
2024 2025
	const char *submodule = NULL;

2026
	memset(&prune_data, 0, sizeof(prune_data));
2027 2028
	if (opt)
		submodule = opt->submodule;
2029 2030

	/* First, search for "--" */
2031
	if (opt && opt->assume_dashdash) {
2032
		seen_dashdash = 1;
2033 2034 2035 2036 2037 2038 2039 2040 2041 2042 2043 2044 2045
	} else {
		seen_dashdash = 0;
		for (i = 1; i < argc; i++) {
			const char *arg = argv[i];
			if (strcmp(arg, "--"))
				continue;
			argv[i] = NULL;
			argc = i;
			if (argv[i + 1])
				append_prune_data(&prune_data, argv + i + 1);
			seen_dashdash = 1;
			break;
		}
2046 2047
	}

2048 2049
	/* Second, deal with arguments and options */
	flags = 0;
2050 2051 2052
	revarg_opt = opt ? opt->revarg_opt : 0;
	if (seen_dashdash)
		revarg_opt |= REVARG_CANNOT_BE_FILENAME;
2053
	read_from_stdin = 0;
2054
	for (left = i = 1; i < argc; i++) {
2055 2056
		const char *arg = argv[i];
		if (*arg == '-') {
2057
			int opts;
2058

2059 2060 2061 2062 2063
			opts = handle_revision_pseudo_opt(submodule,
						revs, argc - i, argv + i,
						&flags);
			if (opts > 0) {
				i += opts - 1;
2064 2065
				continue;
			}
2066

2067 2068 2069 2070 2071 2072 2073
			if (!strcmp(arg, "--stdin")) {
				if (revs->disable_stdin) {
					argv[left++] = arg;
					continue;
				}
				if (read_from_stdin++)
					die("--stdin given twice?");
2074
				read_revisions_from_stdin(revs, &prune_data);
2075 2076
				continue;
			}
2077

2078
			opts = handle_revision_opt(revs, argc - i, argv + i, &left, argv);
2079 2080 2081 2082
			if (opts > 0) {
				i += opts - 1;
				continue;
			}
2083 2084
			if (opts < 0)
				exit(128);
2085 2086 2087
			continue;
		}

2088 2089

		if (handle_revision_arg(arg, revs, flags, revarg_opt)) {
2090 2091
			int j;
			if (seen_dashdash || *arg == '^')
2092 2093
				die("bad revision '%s'", arg);

2094 2095 2096 2097 2098 2099
			/* If we didn't have a "--":
			 * (1) all filenames must exist;
			 * (2) all rev-args must not be interpretable
			 *     as a valid filename.
			 * but the latter we have checked in the main loop.
			 */
2100
			for (j = i; j < argc; j++)
2101
				verify_filename(revs->prefix, argv[j], j == i);
2102

2103
			append_prune_data(&prune_data, argv + i);
2104 2105
			break;
		}
2106 2107
		else
			got_rev_arg = 1;
2108
	}
2109

2110
	if (prune_data.nr) {
2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124
		/*
		 * If we need to introduce the magic "a lone ':' means no
		 * pathspec whatsoever", here is the place to do so.
		 *
		 * if (prune_data.nr == 1 && !strcmp(prune_data[0], ":")) {
		 *	prune_data.nr = 0;
		 *	prune_data.alloc = 0;
		 *	free(prune_data.path);
		 *	prune_data.path = NULL;
		 * } else {
		 *	terminate prune_data.alloc with NULL and
		 *	call init_pathspec() to set revs->prune_data here.
		 * }
		 */
2125 2126
		ALLOC_GROW(prune_data.path, prune_data.nr+1, prune_data.alloc);
		prune_data.path[prune_data.nr++] = NULL;
2127 2128
		parse_pathspec(&revs->prune_data, 0, 0,
			       revs->prefix, prune_data.path);
2129
	}
2130

2131
	if (revs->def == NULL)
2132
		revs->def = opt ? opt->def : NULL;
J
Junio C Hamano 已提交
2133 2134
	if (opt && opt->tweak)
		opt->tweak(revs, opt);
2135
	if (revs->show_merge)
2136
		prepare_show_merge(revs);
2137
	if (revs->def && !revs->pending.nr && !got_rev_arg) {
2138
		unsigned char sha1[20];
2139
		struct object *object;
2140
		struct object_context oc;
2141
		if (get_sha1_with_context(revs->def, 0, sha1, &oc))
2142 2143
			die("bad default revision '%s'", revs->def);
		object = get_reference(revs, revs->def, sha1, 0);
2144
		add_pending_object_with_mode(revs, object, revs->def, oc.mode);
2145
	}
2146

2147 2148 2149 2150
	/* Did the user ask for any diff output? Run the diff! */
	if (revs->diffopt.output_format & ~DIFF_FORMAT_NO_OUTPUT)
		revs->diff = 1;

A
Arjen Laarhoven 已提交
2151 2152 2153 2154
	/* Pickaxe, diff-filter and rename following need diffs */
	if (revs->diffopt.pickaxe ||
	    revs->diffopt.filter ||
	    DIFF_OPT_TST(&revs->diffopt, FOLLOW_RENAMES))
2155 2156
		revs->diff = 1;

2157
	if (revs->topo_order)
2158 2159
		revs->limited = 1;

2160
	if (revs->prune_data.nr) {
2161
		copy_pathspec(&revs->pruning.pathspec, &revs->prune_data);
2162
		/* Can't prune commits with rename following: the paths change.. */
2163
		if (!DIFF_OPT_TST(&revs->diffopt, FOLLOW_RENAMES))
L
Linus Torvalds 已提交
2164
			revs->prune = 1;
2165
		if (!revs->full_diff)
2166 2167
			copy_pathspec(&revs->diffopt.pathspec,
				      &revs->prune_data);
2168
	}
J
Junio C Hamano 已提交
2169
	if (revs->combine_merges)
2170 2171
		revs->ignore_merges = 0;
	revs->diffopt.abbrev = revs->abbrev;
2172 2173 2174 2175 2176 2177

	if (revs->line_level_traverse) {
		revs->limited = 1;
		revs->topo_order = 1;
	}

T
Thomas Rast 已提交
2178
	diff_setup_done(&revs->diffopt);
2179

2180 2181
	grep_commit_pattern_type(GREP_PATTERN_TYPE_UNSPECIFIED,
				 &revs->grep_filter);
J
Jeff King 已提交
2182
	compile_grep_patterns(&revs->grep_filter);
2183

2184 2185
	if (revs->reverse && revs->reflog_info)
		die("cannot combine --reverse with --walk-reflogs");
2186
	if (revs->rewrite_parents && revs->children.name)
2187
		die("cannot combine --parents and --children");
2188

2189 2190 2191 2192 2193 2194 2195 2196
	/*
	 * Limitations on the graph functionality
	 */
	if (revs->reverse && revs->graph)
		die("cannot combine --reverse with --graph");

	if (revs->reflog_info && revs->graph)
		die("cannot combine --walk-reflogs with --graph");
2197 2198
	if (!revs->reflog_info && revs->grep_filter.use_reflog_filter)
		die("cannot use --grep-reflog without --walk-reflogs");
2199

2200 2201
	return left;
}
2202

2203 2204 2205 2206 2207 2208 2209 2210
static void add_child(struct rev_info *revs, struct commit *parent, struct commit *child)
{
	struct commit_list *l = xcalloc(1, sizeof(*l));

	l->item = child;
	l->next = add_decoration(&revs->children, &parent->object, l);
}

2211
static int remove_duplicate_parents(struct rev_info *revs, struct commit *commit)
2212
{
2213
	struct treesame_state *ts = lookup_decoration(&revs->treesame, &commit->object);
2214 2215 2216 2217 2218
	struct commit_list **pp, *p;
	int surviving_parents;

	/* Examine existing parents while marking ones we have seen... */
	pp = &commit->parents;
2219
	surviving_parents = 0;
2220 2221 2222 2223
	while ((p = *pp) != NULL) {
		struct commit *parent = p->item;
		if (parent->object.flags & TMP_MARK) {
			*pp = p->next;
2224 2225
			if (ts)
				compact_treesame(revs, commit, surviving_parents);
2226 2227 2228
			continue;
		}
		parent->object.flags |= TMP_MARK;
2229
		surviving_parents++;
2230 2231
		pp = &p->next;
	}
2232
	/* clear the temporary mark */
2233 2234 2235
	for (p = commit->parents; p; p = p->next) {
		p->item->object.flags &= ~TMP_MARK;
	}
2236
	/* no update_treesame() - removing duplicates can't affect TREESAME */
2237 2238 2239
	return surviving_parents;
}

2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255
struct merge_simplify_state {
	struct commit *simplified;
};

static struct merge_simplify_state *locate_simplify_state(struct rev_info *revs, struct commit *commit)
{
	struct merge_simplify_state *st;

	st = lookup_decoration(&revs->merge_simplification, &commit->object);
	if (!st) {
		st = xcalloc(1, sizeof(*st));
		add_decoration(&revs->merge_simplification, &commit->object, st);
	}
	return st;
}

2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291
static int mark_redundant_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list *h = reduce_heads(commit->parents);
	int i = 0, marked = 0;
	struct commit_list *po, *pn;

	/* Want these for sanity-checking only */
	int orig_cnt = commit_list_count(commit->parents);
	int cnt = commit_list_count(h);

	/*
	 * Not ready to remove items yet, just mark them for now, based
	 * on the output of reduce_heads(). reduce_heads outputs the reduced
	 * set in its original order, so this isn't too hard.
	 */
	po = commit->parents;
	pn = h;
	while (po) {
		if (pn && po->item == pn->item) {
			pn = pn->next;
			i++;
		} else {
			po->item->object.flags |= TMP_MARK;
			marked++;
		}
		po=po->next;
	}

	if (i != cnt || cnt+marked != orig_cnt)
		die("mark_redundant_parents %d %d %d %d", orig_cnt, cnt, i, marked);

	free_commit_list(h);

	return marked;
}

2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307
static int mark_treesame_root_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list *p;
	int marked = 0;

	for (p = commit->parents; p; p = p->next) {
		struct commit *parent = p->item;
		if (!parent->parents && (parent->object.flags & TREESAME)) {
			parent->object.flags |= TMP_MARK;
			marked++;
		}
	}

	return marked;
}

2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374
/*
 * Awkward naming - this means one parent we are TREESAME to.
 * cf mark_treesame_root_parents: root parents that are TREESAME (to an
 * empty tree). Better name suggestions?
 */
static int leave_one_treesame_to_parent(struct rev_info *revs, struct commit *commit)
{
	struct treesame_state *ts = lookup_decoration(&revs->treesame, &commit->object);
	struct commit *unmarked = NULL, *marked = NULL;
	struct commit_list *p;
	unsigned n;

	for (p = commit->parents, n = 0; p; p = p->next, n++) {
		if (ts->treesame[n]) {
			if (p->item->object.flags & TMP_MARK) {
				if (!marked)
					marked = p->item;
			} else {
				if (!unmarked) {
					unmarked = p->item;
					break;
				}
			}
		}
	}

	/*
	 * If we are TREESAME to a marked-for-deletion parent, but not to any
	 * unmarked parents, unmark the first TREESAME parent. This is the
	 * parent that the default simplify_history==1 scan would have followed,
	 * and it doesn't make sense to omit that path when asking for a
	 * simplified full history. Retaining it improves the chances of
	 * understanding odd missed merges that took an old version of a file.
	 *
	 * Example:
	 *
	 *   I--------*X       A modified the file, but mainline merge X used
	 *    \       /        "-s ours", so took the version from I. X is
	 *     `-*A--'         TREESAME to I and !TREESAME to A.
	 *
	 * Default log from X would produce "I". Without this check,
	 * --full-history --simplify-merges would produce "I-A-X", showing
	 * the merge commit X and that it changed A, but not making clear that
	 * it had just taken the I version. With this check, the topology above
	 * is retained.
	 *
	 * Note that it is possible that the simplification chooses a different
	 * TREESAME parent from the default, in which case this test doesn't
	 * activate, and we _do_ drop the default parent. Example:
	 *
	 *   I------X         A modified the file, but it was reverted in B,
	 *    \    /          meaning mainline merge X is TREESAME to both
	 *    *A-*B           parents.
	 *
	 * Default log would produce "I" by following the first parent;
	 * --full-history --simplify-merges will produce "I-A-B". But this is a
	 * reasonable result - it presents a logical full history leading from
	 * I to X, and X is not an important merge.
	 */
	if (!unmarked && marked) {
		marked->object.flags &= ~TMP_MARK;
		return 1;
	}

	return 0;
}

2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402
static int remove_marked_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list **pp, *p;
	int nth_parent, removed = 0;

	pp = &commit->parents;
	nth_parent = 0;
	while ((p = *pp) != NULL) {
		struct commit *parent = p->item;
		if (parent->object.flags & TMP_MARK) {
			parent->object.flags &= ~TMP_MARK;
			*pp = p->next;
			free(p);
			removed++;
			compact_treesame(revs, commit, nth_parent);
			continue;
		}
		pp = &p->next;
		nth_parent++;
	}

	/* Removing parents can only increase TREESAMEness */
	if (removed && !(commit->object.flags & TREESAME))
		update_treesame(revs, commit);

	return nth_parent;
}

2403
static struct commit_list **simplify_one(struct rev_info *revs, struct commit *commit, struct commit_list **tail)
2404 2405
{
	struct commit_list *p;
2406
	struct commit *parent;
2407
	struct merge_simplify_state *st, *pst;
2408 2409
	int cnt;

2410 2411
	st = locate_simplify_state(revs, commit);

2412 2413 2414
	/*
	 * Have we handled this one?
	 */
2415
	if (st->simplified)
2416 2417 2418 2419 2420 2421 2422 2423
		return tail;

	/*
	 * An UNINTERESTING commit simplifies to itself, so does a
	 * root commit.  We do not rewrite parents of such commit
	 * anyway.
	 */
	if ((commit->object.flags & UNINTERESTING) || !commit->parents) {
2424
		st->simplified = commit;
2425 2426 2427 2428
		return tail;
	}

	/*
2429 2430 2431
	 * Do we know what commit all of our parents that matter
	 * should be rewritten to?  Otherwise we are not ready to
	 * rewrite this one yet.
2432 2433
	 */
	for (cnt = 0, p = commit->parents; p; p = p->next) {
2434 2435
		pst = locate_simplify_state(revs, p->item);
		if (!pst->simplified) {
2436 2437 2438
			tail = &commit_list_insert(p->item, tail)->next;
			cnt++;
		}
2439 2440
		if (revs->first_parent_only)
			break;
2441
	}
2442 2443
	if (cnt) {
		tail = &commit_list_insert(commit, tail)->next;
2444
		return tail;
2445
	}
2446 2447

	/*
2448 2449 2450
	 * Rewrite our list of parents. Note that this cannot
	 * affect our TREESAME flags in any way - a commit is
	 * always TREESAME to its simplification.
2451
	 */
2452 2453 2454
	for (p = commit->parents; p; p = p->next) {
		pst = locate_simplify_state(revs, p->item);
		p->item = pst->simplified;
2455 2456
		if (revs->first_parent_only)
			break;
2457
	}
2458

2459
	if (revs->first_parent_only)
2460
		cnt = 1;
2461
	else
2462
		cnt = remove_duplicate_parents(revs, commit);
2463 2464 2465 2466

	/*
	 * It is possible that we are a merge and one side branch
	 * does not have any commit that touches the given paths;
2467 2468
	 * in such a case, the immediate parent from that branch
	 * will be rewritten to be the merge base.
2469 2470 2471 2472 2473
	 *
	 *      o----X		X: the commit we are looking at;
	 *     /    /		o: a commit that touches the paths;
	 * ---o----'
	 *
2474 2475 2476 2477 2478 2479 2480 2481
	 * Further, a merge of an independent branch that doesn't
	 * touch the path will reduce to a treesame root parent:
	 *
	 *  ----o----X		X: the commit we are looking at;
	 *          /		o: a commit that touches the paths;
	 *         r		r: a root commit not touching the paths
	 *
	 * Detect and simplify both cases.
2482 2483
	 */
	if (1 < cnt) {
2484
		int marked = mark_redundant_parents(revs, commit);
2485
		marked += mark_treesame_root_parents(revs, commit);
2486 2487
		if (marked)
			marked -= leave_one_treesame_to_parent(revs, commit);
2488 2489
		if (marked)
			cnt = remove_marked_parents(revs, commit);
2490 2491 2492 2493 2494
	}

	/*
	 * A commit simplifies to itself if it is a root, if it is
	 * UNINTERESTING, if it touches the given paths, or if it is a
2495
	 * merge and its parents don't simplify to one relevant commit
2496 2497 2498
	 * (the first two cases are already handled at the beginning of
	 * this function).
	 *
2499 2500
	 * Otherwise, it simplifies to what its sole relevant parent
	 * simplifies to.
2501 2502 2503 2504
	 */
	if (!cnt ||
	    (commit->object.flags & UNINTERESTING) ||
	    !(commit->object.flags & TREESAME) ||
2505
	    (parent = one_relevant_parent(revs, commit->parents)) == NULL)
2506 2507
		st->simplified = commit;
	else {
2508
		pst = locate_simplify_state(revs, parent);
2509 2510
		st->simplified = pst->simplified;
	}
2511 2512 2513 2514 2515
	return tail;
}

static void simplify_merges(struct rev_info *revs)
{
2516
	struct commit_list *list, *next;
2517
	struct commit_list *yet_to_do, **tail;
2518
	struct commit *commit;
2519

2520 2521
	if (!revs->prune)
		return;
2522

2523 2524
	/* feed the list reversed */
	yet_to_do = NULL;
2525 2526 2527 2528 2529 2530 2531 2532 2533
	for (list = revs->commits; list; list = next) {
		commit = list->item;
		next = list->next;
		/*
		 * Do not free(list) here yet; the original list
		 * is used later in this function.
		 */
		commit_list_insert(commit, &yet_to_do);
	}
2534 2535 2536 2537 2538
	while (yet_to_do) {
		list = yet_to_do;
		yet_to_do = NULL;
		tail = &yet_to_do;
		while (list) {
2539 2540
			commit = list->item;
			next = list->next;
2541 2542
			free(list);
			list = next;
2543
			tail = simplify_one(revs, commit, tail);
2544 2545 2546 2547 2548 2549 2550 2551
		}
	}

	/* clean up the result, removing the simplified ones */
	list = revs->commits;
	revs->commits = NULL;
	tail = &revs->commits;
	while (list) {
2552
		struct merge_simplify_state *st;
2553 2554 2555

		commit = list->item;
		next = list->next;
2556 2557
		free(list);
		list = next;
2558 2559
		st = locate_simplify_state(revs, commit);
		if (st->simplified == commit)
2560 2561 2562 2563
			tail = &commit_list_insert(commit, tail)->next;
	}
}

2564 2565 2566 2567 2568 2569 2570 2571 2572 2573 2574 2575
static void set_children(struct rev_info *revs)
{
	struct commit_list *l;
	for (l = revs->commits; l; l = l->next) {
		struct commit *commit = l->item;
		struct commit_list *p;

		for (p = commit->parents; p; p = p->next)
			add_child(revs, p->item, commit);
	}
}

2576 2577 2578 2579 2580
void reset_revision_walk(void)
{
	clear_object_flags(SEEN | ADDED | SHOWN);
}

2581
int prepare_revision_walk(struct rev_info *revs)
2582
{
2583
	int nr = revs->pending.nr;
2584
	struct object_array_entry *e, *list;
2585
	struct commit_list **next = &revs->commits;
2586

2587
	e = list = revs->pending.objects;
2588 2589 2590 2591
	revs->pending.nr = 0;
	revs->pending.alloc = 0;
	revs->pending.objects = NULL;
	while (--nr >= 0) {
2592
		struct commit *commit = handle_commit(revs, e->item, e->name);
2593 2594 2595
		if (commit) {
			if (!(commit->object.flags & SEEN)) {
				commit->object.flags |= SEEN;
2596
				next = commit_list_append(commit, next);
2597 2598
			}
		}
2599
		e++;
2600
	}
R
René Scharfe 已提交
2601 2602
	if (!revs->leak_pending)
		free(list);
2603

2604
	/* Signal whether we need per-parent treesame decoration */
2605 2606
	if (revs->simplify_merges ||
	    (revs->limited && limiting_can_increase_treesame(revs)))
2607 2608
		revs->treesame.name = "treesame";

2609 2610
	if (revs->no_walk != REVISION_WALK_NO_WALK_UNSORTED)
		commit_list_sort_by_date(&revs->commits);
L
Linus Torvalds 已提交
2611
	if (revs->no_walk)
2612
		return 0;
2613
	if (revs->limited)
2614 2615
		if (limit_list(revs) < 0)
			return -1;
2616
	if (revs->topo_order)
J
Junio C Hamano 已提交
2617
		sort_in_topological_order(&revs->commits, revs->sort_order);
2618 2619
	if (revs->line_level_traverse)
		line_log_filter(revs);
2620 2621
	if (revs->simplify_merges)
		simplify_merges(revs);
2622 2623
	if (revs->children.name)
		set_children(revs);
2624
	return 0;
2625 2626
}

2627
static enum rewrite_result rewrite_one(struct rev_info *revs, struct commit **pp)
2628
{
2629 2630
	struct commit_list *cache = NULL;

2631 2632
	for (;;) {
		struct commit *p = *pp;
2633
		if (!revs->limited)
2634
			if (add_parents_to_list(revs, p, &revs->commits, &cache) < 0)
2635
				return rewrite_one_error;
2636 2637 2638
		if (p->object.flags & UNINTERESTING)
			return rewrite_one_ok;
		if (!(p->object.flags & TREESAME))
2639
			return rewrite_one_ok;
2640
		if (!p->parents)
2641
			return rewrite_one_noparents;
2642 2643 2644
		if ((p = one_relevant_parent(revs, p->parents)) == NULL)
			return rewrite_one_ok;
		*pp = p;
2645 2646 2647
	}
}

B
Bo Yang 已提交
2648 2649
int rewrite_parents(struct rev_info *revs, struct commit *commit,
	rewrite_parent_fn_t rewrite_parent)
2650 2651 2652 2653
{
	struct commit_list **pp = &commit->parents;
	while (*pp) {
		struct commit_list *parent = *pp;
B
Bo Yang 已提交
2654
		switch (rewrite_parent(revs, &parent->item)) {
2655 2656 2657
		case rewrite_one_ok:
			break;
		case rewrite_one_noparents:
2658 2659
			*pp = parent->next;
			continue;
2660 2661
		case rewrite_one_error:
			return -1;
2662 2663 2664
		}
		pp = &parent->next;
	}
2665
	remove_duplicate_parents(revs, commit);
2666
	return 0;
2667 2668
}

2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687 2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698 2699 2700 2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713
static int commit_rewrite_person(struct strbuf *buf, const char *what, struct string_list *mailmap)
{
	char *person, *endp;
	size_t len, namelen, maillen;
	const char *name;
	const char *mail;
	struct ident_split ident;

	person = strstr(buf->buf, what);
	if (!person)
		return 0;

	person += strlen(what);
	endp = strchr(person, '\n');
	if (!endp)
		return 0;

	len = endp - person;

	if (split_ident_line(&ident, person, len))
		return 0;

	mail = ident.mail_begin;
	maillen = ident.mail_end - ident.mail_begin;
	name = ident.name_begin;
	namelen = ident.name_end - ident.name_begin;

	if (map_user(mailmap, &mail, &maillen, &name, &namelen)) {
		struct strbuf namemail = STRBUF_INIT;

		strbuf_addf(&namemail, "%.*s <%.*s>",
			    (int)namelen, name, (int)maillen, mail);

		strbuf_splice(buf, ident.name_begin - buf->buf,
			      ident.mail_end - ident.name_begin + 1,
			      namemail.buf, namemail.len);

		strbuf_release(&namemail);

		return 1;
	}

	return 0;
}

2714 2715
static int commit_match(struct commit *commit, struct rev_info *opt)
{
2716
	int retval;
2717 2718
	const char *encoding;
	char *message;
2719
	struct strbuf buf = STRBUF_INIT;
2720

2721
	if (!opt->grep_filter.pattern_list && !opt->grep_filter.header_list)
2722
		return 1;
2723 2724 2725

	/* Prepend "fake" headers as needed */
	if (opt->grep_filter.use_reflog_filter) {
2726 2727 2728 2729
		strbuf_addstr(&buf, "reflog ");
		get_reflog_message(&buf, opt->reflog_info);
		strbuf_addch(&buf, '\n');
	}
2730

2731 2732 2733 2734 2735 2736 2737 2738
	/*
	 * We grep in the user's output encoding, under the assumption that it
	 * is the encoding they are most likely to write their grep pattern
	 * for. In addition, it means we will match the "notes" encoding below,
	 * so we will not end up with a buffer that has two different encodings
	 * in it.
	 */
	encoding = get_log_output_encoding();
2739
	message = logmsg_reencode(commit, NULL, encoding);
2740

2741 2742
	/* Copy the commit to temporary if we are using "fake" headers */
	if (buf.len)
2743
		strbuf_addstr(&buf, message);
2744

2745
	if (opt->grep_filter.header_list && opt->mailmap) {
2746
		if (!buf.len)
2747
			strbuf_addstr(&buf, message);
2748 2749 2750 2751 2752

		commit_rewrite_person(&buf, "\nauthor ", opt->mailmap);
		commit_rewrite_person(&buf, "\ncommitter ", opt->mailmap);
	}

2753 2754 2755
	/* Append "fake" message parts as needed */
	if (opt->show_notes) {
		if (!buf.len)
2756 2757
			strbuf_addstr(&buf, message);
		format_display_notes(commit->object.sha1, &buf, encoding, 1);
2758 2759
	}

2760
	/* Find either in the original commit message, or in the temporary */
2761 2762 2763 2764
	if (buf.len)
		retval = grep_buffer(&opt->grep_filter, buf.buf, buf.len);
	else
		retval = grep_buffer(&opt->grep_filter,
2765
				     message, strlen(message));
2766
	strbuf_release(&buf);
2767
	logmsg_free(message, commit);
2768
	return retval;
2769 2770
}

2771
static inline int want_ancestry(const struct rev_info *revs)
2772
{
2773
	return (revs->rewrite_parents || revs->children.name);
2774 2775
}

2776
enum commit_action get_commit_action(struct rev_info *revs, struct commit *commit)
L
Linus Torvalds 已提交
2777 2778 2779
{
	if (commit->object.flags & SHOWN)
		return commit_ignore;
2780
	if (revs->unpacked && has_sha1_pack(commit->object.sha1))
L
Linus Torvalds 已提交
2781
		return commit_ignore;
2782 2783
	if (revs->show_all)
		return commit_show;
L
Linus Torvalds 已提交
2784 2785 2786 2787
	if (commit->object.flags & UNINTERESTING)
		return commit_ignore;
	if (revs->min_age != -1 && (commit->date > revs->min_age))
		return commit_ignore;
2788
	if (revs->min_parents || (revs->max_parents >= 0)) {
2789
		int n = commit_list_count(commit->parents);
2790 2791 2792 2793
		if ((n < revs->min_parents) ||
		    ((revs->max_parents >= 0) && (n > revs->max_parents)))
			return commit_ignore;
	}
L
Linus Torvalds 已提交
2794 2795
	if (!commit_match(commit, revs))
		return commit_ignore;
L
Linus Torvalds 已提交
2796
	if (revs->prune && revs->dense) {
L
Linus Torvalds 已提交
2797
		/* Commit without changes? */
2798
		if (commit->object.flags & TREESAME) {
2799 2800
			int n;
			struct commit_list *p;
L
Linus Torvalds 已提交
2801
			/* drop merges unless we want parenthood */
2802
			if (!want_ancestry(revs))
L
Linus Torvalds 已提交
2803
				return commit_ignore;
2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815
			/*
			 * If we want ancestry, then need to keep any merges
			 * between relevant commits to tie together topology.
			 * For consistency with TREESAME and simplification
			 * use "relevant" here rather than just INTERESTING,
			 * to treat bottom commit(s) as part of the topology.
			 */
			for (n = 0, p = commit->parents; p; p = p->next)
				if (relevant_commit(p->item))
					if (++n >= 2)
						return commit_show;
			return commit_ignore;
L
Linus Torvalds 已提交
2816 2817 2818 2819 2820
		}
	}
	return commit_show;
}

2821 2822 2823 2824 2825 2826 2827
enum commit_action simplify_commit(struct rev_info *revs, struct commit *commit)
{
	enum commit_action action = get_commit_action(revs, commit);

	if (action == commit_show &&
	    !revs->show_all &&
	    revs->prune && revs->dense && want_ancestry(revs)) {
2828 2829 2830 2831 2832 2833 2834 2835
		/*
		 * --full-diff on simplified parents is no good: it
		 * will show spurious changes from the commits that
		 * were elided.  So we save the parents on the side
		 * when --full-diff is in effect.
		 */
		if (revs->full_diff)
			save_parents(revs, commit);
B
Bo Yang 已提交
2836
		if (rewrite_parents(revs, commit, rewrite_one) < 0)
2837 2838 2839 2840 2841
			return commit_error;
	}
	return action;
}

J
Junio C Hamano 已提交
2842
static struct commit *get_revision_1(struct rev_info *revs)
2843
{
J
Junio C Hamano 已提交
2844
	if (!revs->commits)
2845 2846
		return NULL;

2847
	do {
L
Linus Torvalds 已提交
2848 2849
		struct commit_list *entry = revs->commits;
		struct commit *commit = entry->item;
2850

L
Linus Torvalds 已提交
2851 2852
		revs->commits = entry->next;
		free(entry);
2853

2854
		if (revs->reflog_info) {
2855
			save_parents(revs, commit);
2856
			fake_reflog_parent(revs->reflog_info, commit);
2857 2858
			commit->object.flags &= ~(ADDED | SEEN | SHOWN);
		}
2859

2860 2861
		/*
		 * If we haven't done the list limiting, we need to look at
2862 2863
		 * the parents here. We also need to do the date-based limiting
		 * that we'd otherwise have done in limit_list().
2864
		 */
2865
		if (!revs->limited) {
2866
			if (revs->max_age != -1 &&
2867 2868
			    (commit->date < revs->max_age))
				continue;
2869 2870 2871 2872 2873
			if (add_parents_to_list(revs, commit, &revs->commits, NULL) < 0) {
				if (!revs->ignore_missing_links)
					die("Failed to traverse parents of commit %s",
						sha1_to_hex(commit->object.sha1));
			}
2874
		}
2875

L
Linus Torvalds 已提交
2876 2877
		switch (simplify_commit(revs, commit)) {
		case commit_ignore:
2878
			continue;
L
Linus Torvalds 已提交
2879
		case commit_error:
2880 2881
			die("Failed to simplify parents of commit %s",
			    sha1_to_hex(commit->object.sha1));
L
Linus Torvalds 已提交
2882 2883
		default:
			return commit;
J
Junio C Hamano 已提交
2884
		}
2885 2886 2887
	} while (revs->commits);
	return NULL;
}
J
Junio C Hamano 已提交
2888

2889 2890 2891 2892 2893
/*
 * Return true for entries that have not yet been shown.  (This is an
 * object_array_each_func_t.)
 */
static int entry_unshown(struct object_array_entry *entry, void *cb_data_unused)
2894
{
2895 2896
	return !(entry->item->flags & SHOWN);
}
2897

2898 2899 2900 2901 2902 2903 2904 2905
/*
 * If array is on the verge of a realloc, garbage-collect any entries
 * that have already been shown to try to free up some space.
 */
static void gc_boundary(struct object_array *array)
{
	if (array->nr == array->alloc)
		object_array_filter(array, entry_unshown, NULL);
2906 2907
}

2908 2909 2910 2911 2912 2913 2914 2915 2916 2917 2918 2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929 2930 2931 2932 2933 2934 2935 2936 2937 2938 2939 2940 2941 2942 2943 2944 2945
static void create_boundary_commit_list(struct rev_info *revs)
{
	unsigned i;
	struct commit *c;
	struct object_array *array = &revs->boundary_commits;
	struct object_array_entry *objects = array->objects;

	/*
	 * If revs->commits is non-NULL at this point, an error occurred in
	 * get_revision_1().  Ignore the error and continue printing the
	 * boundary commits anyway.  (This is what the code has always
	 * done.)
	 */
	if (revs->commits) {
		free_commit_list(revs->commits);
		revs->commits = NULL;
	}

	/*
	 * Put all of the actual boundary commits from revs->boundary_commits
	 * into revs->commits
	 */
	for (i = 0; i < array->nr; i++) {
		c = (struct commit *)(objects[i].item);
		if (!c)
			continue;
		if (!(c->object.flags & CHILD_SHOWN))
			continue;
		if (c->object.flags & (SHOWN | BOUNDARY))
			continue;
		c->object.flags |= BOUNDARY;
		commit_list_insert(c, &revs->commits);
	}

	/*
	 * If revs->topo_order is set, sort the boundary commits
	 * in topological order
	 */
J
Junio C Hamano 已提交
2946
	sort_in_topological_order(&revs->commits, revs->sort_order);
2947 2948
}

2949
static struct commit *get_revision_internal(struct rev_info *revs)
J
Junio C Hamano 已提交
2950 2951
{
	struct commit *c = NULL;
2952 2953 2954
	struct commit_list *l;

	if (revs->boundary == 2) {
2955 2956 2957 2958 2959 2960 2961 2962 2963
		/*
		 * All of the normal commits have already been returned,
		 * and we are now returning boundary commits.
		 * create_boundary_commit_list() has populated
		 * revs->commits with the remaining commits to return.
		 */
		c = pop_commit(&revs->commits);
		if (c)
			c->object.flags |= SHOWN;
2964 2965 2966
		return c;
	}

2967
	/*
2968 2969 2970 2971 2972 2973 2974 2975
	 * If our max_count counter has reached zero, then we are done. We
	 * don't simply return NULL because we still might need to show
	 * boundary commits. But we want to avoid calling get_revision_1, which
	 * might do a considerable amount of work finding the next commit only
	 * for us to throw it away.
	 *
	 * If it is non-zero, then either we don't have a max_count at all
	 * (-1), or it is still counting, in which case we decrement.
2976
	 */
2977 2978 2979 2980 2981 2982 2983 2984 2985
	if (revs->max_count) {
		c = get_revision_1(revs);
		if (c) {
			while (0 < revs->skip_count) {
				revs->skip_count--;
				c = get_revision_1(revs);
				if (!c)
					break;
			}
2986
		}
2987

2988 2989
		if (revs->max_count > 0)
			revs->max_count--;
J
Junio C Hamano 已提交
2990
	}
2991

2992 2993 2994 2995
	if (c)
		c->object.flags |= SHOWN;

	if (!revs->boundary) {
J
Junio C Hamano 已提交
2996
		return c;
2997
	}
2998 2999 3000 3001 3002 3003 3004 3005

	if (!c) {
		/*
		 * get_revision_1() runs out the commits, and
		 * we are done computing the boundaries.
		 * switch to boundary commits output mode.
		 */
		revs->boundary = 2;
3006 3007 3008 3009 3010 3011 3012

		/*
		 * Update revs->commits to contain the list of
		 * boundary commits.
		 */
		create_boundary_commit_list(revs);

3013
		return get_revision_internal(revs);
3014 3015 3016 3017 3018 3019 3020 3021 3022 3023 3024 3025
	}

	/*
	 * boundary commits are the commits that are parents of the
	 * ones we got from get_revision_1() but they themselves are
	 * not returned from get_revision_1().  Before returning
	 * 'c', we need to mark its parents that they could be boundaries.
	 */

	for (l = c->parents; l; l = l->next) {
		struct object *p;
		p = &(l->item->object);
3026
		if (p->flags & (CHILD_SHOWN | SHOWN))
3027 3028 3029 3030 3031 3032 3033
			continue;
		p->flags |= CHILD_SHOWN;
		gc_boundary(&revs->boundary_commits);
		add_object_array(p, NULL, &revs->boundary_commits);
	}

	return c;
J
Junio C Hamano 已提交
3034
}
3035 3036 3037

struct commit *get_revision(struct rev_info *revs)
{
3038 3039 3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054
	struct commit *c;
	struct commit_list *reversed;

	if (revs->reverse) {
		reversed = NULL;
		while ((c = get_revision_internal(revs))) {
			commit_list_insert(c, &reversed);
		}
		revs->commits = reversed;
		revs->reverse = 0;
		revs->reverse_output_stage = 1;
	}

	if (revs->reverse_output_stage)
		return pop_commit(&revs->commits);

	c = get_revision_internal(revs);
3055 3056
	if (c && revs->graph)
		graph_update(revs->graph, c);
3057 3058
	if (!c)
		free_saved_parents(revs);
3059 3060
	return c;
}
3061 3062 3063 3064 3065 3066 3067

char *get_revision_mark(const struct rev_info *revs, const struct commit *commit)
{
	if (commit->object.flags & BOUNDARY)
		return "-";
	else if (commit->object.flags & UNINTERESTING)
		return "^";
3068 3069
	else if (commit->object.flags & PATCHSAME)
		return "=";
3070 3071 3072 3073 3074 3075 3076
	else if (!revs || revs->left_right) {
		if (commit->object.flags & SYMMETRIC_LEFT)
			return "<";
		else
			return ">";
	} else if (revs->graph)
		return "*";
3077 3078
	else if (revs->cherry_mark)
		return "+";
3079 3080
	return "";
}
3081 3082 3083 3084 3085 3086 3087 3088 3089

void put_revision_mark(const struct rev_info *revs, const struct commit *commit)
{
	char *mark = get_revision_mark(revs, commit);
	if (!strlen(mark))
		return;
	fputs(mark, stdout);
	putchar(' ');
}
3090 3091 3092

define_commit_slab(saved_parents, struct commit_list *);

3093 3094
#define EMPTY_PARENT_LIST ((struct commit_list *)-1)

3095 3096 3097 3098 3099 3100 3101 3102 3103 3104
void save_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list **pp;

	if (!revs->saved_parents_slab) {
		revs->saved_parents_slab = xmalloc(sizeof(struct saved_parents));
		init_saved_parents(revs->saved_parents_slab);
	}

	pp = saved_parents_at(revs->saved_parents_slab, commit);
3105 3106 3107 3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120

	/*
	 * When walking with reflogs, we may visit the same commit
	 * several times: once for each appearance in the reflog.
	 *
	 * In this case, save_parents() will be called multiple times.
	 * We want to keep only the first set of parents.  We need to
	 * store a sentinel value for an empty (i.e., NULL) parent
	 * list to distinguish it from a not-yet-saved list, however.
	 */
	if (*pp)
		return;
	if (commit->parents)
		*pp = copy_commit_list(commit->parents);
	else
		*pp = EMPTY_PARENT_LIST;
3121 3122 3123 3124
}

struct commit_list *get_saved_parents(struct rev_info *revs, const struct commit *commit)
{
3125 3126
	struct commit_list *parents;

3127 3128 3129
	if (!revs->saved_parents_slab)
		return commit->parents;

3130 3131 3132 3133
	parents = *saved_parents_at(revs->saved_parents_slab, commit);
	if (parents == EMPTY_PARENT_LIST)
		return NULL;
	return parents;
3134 3135 3136 3137 3138 3139 3140
}

void free_saved_parents(struct rev_info *revs)
{
	if (revs->saved_parents_slab)
		clear_saved_parents(revs->saved_parents_slab);
}