revision.c 82.8 KB
Newer Older
1 2 3 4 5
#include "cache.h"
#include "tag.h"
#include "blob.h"
#include "tree.h"
#include "commit.h"
6
#include "diff.h"
7 8
#include "refs.h"
#include "revision.h"
9
#include "graph.h"
10
#include "grep.h"
11
#include "reflog-walk.h"
J
Junio C Hamano 已提交
12
#include "patch-ids.h"
13
#include "decorate.h"
14
#include "log-tree.h"
15
#include "string-list.h"
16
#include "mailmap.h"
17

18 19
volatile show_early_output_fn_t show_early_output;

20
char *path_name(const struct name_path *path, const char *name)
21
{
22
	const struct name_path *p;
23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
	char *n, *m;
	int nlen = strlen(name);
	int len = nlen + 1;

	for (p = path; p; p = p->up) {
		if (p->elem_len)
			len += p->elem_len + 1;
	}
	n = xmalloc(len);
	m = n + len - (nlen + 1);
	strcpy(m, name);
	for (p = path; p; p = p->up) {
		if (p->elem_len) {
			m -= p->elem_len + 1;
			memcpy(m, p->elem, p->elem_len);
			m[p->elem_len] = '/';
		}
	}
	return n;
}

44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
static int show_path_component_truncated(FILE *out, const char *name, int len)
{
	int cnt;
	for (cnt = 0; cnt < len; cnt++) {
		int ch = name[cnt];
		if (!ch || ch == '\n')
			return -1;
		fputc(ch, out);
	}
	return len;
}

static int show_path_truncated(FILE *out, const struct name_path *path)
{
	int emitted, ours;

	if (!path)
		return 0;
	emitted = show_path_truncated(out, path->up);
	if (emitted < 0)
		return emitted;
	if (emitted)
		fputc('/', out);
	ours = show_path_component_truncated(out, path->elem, path->elem_len);
	if (ours < 0)
		return ours;
	return ours || emitted;
}

73 74
void show_object_with_name(FILE *out, struct object *obj, const struct name_path *path, const char *component)
{
75 76 77 78
	struct name_path leaf;
	leaf.up = (struct name_path *)path;
	leaf.elem = component;
	leaf.elem_len = strlen(component);
79

80 81 82
	fprintf(out, "%s ", sha1_to_hex(obj->sha1));
	show_path_truncated(out, &leaf);
	fputc('\n', out);
83 84
}

85 86 87 88
void add_object(struct object *obj,
		struct object_array *p,
		struct name_path *path,
		const char *name)
89
{
90
	add_object_array(obj, path_name(path, name), p);
91 92 93 94
}

static void mark_blob_uninteresting(struct blob *blob)
{
95 96
	if (!blob)
		return;
97 98 99 100 101 102 103
	if (blob->object.flags & UNINTERESTING)
		return;
	blob->object.flags |= UNINTERESTING;
}

void mark_tree_uninteresting(struct tree *tree)
{
104
	struct tree_desc desc;
105
	struct name_entry entry;
106 107
	struct object *obj = &tree->object;

108 109
	if (!tree)
		return;
110 111 112 113 114 115 116
	if (obj->flags & UNINTERESTING)
		return;
	obj->flags |= UNINTERESTING;
	if (!has_sha1_file(obj->sha1))
		return;
	if (parse_tree(tree) < 0)
		die("bad tree %s", sha1_to_hex(obj->sha1));
117

118
	init_tree_desc(&desc, tree->buffer, tree->size);
119
	while (tree_entry(&desc, &entry)) {
120 121
		switch (object_type(entry.mode)) {
		case OBJ_TREE:
122
			mark_tree_uninteresting(lookup_tree(entry.sha1));
123 124
			break;
		case OBJ_BLOB:
125
			mark_blob_uninteresting(lookup_blob(entry.sha1));
126 127 128 129 130
			break;
		default:
			/* Subproject commit - not in this repository */
			break;
		}
131
	}
132 133 134 135 136 137 138

	/*
	 * We don't care about the tree any more
	 * after it has been marked uninteresting.
	 */
	free(tree->buffer);
	tree->buffer = NULL;
139 140 141 142
}

void mark_parents_uninteresting(struct commit *commit)
{
143 144 145 146
	struct commit_list *parents = NULL, *l;

	for (l = commit->parents; l; l = l->next)
		commit_list_insert(l->item, &parents);
147 148 149

	while (parents) {
		struct commit *commit = parents->item;
150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168
		l = parents;
		parents = parents->next;
		free(l);

		while (commit) {
			/*
			 * A missing commit is ok iff its parent is marked
			 * uninteresting.
			 *
			 * We just mark such a thing parsed, so that when
			 * it is popped next time around, we won't be trying
			 * to parse it and get an error.
			 */
			if (!has_sha1_file(commit->object.sha1))
				commit->object.parsed = 1;

			if (commit->object.flags & UNINTERESTING)
				break;

169
			commit->object.flags |= UNINTERESTING;
170

171 172 173 174 175 176 177 178
			/*
			 * Normally we haven't parsed the parent
			 * yet, so we won't have a parent of a parent
			 * here. However, it may turn out that we've
			 * reached this commit some other way (where it
			 * wasn't uninteresting), in which case we need
			 * to mark its parents recursively too..
			 */
179 180
			if (!commit->parents)
				break;
181

182 183 184 185
			for (l = commit->parents->next; l; l = l->next)
				commit_list_insert(l->item, &parents);
			commit = commit->parents->item;
		}
186 187 188
	}
}

J
Junio C Hamano 已提交
189
static void add_pending_object_with_mode(struct rev_info *revs, struct object *obj, const char *name, unsigned mode)
190
{
J
Junio C Hamano 已提交
191 192
	if (!obj)
		return;
L
Linus Torvalds 已提交
193
	if (revs->no_walk && (obj->flags & UNINTERESTING))
L
Linus Torvalds 已提交
194
		revs->no_walk = 0;
J
Junio C Hamano 已提交
195 196 197 198 199 200 201 202 203 204 205 206 207 208
	if (revs->reflog_info && obj->type == OBJ_COMMIT) {
		struct strbuf buf = STRBUF_INIT;
		int len = interpret_branch_name(name, &buf);
		int st;

		if (0 < len && name[len] && buf.len)
			strbuf_addstr(&buf, name + len);
		st = add_reflog_for_walk(revs->reflog_info,
					 (struct commit *)obj,
					 buf.buf[0] ? buf.buf: name);
		strbuf_release(&buf);
		if (st)
			return;
	}
209
	add_object_array_with_mode(obj, name, &revs->pending, mode);
210 211
}

J
Junio C Hamano 已提交
212 213 214 215 216
void add_pending_object(struct rev_info *revs, struct object *obj, const char *name)
{
	add_pending_object_with_mode(revs, obj, name, S_IFINVALID);
}

217 218 219 220 221 222 223 224 225 226 227 228
void add_head_to_pending(struct rev_info *revs)
{
	unsigned char sha1[20];
	struct object *obj;
	if (get_sha1("HEAD", sha1))
		return;
	obj = parse_object(sha1);
	if (!obj)
		return;
	add_pending_object(revs, obj, "HEAD");
}

229
static struct object *get_reference(struct rev_info *revs, const char *name, const unsigned char *sha1, unsigned int flags)
230 231 232 233
{
	struct object *object;

	object = parse_object(sha1);
J
Junio C Hamano 已提交
234 235 236
	if (!object) {
		if (revs->ignore_missing)
			return object;
237
		die("bad object %s", name);
J
Junio C Hamano 已提交
238
	}
239 240 241 242
	object->flags |= flags;
	return object;
}

243 244 245 246 247 248 249
void add_pending_sha1(struct rev_info *revs, const char *name,
		      const unsigned char *sha1, unsigned int flags)
{
	struct object *object = get_reference(revs, name, sha1, flags);
	add_pending_object(revs, object, name);
}

250 251 252
static struct commit *handle_commit(struct rev_info *revs, struct object *object, const char *name)
{
	unsigned long flags = object->flags;
253 254 255 256

	/*
	 * Tag object? Look what it points to..
	 */
257
	while (object->type == OBJ_TAG) {
258
		struct tag *tag = (struct tag *) object;
259
		if (revs->tag_objects && !(flags & UNINTERESTING))
260
			add_pending_object(revs, object, tag->tag);
261 262
		if (!tag->tagged)
			die("bad tag");
263
		object = parse_object(tag->tagged->sha1);
264 265 266
		if (!object) {
			if (flags & UNINTERESTING)
				return NULL;
267
			die("bad object %s", sha1_to_hex(tag->tagged->sha1));
268
		}
269 270 271 272 273 274
	}

	/*
	 * Commit object? Just return it, we'll do all the complex
	 * reachability crud.
	 */
275
	if (object->type == OBJ_COMMIT) {
276 277 278
		struct commit *commit = (struct commit *)object;
		if (parse_commit(commit) < 0)
			die("unable to parse commit %s", name);
279
		if (flags & UNINTERESTING) {
280
			commit->object.flags |= UNINTERESTING;
281
			mark_parents_uninteresting(commit);
282 283
			revs->limited = 1;
		}
284 285
		if (revs->show_source && !commit->util)
			commit->util = (void *) name;
286 287 288 289
		return commit;
	}

	/*
M
Mike Ralphson 已提交
290
	 * Tree object? Either mark it uninteresting, or add it
291 292
	 * to the list of objects to look at later..
	 */
293
	if (object->type == OBJ_TREE) {
294 295 296 297 298 299 300 301 302 303 304 305 306 307
		struct tree *tree = (struct tree *)object;
		if (!revs->tree_objects)
			return NULL;
		if (flags & UNINTERESTING) {
			mark_tree_uninteresting(tree);
			return NULL;
		}
		add_pending_object(revs, object, "");
		return NULL;
	}

	/*
	 * Blob object? You know the drill by now..
	 */
308
	if (object->type == OBJ_BLOB) {
309 310 311 312 313 314 315 316 317 318 319 320 321
		struct blob *blob = (struct blob *)object;
		if (!revs->blob_objects)
			return NULL;
		if (flags & UNINTERESTING) {
			mark_blob_uninteresting(blob);
			return NULL;
		}
		add_pending_object(revs, object, "");
		return NULL;
	}
	die("%s is unknown object", name);
}

322 323 324 325 326 327 328 329 330 331 332 333 334
static int everybody_uninteresting(struct commit_list *orig)
{
	struct commit_list *list = orig;
	while (list) {
		struct commit *commit = list->item;
		list = list->next;
		if (commit->object.flags & UNINTERESTING)
			continue;
		return 0;
	}
	return 1;
}

335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408
/*
 * A definition of "relevant" commit that we can use to simplify limited graphs
 * by eliminating side branches.
 *
 * A "relevant" commit is one that is !UNINTERESTING (ie we are including it
 * in our list), or that is a specified BOTTOM commit. Then after computing
 * a limited list, during processing we can generally ignore boundary merges
 * coming from outside the graph, (ie from irrelevant parents), and treat
 * those merges as if they were single-parent. TREESAME is defined to consider
 * only relevant parents, if any. If we are TREESAME to our on-graph parents,
 * we don't care if we were !TREESAME to non-graph parents.
 *
 * Treating bottom commits as relevant ensures that a limited graph's
 * connection to the actual bottom commit is not viewed as a side branch, but
 * treated as part of the graph. For example:
 *
 *   ....Z...A---X---o---o---B
 *        .     /
 *         W---Y
 *
 * When computing "A..B", the A-X connection is at least as important as
 * Y-X, despite A being flagged UNINTERESTING.
 *
 * And when computing --ancestry-path "A..B", the A-X connection is more
 * important than Y-X, despite both A and Y being flagged UNINTERESTING.
 */
static inline int relevant_commit(struct commit *commit)
{
	return (commit->object.flags & (UNINTERESTING | BOTTOM)) != UNINTERESTING;
}

/*
 * Return a single relevant commit from a parent list. If we are a TREESAME
 * commit, and this selects one of our parents, then we can safely simplify to
 * that parent.
 */
static struct commit *one_relevant_parent(const struct rev_info *revs,
					  struct commit_list *orig)
{
	struct commit_list *list = orig;
	struct commit *relevant = NULL;

	if (!orig)
		return NULL;

	/*
	 * For 1-parent commits, or if first-parent-only, then return that
	 * first parent (even if not "relevant" by the above definition).
	 * TREESAME will have been set purely on that parent.
	 */
	if (revs->first_parent_only || !orig->next)
		return orig->item;

	/*
	 * For multi-parent commits, identify a sole relevant parent, if any.
	 * If we have only one relevant parent, then TREESAME will be set purely
	 * with regard to that parent, and we can simplify accordingly.
	 *
	 * If we have more than one relevant parent, or no relevant parents
	 * (and multiple irrelevant ones), then we can't select a parent here
	 * and return NULL.
	 */
	while (list) {
		struct commit *commit = list->item;
		list = list->next;
		if (relevant_commit(commit)) {
			if (relevant)
				return NULL;
			relevant = commit;
		}
	}
	return relevant;
}

409 410
/*
 * The goal is to get REV_TREE_NEW as the result only if the
411 412 413 414 415 416
 * diff consists of all '+' (and no other changes), REV_TREE_OLD
 * if the whole diff is removal of old data, and otherwise
 * REV_TREE_DIFFERENT (of course if the trees are the same we
 * want REV_TREE_SAME).
 * That means that once we get to REV_TREE_DIFFERENT, we do not
 * have to look any further.
417
 */
418
static int tree_difference = REV_TREE_SAME;
419 420 421 422

static void file_add_remove(struct diff_options *options,
		    int addremove, unsigned mode,
		    const unsigned char *sha1,
423
		    int sha1_valid,
424
		    const char *fullpath, unsigned dirty_submodule)
425
{
426
	int diff = addremove == '+' ? REV_TREE_NEW : REV_TREE_OLD;
427

428
	tree_difference |= diff;
429
	if (tree_difference == REV_TREE_DIFFERENT)
430
		DIFF_OPT_SET(options, HAS_CHANGES);
431 432 433 434 435 436
}

static void file_change(struct diff_options *options,
		 unsigned old_mode, unsigned new_mode,
		 const unsigned char *old_sha1,
		 const unsigned char *new_sha1,
437
		 int old_sha1_valid, int new_sha1_valid,
438 439
		 const char *fullpath,
		 unsigned old_dirty_submodule, unsigned new_dirty_submodule)
440
{
441
	tree_difference = REV_TREE_DIFFERENT;
442
	DIFF_OPT_SET(options, HAS_CHANGES);
443 444
}

445
static int rev_compare_tree(struct rev_info *revs, struct commit *parent, struct commit *commit)
446
{
447 448 449
	struct tree *t1 = parent->tree;
	struct tree *t2 = commit->tree;

450
	if (!t1)
451
		return REV_TREE_NEW;
452 453
	if (!t2)
		return REV_TREE_OLD;
454 455 456 457 458 459 460 461 462 463 464 465 466 467 468

	if (revs->simplify_by_decoration) {
		/*
		 * If we are simplifying by decoration, then the commit
		 * is worth showing if it has a tag pointing at it.
		 */
		if (lookup_decoration(&name_decoration, &commit->object))
			return REV_TREE_DIFFERENT;
		/*
		 * A commit that is not pointed by a tag is uninteresting
		 * if we are not limited by path.  This means that you will
		 * see the usual "commits that touch the paths" plus any
		 * tagged commit by specifying both --simplify-by-decoration
		 * and pathspec.
		 */
469
		if (!revs->prune_data.nr)
470 471
			return REV_TREE_SAME;
	}
472

473
	tree_difference = REV_TREE_SAME;
474
	DIFF_OPT_CLR(&revs->pruning, HAS_CHANGES);
475
	if (diff_tree_sha1(t1->object.sha1, t2->object.sha1, "",
476
			   &revs->pruning) < 0)
477
		return REV_TREE_DIFFERENT;
478 479 480
	return tree_difference;
}

481
static int rev_same_tree_as_empty(struct rev_info *revs, struct commit *commit)
482 483 484
{
	int retval;
	void *tree;
485
	unsigned long size;
486
	struct tree_desc empty, real;
487
	struct tree *t1 = commit->tree;
488 489 490 491

	if (!t1)
		return 0;

492
	tree = read_object_with_reference(t1->object.sha1, tree_type, &size, NULL);
493 494
	if (!tree)
		return 0;
495 496
	init_tree_desc(&real, tree, size);
	init_tree_desc(&empty, "", 0);
497

498
	tree_difference = REV_TREE_SAME;
499
	DIFF_OPT_CLR(&revs->pruning, HAS_CHANGES);
500
	retval = diff_tree(&empty, &real, "", &revs->pruning);
501 502
	free(tree);

503
	return retval >= 0 && (tree_difference == REV_TREE_SAME);
504 505
}

506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578
struct treesame_state {
	unsigned int nparents;
	unsigned char treesame[FLEX_ARRAY];
};

static struct treesame_state *initialise_treesame(struct rev_info *revs, struct commit *commit)
{
	unsigned n = commit_list_count(commit->parents);
	struct treesame_state *st = xcalloc(1, sizeof(*st) + n);
	st->nparents = n;
	add_decoration(&revs->treesame, &commit->object, st);
	return st;
}

/*
 * Must be called immediately after removing the nth_parent from a commit's
 * parent list, if we are maintaining the per-parent treesame[] decoration.
 * This does not recalculate the master TREESAME flag - update_treesame()
 * should be called to update it after a sequence of treesame[] modifications
 * that may have affected it.
 */
static int compact_treesame(struct rev_info *revs, struct commit *commit, unsigned nth_parent)
{
	struct treesame_state *st;
	int old_same;

	if (!commit->parents) {
		/*
		 * Have just removed the only parent from a non-merge.
		 * Different handling, as we lack decoration.
		 */
		if (nth_parent != 0)
			die("compact_treesame %u", nth_parent);
		old_same = !!(commit->object.flags & TREESAME);
		if (rev_same_tree_as_empty(revs, commit))
			commit->object.flags |= TREESAME;
		else
			commit->object.flags &= ~TREESAME;
		return old_same;
	}

	st = lookup_decoration(&revs->treesame, &commit->object);
	if (!st || nth_parent >= st->nparents)
		die("compact_treesame %u", nth_parent);

	old_same = st->treesame[nth_parent];
	memmove(st->treesame + nth_parent,
		st->treesame + nth_parent + 1,
		st->nparents - nth_parent - 1);

	/*
	 * If we've just become a non-merge commit, update TREESAME
	 * immediately, and remove the no-longer-needed decoration.
	 * If still a merge, defer update until update_treesame().
	 */
	if (--st->nparents == 1) {
		if (commit->parents->next)
			die("compact_treesame parents mismatch");
		if (st->treesame[0] && revs->dense)
			commit->object.flags |= TREESAME;
		else
			commit->object.flags &= ~TREESAME;
		free(add_decoration(&revs->treesame, &commit->object, NULL));
	}

	return old_same;
}

static unsigned update_treesame(struct rev_info *revs, struct commit *commit)
{
	if (commit->parents && commit->parents->next) {
		unsigned n;
		struct treesame_state *st;
579 580 581
		struct commit_list *p;
		unsigned relevant_parents;
		unsigned relevant_change, irrelevant_change;
582 583 584 585

		st = lookup_decoration(&revs->treesame, &commit->object);
		if (!st)
			die("update_treesame %s", sha1_to_hex(commit->object.sha1));
586 587 588 589 590 591 592 593
		relevant_parents = 0;
		relevant_change = irrelevant_change = 0;
		for (p = commit->parents, n = 0; p; n++, p = p->next) {
			if (relevant_commit(p->item)) {
				relevant_change |= !st->treesame[n];
				relevant_parents++;
			} else
				irrelevant_change |= !st->treesame[n];
594
		}
595 596 597 598
		if (relevant_parents ? relevant_change : irrelevant_change)
			commit->object.flags &= ~TREESAME;
		else
			commit->object.flags |= TREESAME;
599 600 601 602 603
	}

	return commit->object.flags & TREESAME;
}

604 605 606 607 608 609 610 611 612 613 614 615 616 617 618
static inline int limiting_can_increase_treesame(const struct rev_info *revs)
{
	/*
	 * TREESAME is irrelevant unless prune && dense;
	 * if simplify_history is set, we can't have a mixture of TREESAME and
	 *    !TREESAME INTERESTING parents (and we don't have treesame[]
	 *    decoration anyway);
	 * if first_parent_only is set, then the TREESAME flag is locked
	 *    against the first parent (and again we lack treesame[] decoration).
	 */
	return revs->prune && revs->dense &&
	       !revs->simplify_history &&
	       !revs->first_parent_only;
}

619 620 621
static void try_to_simplify_commit(struct rev_info *revs, struct commit *commit)
{
	struct commit_list **pp, *parent;
622
	struct treesame_state *ts = NULL;
623 624
	int relevant_change = 0, irrelevant_change = 0;
	int relevant_parents, nth_parent;
625

L
Linus Torvalds 已提交
626 627 628
	/*
	 * If we don't do pruning, everything is interesting
	 */
629
	if (!revs->prune)
L
Linus Torvalds 已提交
630 631
		return;

632 633 634 635
	if (!commit->tree)
		return;

	if (!commit->parents) {
636
		if (rev_same_tree_as_empty(revs, commit))
637
			commit->object.flags |= TREESAME;
638 639 640
		return;
	}

L
Linus Torvalds 已提交
641 642 643 644
	/*
	 * Normal non-merge commit? If we don't want to make the
	 * history dense, we consider it always to be a change..
	 */
645
	if (!revs->dense && !commit->parents->next)
L
Linus Torvalds 已提交
646 647
		return;

648
	for (pp = &commit->parents, nth_parent = 0, relevant_parents = 0;
649 650
	     (parent = *pp) != NULL;
	     pp = &parent->next, nth_parent++) {
651
		struct commit *p = parent->item;
652 653
		if (relevant_commit(p))
			relevant_parents++;
654

655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676
		if (nth_parent == 1) {
			/*
			 * This our second loop iteration - so we now know
			 * we're dealing with a merge.
			 *
			 * Do not compare with later parents when we care only about
			 * the first parent chain, in order to avoid derailing the
			 * traversal to follow a side branch that brought everything
			 * in the path we are limited to by the pathspec.
			 */
			if (revs->first_parent_only)
				break;
			/*
			 * If this will remain a potentially-simplifiable
			 * merge, remember per-parent treesame if needed.
			 * Initialise the array with the comparison from our
			 * first iteration.
			 */
			if (revs->treesame.name &&
			    !revs->simplify_history &&
			    !(commit->object.flags & UNINTERESTING)) {
				ts = initialise_treesame(revs, commit);
677
				if (!(irrelevant_change || relevant_change))
678 679 680
					ts->treesame[0] = 1;
			}
		}
681 682 683 684
		if (parse_commit(p) < 0)
			die("cannot simplify commit %s (because of %s)",
			    sha1_to_hex(commit->object.sha1),
			    sha1_to_hex(p->object.sha1));
685
		switch (rev_compare_tree(revs, p, commit)) {
686
		case REV_TREE_SAME:
687
			if (!revs->simplify_history || !relevant_commit(p)) {
688 689 690 691 692 693
				/* Even if a merge with an uninteresting
				 * side branch brought the entire change
				 * we are interested in, we do not want
				 * to lose the other branches of this
				 * merge, so we just keep going.
				 */
694 695
				if (ts)
					ts->treesame[nth_parent] = 1;
696 697
				continue;
			}
698 699
			parent->next = NULL;
			commit->parents = parent;
700
			commit->object.flags |= TREESAME;
701 702
			return;

703 704
		case REV_TREE_NEW:
			if (revs->remove_empty_trees &&
705
			    rev_same_tree_as_empty(revs, p)) {
706 707 708 709 710 711 712
				/* We are adding all the specified
				 * paths from this parent, so the
				 * history beyond this parent is not
				 * interesting.  Remove its parents
				 * (they are grandparents for us).
				 * IOW, we pretend this parent is a
				 * "root" commit.
713
				 */
714 715 716 717
				if (parse_commit(p) < 0)
					die("cannot simplify commit %s (invalid %s)",
					    sha1_to_hex(commit->object.sha1),
					    sha1_to_hex(p->object.sha1));
718
				p->parents = NULL;
719 720
			}
		/* fallthrough */
721
		case REV_TREE_OLD:
722
		case REV_TREE_DIFFERENT:
723 724 725 726
			if (relevant_commit(p))
				relevant_change = 1;
			else
				irrelevant_change = 1;
727 728 729 730
			continue;
		}
		die("bad tree compare for commit %s", sha1_to_hex(commit->object.sha1));
	}
731 732 733 734 735 736 737 738 739 740 741 742 743

	/*
	 * TREESAME is straightforward for single-parent commits. For merge
	 * commits, it is most useful to define it so that "irrelevant"
	 * parents cannot make us !TREESAME - if we have any relevant
	 * parents, then we only consider TREESAMEness with respect to them,
	 * allowing irrelevant merges from uninteresting branches to be
	 * simplified away. Only if we have only irrelevant parents do we
	 * base TREESAME on them. Note that this logic is replicated in
	 * update_treesame, which should be kept in sync.
	 */
	if (relevant_parents ? !relevant_change : !irrelevant_change)
		commit->object.flags |= TREESAME;
744 745
}

746
static void commit_list_insert_by_date_cached(struct commit *p, struct commit_list **head,
747 748 749 750 751
		    struct commit_list *cached_base, struct commit_list **cache)
{
	struct commit_list *new_entry;

	if (cached_base && p->date < cached_base->item->date)
752
		new_entry = commit_list_insert_by_date(p, &cached_base->next);
753
	else
754
		new_entry = commit_list_insert_by_date(p, head);
755 756 757 758 759 760 761

	if (cache && (!*cache || p->date < (*cache)->item->date))
		*cache = new_entry;
}

static int add_parents_to_list(struct rev_info *revs, struct commit *commit,
		    struct commit_list **list, struct commit_list **cache_ptr)
762 763
{
	struct commit_list *parent = commit->parents;
J
Junio C Hamano 已提交
764
	unsigned left_flag;
765
	struct commit_list *cached_base = cache_ptr ? *cache_ptr : NULL;
766

767
	if (commit->object.flags & ADDED)
768
		return 0;
769 770
	commit->object.flags |= ADDED;

771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786
	/*
	 * If the commit is uninteresting, don't try to
	 * prune parents - we want the maximal uninteresting
	 * set.
	 *
	 * Normally we haven't parsed the parent
	 * yet, so we won't have a parent of a parent
	 * here. However, it may turn out that we've
	 * reached this commit some other way (where it
	 * wasn't uninteresting), in which case we need
	 * to mark its parents recursively too..
	 */
	if (commit->object.flags & UNINTERESTING) {
		while (parent) {
			struct commit *p = parent->item;
			parent = parent->next;
787 788
			if (p)
				p->object.flags |= UNINTERESTING;
789
			if (parse_commit(p) < 0)
790
				continue;
791 792 793 794 795
			if (p->parents)
				mark_parents_uninteresting(p);
			if (p->object.flags & SEEN)
				continue;
			p->object.flags |= SEEN;
796
			commit_list_insert_by_date_cached(p, list, cached_base, cache_ptr);
797
		}
798
		return 0;
799 800 801 802 803 804 805
	}

	/*
	 * Ok, the commit wasn't uninteresting. Try to
	 * simplify the commit history and find the parent
	 * that has no differences in the path set if one exists.
	 */
L
Linus Torvalds 已提交
806
	try_to_simplify_commit(revs, commit);
807

L
Linus Torvalds 已提交
808
	if (revs->no_walk)
809
		return 0;
L
Linus Torvalds 已提交
810

J
Junio C Hamano 已提交
811
	left_flag = (commit->object.flags & SYMMETRIC_LEFT);
812

813
	for (parent = commit->parents; parent; parent = parent->next) {
814 815
		struct commit *p = parent->item;

816 817
		if (parse_commit(p) < 0)
			return -1;
818 819
		if (revs->show_source && !p->util)
			p->util = commit->util;
J
Junio C Hamano 已提交
820
		p->object.flags |= left_flag;
821 822
		if (!(p->object.flags & SEEN)) {
			p->object.flags |= SEEN;
823
			commit_list_insert_by_date_cached(p, list, cached_base, cache_ptr);
824
		}
J
Junio C Hamano 已提交
825
		if (revs->first_parent_only)
826
			break;
827
	}
828
	return 0;
829 830
}

831
static void cherry_pick_list(struct commit_list *list, struct rev_info *revs)
J
Junio C Hamano 已提交
832 833 834 835 836
{
	struct commit_list *p;
	int left_count = 0, right_count = 0;
	int left_first;
	struct patch_ids ids;
837
	unsigned cherry_flag;
J
Junio C Hamano 已提交
838 839 840 841 842 843 844 845 846 847 848 849 850

	/* First count the commits on the left and on the right */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		unsigned flags = commit->object.flags;
		if (flags & BOUNDARY)
			;
		else if (flags & SYMMETRIC_LEFT)
			left_count++;
		else
			right_count++;
	}

851 852 853
	if (!left_count || !right_count)
		return;

J
Junio C Hamano 已提交
854 855
	left_first = left_count < right_count;
	init_patch_ids(&ids);
856
	ids.diffopts.pathspec = revs->diffopt.pathspec;
J
Junio C Hamano 已提交
857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874

	/* Compute patch-ids for one side */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		unsigned flags = commit->object.flags;

		if (flags & BOUNDARY)
			continue;
		/*
		 * If we have fewer left, left_first is set and we omit
		 * commits on the right branch in this loop.  If we have
		 * fewer right, we skip the left ones.
		 */
		if (left_first != !!(flags & SYMMETRIC_LEFT))
			continue;
		commit->util = add_commit_patch_id(commit, &ids);
	}

875 876 877
	/* either cherry_mark or cherry_pick are true */
	cherry_flag = revs->cherry_mark ? PATCHSAME : SHOWN;

J
Junio C Hamano 已提交
878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899
	/* Check the other side */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		struct patch_id *id;
		unsigned flags = commit->object.flags;

		if (flags & BOUNDARY)
			continue;
		/*
		 * If we have fewer left, left_first is set and we omit
		 * commits on the left branch in this loop.
		 */
		if (left_first == !!(flags & SYMMETRIC_LEFT))
			continue;

		/*
		 * Have we seen the same patch id?
		 */
		id = has_commit_patch_id(commit, &ids);
		if (!id)
			continue;
		id->seen = 1;
900
		commit->object.flags |= cherry_flag;
J
Junio C Hamano 已提交
901 902 903 904 905 906 907 908 909 910 911
	}

	/* Now check the original side for seen ones */
	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;
		struct patch_id *ent;

		ent = commit->util;
		if (!ent)
			continue;
		if (ent->seen)
912
			commit->object.flags |= cherry_flag;
J
Junio C Hamano 已提交
913 914 915 916 917 918
		commit->util = NULL;
	}

	free_patch_ids(&ids);
}

919 920 921 922
/* How many extra uninteresting commits we want to see.. */
#define SLOP 5

static int still_interesting(struct commit_list *src, unsigned long date, int slop)
923
{
924 925 926 927 928 929 930 931 932 933
	/*
	 * No source list at all? We're definitely done..
	 */
	if (!src)
		return 0;

	/*
	 * Does the destination list contain entries with a date
	 * before the source list? Definitely _not_ done.
	 */
934
	if (date <= src->item->date)
935 936 937 938 939 940 941 942 943 944 945
		return SLOP;

	/*
	 * Does the source list still have interesting commits in
	 * it? Definitely not done..
	 */
	if (!everybody_uninteresting(src))
		return SLOP;

	/* Ok, we're closing in.. */
	return slop-1;
946 947
}

J
Junio C Hamano 已提交
948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025
/*
 * "rev-list --ancestry-path A..B" computes commits that are ancestors
 * of B but not ancestors of A but further limits the result to those
 * that are descendants of A.  This takes the list of bottom commits and
 * the result of "A..B" without --ancestry-path, and limits the latter
 * further to the ones that can reach one of the commits in "bottom".
 */
static void limit_to_ancestry(struct commit_list *bottom, struct commit_list *list)
{
	struct commit_list *p;
	struct commit_list *rlist = NULL;
	int made_progress;

	/*
	 * Reverse the list so that it will be likely that we would
	 * process parents before children.
	 */
	for (p = list; p; p = p->next)
		commit_list_insert(p->item, &rlist);

	for (p = bottom; p; p = p->next)
		p->item->object.flags |= TMP_MARK;

	/*
	 * Mark the ones that can reach bottom commits in "list",
	 * in a bottom-up fashion.
	 */
	do {
		made_progress = 0;
		for (p = rlist; p; p = p->next) {
			struct commit *c = p->item;
			struct commit_list *parents;
			if (c->object.flags & (TMP_MARK | UNINTERESTING))
				continue;
			for (parents = c->parents;
			     parents;
			     parents = parents->next) {
				if (!(parents->item->object.flags & TMP_MARK))
					continue;
				c->object.flags |= TMP_MARK;
				made_progress = 1;
				break;
			}
		}
	} while (made_progress);

	/*
	 * NEEDSWORK: decide if we want to remove parents that are
	 * not marked with TMP_MARK from commit->parents for commits
	 * in the resulting list.  We may not want to do that, though.
	 */

	/*
	 * The ones that are not marked with TMP_MARK are uninteresting
	 */
	for (p = list; p; p = p->next) {
		struct commit *c = p->item;
		if (c->object.flags & TMP_MARK)
			continue;
		c->object.flags |= UNINTERESTING;
	}

	/* We are done with the TMP_MARK */
	for (p = list; p; p = p->next)
		p->item->object.flags &= ~TMP_MARK;
	for (p = bottom; p; p = p->next)
		p->item->object.flags &= ~TMP_MARK;
	free_commit_list(rlist);
}

/*
 * Before walking the history, keep the set of "negative" refs the
 * caller has asked to exclude.
 *
 * This is used to compute "rev-list --ancestry-path A..B", as we need
 * to filter the result of "A..B" further to the ones that can actually
 * reach A.
 */
1026
static struct commit_list *collect_bottom_commits(struct commit_list *list)
J
Junio C Hamano 已提交
1027
{
1028 1029 1030 1031
	struct commit_list *elem, *bottom = NULL;
	for (elem = list; elem; elem = elem->next)
		if (elem->item->object.flags & BOTTOM)
			commit_list_insert(elem->item, &bottom);
J
Junio C Hamano 已提交
1032 1033 1034
	return bottom;
}

1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051
/* Assumes either left_only or right_only is set */
static void limit_left_right(struct commit_list *list, struct rev_info *revs)
{
	struct commit_list *p;

	for (p = list; p; p = p->next) {
		struct commit *commit = p->item;

		if (revs->right_only) {
			if (commit->object.flags & SYMMETRIC_LEFT)
				commit->object.flags |= SHOWN;
		} else	/* revs->left_only is set */
			if (!(commit->object.flags & SYMMETRIC_LEFT))
				commit->object.flags |= SHOWN;
	}
}

1052
static int limit_list(struct rev_info *revs)
1053
{
1054 1055
	int slop = SLOP;
	unsigned long date = ~0ul;
1056 1057 1058
	struct commit_list *list = revs->commits;
	struct commit_list *newlist = NULL;
	struct commit_list **p = &newlist;
J
Junio C Hamano 已提交
1059 1060 1061
	struct commit_list *bottom = NULL;

	if (revs->ancestry_path) {
1062
		bottom = collect_bottom_commits(list);
J
Junio C Hamano 已提交
1063
		if (!bottom)
1064
			die("--ancestry-path given but there are no bottom commits");
J
Junio C Hamano 已提交
1065
	}
1066 1067 1068 1069 1070

	while (list) {
		struct commit_list *entry = list;
		struct commit *commit = list->item;
		struct object *obj = &commit->object;
1071
		show_early_output_fn_t show;
1072 1073 1074 1075 1076 1077

		list = list->next;
		free(entry);

		if (revs->max_age != -1 && (commit->date < revs->max_age))
			obj->flags |= UNINTERESTING;
1078
		if (add_parents_to_list(revs, commit, &list, NULL) < 0)
1079
			return -1;
1080 1081
		if (obj->flags & UNINTERESTING) {
			mark_parents_uninteresting(commit);
1082 1083 1084 1085
			if (revs->show_all)
				p = &commit_list_insert(commit, p)->next;
			slop = still_interesting(list, date, slop);
			if (slop)
1086
				continue;
1087 1088 1089 1090
			/* If showing all, add the whole pending list to the end */
			if (revs->show_all)
				*p = list;
			break;
1091 1092 1093
		}
		if (revs->min_age != -1 && (commit->date > revs->min_age))
			continue;
1094
		date = commit->date;
1095
		p = &commit_list_insert(commit, p)->next;
1096 1097 1098 1099 1100 1101 1102

		show = show_early_output;
		if (!show)
			continue;

		show(revs, newlist);
		show_early_output = NULL;
1103
	}
1104
	if (revs->cherry_pick || revs->cherry_mark)
1105
		cherry_pick_list(newlist, revs);
J
Junio C Hamano 已提交
1106

1107 1108 1109
	if (revs->left_only || revs->right_only)
		limit_left_right(newlist, revs);

J
Junio C Hamano 已提交
1110 1111 1112 1113 1114
	if (bottom) {
		limit_to_ancestry(bottom, newlist);
		free_commit_list(bottom);
	}

1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126
	/*
	 * Check if any commits have become TREESAME by some of their parents
	 * becoming UNINTERESTING.
	 */
	if (limiting_can_increase_treesame(revs))
		for (list = newlist; list; list = list->next) {
			struct commit *c = list->item;
			if (c->object.flags & (UNINTERESTING | TREESAME))
				continue;
			update_treesame(revs, c);
		}

1127
	revs->commits = newlist;
1128
	return 0;
1129 1130
}

1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147
static void add_rev_cmdline(struct rev_info *revs,
			    struct object *item,
			    const char *name,
			    int whence,
			    unsigned flags)
{
	struct rev_cmdline_info *info = &revs->cmdline;
	int nr = info->nr;

	ALLOC_GROW(info->rev, nr + 1, info->alloc);
	info->rev[nr].item = item;
	info->rev[nr].name = name;
	info->rev[nr].whence = whence;
	info->rev[nr].flags = flags;
	info->nr++;
}

1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160
static void add_rev_cmdline_list(struct rev_info *revs,
				 struct commit_list *commit_list,
				 int whence,
				 unsigned flags)
{
	while (commit_list) {
		struct object *object = &commit_list->item->object;
		add_rev_cmdline(revs, object, sha1_to_hex(object->sha1),
				whence, flags);
		commit_list = commit_list->next;
	}
}

1161 1162
struct all_refs_cb {
	int all_flags;
1163
	int warned_bad_reflog;
1164 1165 1166
	struct rev_info *all_revs;
	const char *name_for_errormsg;
};
1167

1168
static int handle_one_ref(const char *path, const unsigned char *sha1, int flag, void *cb_data)
1169
{
1170 1171 1172
	struct all_refs_cb *cb = cb_data;
	struct object *object = get_reference(cb->all_revs, path, sha1,
					      cb->all_flags);
1173
	add_rev_cmdline(cb->all_revs, object, path, REV_CMD_REF, cb->all_flags);
1174
	add_pending_sha1(cb->all_revs, path, sha1, cb->all_flags);
1175 1176 1177
	return 0;
}

I
Ilari Liusvaara 已提交
1178 1179 1180 1181 1182 1183 1184
static void init_all_refs_cb(struct all_refs_cb *cb, struct rev_info *revs,
	unsigned flags)
{
	cb->all_revs = revs;
	cb->all_flags = flags;
}

1185 1186
static void handle_refs(const char *submodule, struct rev_info *revs, unsigned flags,
		int (*for_each)(const char *, each_ref_fn, void *))
1187
{
1188
	struct all_refs_cb cb;
I
Ilari Liusvaara 已提交
1189
	init_all_refs_cb(&cb, revs, flags);
1190
	for_each(submodule, handle_one_ref, &cb);
1191 1192
}

1193
static void handle_one_reflog_commit(unsigned char *sha1, void *cb_data)
1194 1195
{
	struct all_refs_cb *cb = cb_data;
1196 1197 1198 1199
	if (!is_null_sha1(sha1)) {
		struct object *o = parse_object(sha1);
		if (o) {
			o->flags |= cb->all_flags;
1200
			/* ??? CMDLINEFLAGS ??? */
1201 1202 1203
			add_pending_object(cb->all_revs, o, "");
		}
		else if (!cb->warned_bad_reflog) {
1204
			warning("reflog of '%s' references pruned commits",
1205 1206 1207
				cb->name_for_errormsg);
			cb->warned_bad_reflog = 1;
		}
1208
	}
1209 1210
}

1211 1212 1213
static int handle_one_reflog_ent(unsigned char *osha1, unsigned char *nsha1,
		const char *email, unsigned long timestamp, int tz,
		const char *message, void *cb_data)
1214 1215 1216
{
	handle_one_reflog_commit(osha1, cb_data);
	handle_one_reflog_commit(nsha1, cb_data);
1217 1218 1219 1220 1221 1222
	return 0;
}

static int handle_one_reflog(const char *path, const unsigned char *sha1, int flag, void *cb_data)
{
	struct all_refs_cb *cb = cb_data;
1223
	cb->warned_bad_reflog = 0;
1224 1225 1226 1227 1228 1229 1230 1231 1232 1233
	cb->name_for_errormsg = path;
	for_each_reflog_ent(path, handle_one_reflog_ent, cb_data);
	return 0;
}

static void handle_reflog(struct rev_info *revs, unsigned flags)
{
	struct all_refs_cb cb;
	cb.all_revs = revs;
	cb.all_flags = flags;
1234
	for_each_reflog(handle_one_reflog, &cb);
1235 1236
}

1237
static int add_parents_only(struct rev_info *revs, const char *arg_, int flags)
1238 1239 1240 1241 1242
{
	unsigned char sha1[20];
	struct object *it;
	struct commit *commit;
	struct commit_list *parents;
1243
	const char *arg = arg_;
1244 1245

	if (*arg == '^') {
1246
		flags ^= UNINTERESTING | BOTTOM;
1247 1248
		arg++;
	}
1249
	if (get_sha1_committish(arg, sha1))
1250 1251 1252
		return 0;
	while (1) {
		it = get_reference(revs, arg, sha1, 0);
J
Junio C Hamano 已提交
1253 1254
		if (!it && revs->ignore_missing)
			return 0;
1255
		if (it->type != OBJ_TAG)
1256
			break;
1257 1258
		if (!((struct tag*)it)->tagged)
			return 0;
1259
		hashcpy(sha1, ((struct tag*)it)->tagged->sha1);
1260
	}
1261
	if (it->type != OBJ_COMMIT)
1262 1263 1264 1265 1266
		return 0;
	commit = (struct commit *)it;
	for (parents = commit->parents; parents; parents = parents->next) {
		it = &parents->item->object;
		it->flags |= flags;
1267
		add_rev_cmdline(revs, it, arg_, REV_CMD_PARENTS_ONLY, flags);
1268 1269 1270 1271 1272
		add_pending_object(revs, it, arg);
	}
	return 1;
}

1273
void init_revisions(struct rev_info *revs, const char *prefix)
1274 1275
{
	memset(revs, 0, sizeof(*revs));
1276

1277
	revs->abbrev = DEFAULT_ABBREV;
1278
	revs->ignore_merges = 1;
L
Linus Torvalds 已提交
1279
	revs->simplify_history = 1;
1280
	DIFF_OPT_SET(&revs->pruning, RECURSIVE);
1281
	DIFF_OPT_SET(&revs->pruning, QUICK);
1282 1283
	revs->pruning.add_remove = file_add_remove;
	revs->pruning.change = file_change;
1284 1285
	revs->lifo = 1;
	revs->dense = 1;
1286
	revs->prefix = prefix;
1287 1288
	revs->max_age = -1;
	revs->min_age = -1;
J
Junio C Hamano 已提交
1289
	revs->skip_count = -1;
1290
	revs->max_count = -1;
1291
	revs->max_parents = -1;
1292

1293 1294
	revs->commit_format = CMIT_FMT_DEFAULT;

1295 1296
	init_grep_defaults();
	grep_init(&revs->grep_filter, prefix);
J
Jeff King 已提交
1297 1298 1299
	revs->grep_filter.status_only = 1;
	revs->grep_filter.regflags = REG_NEWLINE;

1300
	diff_setup(&revs->diffopt);
1301
	if (prefix && !revs->diffopt.prefix) {
1302 1303 1304
		revs->diffopt.prefix = prefix;
		revs->diffopt.prefix_length = strlen(prefix);
	}
1305 1306

	revs->notes_opt.use_default_notes = -1;
1307 1308
}

R
Rene Scharfe 已提交
1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320
static void add_pending_commit_list(struct rev_info *revs,
                                    struct commit_list *commit_list,
                                    unsigned int flags)
{
	while (commit_list) {
		struct object *object = &commit_list->item->object;
		object->flags |= flags;
		add_pending_object(revs, object, sha1_to_hex(object->sha1));
		commit_list = commit_list->next;
	}
}

1321 1322 1323 1324 1325 1326 1327 1328
static void prepare_show_merge(struct rev_info *revs)
{
	struct commit_list *bases;
	struct commit *head, *other;
	unsigned char sha1[20];
	const char **prune = NULL;
	int i, prune_num = 1; /* counting terminating NULL */

1329
	if (get_sha1("HEAD", sha1))
1330
		die("--merge without HEAD?");
1331 1332
	head = lookup_commit_or_die(sha1, "HEAD");
	if (get_sha1("MERGE_HEAD", sha1))
1333
		die("--merge without MERGE_HEAD?");
1334
	other = lookup_commit_or_die(sha1, "MERGE_HEAD");
1335 1336 1337
	add_pending_object(revs, &head->object, "HEAD");
	add_pending_object(revs, &other->object, "MERGE_HEAD");
	bases = get_merge_bases(head, other, 1);
1338 1339
	add_rev_cmdline_list(revs, bases, REV_CMD_MERGE_BASE, UNINTERESTING | BOTTOM);
	add_pending_commit_list(revs, bases, UNINTERESTING | BOTTOM);
1340 1341
	free_commit_list(bases);
	head->object.flags |= SYMMETRIC_LEFT;
1342 1343 1344 1345 1346 1347 1348

	if (!active_nr)
		read_cache();
	for (i = 0; i < active_nr; i++) {
		struct cache_entry *ce = active_cache[i];
		if (!ce_stage(ce))
			continue;
1349
		if (ce_path_match(ce, &revs->prune_data)) {
1350 1351 1352 1353 1354 1355 1356 1357 1358
			prune_num++;
			prune = xrealloc(prune, sizeof(*prune) * prune_num);
			prune[prune_num-2] = ce->name;
			prune[prune_num-1] = NULL;
		}
		while ((i+1 < active_nr) &&
		       ce_same_name(ce, active_cache[i+1]))
			i++;
	}
1359 1360
	free_pathspec(&revs->prune_data);
	init_pathspec(&revs->prune_data, prune);
1361
	revs->limited = 1;
1362 1363
}

1364
int handle_revision_arg(const char *arg_, struct rev_info *revs, int flags, unsigned revarg_opt)
1365
{
1366
	struct object_context oc;
1367 1368 1369 1370
	char *dotdot;
	struct object *object;
	unsigned char sha1[20];
	int local_flags;
1371
	const char *arg = arg_;
1372
	int cant_be_filename = revarg_opt & REVARG_CANNOT_BE_FILENAME;
1373
	unsigned get_sha1_flags = 0;
1374

1375 1376
	flags = flags & UNINTERESTING ? flags | BOTTOM : flags & ~BOTTOM;

1377 1378 1379 1380 1381 1382
	dotdot = strstr(arg, "..");
	if (dotdot) {
		unsigned char from_sha1[20];
		const char *next = dotdot + 2;
		const char *this = arg;
		int symmetric = *next == '.';
1383
		unsigned int flags_exclude = flags ^ (UNINTERESTING | BOTTOM);
1384
		static const char head_by_default[] = "HEAD";
1385
		unsigned int a_flags;
1386 1387 1388 1389 1390

		*dotdot = 0;
		next += symmetric;

		if (!*next)
1391
			next = head_by_default;
1392
		if (dotdot == arg)
1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404
			this = head_by_default;
		if (this == head_by_default && next == head_by_default &&
		    !symmetric) {
			/*
			 * Just ".."?  That is not a range but the
			 * pathspec for the parent directory.
			 */
			if (!cant_be_filename) {
				*dotdot = '.';
				return -1;
			}
		}
1405 1406
		if (!get_sha1_committish(this, from_sha1) &&
		    !get_sha1_committish(next, sha1)) {
1407 1408 1409 1410 1411 1412
			struct commit *a, *b;
			struct commit_list *exclude;

			a = lookup_commit_reference(from_sha1);
			b = lookup_commit_reference(sha1);
			if (!a || !b) {
J
Junio C Hamano 已提交
1413 1414
				if (revs->ignore_missing)
					return 0;
1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427
				die(symmetric ?
				    "Invalid symmetric difference expression %s...%s" :
				    "Invalid revision range %s..%s",
				    arg, next);
			}

			if (!cant_be_filename) {
				*dotdot = '.';
				verify_non_filename(revs->prefix, arg);
			}

			if (symmetric) {
				exclude = get_merge_bases(a, b, 1);
1428 1429 1430
				add_rev_cmdline_list(revs, exclude,
						     REV_CMD_MERGE_BASE,
						     flags_exclude);
1431 1432 1433
				add_pending_commit_list(revs, exclude,
							flags_exclude);
				free_commit_list(exclude);
1434
				a_flags = flags | SYMMETRIC_LEFT;
1435
			} else
1436 1437
				a_flags = flags_exclude;
			a->object.flags |= a_flags;
1438
			b->object.flags |= flags;
1439 1440 1441 1442
			add_rev_cmdline(revs, &a->object, this,
					REV_CMD_LEFT, a_flags);
			add_rev_cmdline(revs, &b->object, next,
					REV_CMD_RIGHT, flags);
1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455
			add_pending_object(revs, &a->object, this);
			add_pending_object(revs, &b->object, next);
			return 0;
		}
		*dotdot = '.';
	}
	dotdot = strstr(arg, "^@");
	if (dotdot && !dotdot[2]) {
		*dotdot = 0;
		if (add_parents_only(revs, arg, flags))
			return 0;
		*dotdot = '^';
	}
1456 1457 1458
	dotdot = strstr(arg, "^!");
	if (dotdot && !dotdot[2]) {
		*dotdot = 0;
1459
		if (!add_parents_only(revs, arg, flags ^ (UNINTERESTING | BOTTOM)))
1460 1461 1462
			*dotdot = '^';
	}

1463 1464
	local_flags = 0;
	if (*arg == '^') {
1465
		local_flags = UNINTERESTING | BOTTOM;
1466 1467
		arg++;
	}
1468 1469 1470 1471 1472

	if (revarg_opt & REVARG_COMMITTISH)
		get_sha1_flags = GET_SHA1_COMMITTISH;

	if (get_sha1_with_context(arg, get_sha1_flags, sha1, &oc))
J
Junio C Hamano 已提交
1473
		return revs->ignore_missing ? 0 : -1;
1474 1475 1476
	if (!cant_be_filename)
		verify_non_filename(revs->prefix, arg);
	object = get_reference(revs, arg, sha1, flags ^ local_flags);
1477
	add_rev_cmdline(revs, object, arg_, REV_CMD_REV, flags ^ local_flags);
1478
	add_pending_object_with_mode(revs, object, arg, oc.mode);
1479 1480 1481
	return 0;
}

1482 1483 1484 1485 1486
struct cmdline_pathspec {
	int alloc;
	int nr;
	const char **path;
};
1487

1488 1489 1490 1491 1492 1493 1494
static void append_prune_data(struct cmdline_pathspec *prune, const char **av)
{
	while (*av) {
		ALLOC_GROW(prune->path, prune->nr+1, prune->alloc);
		prune->path[prune->nr++] = *(av++);
	}
}
1495

1496 1497 1498
static void read_pathspec_from_stdin(struct rev_info *revs, struct strbuf *sb,
				     struct cmdline_pathspec *prune)
{
1499 1500 1501 1502
	while (strbuf_getwholeline(sb, stdin, '\n') != EOF) {
		int len = sb->len;
		if (len && sb->buf[len - 1] == '\n')
			sb->buf[--len] = '\0';
1503 1504
		ALLOC_GROW(prune->path, prune->nr+1, prune->alloc);
		prune->path[prune->nr++] = xstrdup(sb->buf);
1505 1506 1507
	}
}

1508 1509
static void read_revisions_from_stdin(struct rev_info *revs,
				      struct cmdline_pathspec *prune)
1510
{
1511
	struct strbuf sb;
1512
	int seen_dashdash = 0;
1513

1514 1515 1516 1517 1518
	strbuf_init(&sb, 1000);
	while (strbuf_getwholeline(&sb, stdin, '\n') != EOF) {
		int len = sb.len;
		if (len && sb.buf[len - 1] == '\n')
			sb.buf[--len] = '\0';
1519 1520
		if (!len)
			break;
1521 1522 1523 1524 1525
		if (sb.buf[0] == '-') {
			if (len == 2 && sb.buf[1] == '-') {
				seen_dashdash = 1;
				break;
			}
1526
			die("options not supported in --stdin mode");
1527
		}
1528 1529
		if (handle_revision_arg(xstrdup(sb.buf), revs, 0,
					REVARG_CANNOT_BE_FILENAME))
1530
			die("bad revision '%s'", sb.buf);
1531
	}
1532 1533
	if (seen_dashdash)
		read_pathspec_from_stdin(revs, &sb, prune);
1534
	strbuf_release(&sb);
1535 1536
}

1537
static void add_grep(struct rev_info *revs, const char *ptn, enum grep_pat_token what)
1538
{
J
Jeff King 已提交
1539
	append_grep_pattern(&revs->grep_filter, ptn, "command line", 0, what);
1540 1541
}

1542
static void add_header_grep(struct rev_info *revs, enum grep_header_field field, const char *pattern)
1543
{
1544
	append_header_grep_pattern(&revs->grep_filter, field, pattern);
1545 1546 1547 1548
}

static void add_message_grep(struct rev_info *revs, const char *pattern)
{
1549
	add_grep(revs, pattern, GREP_PATTERN_BODY);
1550 1551
}

1552 1553
static int handle_revision_opt(struct rev_info *revs, int argc, const char **argv,
			       int *unkc, const char **unkv)
1554 1555
{
	const char *arg = argv[0];
1556 1557
	const char *optarg;
	int argcount;
1558 1559 1560 1561 1562

	/* pseudo revision arguments */
	if (!strcmp(arg, "--all") || !strcmp(arg, "--branches") ||
	    !strcmp(arg, "--tags") || !strcmp(arg, "--remotes") ||
	    !strcmp(arg, "--reflog") || !strcmp(arg, "--not") ||
1563
	    !strcmp(arg, "--no-walk") || !strcmp(arg, "--do-walk") ||
1564 1565
	    !strcmp(arg, "--bisect") || !prefixcmp(arg, "--glob=") ||
	    !prefixcmp(arg, "--branches=") || !prefixcmp(arg, "--tags=") ||
1566
	    !prefixcmp(arg, "--remotes=") || !prefixcmp(arg, "--no-walk="))
1567 1568
	{
		unkv[(*unkc)++] = arg;
1569
		return 1;
1570 1571
	}

1572 1573
	if ((argcount = parse_long_opt("max-count", argv, &optarg))) {
		revs->max_count = atoi(optarg);
1574
		revs->no_walk = 0;
1575 1576 1577 1578
		return argcount;
	} else if ((argcount = parse_long_opt("skip", argv, &optarg))) {
		revs->skip_count = atoi(optarg);
		return argcount;
1579 1580 1581
	} else if ((*arg == '-') && isdigit(arg[1])) {
	/* accept -<digit>, like traditional "head" */
		revs->max_count = atoi(arg + 1);
1582
		revs->no_walk = 0;
1583 1584 1585 1586
	} else if (!strcmp(arg, "-n")) {
		if (argc <= 1)
			return error("-n requires an argument");
		revs->max_count = atoi(argv[1]);
1587
		revs->no_walk = 0;
1588 1589 1590
		return 2;
	} else if (!prefixcmp(arg, "-n")) {
		revs->max_count = atoi(arg + 2);
1591
		revs->no_walk = 0;
1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609
	} else if ((argcount = parse_long_opt("max-age", argv, &optarg))) {
		revs->max_age = atoi(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("since", argv, &optarg))) {
		revs->max_age = approxidate(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("after", argv, &optarg))) {
		revs->max_age = approxidate(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("min-age", argv, &optarg))) {
		revs->min_age = atoi(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("before", argv, &optarg))) {
		revs->min_age = approxidate(optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("until", argv, &optarg))) {
		revs->min_age = approxidate(optarg);
		return argcount;
1610 1611
	} else if (!strcmp(arg, "--first-parent")) {
		revs->first_parent_only = 1;
J
Junio C Hamano 已提交
1612 1613
	} else if (!strcmp(arg, "--ancestry-path")) {
		revs->ancestry_path = 1;
1614
		revs->simplify_history = 0;
J
Junio C Hamano 已提交
1615
		revs->limited = 1;
1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627
	} else if (!strcmp(arg, "-g") || !strcmp(arg, "--walk-reflogs")) {
		init_reflog_walk(&revs->reflog_info);
	} else if (!strcmp(arg, "--default")) {
		if (argc <= 1)
			return error("bad --default argument");
		revs->def = argv[1];
		return 2;
	} else if (!strcmp(arg, "--merge")) {
		revs->show_merge = 1;
	} else if (!strcmp(arg, "--topo-order")) {
		revs->lifo = 1;
		revs->topo_order = 1;
1628 1629
	} else if (!strcmp(arg, "--simplify-merges")) {
		revs->simplify_merges = 1;
1630
		revs->topo_order = 1;
1631 1632 1633
		revs->rewrite_parents = 1;
		revs->simplify_history = 0;
		revs->limited = 1;
1634 1635
	} else if (!strcmp(arg, "--simplify-by-decoration")) {
		revs->simplify_merges = 1;
1636
		revs->topo_order = 1;
1637 1638 1639 1640 1641
		revs->rewrite_parents = 1;
		revs->simplify_history = 0;
		revs->simplify_by_decoration = 1;
		revs->limited = 1;
		revs->prune = 1;
1642
		load_ref_decorations(DECORATE_SHORT_REFS);
1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666
	} else if (!strcmp(arg, "--date-order")) {
		revs->lifo = 0;
		revs->topo_order = 1;
	} else if (!prefixcmp(arg, "--early-output")) {
		int count = 100;
		switch (arg[14]) {
		case '=':
			count = atoi(arg+15);
			/* Fallthrough */
		case 0:
			revs->topo_order = 1;
		       revs->early_output = count;
		}
	} else if (!strcmp(arg, "--parents")) {
		revs->rewrite_parents = 1;
		revs->print_parents = 1;
	} else if (!strcmp(arg, "--dense")) {
		revs->dense = 1;
	} else if (!strcmp(arg, "--sparse")) {
		revs->dense = 0;
	} else if (!strcmp(arg, "--show-all")) {
		revs->show_all = 1;
	} else if (!strcmp(arg, "--remove-empty")) {
		revs->remove_empty_trees = 1;
1667
	} else if (!strcmp(arg, "--merges")) {
1668
		revs->min_parents = 2;
1669
	} else if (!strcmp(arg, "--no-merges")) {
1670 1671 1672 1673 1674 1675 1676 1677 1678
		revs->max_parents = 1;
	} else if (!prefixcmp(arg, "--min-parents=")) {
		revs->min_parents = atoi(arg+14);
	} else if (!prefixcmp(arg, "--no-min-parents")) {
		revs->min_parents = 0;
	} else if (!prefixcmp(arg, "--max-parents=")) {
		revs->max_parents = atoi(arg+14);
	} else if (!prefixcmp(arg, "--no-max-parents")) {
		revs->max_parents = -1;
1679 1680 1681 1682
	} else if (!strcmp(arg, "--boundary")) {
		revs->boundary = 1;
	} else if (!strcmp(arg, "--left-right")) {
		revs->left_right = 1;
1683
	} else if (!strcmp(arg, "--left-only")) {
1684
		if (revs->right_only)
M
Michael J Gruber 已提交
1685 1686
			die("--left-only is incompatible with --right-only"
			    " or --cherry");
1687 1688
		revs->left_only = 1;
	} else if (!strcmp(arg, "--right-only")) {
1689 1690
		if (revs->left_only)
			die("--right-only is incompatible with --left-only");
1691
		revs->right_only = 1;
M
Michael J Gruber 已提交
1692 1693 1694 1695 1696
	} else if (!strcmp(arg, "--cherry")) {
		if (revs->left_only)
			die("--cherry is incompatible with --left-only");
		revs->cherry_mark = 1;
		revs->right_only = 1;
1697
		revs->max_parents = 1;
M
Michael J Gruber 已提交
1698
		revs->limited = 1;
T
Thomas Rast 已提交
1699 1700
	} else if (!strcmp(arg, "--count")) {
		revs->count = 1;
1701 1702 1703 1704 1705
	} else if (!strcmp(arg, "--cherry-mark")) {
		if (revs->cherry_pick)
			die("--cherry-mark is incompatible with --cherry-pick");
		revs->cherry_mark = 1;
		revs->limited = 1; /* needs limit_list() */
1706
	} else if (!strcmp(arg, "--cherry-pick")) {
1707 1708
		if (revs->cherry_mark)
			die("--cherry-pick is incompatible with --cherry-mark");
1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719
		revs->cherry_pick = 1;
		revs->limited = 1;
	} else if (!strcmp(arg, "--objects")) {
		revs->tag_objects = 1;
		revs->tree_objects = 1;
		revs->blob_objects = 1;
	} else if (!strcmp(arg, "--objects-edge")) {
		revs->tag_objects = 1;
		revs->tree_objects = 1;
		revs->blob_objects = 1;
		revs->edge_hint = 1;
J
Junio C Hamano 已提交
1720 1721 1722 1723 1724
	} else if (!strcmp(arg, "--verify-objects")) {
		revs->tag_objects = 1;
		revs->tree_objects = 1;
		revs->blob_objects = 1;
		revs->verify_objects = 1;
1725 1726
	} else if (!strcmp(arg, "--unpacked")) {
		revs->unpacked = 1;
J
Junio C Hamano 已提交
1727 1728
	} else if (!prefixcmp(arg, "--unpacked=")) {
		die("--unpacked=<packfile> no longer supported.");
1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749
	} else if (!strcmp(arg, "-r")) {
		revs->diff = 1;
		DIFF_OPT_SET(&revs->diffopt, RECURSIVE);
	} else if (!strcmp(arg, "-t")) {
		revs->diff = 1;
		DIFF_OPT_SET(&revs->diffopt, RECURSIVE);
		DIFF_OPT_SET(&revs->diffopt, TREE_IN_RECURSIVE);
	} else if (!strcmp(arg, "-m")) {
		revs->ignore_merges = 0;
	} else if (!strcmp(arg, "-c")) {
		revs->diff = 1;
		revs->dense_combined_merges = 0;
		revs->combine_merges = 1;
	} else if (!strcmp(arg, "--cc")) {
		revs->diff = 1;
		revs->dense_combined_merges = 1;
		revs->combine_merges = 1;
	} else if (!strcmp(arg, "-v")) {
		revs->verbose_header = 1;
	} else if (!strcmp(arg, "--pretty")) {
		revs->verbose_header = 1;
1750
		revs->pretty_given = 1;
1751
		get_commit_format(arg+8, revs);
1752
	} else if (!prefixcmp(arg, "--pretty=") || !prefixcmp(arg, "--format=")) {
1753 1754 1755 1756
		/*
		 * Detached form ("--pretty X" as opposed to "--pretty=X")
		 * not allowed, since the argument is optional.
		 */
1757
		revs->verbose_header = 1;
1758
		revs->pretty_given = 1;
1759
		get_commit_format(arg+9, revs);
1760
	} else if (!strcmp(arg, "--show-notes") || !strcmp(arg, "--notes")) {
1761 1762
		revs->show_notes = 1;
		revs->show_notes_given = 1;
1763
		revs->notes_opt.use_default_notes = 1;
J
Junio C Hamano 已提交
1764 1765
	} else if (!strcmp(arg, "--show-signature")) {
		revs->show_signature = 1;
1766 1767
	} else if (!prefixcmp(arg, "--show-notes=") ||
		   !prefixcmp(arg, "--notes=")) {
1768 1769 1770
		struct strbuf buf = STRBUF_INIT;
		revs->show_notes = 1;
		revs->show_notes_given = 1;
1771 1772 1773 1774 1775 1776 1777
		if (!prefixcmp(arg, "--show-notes")) {
			if (revs->notes_opt.use_default_notes < 0)
				revs->notes_opt.use_default_notes = 1;
			strbuf_addstr(&buf, arg+13);
		}
		else
			strbuf_addstr(&buf, arg+8);
1778
		expand_notes_ref(&buf);
1779
		string_list_append(&revs->notes_opt.extra_notes_refs,
1780
				   strbuf_detach(&buf, NULL));
1781 1782 1783
	} else if (!strcmp(arg, "--no-notes")) {
		revs->show_notes = 0;
		revs->show_notes_given = 1;
1784 1785 1786 1787 1788 1789
		revs->notes_opt.use_default_notes = -1;
		/* we have been strdup'ing ourselves, so trick
		 * string_list into free()ing strings */
		revs->notes_opt.extra_notes_refs.strdup_strings = 1;
		string_list_clear(&revs->notes_opt.extra_notes_refs, 0);
		revs->notes_opt.extra_notes_refs.strdup_strings = 0;
1790 1791
	} else if (!strcmp(arg, "--standard-notes")) {
		revs->show_notes_given = 1;
1792
		revs->notes_opt.use_default_notes = 1;
1793
	} else if (!strcmp(arg, "--no-standard-notes")) {
1794
		revs->notes_opt.use_default_notes = 0;
1795 1796 1797
	} else if (!strcmp(arg, "--oneline")) {
		revs->verbose_header = 1;
		get_commit_format("oneline", revs);
1798
		revs->pretty_given = 1;
1799
		revs->abbrev_commit = 1;
1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821
	} else if (!strcmp(arg, "--graph")) {
		revs->topo_order = 1;
		revs->rewrite_parents = 1;
		revs->graph = graph_init(revs);
	} else if (!strcmp(arg, "--root")) {
		revs->show_root_diff = 1;
	} else if (!strcmp(arg, "--no-commit-id")) {
		revs->no_commit_id = 1;
	} else if (!strcmp(arg, "--always")) {
		revs->always_show_header = 1;
	} else if (!strcmp(arg, "--no-abbrev")) {
		revs->abbrev = 0;
	} else if (!strcmp(arg, "--abbrev")) {
		revs->abbrev = DEFAULT_ABBREV;
	} else if (!prefixcmp(arg, "--abbrev=")) {
		revs->abbrev = strtoul(arg + 9, NULL, 10);
		if (revs->abbrev < MINIMUM_ABBREV)
			revs->abbrev = MINIMUM_ABBREV;
		else if (revs->abbrev > 40)
			revs->abbrev = 40;
	} else if (!strcmp(arg, "--abbrev-commit")) {
		revs->abbrev_commit = 1;
1822 1823 1824
		revs->abbrev_commit_given = 1;
	} else if (!strcmp(arg, "--no-abbrev-commit")) {
		revs->abbrev_commit = 0;
1825 1826 1827 1828 1829 1830 1831
	} else if (!strcmp(arg, "--full-diff")) {
		revs->diff = 1;
		revs->full_diff = 1;
	} else if (!strcmp(arg, "--full-history")) {
		revs->simplify_history = 0;
	} else if (!strcmp(arg, "--relative-date")) {
		revs->date_mode = DATE_RELATIVE;
J
Jeff King 已提交
1832
		revs->date_mode_explicit = 1;
1833 1834
	} else if ((argcount = parse_long_opt("date", argv, &optarg))) {
		revs->date_mode = parse_date_format(optarg);
J
Jeff King 已提交
1835
		revs->date_mode_explicit = 1;
1836
		return argcount;
1837 1838 1839 1840 1841 1842
	} else if (!strcmp(arg, "--log-size")) {
		revs->show_log_size = 1;
	}
	/*
	 * Grepping the commit log
	 */
1843 1844 1845 1846 1847 1848
	else if ((argcount = parse_long_opt("author", argv, &optarg))) {
		add_header_grep(revs, GREP_HEADER_AUTHOR, optarg);
		return argcount;
	} else if ((argcount = parse_long_opt("committer", argv, &optarg))) {
		add_header_grep(revs, GREP_HEADER_COMMITTER, optarg);
		return argcount;
1849 1850 1851
	} else if ((argcount = parse_long_opt("grep-reflog", argv, &optarg))) {
		add_header_grep(revs, GREP_HEADER_REFLOG, optarg);
		return argcount;
1852 1853 1854
	} else if ((argcount = parse_long_opt("grep", argv, &optarg))) {
		add_message_grep(revs, optarg);
		return argcount;
1855 1856
	} else if (!strcmp(arg, "--grep-debug")) {
		revs->grep_filter.debug = 1;
1857 1858
	} else if (!strcmp(arg, "--basic-regexp")) {
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_BRE, &revs->grep_filter);
1859
	} else if (!strcmp(arg, "--extended-regexp") || !strcmp(arg, "-E")) {
1860
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_ERE, &revs->grep_filter);
1861
	} else if (!strcmp(arg, "--regexp-ignore-case") || !strcmp(arg, "-i")) {
J
Jeff King 已提交
1862
		revs->grep_filter.regflags |= REG_ICASE;
1863
		DIFF_OPT_SET(&revs->diffopt, PICKAXE_IGNORE_CASE);
1864
	} else if (!strcmp(arg, "--fixed-strings") || !strcmp(arg, "-F")) {
1865
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_FIXED, &revs->grep_filter);
1866 1867
	} else if (!strcmp(arg, "--perl-regexp")) {
		grep_set_pattern_type_option(GREP_PATTERN_TYPE_PCRE, &revs->grep_filter);
1868
	} else if (!strcmp(arg, "--all-match")) {
J
Jeff King 已提交
1869
		revs->grep_filter.all_match = 1;
1870 1871 1872
	} else if ((argcount = parse_long_opt("encoding", argv, &optarg))) {
		if (strcmp(optarg, "none"))
			git_log_output_encoding = xstrdup(optarg);
1873 1874
		else
			git_log_output_encoding = "";
1875
		return argcount;
1876 1877 1878 1879 1880
	} else if (!strcmp(arg, "--reverse")) {
		revs->reverse ^= 1;
	} else if (!strcmp(arg, "--children")) {
		revs->children.name = "children";
		revs->limited = 1;
J
Junio C Hamano 已提交
1881 1882
	} else if (!strcmp(arg, "--ignore-missing")) {
		revs->ignore_missing = 1;
1883 1884 1885 1886 1887 1888 1889 1890 1891 1892
	} else {
		int opts = diff_opt_parse(&revs->diffopt, argv, argc);
		if (!opts)
			unkv[(*unkc)++] = arg;
		return opts;
	}

	return 1;
}

1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906
void parse_revision_opt(struct rev_info *revs, struct parse_opt_ctx_t *ctx,
			const struct option *options,
			const char * const usagestr[])
{
	int n = handle_revision_opt(revs, ctx->argc, ctx->argv,
				    &ctx->cpidx, ctx->out);
	if (n <= 0) {
		error("unknown option `%s'", ctx->argv[0]);
		usage_with_options(usagestr, options);
	}
	ctx->argv += n;
	ctx->argc -= n;
}

1907
static int for_each_bad_bisect_ref(const char *submodule, each_ref_fn fn, void *cb_data)
1908
{
1909
	return for_each_ref_in_submodule(submodule, "refs/bisect/bad", fn, cb_data);
1910 1911
}

1912
static int for_each_good_bisect_ref(const char *submodule, each_ref_fn fn, void *cb_data)
1913
{
1914
	return for_each_ref_in_submodule(submodule, "refs/bisect/good", fn, cb_data);
1915 1916
}

1917 1918 1919 1920 1921 1922 1923 1924
static int handle_revision_pseudo_opt(const char *submodule,
				struct rev_info *revs,
				int argc, const char **argv, int *flags)
{
	const char *arg = argv[0];
	const char *optarg;
	int argcount;

1925 1926 1927 1928 1929 1930 1931 1932 1933 1934
	/*
	 * NOTE!
	 *
	 * Commands like "git shortlog" will not accept the options below
	 * unless parse_revision_opt queues them (as opposed to erroring
	 * out).
	 *
	 * When implementing your new pseudo-option, remember to
	 * register it in the list at the top of handle_revision_opt.
	 */
1935 1936 1937 1938 1939 1940 1941
	if (!strcmp(arg, "--all")) {
		handle_refs(submodule, revs, *flags, for_each_ref_submodule);
		handle_refs(submodule, revs, *flags, head_ref_submodule);
	} else if (!strcmp(arg, "--branches")) {
		handle_refs(submodule, revs, *flags, for_each_branch_ref_submodule);
	} else if (!strcmp(arg, "--bisect")) {
		handle_refs(submodule, revs, *flags, for_each_bad_bisect_ref);
1942
		handle_refs(submodule, revs, *flags ^ (UNINTERESTING | BOTTOM), for_each_good_bisect_ref);
1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967
		revs->bisect = 1;
	} else if (!strcmp(arg, "--tags")) {
		handle_refs(submodule, revs, *flags, for_each_tag_ref_submodule);
	} else if (!strcmp(arg, "--remotes")) {
		handle_refs(submodule, revs, *flags, for_each_remote_ref_submodule);
	} else if ((argcount = parse_long_opt("glob", argv, &optarg))) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref(handle_one_ref, optarg, &cb);
		return argcount;
	} else if (!prefixcmp(arg, "--branches=")) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref_in(handle_one_ref, arg + 11, "refs/heads/", &cb);
	} else if (!prefixcmp(arg, "--tags=")) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref_in(handle_one_ref, arg + 7, "refs/tags/", &cb);
	} else if (!prefixcmp(arg, "--remotes=")) {
		struct all_refs_cb cb;
		init_all_refs_cb(&cb, revs, *flags);
		for_each_glob_ref_in(handle_one_ref, arg + 10, "refs/remotes/", &cb);
	} else if (!strcmp(arg, "--reflog")) {
		handle_reflog(revs, *flags);
	} else if (!strcmp(arg, "--not")) {
1968
		*flags ^= UNINTERESTING | BOTTOM;
1969
	} else if (!strcmp(arg, "--no-walk")) {
1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981
		revs->no_walk = REVISION_WALK_NO_WALK_SORTED;
	} else if (!prefixcmp(arg, "--no-walk=")) {
		/*
		 * Detached form ("--no-walk X" as opposed to "--no-walk=X")
		 * not allowed, since the argument is optional.
		 */
		if (!strcmp(arg + 10, "sorted"))
			revs->no_walk = REVISION_WALK_NO_WALK_SORTED;
		else if (!strcmp(arg + 10, "unsorted"))
			revs->no_walk = REVISION_WALK_NO_WALK_UNSORTED;
		else
			return error("invalid argument to --no-walk");
1982 1983 1984 1985 1986 1987 1988 1989 1990
	} else if (!strcmp(arg, "--do-walk")) {
		revs->no_walk = 0;
	} else {
		return 0;
	}

	return 1;
}

1991 1992 1993 1994
/*
 * Parse revision information, filling in the "rev_info" structure,
 * and removing the used arguments from the argument list.
 *
1995 1996
 * Returns the number of arguments left that weren't recognized
 * (which are also moved to the head of the argument list)
1997
 */
1998
int setup_revisions(int argc, const char **argv, struct rev_info *revs, struct setup_revision_opt *opt)
1999
{
2000
	int i, flags, left, seen_dashdash, read_from_stdin, got_rev_arg = 0, revarg_opt;
2001
	struct cmdline_pathspec prune_data;
2002 2003
	const char *submodule = NULL;

2004
	memset(&prune_data, 0, sizeof(prune_data));
2005 2006
	if (opt)
		submodule = opt->submodule;
2007 2008

	/* First, search for "--" */
2009
	if (opt && opt->assume_dashdash) {
2010
		seen_dashdash = 1;
2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023
	} else {
		seen_dashdash = 0;
		for (i = 1; i < argc; i++) {
			const char *arg = argv[i];
			if (strcmp(arg, "--"))
				continue;
			argv[i] = NULL;
			argc = i;
			if (argv[i + 1])
				append_prune_data(&prune_data, argv + i + 1);
			seen_dashdash = 1;
			break;
		}
2024 2025
	}

2026 2027
	/* Second, deal with arguments and options */
	flags = 0;
2028 2029 2030
	revarg_opt = opt ? opt->revarg_opt : 0;
	if (seen_dashdash)
		revarg_opt |= REVARG_CANNOT_BE_FILENAME;
2031
	read_from_stdin = 0;
2032
	for (left = i = 1; i < argc; i++) {
2033 2034
		const char *arg = argv[i];
		if (*arg == '-') {
2035
			int opts;
2036

2037 2038 2039 2040 2041
			opts = handle_revision_pseudo_opt(submodule,
						revs, argc - i, argv + i,
						&flags);
			if (opts > 0) {
				i += opts - 1;
2042 2043
				continue;
			}
2044

2045 2046 2047 2048 2049 2050 2051
			if (!strcmp(arg, "--stdin")) {
				if (revs->disable_stdin) {
					argv[left++] = arg;
					continue;
				}
				if (read_from_stdin++)
					die("--stdin given twice?");
2052
				read_revisions_from_stdin(revs, &prune_data);
2053 2054
				continue;
			}
2055

2056
			opts = handle_revision_opt(revs, argc - i, argv + i, &left, argv);
2057 2058 2059 2060
			if (opts > 0) {
				i += opts - 1;
				continue;
			}
2061 2062
			if (opts < 0)
				exit(128);
2063 2064 2065
			continue;
		}

2066 2067

		if (handle_revision_arg(arg, revs, flags, revarg_opt)) {
2068 2069
			int j;
			if (seen_dashdash || *arg == '^')
2070 2071
				die("bad revision '%s'", arg);

2072 2073 2074 2075 2076 2077
			/* If we didn't have a "--":
			 * (1) all filenames must exist;
			 * (2) all rev-args must not be interpretable
			 *     as a valid filename.
			 * but the latter we have checked in the main loop.
			 */
2078
			for (j = i; j < argc; j++)
2079
				verify_filename(revs->prefix, argv[j], j == i);
2080

2081
			append_prune_data(&prune_data, argv + i);
2082 2083
			break;
		}
2084 2085
		else
			got_rev_arg = 1;
2086
	}
2087

2088
	if (prune_data.nr) {
2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102
		/*
		 * If we need to introduce the magic "a lone ':' means no
		 * pathspec whatsoever", here is the place to do so.
		 *
		 * if (prune_data.nr == 1 && !strcmp(prune_data[0], ":")) {
		 *	prune_data.nr = 0;
		 *	prune_data.alloc = 0;
		 *	free(prune_data.path);
		 *	prune_data.path = NULL;
		 * } else {
		 *	terminate prune_data.alloc with NULL and
		 *	call init_pathspec() to set revs->prune_data here.
		 * }
		 */
2103 2104
		ALLOC_GROW(prune_data.path, prune_data.nr+1, prune_data.alloc);
		prune_data.path[prune_data.nr++] = NULL;
2105 2106
		init_pathspec(&revs->prune_data,
			      get_pathspec(revs->prefix, prune_data.path));
2107
	}
2108

2109
	if (revs->def == NULL)
2110
		revs->def = opt ? opt->def : NULL;
J
Junio C Hamano 已提交
2111 2112
	if (opt && opt->tweak)
		opt->tweak(revs, opt);
2113
	if (revs->show_merge)
2114
		prepare_show_merge(revs);
2115
	if (revs->def && !revs->pending.nr && !got_rev_arg) {
2116
		unsigned char sha1[20];
2117
		struct object *object;
2118
		struct object_context oc;
2119
		if (get_sha1_with_context(revs->def, 0, sha1, &oc))
2120 2121
			die("bad default revision '%s'", revs->def);
		object = get_reference(revs, revs->def, sha1, 0);
2122
		add_pending_object_with_mode(revs, object, revs->def, oc.mode);
2123
	}
2124

2125 2126 2127 2128
	/* Did the user ask for any diff output? Run the diff! */
	if (revs->diffopt.output_format & ~DIFF_FORMAT_NO_OUTPUT)
		revs->diff = 1;

A
Arjen Laarhoven 已提交
2129 2130 2131 2132
	/* Pickaxe, diff-filter and rename following need diffs */
	if (revs->diffopt.pickaxe ||
	    revs->diffopt.filter ||
	    DIFF_OPT_TST(&revs->diffopt, FOLLOW_RENAMES))
2133 2134
		revs->diff = 1;

2135
	if (revs->topo_order)
2136 2137
		revs->limited = 1;

2138 2139
	if (revs->prune_data.nr) {
		diff_tree_setup_paths(revs->prune_data.raw, &revs->pruning);
2140
		/* Can't prune commits with rename following: the paths change.. */
2141
		if (!DIFF_OPT_TST(&revs->diffopt, FOLLOW_RENAMES))
L
Linus Torvalds 已提交
2142
			revs->prune = 1;
2143
		if (!revs->full_diff)
2144
			diff_tree_setup_paths(revs->prune_data.raw, &revs->diffopt);
2145
	}
J
Junio C Hamano 已提交
2146
	if (revs->combine_merges)
2147 2148
		revs->ignore_merges = 0;
	revs->diffopt.abbrev = revs->abbrev;
T
Thomas Rast 已提交
2149
	diff_setup_done(&revs->diffopt);
2150

2151 2152
	grep_commit_pattern_type(GREP_PATTERN_TYPE_UNSPECIFIED,
				 &revs->grep_filter);
J
Jeff King 已提交
2153
	compile_grep_patterns(&revs->grep_filter);
2154

2155 2156
	if (revs->reverse && revs->reflog_info)
		die("cannot combine --reverse with --walk-reflogs");
2157
	if (revs->rewrite_parents && revs->children.name)
2158
		die("cannot combine --parents and --children");
2159

2160 2161 2162 2163 2164 2165 2166 2167
	/*
	 * Limitations on the graph functionality
	 */
	if (revs->reverse && revs->graph)
		die("cannot combine --reverse with --graph");

	if (revs->reflog_info && revs->graph)
		die("cannot combine --walk-reflogs with --graph");
2168 2169
	if (!revs->reflog_info && revs->grep_filter.use_reflog_filter)
		die("cannot use --grep-reflog without --walk-reflogs");
2170

2171 2172
	return left;
}
2173

2174 2175 2176 2177 2178 2179 2180 2181
static void add_child(struct rev_info *revs, struct commit *parent, struct commit *child)
{
	struct commit_list *l = xcalloc(1, sizeof(*l));

	l->item = child;
	l->next = add_decoration(&revs->children, &parent->object, l);
}

2182
static int remove_duplicate_parents(struct rev_info *revs, struct commit *commit)
2183
{
2184
	struct treesame_state *ts = lookup_decoration(&revs->treesame, &commit->object);
2185 2186 2187 2188 2189
	struct commit_list **pp, *p;
	int surviving_parents;

	/* Examine existing parents while marking ones we have seen... */
	pp = &commit->parents;
2190
	surviving_parents = 0;
2191 2192 2193 2194
	while ((p = *pp) != NULL) {
		struct commit *parent = p->item;
		if (parent->object.flags & TMP_MARK) {
			*pp = p->next;
2195 2196
			if (ts)
				compact_treesame(revs, commit, surviving_parents);
2197 2198 2199
			continue;
		}
		parent->object.flags |= TMP_MARK;
2200
		surviving_parents++;
2201 2202
		pp = &p->next;
	}
2203
	/* clear the temporary mark */
2204 2205 2206
	for (p = commit->parents; p; p = p->next) {
		p->item->object.flags &= ~TMP_MARK;
	}
2207
	/* no update_treesame() - removing duplicates can't affect TREESAME */
2208 2209 2210
	return surviving_parents;
}

2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226
struct merge_simplify_state {
	struct commit *simplified;
};

static struct merge_simplify_state *locate_simplify_state(struct rev_info *revs, struct commit *commit)
{
	struct merge_simplify_state *st;

	st = lookup_decoration(&revs->merge_simplification, &commit->object);
	if (!st) {
		st = xcalloc(1, sizeof(*st));
		add_decoration(&revs->merge_simplification, &commit->object, st);
	}
	return st;
}

2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262
static int mark_redundant_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list *h = reduce_heads(commit->parents);
	int i = 0, marked = 0;
	struct commit_list *po, *pn;

	/* Want these for sanity-checking only */
	int orig_cnt = commit_list_count(commit->parents);
	int cnt = commit_list_count(h);

	/*
	 * Not ready to remove items yet, just mark them for now, based
	 * on the output of reduce_heads(). reduce_heads outputs the reduced
	 * set in its original order, so this isn't too hard.
	 */
	po = commit->parents;
	pn = h;
	while (po) {
		if (pn && po->item == pn->item) {
			pn = pn->next;
			i++;
		} else {
			po->item->object.flags |= TMP_MARK;
			marked++;
		}
		po=po->next;
	}

	if (i != cnt || cnt+marked != orig_cnt)
		die("mark_redundant_parents %d %d %d %d", orig_cnt, cnt, i, marked);

	free_commit_list(h);

	return marked;
}

2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278
static int mark_treesame_root_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list *p;
	int marked = 0;

	for (p = commit->parents; p; p = p->next) {
		struct commit *parent = p->item;
		if (!parent->parents && (parent->object.flags & TREESAME)) {
			parent->object.flags |= TMP_MARK;
			marked++;
		}
	}

	return marked;
}

2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344 2345
/*
 * Awkward naming - this means one parent we are TREESAME to.
 * cf mark_treesame_root_parents: root parents that are TREESAME (to an
 * empty tree). Better name suggestions?
 */
static int leave_one_treesame_to_parent(struct rev_info *revs, struct commit *commit)
{
	struct treesame_state *ts = lookup_decoration(&revs->treesame, &commit->object);
	struct commit *unmarked = NULL, *marked = NULL;
	struct commit_list *p;
	unsigned n;

	for (p = commit->parents, n = 0; p; p = p->next, n++) {
		if (ts->treesame[n]) {
			if (p->item->object.flags & TMP_MARK) {
				if (!marked)
					marked = p->item;
			} else {
				if (!unmarked) {
					unmarked = p->item;
					break;
				}
			}
		}
	}

	/*
	 * If we are TREESAME to a marked-for-deletion parent, but not to any
	 * unmarked parents, unmark the first TREESAME parent. This is the
	 * parent that the default simplify_history==1 scan would have followed,
	 * and it doesn't make sense to omit that path when asking for a
	 * simplified full history. Retaining it improves the chances of
	 * understanding odd missed merges that took an old version of a file.
	 *
	 * Example:
	 *
	 *   I--------*X       A modified the file, but mainline merge X used
	 *    \       /        "-s ours", so took the version from I. X is
	 *     `-*A--'         TREESAME to I and !TREESAME to A.
	 *
	 * Default log from X would produce "I". Without this check,
	 * --full-history --simplify-merges would produce "I-A-X", showing
	 * the merge commit X and that it changed A, but not making clear that
	 * it had just taken the I version. With this check, the topology above
	 * is retained.
	 *
	 * Note that it is possible that the simplification chooses a different
	 * TREESAME parent from the default, in which case this test doesn't
	 * activate, and we _do_ drop the default parent. Example:
	 *
	 *   I------X         A modified the file, but it was reverted in B,
	 *    \    /          meaning mainline merge X is TREESAME to both
	 *    *A-*B           parents.
	 *
	 * Default log would produce "I" by following the first parent;
	 * --full-history --simplify-merges will produce "I-A-B". But this is a
	 * reasonable result - it presents a logical full history leading from
	 * I to X, and X is not an important merge.
	 */
	if (!unmarked && marked) {
		marked->object.flags &= ~TMP_MARK;
		return 1;
	}

	return 0;
}

2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373
static int remove_marked_parents(struct rev_info *revs, struct commit *commit)
{
	struct commit_list **pp, *p;
	int nth_parent, removed = 0;

	pp = &commit->parents;
	nth_parent = 0;
	while ((p = *pp) != NULL) {
		struct commit *parent = p->item;
		if (parent->object.flags & TMP_MARK) {
			parent->object.flags &= ~TMP_MARK;
			*pp = p->next;
			free(p);
			removed++;
			compact_treesame(revs, commit, nth_parent);
			continue;
		}
		pp = &p->next;
		nth_parent++;
	}

	/* Removing parents can only increase TREESAMEness */
	if (removed && !(commit->object.flags & TREESAME))
		update_treesame(revs, commit);

	return nth_parent;
}

2374
static struct commit_list **simplify_one(struct rev_info *revs, struct commit *commit, struct commit_list **tail)
2375 2376
{
	struct commit_list *p;
2377
	struct commit *parent;
2378
	struct merge_simplify_state *st, *pst;
2379 2380
	int cnt;

2381 2382
	st = locate_simplify_state(revs, commit);

2383 2384 2385
	/*
	 * Have we handled this one?
	 */
2386
	if (st->simplified)
2387 2388 2389 2390 2391 2392 2393 2394
		return tail;

	/*
	 * An UNINTERESTING commit simplifies to itself, so does a
	 * root commit.  We do not rewrite parents of such commit
	 * anyway.
	 */
	if ((commit->object.flags & UNINTERESTING) || !commit->parents) {
2395
		st->simplified = commit;
2396 2397 2398 2399
		return tail;
	}

	/*
2400 2401 2402
	 * Do we know what commit all of our parents that matter
	 * should be rewritten to?  Otherwise we are not ready to
	 * rewrite this one yet.
2403 2404
	 */
	for (cnt = 0, p = commit->parents; p; p = p->next) {
2405 2406
		pst = locate_simplify_state(revs, p->item);
		if (!pst->simplified) {
2407 2408 2409
			tail = &commit_list_insert(p->item, tail)->next;
			cnt++;
		}
2410 2411
		if (revs->first_parent_only)
			break;
2412
	}
2413 2414
	if (cnt) {
		tail = &commit_list_insert(commit, tail)->next;
2415
		return tail;
2416
	}
2417 2418

	/*
2419 2420 2421
	 * Rewrite our list of parents. Note that this cannot
	 * affect our TREESAME flags in any way - a commit is
	 * always TREESAME to its simplification.
2422
	 */
2423 2424 2425
	for (p = commit->parents; p; p = p->next) {
		pst = locate_simplify_state(revs, p->item);
		p->item = pst->simplified;
2426 2427
		if (revs->first_parent_only)
			break;
2428
	}
2429

2430
	if (revs->first_parent_only)
2431
		cnt = 1;
2432
	else
2433
		cnt = remove_duplicate_parents(revs, commit);
2434 2435 2436 2437

	/*
	 * It is possible that we are a merge and one side branch
	 * does not have any commit that touches the given paths;
2438 2439
	 * in such a case, the immediate parent from that branch
	 * will be rewritten to be the merge base.
2440 2441 2442 2443 2444
	 *
	 *      o----X		X: the commit we are looking at;
	 *     /    /		o: a commit that touches the paths;
	 * ---o----'
	 *
2445 2446 2447 2448 2449 2450 2451 2452
	 * Further, a merge of an independent branch that doesn't
	 * touch the path will reduce to a treesame root parent:
	 *
	 *  ----o----X		X: the commit we are looking at;
	 *          /		o: a commit that touches the paths;
	 *         r		r: a root commit not touching the paths
	 *
	 * Detect and simplify both cases.
2453 2454
	 */
	if (1 < cnt) {
2455
		int marked = mark_redundant_parents(revs, commit);
2456
		marked += mark_treesame_root_parents(revs, commit);
2457 2458
		if (marked)
			marked -= leave_one_treesame_to_parent(revs, commit);
2459 2460
		if (marked)
			cnt = remove_marked_parents(revs, commit);
2461 2462 2463 2464 2465
	}

	/*
	 * A commit simplifies to itself if it is a root, if it is
	 * UNINTERESTING, if it touches the given paths, or if it is a
2466
	 * merge and its parents don't simplify to one relevant commit
2467 2468 2469
	 * (the first two cases are already handled at the beginning of
	 * this function).
	 *
2470 2471
	 * Otherwise, it simplifies to what its sole relevant parent
	 * simplifies to.
2472 2473 2474 2475
	 */
	if (!cnt ||
	    (commit->object.flags & UNINTERESTING) ||
	    !(commit->object.flags & TREESAME) ||
2476
	    (parent = one_relevant_parent(revs, commit->parents)) == NULL)
2477 2478
		st->simplified = commit;
	else {
2479
		pst = locate_simplify_state(revs, parent);
2480 2481
		st->simplified = pst->simplified;
	}
2482 2483 2484 2485 2486
	return tail;
}

static void simplify_merges(struct rev_info *revs)
{
2487
	struct commit_list *list, *next;
2488
	struct commit_list *yet_to_do, **tail;
2489
	struct commit *commit;
2490

2491 2492
	if (!revs->prune)
		return;
2493

2494 2495
	/* feed the list reversed */
	yet_to_do = NULL;
2496 2497 2498 2499 2500 2501 2502 2503 2504
	for (list = revs->commits; list; list = next) {
		commit = list->item;
		next = list->next;
		/*
		 * Do not free(list) here yet; the original list
		 * is used later in this function.
		 */
		commit_list_insert(commit, &yet_to_do);
	}
2505 2506 2507 2508 2509
	while (yet_to_do) {
		list = yet_to_do;
		yet_to_do = NULL;
		tail = &yet_to_do;
		while (list) {
2510 2511
			commit = list->item;
			next = list->next;
2512 2513
			free(list);
			list = next;
2514
			tail = simplify_one(revs, commit, tail);
2515 2516 2517 2518 2519 2520 2521 2522
		}
	}

	/* clean up the result, removing the simplified ones */
	list = revs->commits;
	revs->commits = NULL;
	tail = &revs->commits;
	while (list) {
2523
		struct merge_simplify_state *st;
2524 2525 2526

		commit = list->item;
		next = list->next;
2527 2528
		free(list);
		list = next;
2529 2530
		st = locate_simplify_state(revs, commit);
		if (st->simplified == commit)
2531 2532 2533 2534
			tail = &commit_list_insert(commit, tail)->next;
	}
}

2535 2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546
static void set_children(struct rev_info *revs)
{
	struct commit_list *l;
	for (l = revs->commits; l; l = l->next) {
		struct commit *commit = l->item;
		struct commit_list *p;

		for (p = commit->parents; p; p = p->next)
			add_child(revs, p->item, commit);
	}
}

2547 2548 2549 2550 2551
void reset_revision_walk(void)
{
	clear_object_flags(SEEN | ADDED | SHOWN);
}

2552
int prepare_revision_walk(struct rev_info *revs)
2553
{
2554
	int nr = revs->pending.nr;
2555
	struct object_array_entry *e, *list;
2556
	struct commit_list **next = &revs->commits;
2557

2558
	e = list = revs->pending.objects;
2559 2560 2561 2562
	revs->pending.nr = 0;
	revs->pending.alloc = 0;
	revs->pending.objects = NULL;
	while (--nr >= 0) {
2563
		struct commit *commit = handle_commit(revs, e->item, e->name);
2564 2565 2566
		if (commit) {
			if (!(commit->object.flags & SEEN)) {
				commit->object.flags |= SEEN;
2567
				next = commit_list_append(commit, next);
2568 2569
			}
		}
2570
		e++;
2571
	}
R
René Scharfe 已提交
2572 2573
	if (!revs->leak_pending)
		free(list);
2574

2575
	/* Signal whether we need per-parent treesame decoration */
2576 2577
	if (revs->simplify_merges ||
	    (revs->limited && limiting_can_increase_treesame(revs)))
2578 2579
		revs->treesame.name = "treesame";

2580 2581
	if (revs->no_walk != REVISION_WALK_NO_WALK_UNSORTED)
		commit_list_sort_by_date(&revs->commits);
L
Linus Torvalds 已提交
2582
	if (revs->no_walk)
2583
		return 0;
2584
	if (revs->limited)
2585 2586
		if (limit_list(revs) < 0)
			return -1;
2587
	if (revs->topo_order)
L
Linus Torvalds 已提交
2588
		sort_in_topological_order(&revs->commits, revs->lifo);
2589 2590
	if (revs->simplify_merges)
		simplify_merges(revs);
2591 2592
	if (revs->children.name)
		set_children(revs);
2593
	return 0;
2594 2595
}

2596 2597 2598
enum rewrite_result {
	rewrite_one_ok,
	rewrite_one_noparents,
2599
	rewrite_one_error
2600 2601 2602
};

static enum rewrite_result rewrite_one(struct rev_info *revs, struct commit **pp)
2603
{
2604 2605
	struct commit_list *cache = NULL;

2606 2607
	for (;;) {
		struct commit *p = *pp;
2608
		if (!revs->limited)
2609
			if (add_parents_to_list(revs, p, &revs->commits, &cache) < 0)
2610
				return rewrite_one_error;
2611 2612 2613
		if (p->object.flags & UNINTERESTING)
			return rewrite_one_ok;
		if (!(p->object.flags & TREESAME))
2614
			return rewrite_one_ok;
2615
		if (!p->parents)
2616
			return rewrite_one_noparents;
2617 2618 2619
		if ((p = one_relevant_parent(revs, p->parents)) == NULL)
			return rewrite_one_ok;
		*pp = p;
2620 2621 2622
	}
}

2623
static int rewrite_parents(struct rev_info *revs, struct commit *commit)
2624 2625 2626 2627
{
	struct commit_list **pp = &commit->parents;
	while (*pp) {
		struct commit_list *parent = *pp;
2628 2629 2630 2631
		switch (rewrite_one(revs, &parent->item)) {
		case rewrite_one_ok:
			break;
		case rewrite_one_noparents:
2632 2633
			*pp = parent->next;
			continue;
2634 2635
		case rewrite_one_error:
			return -1;
2636 2637 2638
		}
		pp = &parent->next;
	}
2639
	remove_duplicate_parents(revs, commit);
2640
	return 0;
2641 2642
}

2643 2644 2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687
static int commit_rewrite_person(struct strbuf *buf, const char *what, struct string_list *mailmap)
{
	char *person, *endp;
	size_t len, namelen, maillen;
	const char *name;
	const char *mail;
	struct ident_split ident;

	person = strstr(buf->buf, what);
	if (!person)
		return 0;

	person += strlen(what);
	endp = strchr(person, '\n');
	if (!endp)
		return 0;

	len = endp - person;

	if (split_ident_line(&ident, person, len))
		return 0;

	mail = ident.mail_begin;
	maillen = ident.mail_end - ident.mail_begin;
	name = ident.name_begin;
	namelen = ident.name_end - ident.name_begin;

	if (map_user(mailmap, &mail, &maillen, &name, &namelen)) {
		struct strbuf namemail = STRBUF_INIT;

		strbuf_addf(&namemail, "%.*s <%.*s>",
			    (int)namelen, name, (int)maillen, mail);

		strbuf_splice(buf, ident.name_begin - buf->buf,
			      ident.mail_end - ident.name_begin + 1,
			      namemail.buf, namemail.len);

		strbuf_release(&namemail);

		return 1;
	}

	return 0;
}

2688 2689
static int commit_match(struct commit *commit, struct rev_info *opt)
{
2690
	int retval;
2691 2692
	const char *encoding;
	char *message;
2693
	struct strbuf buf = STRBUF_INIT;
2694

2695
	if (!opt->grep_filter.pattern_list && !opt->grep_filter.header_list)
2696
		return 1;
2697 2698 2699

	/* Prepend "fake" headers as needed */
	if (opt->grep_filter.use_reflog_filter) {
2700 2701 2702 2703
		strbuf_addstr(&buf, "reflog ");
		get_reflog_message(&buf, opt->reflog_info);
		strbuf_addch(&buf, '\n');
	}
2704

2705 2706 2707 2708 2709 2710 2711 2712
	/*
	 * We grep in the user's output encoding, under the assumption that it
	 * is the encoding they are most likely to write their grep pattern
	 * for. In addition, it means we will match the "notes" encoding below,
	 * so we will not end up with a buffer that has two different encodings
	 * in it.
	 */
	encoding = get_log_output_encoding();
2713
	message = logmsg_reencode(commit, NULL, encoding);
2714

2715 2716
	/* Copy the commit to temporary if we are using "fake" headers */
	if (buf.len)
2717
		strbuf_addstr(&buf, message);
2718

2719
	if (opt->grep_filter.header_list && opt->mailmap) {
2720
		if (!buf.len)
2721
			strbuf_addstr(&buf, message);
2722 2723 2724 2725 2726

		commit_rewrite_person(&buf, "\nauthor ", opt->mailmap);
		commit_rewrite_person(&buf, "\ncommitter ", opt->mailmap);
	}

2727 2728 2729
	/* Append "fake" message parts as needed */
	if (opt->show_notes) {
		if (!buf.len)
2730 2731
			strbuf_addstr(&buf, message);
		format_display_notes(commit->object.sha1, &buf, encoding, 1);
2732 2733
	}

2734
	/* Find either in the original commit message, or in the temporary */
2735 2736 2737 2738
	if (buf.len)
		retval = grep_buffer(&opt->grep_filter, buf.buf, buf.len);
	else
		retval = grep_buffer(&opt->grep_filter,
2739
				     message, strlen(message));
2740
	strbuf_release(&buf);
2741
	logmsg_free(message, commit);
2742
	return retval;
2743 2744
}

2745 2746
static inline int want_ancestry(struct rev_info *revs)
{
2747
	return (revs->rewrite_parents || revs->children.name);
2748 2749
}

2750
enum commit_action get_commit_action(struct rev_info *revs, struct commit *commit)
L
Linus Torvalds 已提交
2751 2752 2753
{
	if (commit->object.flags & SHOWN)
		return commit_ignore;
2754
	if (revs->unpacked && has_sha1_pack(commit->object.sha1))
L
Linus Torvalds 已提交
2755
		return commit_ignore;
2756 2757
	if (revs->show_all)
		return commit_show;
L
Linus Torvalds 已提交
2758 2759 2760 2761
	if (commit->object.flags & UNINTERESTING)
		return commit_ignore;
	if (revs->min_age != -1 && (commit->date > revs->min_age))
		return commit_ignore;
2762
	if (revs->min_parents || (revs->max_parents >= 0)) {
2763
		int n = commit_list_count(commit->parents);
2764 2765 2766 2767
		if ((n < revs->min_parents) ||
		    ((revs->max_parents >= 0) && (n > revs->max_parents)))
			return commit_ignore;
	}
L
Linus Torvalds 已提交
2768 2769
	if (!commit_match(commit, revs))
		return commit_ignore;
L
Linus Torvalds 已提交
2770
	if (revs->prune && revs->dense) {
L
Linus Torvalds 已提交
2771
		/* Commit without changes? */
2772
		if (commit->object.flags & TREESAME) {
2773 2774
			int n;
			struct commit_list *p;
L
Linus Torvalds 已提交
2775
			/* drop merges unless we want parenthood */
2776
			if (!want_ancestry(revs))
L
Linus Torvalds 已提交
2777
				return commit_ignore;
2778 2779 2780 2781 2782 2783 2784 2785 2786 2787 2788 2789
			/*
			 * If we want ancestry, then need to keep any merges
			 * between relevant commits to tie together topology.
			 * For consistency with TREESAME and simplification
			 * use "relevant" here rather than just INTERESTING,
			 * to treat bottom commit(s) as part of the topology.
			 */
			for (n = 0, p = commit->parents; p; p = p->next)
				if (relevant_commit(p->item))
					if (++n >= 2)
						return commit_show;
			return commit_ignore;
L
Linus Torvalds 已提交
2790 2791 2792 2793 2794
		}
	}
	return commit_show;
}

2795 2796 2797 2798 2799 2800 2801 2802 2803 2804 2805 2806 2807
enum commit_action simplify_commit(struct rev_info *revs, struct commit *commit)
{
	enum commit_action action = get_commit_action(revs, commit);

	if (action == commit_show &&
	    !revs->show_all &&
	    revs->prune && revs->dense && want_ancestry(revs)) {
		if (rewrite_parents(revs, commit) < 0)
			return commit_error;
	}
	return action;
}

J
Junio C Hamano 已提交
2808
static struct commit *get_revision_1(struct rev_info *revs)
2809
{
J
Junio C Hamano 已提交
2810
	if (!revs->commits)
2811 2812
		return NULL;

2813
	do {
L
Linus Torvalds 已提交
2814 2815
		struct commit_list *entry = revs->commits;
		struct commit *commit = entry->item;
2816

L
Linus Torvalds 已提交
2817 2818
		revs->commits = entry->next;
		free(entry);
2819

2820
		if (revs->reflog_info) {
2821
			fake_reflog_parent(revs->reflog_info, commit);
2822 2823
			commit->object.flags &= ~(ADDED | SEEN | SHOWN);
		}
2824

2825 2826
		/*
		 * If we haven't done the list limiting, we need to look at
2827 2828
		 * the parents here. We also need to do the date-based limiting
		 * that we'd otherwise have done in limit_list().
2829
		 */
2830
		if (!revs->limited) {
2831
			if (revs->max_age != -1 &&
2832 2833
			    (commit->date < revs->max_age))
				continue;
2834
			if (add_parents_to_list(revs, commit, &revs->commits, NULL) < 0)
2835 2836
				die("Failed to traverse parents of commit %s",
				    sha1_to_hex(commit->object.sha1));
2837
		}
2838

L
Linus Torvalds 已提交
2839 2840
		switch (simplify_commit(revs, commit)) {
		case commit_ignore:
2841
			continue;
L
Linus Torvalds 已提交
2842
		case commit_error:
2843 2844
			die("Failed to simplify parents of commit %s",
			    sha1_to_hex(commit->object.sha1));
L
Linus Torvalds 已提交
2845 2846
		default:
			return commit;
J
Junio C Hamano 已提交
2847
		}
2848 2849 2850
	} while (revs->commits);
	return NULL;
}
J
Junio C Hamano 已提交
2851

2852 2853 2854 2855 2856 2857 2858 2859 2860 2861 2862 2863 2864 2865 2866
static void gc_boundary(struct object_array *array)
{
	unsigned nr = array->nr;
	unsigned alloc = array->alloc;
	struct object_array_entry *objects = array->objects;

	if (alloc <= nr) {
		unsigned i, j;
		for (i = j = 0; i < nr; i++) {
			if (objects[i].item->flags & SHOWN)
				continue;
			if (i != j)
				objects[j] = objects[i];
			j++;
		}
2867
		for (i = j; i < nr; i++)
2868 2869 2870 2871 2872
			objects[i].item = NULL;
		array->nr = j;
	}
}

2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883 2884 2885 2886 2887 2888 2889 2890 2891 2892 2893 2894 2895 2896 2897 2898 2899 2900 2901 2902 2903 2904 2905 2906 2907 2908 2909 2910 2911 2912 2913
static void create_boundary_commit_list(struct rev_info *revs)
{
	unsigned i;
	struct commit *c;
	struct object_array *array = &revs->boundary_commits;
	struct object_array_entry *objects = array->objects;

	/*
	 * If revs->commits is non-NULL at this point, an error occurred in
	 * get_revision_1().  Ignore the error and continue printing the
	 * boundary commits anyway.  (This is what the code has always
	 * done.)
	 */
	if (revs->commits) {
		free_commit_list(revs->commits);
		revs->commits = NULL;
	}

	/*
	 * Put all of the actual boundary commits from revs->boundary_commits
	 * into revs->commits
	 */
	for (i = 0; i < array->nr; i++) {
		c = (struct commit *)(objects[i].item);
		if (!c)
			continue;
		if (!(c->object.flags & CHILD_SHOWN))
			continue;
		if (c->object.flags & (SHOWN | BOUNDARY))
			continue;
		c->object.flags |= BOUNDARY;
		commit_list_insert(c, &revs->commits);
	}

	/*
	 * If revs->topo_order is set, sort the boundary commits
	 * in topological order
	 */
	sort_in_topological_order(&revs->commits, revs->lifo);
}

2914
static struct commit *get_revision_internal(struct rev_info *revs)
J
Junio C Hamano 已提交
2915 2916
{
	struct commit *c = NULL;
2917 2918 2919
	struct commit_list *l;

	if (revs->boundary == 2) {
2920 2921 2922 2923 2924 2925 2926 2927 2928
		/*
		 * All of the normal commits have already been returned,
		 * and we are now returning boundary commits.
		 * create_boundary_commit_list() has populated
		 * revs->commits with the remaining commits to return.
		 */
		c = pop_commit(&revs->commits);
		if (c)
			c->object.flags |= SHOWN;
2929 2930 2931
		return c;
	}

2932
	/*
2933 2934 2935 2936 2937 2938 2939 2940
	 * If our max_count counter has reached zero, then we are done. We
	 * don't simply return NULL because we still might need to show
	 * boundary commits. But we want to avoid calling get_revision_1, which
	 * might do a considerable amount of work finding the next commit only
	 * for us to throw it away.
	 *
	 * If it is non-zero, then either we don't have a max_count at all
	 * (-1), or it is still counting, in which case we decrement.
2941
	 */
2942 2943 2944 2945 2946 2947 2948 2949 2950
	if (revs->max_count) {
		c = get_revision_1(revs);
		if (c) {
			while (0 < revs->skip_count) {
				revs->skip_count--;
				c = get_revision_1(revs);
				if (!c)
					break;
			}
2951
		}
2952

2953 2954
		if (revs->max_count > 0)
			revs->max_count--;
J
Junio C Hamano 已提交
2955
	}
2956

2957 2958 2959 2960
	if (c)
		c->object.flags |= SHOWN;

	if (!revs->boundary) {
J
Junio C Hamano 已提交
2961
		return c;
2962
	}
2963 2964 2965 2966 2967 2968 2969 2970

	if (!c) {
		/*
		 * get_revision_1() runs out the commits, and
		 * we are done computing the boundaries.
		 * switch to boundary commits output mode.
		 */
		revs->boundary = 2;
2971 2972 2973 2974 2975 2976 2977

		/*
		 * Update revs->commits to contain the list of
		 * boundary commits.
		 */
		create_boundary_commit_list(revs);

2978
		return get_revision_internal(revs);
2979 2980 2981 2982 2983 2984 2985 2986 2987 2988 2989 2990
	}

	/*
	 * boundary commits are the commits that are parents of the
	 * ones we got from get_revision_1() but they themselves are
	 * not returned from get_revision_1().  Before returning
	 * 'c', we need to mark its parents that they could be boundaries.
	 */

	for (l = c->parents; l; l = l->next) {
		struct object *p;
		p = &(l->item->object);
2991
		if (p->flags & (CHILD_SHOWN | SHOWN))
2992 2993 2994 2995 2996 2997 2998
			continue;
		p->flags |= CHILD_SHOWN;
		gc_boundary(&revs->boundary_commits);
		add_object_array(p, NULL, &revs->boundary_commits);
	}

	return c;
J
Junio C Hamano 已提交
2999
}
3000 3001 3002

struct commit *get_revision(struct rev_info *revs)
{
3003 3004 3005 3006 3007 3008 3009 3010 3011 3012 3013 3014 3015 3016 3017 3018 3019
	struct commit *c;
	struct commit_list *reversed;

	if (revs->reverse) {
		reversed = NULL;
		while ((c = get_revision_internal(revs))) {
			commit_list_insert(c, &reversed);
		}
		revs->commits = reversed;
		revs->reverse = 0;
		revs->reverse_output_stage = 1;
	}

	if (revs->reverse_output_stage)
		return pop_commit(&revs->commits);

	c = get_revision_internal(revs);
3020 3021 3022 3023
	if (c && revs->graph)
		graph_update(revs->graph, c);
	return c;
}
3024 3025 3026 3027 3028 3029 3030

char *get_revision_mark(const struct rev_info *revs, const struct commit *commit)
{
	if (commit->object.flags & BOUNDARY)
		return "-";
	else if (commit->object.flags & UNINTERESTING)
		return "^";
3031 3032
	else if (commit->object.flags & PATCHSAME)
		return "=";
3033 3034 3035 3036 3037 3038 3039
	else if (!revs || revs->left_right) {
		if (commit->object.flags & SYMMETRIC_LEFT)
			return "<";
		else
			return ">";
	} else if (revs->graph)
		return "*";
3040 3041
	else if (revs->cherry_mark)
		return "+";
3042 3043
	return "";
}
3044 3045 3046 3047 3048 3049 3050 3051 3052

void put_revision_mark(const struct rev_info *revs, const struct commit *commit)
{
	char *mark = get_revision_mark(revs, commit);
	if (!strlen(mark))
		return;
	fputs(mark, stdout);
	putchar(' ');
}