diff.c 26.2 KB
Newer Older
1 2 3 4 5
/*
 * Copyright (C) 2005 Junio C Hamano
 */
#include <sys/types.h>
#include <sys/wait.h>
6
#include <signal.h>
7 8
#include "cache.h"
#include "diff.h"
9
#include "diffcore.h"
10

J
Junio C Hamano 已提交
11
static const char *diff_opts = "-pu";
12
static unsigned char null_sha1[20] = { 0, };
13 14

static int reverse_diff;
15
static int use_size_cache;
16

17
static const char *external_diff(void)
18
{
J
Junio C Hamano 已提交
19
	static const char *external_diff_cmd = NULL;
20 21 22 23 24
	static int done_preparing = 0;

	if (done_preparing)
		return external_diff_cmd;

25 26 27 28 29 30 31 32
	/*
	 * Default values above are meant to match the
	 * Linux kernel development style.  Examples of
	 * alternative styles you can specify via environment
	 * variables are:
	 *
	 * GIT_DIFF_OPTS="-c";
	 */
J
Junio C Hamano 已提交
33 34
	if (gitenv("GIT_EXTERNAL_DIFF"))
		external_diff_cmd = gitenv("GIT_EXTERNAL_DIFF");
35 36

	/* In case external diff fails... */
J
Junio C Hamano 已提交
37
	diff_opts = gitenv("GIT_DIFF_OPTS") ? : diff_opts;
38 39 40

	done_preparing = 1;
	return external_diff_cmd;
41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
}

/* Help to copy the thing properly quoted for the shell safety.
 * any single quote is replaced with '\'', and the caller is
 * expected to enclose the result within a single quote pair.
 *
 * E.g.
 *  original     sq_expand     result
 *  name     ==> name      ==> 'name'
 *  a b      ==> a b       ==> 'a b'
 *  a'b      ==> a'\''b    ==> 'a'\''b'
 */
static char *sq_expand(const char *src)
{
	static char *buf = NULL;
	int cnt, c;
	const char *cp;
	char *bp;

J
Junio C Hamano 已提交
60
	/* count bytes needed to store the quoted string. */
61 62 63 64
	for (cnt = 1, cp = src; *cp; cnt++, cp++)
		if (*cp == '\'')
			cnt += 3;

65
	buf = xmalloc(cnt);
66 67 68 69 70 71 72 73 74 75 76 77 78
	bp = buf;
	while ((c = *src++)) {
		if (c != '\'')
			*bp++ = c;
		else {
			bp = strcpy(bp, "'\\''");
			bp += 4;
		}
	}
	*bp = 0;
	return buf;
}

79
static struct diff_tempfile {
80
	const char *name; /* filename external diff should read from */
81 82 83 84 85
	char hex[41];
	char mode[10];
	char tmp_path[50];
} diff_temp[2];

J
Junio C Hamano 已提交
86 87
static void builtin_diff(const char *name_a,
			 const char *name_b,
J
Junio C Hamano 已提交
88
			 struct diff_tempfile *temp,
89
			 const char *xfrm_msg)
90
{
91
	int i, next_at, cmd_size;
92
	const char *diff_cmd = "diff -L'%s%s' -L'%s%s'";
93
	const char *diff_arg  = "'%s' '%s'||:"; /* "||:" is to return 0 */
94 95 96
	const char *input_name_sq[2];
	const char *path0[2];
	const char *path1[2];
J
Junio C Hamano 已提交
97
	const char *name_sq[2];
98
	char *cmd;
J
Junio C Hamano 已提交
99 100 101 102

	name_sq[0] = sq_expand(name_a);
	name_sq[1] = sq_expand(name_b);

103 104
	/* diff_cmd and diff_arg have 6 %s in total which makes
	 * the sum of these strings 12 bytes larger than required.
105
	 * we use 2 spaces around diff-opts, and we need to count
106
	 * terminating NUL, so we subtract 9 here.
107
	 */
108
	cmd_size = (strlen(diff_cmd) + strlen(diff_opts) +
109
			strlen(diff_arg) - 9);
110 111 112 113 114 115
	for (i = 0; i < 2; i++) {
		input_name_sq[i] = sq_expand(temp[i].name);
		if (!strcmp(temp[i].name, "/dev/null")) {
			path0[i] = "/dev/null";
			path1[i] = "";
		} else {
116
			path0[i] = i ? "b/" : "a/";
J
Junio C Hamano 已提交
117
			path1[i] = name_sq[i];
118 119
		}
		cmd_size += (strlen(path0[i]) + strlen(path1[i]) +
120
			     strlen(input_name_sq[i]));
121
	}
122

123 124 125
	cmd = xmalloc(cmd_size);

	next_at = 0;
126
	next_at += snprintf(cmd+next_at, cmd_size-next_at,
127
			    diff_cmd,
128
			    path0[0], path1[0], path0[1], path1[1]);
129 130 131
	next_at += snprintf(cmd+next_at, cmd_size-next_at,
			    " %s ", diff_opts);
	next_at += snprintf(cmd+next_at, cmd_size-next_at,
132 133
			    diff_arg, input_name_sq[0], input_name_sq[1]);

J
Junio C Hamano 已提交
134
	printf("diff --git a/%s b/%s\n", name_a, name_b);
135
	if (!path1[0][0]) {
136
		printf("new file mode %s\n", temp[1].mode);
137 138 139 140
		if (xfrm_msg && xfrm_msg[0])
			puts(xfrm_msg);
	}
	else if (!path1[1][0]) {
141
		printf("deleted file mode %s\n", temp[0].mode);
142 143 144
		if (xfrm_msg && xfrm_msg[0])
			puts(xfrm_msg);
	}
145
	else {
146 147 148 149
		if (strcmp(temp[0].mode, temp[1].mode)) {
			printf("old mode %s\n", temp[0].mode);
			printf("new mode %s\n", temp[1].mode);
		}
150
		if (xfrm_msg && xfrm_msg[0])
151
			puts(xfrm_msg);
152

153 154 155 156
		if (strncmp(temp[0].mode, temp[1].mode, 3))
			/* we do not run diff between different kind
			 * of objects.
			 */
157 158
			exit(0);
	}
159
	fflush(NULL);
160
	execlp("/bin/sh","sh", "-c", cmd, NULL);
161 162
}

163 164 165 166 167 168
struct diff_filespec *alloc_filespec(const char *path)
{
	int namelen = strlen(path);
	struct diff_filespec *spec = xmalloc(sizeof(*spec) + namelen + 1);
	spec->path = (char *)(spec + 1);
	strcpy(spec->path, path);
169
	spec->should_free = spec->should_munmap = 0;
170 171
	spec->xfrm_flags = 0;
	spec->size = 0;
L
Linus Torvalds 已提交
172
	spec->data = NULL;
173 174
	spec->mode = 0;
	memset(spec->sha1, 0, 20);
175 176 177 178 179 180
	return spec;
}

void fill_filespec(struct diff_filespec *spec, const unsigned char *sha1,
		   unsigned short mode)
{
181 182
	if (mode) {
		spec->mode = DIFF_FILE_CANON_MODE(mode);
183 184 185
		memcpy(spec->sha1, sha1, 20);
		spec->sha1_valid = !!memcmp(sha1, null_sha1, 20);
	}
186 187
}

J
Junio C Hamano 已提交
188 189 190 191 192 193 194 195 196 197
/*
 * Given a name and sha1 pair, if the dircache tells us the file in
 * the work tree has that object contents, return true, so that
 * prepare_temp_file() does not have to inflate and extract.
 */
static int work_tree_matches(const char *name, const unsigned char *sha1)
{
	struct cache_entry *ce;
	struct stat st;
	int pos, len;
198

J
Junio C Hamano 已提交
199 200 201 202
	/* We do not read the cache ourselves here, because the
	 * benchmark with my previous version that always reads cache
	 * shows that it makes things worse for diff-tree comparing
	 * two linux-2.6 kernel trees in an already checked out work
J
Junio C Hamano 已提交
203
	 * tree.  This is because most diff-tree comparisons deal with
J
Junio C Hamano 已提交
204 205 206 207 208 209
	 * only a small number of files, while reading the cache is
	 * expensive for a large project, and its cost outweighs the
	 * savings we get by not inflating the object to a temporary
	 * file.  Practically, this code only helps when we are used
	 * by diff-cache --cached, which does read the cache before
	 * calling us.
J
Junio C Hamano 已提交
210
	 */
J
Junio C Hamano 已提交
211 212 213 214 215 216 217 218
	if (!active_cache)
		return 0;

	len = strlen(name);
	pos = cache_name_pos(name, len);
	if (pos < 0)
		return 0;
	ce = active_cache[pos];
219
	if ((lstat(name, &st) < 0) ||
220
	    !S_ISREG(st.st_mode) || /* careful! */
221
	    ce_match_stat(ce, &st) ||
J
Junio C Hamano 已提交
222 223
	    memcmp(sha1, ce->sha1, 20))
		return 0;
224 225 226 227 228
	/* we return 1 only when we can stat, it is a regular file,
	 * stat information matches, and sha1 recorded in the cache
	 * matches.  I.e. we know the file in the work tree really is
	 * the same as the <name, sha1> pair.
	 */
J
Junio C Hamano 已提交
229 230 231
	return 1;
}

232 233 234 235 236 237 238
static struct sha1_size_cache {
	unsigned char sha1[20];
	unsigned long size;
} **sha1_size_cache;
static int sha1_size_cache_nr, sha1_size_cache_alloc;

static struct sha1_size_cache *locate_size_cache(unsigned char *sha1,
239
						 int find_only,
240 241 242 243 244 245 246 247
						 unsigned long size)
{
	int first, last;
	struct sha1_size_cache *e;

	first = 0;
	last = sha1_size_cache_nr;
	while (last > first) {
248
		int cmp, next = (last + first) >> 1;
249
		e = sha1_size_cache[next];
250
		cmp = memcmp(e->sha1, sha1, 20);
251 252 253 254 255 256 257 258 259
		if (!cmp)
			return e;
		if (cmp < 0) {
			last = next;
			continue;
		}
		first = next+1;
	}
	/* not found */
260
	if (find_only)
261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280
		return NULL;
	/* insert to make it at "first" */
	if (sha1_size_cache_alloc <= sha1_size_cache_nr) {
		sha1_size_cache_alloc = alloc_nr(sha1_size_cache_alloc);
		sha1_size_cache = xrealloc(sha1_size_cache,
					   sha1_size_cache_alloc *
					   sizeof(*sha1_size_cache));
	}
	sha1_size_cache_nr++;
	if (first < sha1_size_cache_nr)
		memmove(sha1_size_cache + first + 1, sha1_size_cache + first,
			(sha1_size_cache_nr - first - 1) *
			sizeof(*sha1_size_cache));
	e = xmalloc(sizeof(struct sha1_size_cache));
	sha1_size_cache[first] = e;
	memcpy(e->sha1, sha1, 20);
	e->size = size;
	return e;
}

281 282 283 284 285
/*
 * While doing rename detection and pickaxe operation, we may need to
 * grab the data for the blob (or file) for our own in-core comparison.
 * diff_filespec has data and size fields for this purpose.
 */
286
int diff_populate_filespec(struct diff_filespec *s, int size_only)
287 288
{
	int err = 0;
289
	if (!DIFF_FILE_VALID(s))
290 291 292 293
		die("internal error: asking to populate invalid file.");
	if (S_ISDIR(s->mode))
		return -1;

294 295 296
	if (!use_size_cache)
		size_only = 0;

297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315
	if (s->data)
		return err;
	if (!s->sha1_valid ||
	    work_tree_matches(s->path, s->sha1)) {
		struct stat st;
		int fd;
		if (lstat(s->path, &st) < 0) {
			if (errno == ENOENT) {
			err_empty:
				err = -1;
			empty:
				s->data = "";
				s->size = 0;
				return err;
			}
		}
		s->size = st.st_size;
		if (!s->size)
			goto empty;
316 317
		if (size_only)
			return 0;
318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337
		if (S_ISLNK(st.st_mode)) {
			int ret;
			s->data = xmalloc(s->size);
			s->should_free = 1;
			ret = readlink(s->path, s->data, s->size);
			if (ret < 0) {
				free(s->data);
				goto err_empty;
			}
			return 0;
		}
		fd = open(s->path, O_RDONLY);
		if (fd < 0)
			goto err_empty;
		s->data = mmap(NULL, s->size, PROT_READ, MAP_PRIVATE, fd, 0);
		s->should_munmap = 1;
		close(fd);
	}
	else {
		char type[20];
338 339 340
		struct sha1_size_cache *e;

		if (size_only) {
341
			e = locate_size_cache(s->sha1, 1, 0);
342 343 344 345
			if (e) {
				s->size = e->size;
				return 0;
			}
346
			if (!sha1_file_size(s->sha1, &s->size))
347
				locate_size_cache(s->sha1, 0, s->size);
348 349 350 351
		}
		else {
			s->data = read_sha1_file(s->sha1, type, &s->size);
			s->should_free = 1;
352
		}
353 354 355 356 357 358 359 360 361 362 363
	}
	return 0;
}

void diff_free_filespec_data(struct diff_filespec *s)
{
	if (s->should_free)
		free(s->data);
	else if (s->should_munmap)
		munmap(s->data, s->size);
	s->should_free = s->should_munmap = 0;
L
Linus Torvalds 已提交
364
	s->data = NULL;
365 366
}

367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387
static void prep_temp_blob(struct diff_tempfile *temp,
			   void *blob,
			   unsigned long size,
			   unsigned char *sha1,
			   int mode)
{
	int fd;

	strcpy(temp->tmp_path, ".diff_XXXXXX");
	fd = mkstemp(temp->tmp_path);
	if (fd < 0)
		die("unable to create temp-file");
	if (write(fd, blob, size) != size)
		die("unable to write temp-file");
	close(fd);
	temp->name = temp->tmp_path;
	strcpy(temp->hex, sha1_to_hex(sha1));
	temp->hex[40] = 0;
	sprintf(temp->mode, "%06o", mode);
}

388 389
static void prepare_temp_file(const char *name,
			      struct diff_tempfile *temp,
390
			      struct diff_filespec *one)
391
{
392
	if (!DIFF_FILE_VALID(one)) {
393
	not_a_valid_file:
394 395 396
		/* A '-' entry produces this for file-2, and
		 * a '+' entry produces this for file-1.
		 */
397 398 399
		temp->name = "/dev/null";
		strcpy(temp->hex, ".");
		strcpy(temp->mode, ".");
400 401
		return;
	}
402

403
	if (!one->sha1_valid ||
404
	    work_tree_matches(name, one->sha1)) {
405
		struct stat st;
406
		if (lstat(name, &st) < 0) {
407 408
			if (errno == ENOENT)
				goto not_a_valid_file;
409
			die("stat(%s): %s", name, strerror(errno));
410
		}
411 412 413 414 415 416 417 418 419 420
		if (S_ISLNK(st.st_mode)) {
			int ret;
			char *buf, buf_[1024];
			buf = ((sizeof(buf_) < st.st_size) ?
			       xmalloc(st.st_size) : buf_);
			ret = readlink(name, buf, st.st_size);
			if (ret < 0)
				die("readlink(%s)", name);
			prep_temp_blob(temp, buf, st.st_size,
				       (one->sha1_valid ?
421
					one->sha1 : null_sha1),
422 423 424 425
				       (one->sha1_valid ?
					one->mode : S_IFLNK));
		}
		else {
426 427
			/* we can borrow from the file in the work tree */
			temp->name = name;
428 429 430
			if (!one->sha1_valid)
				strcpy(temp->hex, sha1_to_hex(null_sha1));
			else
431
				strcpy(temp->hex, sha1_to_hex(one->sha1));
J
Junio C Hamano 已提交
432 433 434 435 436 437 438
			/* Even though we may sometimes borrow the
			 * contents from the work tree, we always want
			 * one->mode.  mode is trustworthy even when
			 * !(one->sha1_valid), as long as
			 * DIFF_FILE_VALID(one).
			 */
			sprintf(temp->mode, "%06o", one->mode);
439 440
		}
		return;
441 442
	}
	else {
443
		if (diff_populate_filespec(one, 0))
444 445 446
			die("cannot read data blob for %s", one->path);
		prep_temp_blob(temp, one->data, one->size,
			       one->sha1, one->mode);
447 448 449 450 451 452 453 454 455 456 457 458 459 460
	}
}

static void remove_tempfile(void)
{
	int i;

	for (i = 0; i < 2; i++)
		if (diff_temp[i].name == diff_temp[i].tmp_path) {
			unlink(diff_temp[i].name);
			diff_temp[i].name = NULL;
		}
}

461 462 463 464 465
static void remove_tempfile_on_signal(int signo)
{
	remove_tempfile();
}

466 467 468
/* An external diff command takes:
 *
 * diff-cmd name infile1 infile1-sha1 infile1-mode \
469
 *               infile2 infile2-sha1 infile2-mode [ rename-to ]
470 471
 *
 */
472 473
static void run_external_diff(const char *pgm,
			      const char *name,
474
			      const char *other,
475 476 477
			      struct diff_filespec *one,
			      struct diff_filespec *two,
			      const char *xfrm_msg)
478 479
{
	struct diff_tempfile *temp = diff_temp;
480 481
	pid_t pid;
	int status;
482 483
	static int atexit_asked = 0;

484 485
	if (one && two) {
		prepare_temp_file(name, &temp[0], one);
J
Junio C Hamano 已提交
486
		prepare_temp_file(other ? : name, &temp[1], two);
487 488 489 490 491 492
		if (! atexit_asked &&
		    (temp[0].name == temp[0].tmp_path ||
		     temp[1].name == temp[1].tmp_path)) {
			atexit_asked = 1;
			atexit(remove_tempfile);
		}
493
		signal(SIGINT, remove_tempfile_on_signal);
494 495 496 497 498 499 500
	}

	fflush(NULL);
	pid = fork();
	if (pid < 0)
		die("unable to fork");
	if (!pid) {
501 502
		if (pgm) {
			if (one && two) {
503
				const char *exec_arg[10];
504 505 506 507 508 509 510 511 512
				const char **arg = &exec_arg[0];
				*arg++ = pgm;
				*arg++ = name;
				*arg++ = temp[0].name;
				*arg++ = temp[0].hex;
				*arg++ = temp[0].mode;
				*arg++ = temp[1].name;
				*arg++ = temp[1].hex;
				*arg++ = temp[1].mode;
513
				if (other) {
514
					*arg++ = other;
515 516
					*arg++ = xfrm_msg;
				}
L
Linus Torvalds 已提交
517
				*arg = NULL;
518 519
				execvp(pgm, (char *const*) exec_arg);
			}
520 521 522
			else
				execlp(pgm, pgm, name, NULL);
		}
523 524 525
		/*
		 * otherwise we use the built-in one.
		 */
526
		if (one && two)
527
			builtin_diff(name, other ? : name, temp, xfrm_msg);
528 529
		else
			printf("* Unmerged path %s\n", name);
530 531
		exit(0);
	}
532 533 534
	if (waitpid(pid, &status, 0) < 0 ||
	    !WIFEXITED(status) || WEXITSTATUS(status)) {
		/* Earlier we did not check the exit status because
535
		 * diff exits non-zero if files are different, and
536 537 538 539 540 541
		 * we are not interested in knowing that.  It was a
		 * mistake which made it harder to quit a diff-*
		 * session that uses the git-apply-patch-script as
		 * the GIT_EXTERNAL_DIFF.  A custom GIT_EXTERNAL_DIFF
		 * should also exit non-zero only when it wants to
		 * abort the entire diff-* session.
542 543
		 */
		remove_tempfile();
544 545
		fprintf(stderr, "external diff died, stopping at %s.\n", name);
		exit(1);
546
	}
547 548 549
	remove_tempfile();
}

550 551 552 553 554 555 556 557
static void run_diff(const char *name,
		     const char *other,
		     struct diff_filespec *one,
		     struct diff_filespec *two,
		     const char *xfrm_msg)
{
	const char *pgm = external_diff();
	if (!pgm &&
558
	    one && two &&
559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574
	    DIFF_FILE_VALID(one) && DIFF_FILE_VALID(two) &&
	    (S_IFMT & one->mode) != (S_IFMT & two->mode)) {
		/* a filepair that changes between file and symlink
		 * needs to be split into deletion and creation.
		 */
		struct diff_filespec *null = alloc_filespec(two->path);
		run_external_diff(NULL, name, other, one, null, xfrm_msg);
		free(null);
		null = alloc_filespec(one->path);
		run_external_diff(NULL, name, other, null, two, xfrm_msg);
		free(null);
	}
	else
		run_external_diff(pgm, name, other, one, two, xfrm_msg);
}

575
void diff_setup(int flags)
576
{
577 578
	if (flags & DIFF_SETUP_REVERSE)
		reverse_diff = 1;
579 580 581 582 583 584 585 586 587 588 589 590 591
	if (flags & DIFF_SETUP_USE_CACHE) {
		if (!active_cache)
			/* read-cache does not die even when it fails
			 * so it is safe for us to do this here.  Also
			 * it does not smudge active_cache or active_nr
			 * when it fails, so we do not have to worry about
			 * cleaning it up oufselves either.
			 */
			read_cache();
	}
	if (flags & DIFF_SETUP_USE_SIZE_CACHE)
		use_size_cache = 1;
	
592 593
}

594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618
static int parse_num(const char **cp_p)
{
	int num, scale, ch, cnt;
	const char *cp = *cp_p;

	cnt = num = 0;
	scale = 1;
	while ('0' <= (ch = *cp) && ch <= '9') {
		if (cnt++ < 5) {
			/* We simply ignore more than 5 digits precision. */
			scale *= 10;
			num = num * 10 + ch - '0';
		}
		*cp++;
	}
	*cp_p = cp;

	/* user says num divided by scale and we say internally that
	 * is MAX_SCORE * num / scale.
	 */
	return (MAX_SCORE * num / scale);
}

int diff_scoreopt_parse(const char *opt)
{
619
	int opt1, opt2, cmd;
620 621 622 623 624 625 626 627

	if (*opt++ != '-')
		return -1;
	cmd = *opt++;
	if (cmd != 'M' && cmd != 'C' && cmd != 'B')
		return -1; /* that is not a -M, -C nor -B option */

	opt1 = parse_num(&opt);
628 629 630 631 632 633 634 635 636 637 638 639
	if (cmd != 'B')
		opt2 = 0;
	else {
		if (*opt == 0)
			opt2 = 0;
		else if (*opt != '/')
			return -1; /* we expect -B80/99 or -B80 */
		else {
			opt++;
			opt2 = parse_num(&opt);
		}
	}
640 641
	if (*opt != 0)
		return -1;
642
	return opt1 | (opt2 << 16);
643 644
}

J
Junio C Hamano 已提交
645 646 647
struct diff_queue_struct diff_queued_diff;

void diff_q(struct diff_queue_struct *queue, struct diff_filepair *dp)
648
{
J
Junio C Hamano 已提交
649 650 651 652
	if (queue->alloc <= queue->nr) {
		queue->alloc = alloc_nr(queue->alloc);
		queue->queue = xrealloc(queue->queue,
					sizeof(dp) * queue->alloc);
653
	}
J
Junio C Hamano 已提交
654
	queue->queue[queue->nr++] = dp;
655 656
}

657
struct diff_filepair *diff_queue(struct diff_queue_struct *queue,
J
Junio C Hamano 已提交
658 659
				 struct diff_filespec *one,
				 struct diff_filespec *two)
660
{
661
	struct diff_filepair *dp = xmalloc(sizeof(*dp));
662 663
	dp->one = one;
	dp->two = two;
664
	dp->score = 0;
665
	dp->source_stays = 0;
666
	dp->broken_pair = 0;
J
Junio C Hamano 已提交
667
	diff_q(queue, dp);
668
	return dp;
669 670
}

671 672 673 674 675 676 677
void diff_free_filepair(struct diff_filepair *p)
{
	diff_free_filespec_data(p->one);
	diff_free_filespec_data(p->two);
	free(p);
}

678 679 680
static void diff_flush_raw(struct diff_filepair *p,
			   int line_termination,
			   int inter_name_termination)
681
{
682 683
	int two_paths;
	char status[10];
684 685 686 687 688 689 690 691 692 693 694

	if (line_termination) {
		const char *err = "path %s cannot be expressed without -z";
		if (strchr(p->one->path, line_termination) ||
		    strchr(p->one->path, inter_name_termination))
			die(err, p->one->path);
		if (strchr(p->two->path, line_termination) ||
		    strchr(p->two->path, inter_name_termination))
			die(err, p->two->path);
	}

695 696 697
	switch (p->status) {
	case 'C': case 'R':
		two_paths = 1;
698 699
		sprintf(status, "%c%03d", p->status,
			(int)(0.5 + p->score * 100.0/MAX_SCORE));
700
		break;
701 702 703 704 705 706 707 708 709 710
	case 'N': case 'D':
		two_paths = 0;
		if (p->score)
			sprintf(status, "%c%03d", p->status,
				(int)(0.5 + p->score * 100.0/MAX_SCORE));
		else {
			status[0] = p->status;
			status[1] = 0;
		}
		break;
711 712 713 714 715
	default:
		two_paths = 0;
		status[0] = p->status;
		status[1] = 0;
		break;
J
Junio C Hamano 已提交
716
	}
717 718
	printf(":%06o %06o %s ",
	       p->one->mode, p->two->mode, sha1_to_hex(p->one->sha1));
719 720 721 722 723 724 725 726
	printf("%s %s%c%s",
	       sha1_to_hex(p->two->sha1),
	       status,
	       inter_name_termination,
	       p->one->path);
	if (two_paths)
		printf("%c%s", inter_name_termination, p->two->path);
	putchar(line_termination);
727 728
}

729
int diff_unmodified_pair(struct diff_filepair *p)
730
{
731 732
	/* This function is written stricter than necessary to support
	 * the currently implemented transformers, but the idea is to
733
	 * let transformers to produce diff_filepairs any way they want,
734
	 * and filter and clean them up here before producing the output.
735
	 */
J
Junio C Hamano 已提交
736 737 738 739
	struct diff_filespec *one, *two;

	if (DIFF_PAIR_UNMERGED(p))
		return 0; /* unmerged is interesting */
740

J
Junio C Hamano 已提交
741 742
	one = p->one;
	two = p->two;
743

744 745 746
	/* deletion, addition, mode or type change
	 * and rename are all interesting.
	 */
747
	if (DIFF_FILE_VALID(one) != DIFF_FILE_VALID(two) ||
748
	    DIFF_PAIR_MODE_CHANGED(p) ||
749 750
	    strcmp(one->path, two->path))
		return 0;
J
Junio C Hamano 已提交
751

752 753
	/* both are valid and point at the same path.  that is, we are
	 * dealing with a change.
J
Junio C Hamano 已提交
754
	 */
755 756 757 758 759 760
	if (one->sha1_valid && two->sha1_valid &&
	    !memcmp(one->sha1, two->sha1, sizeof(one->sha1)))
		return 1; /* no change */
	if (!one->sha1_valid && !two->sha1_valid)
		return 1; /* both look at the same file on the filesystem. */
	return 0;
J
Junio C Hamano 已提交
761 762
}

763
static void diff_flush_patch(struct diff_filepair *p)
764 765
{
	const char *name, *other;
766
	char msg_[PATH_MAX*2+200], *msg;
767 768 769 770 771 772 773 774 775 776

	if (diff_unmodified_pair(p))
		return;

	name = p->one->path;
	other = (strcmp(name, p->two->path) ? p->two->path : NULL);
	if ((DIFF_FILE_VALID(p->one) && S_ISDIR(p->one->mode)) ||
	    (DIFF_FILE_VALID(p->two) && S_ISDIR(p->two->mode)))
		return; /* no tree diffs in patch format */ 

777 778 779 780 781
	switch (p->status) {
	case 'C':
		sprintf(msg_,
			"similarity index %d%%\n"
			"copy from %s\n"
782
			"copy to %s",
783
			(int)(0.5 + p->score * 100.0/MAX_SCORE),
784 785 786 787 788 789
			p->one->path, p->two->path);
		msg = msg_;
		break;
	case 'R':
		sprintf(msg_,
			"similarity index %d%%\n"
L
Linus Torvalds 已提交
790 791
			"rename from %s\n"
			"rename to %s",
792
			(int)(0.5 + p->score * 100.0/MAX_SCORE),
793 794 795
			p->one->path, p->two->path);
		msg = msg_;
		break;
796 797 798 799 800 801 802 803 804 805
	case 'D': case 'N':
		if (DIFF_PAIR_BROKEN(p)) {
			sprintf(msg_,
				"dissimilarity index %d%%",
				(int)(0.5 + p->score * 100.0/MAX_SCORE));
			msg = msg_;
		}
		else
			msg = NULL;
		break;
806 807 808 809
	default:
		msg = NULL;
	}

810
	if (DIFF_PAIR_UNMERGED(p))
811
		run_diff(name, NULL, NULL, NULL, NULL);
812
	else
813
		run_diff(name, other, p->one, p->two, msg);
814 815
}

816
int diff_queue_is_empty(void)
817
{
818
	struct diff_queue_struct *q = &diff_queued_diff;
819 820 821 822 823
	int i;
	for (i = 0; i < q->nr; i++)
		if (!diff_unmodified_pair(q->queue[i]))
			return 0;
	return 1;
824 825
}

826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843
#if DIFF_DEBUG
void diff_debug_filespec(struct diff_filespec *s, int x, const char *one)
{
	fprintf(stderr, "queue[%d] %s (%s) %s %06o %s\n",
		x, one ? : "",
		s->path,
		DIFF_FILE_VALID(s) ? "valid" : "invalid",
		s->mode,
		s->sha1_valid ? sha1_to_hex(s->sha1) : "");
	fprintf(stderr, "queue[%d] %s size %lu flags %d\n",
		x, one ? : "",
		s->size, s->xfrm_flags);
}

void diff_debug_filepair(const struct diff_filepair *p, int i)
{
	diff_debug_filespec(p->one, i, "one");
	diff_debug_filespec(p->two, i, "two");
844 845 846
	fprintf(stderr, "score %d, status %c stays %d broken %d\n",
		p->score, p->status ? : '?',
		p->source_stays, p->broken_pair);
847 848 849
}

void diff_debug_queue(const char *msg, struct diff_queue_struct *q)
J
Junio C Hamano 已提交
850 851
{
	int i;
852 853 854
	if (msg)
		fprintf(stderr, "%s\n", msg);
	fprintf(stderr, "q->nr = %d\n", q->nr);
J
Junio C Hamano 已提交
855 856
	for (i = 0; i < q->nr; i++) {
		struct diff_filepair *p = q->queue[i];
857 858 859 860 861 862 863 864 865 866 867 868 869 870 871
		diff_debug_filepair(p, i);
	}
}
#endif

static void diff_resolve_rename_copy(void)
{
	int i, j;
	struct diff_filepair *p, *pp;
	struct diff_queue_struct *q = &diff_queued_diff;

	diff_debug_queue("resolve-rename-copy", q);

	for (i = 0; i < q->nr; i++) {
		p = q->queue[i];
872
		p->status = 0; /* undecided */
873 874
		if (DIFF_PAIR_UNMERGED(p))
			p->status = 'U';
875
		else if (!DIFF_FILE_VALID(p->one))
876
			p->status = 'N';
877 878
		else if (!DIFF_FILE_VALID(p->two))
			p->status = 'D';
879 880 881 882 883 884 885
		else if (DIFF_PAIR_TYPE_CHANGED(p))
			p->status = 'T';

		/* from this point on, we are dealing with a pair
		 * whose both sides are valid and of the same type, i.e.
		 * either in-place edit or rename/copy edit.
		 */
886
		else if (DIFF_PAIR_RENAME(p)) {
887 888 889 890 891 892 893
			if (p->source_stays) {
				p->status = 'C';
				continue;
			}
			/* See if there is some other filepair that
			 * copies from the same source as us.  If so
			 * we are a copy.  Otherwise we are a rename.
894
			 */
895
			for (j = i + 1; j < q->nr; j++) {
896 897
				pp = q->queue[j];
				if (strcmp(pp->one->path, p->one->path))
898
					continue; /* not us */
899
				if (!DIFF_PAIR_RENAME(pp))
900 901 902 903
					continue; /* not a rename/copy */
				/* pp is a rename/copy from the same source */
				p->status = 'C';
				break;
904 905
			}
			if (!p->status)
906 907
				p->status = 'R';
		}
908 909
		else if (memcmp(p->one->sha1, p->two->sha1, 20) ||
			 p->one->mode != p->two->mode)
910
			p->status = 'M';
J
Junio C Hamano 已提交
911 912 913
		else {
			/* This is a "no-change" entry and should not
			 * happen anymore, but prepare for broken callers.
914
			 */
J
Junio C Hamano 已提交
915 916 917 918
			error("feeding unmodified %s to diffcore",
			      p->one->path);
			p->status = 'X';
		}
J
Junio C Hamano 已提交
919
	}
920
	diff_debug_queue("resolve-rename-copy done", q);
921 922
}

923
void diff_flush(int diff_output_style, int resolve_rename_copy)
924 925 926
{
	struct diff_queue_struct *q = &diff_queued_diff;
	int i;
927 928
	int line_termination = '\n';
	int inter_name_termination = '\t';
929

930
	if (diff_output_style == DIFF_FORMAT_MACHINE)
J
Junio C Hamano 已提交
931
		line_termination = inter_name_termination = 0;
932 933 934
	if (resolve_rename_copy)
		diff_resolve_rename_copy();

935 936
	for (i = 0; i < q->nr; i++) {
		struct diff_filepair *p = q->queue[i];
937 938
		if ((diff_output_style == DIFF_FORMAT_NO_OUTPUT) ||
		    (p->status == 'X'))
939
			continue;
940
		if (p->status == 0)
941
			die("internal error in diff-resolve-rename-copy");
942 943
		switch (diff_output_style) {
		case DIFF_FORMAT_PATCH:
944
			diff_flush_patch(p);
945 946 947 948 949 950 951
			break;
		case DIFF_FORMAT_HUMAN:
		case DIFF_FORMAT_MACHINE:
			diff_flush_raw(p, line_termination,
				       inter_name_termination);
			break;
		}
952
	}
953 954
	for (i = 0; i < q->nr; i++)
		diff_free_filepair(q->queue[i]);
955 956 957
	free(q->queue);
	q->queue = NULL;
	q->nr = q->alloc = 0;
958 959
}

960 961
void diffcore_std(const char **paths,
		  int detect_rename, int rename_score,
962
		  const char *pickaxe, int pickaxe_opts,
963 964
		  int break_opt,
		  const char *orderfile)
965 966 967
{
	if (paths && paths[0])
		diffcore_pathspec(paths);
968
	if (break_opt != -1)
969
		diffcore_break(break_opt);
970 971
	if (detect_rename)
		diffcore_rename(detect_rename, rename_score);
972
	if (break_opt != -1)
973
		diffcore_merge_broken();
974 975
	if (pickaxe)
		diffcore_pickaxe(pickaxe, pickaxe_opts);
976 977
	if (orderfile)
		diffcore_order(orderfile);
978 979
}

980 981 982
void diff_addremove(int addremove, unsigned mode,
		    const unsigned char *sha1,
		    const char *base, const char *path)
983
{
984
	char concatpath[PATH_MAX];
985 986 987 988 989 990 991 992 993
	struct diff_filespec *one, *two;

	/* This may look odd, but it is a preparation for
	 * feeding "there are unchanged files which should
	 * not produce diffs, but when you are doing copy
	 * detection you would need them, so here they are"
	 * entries to the diff-core.  They will be prefixed
	 * with something like '=' or '*' (I haven't decided
	 * which but should not make any difference).
994
	 * Feeding the same new and old to diff_change() 
995 996 997
	 * also has the same effect.
	 * Before the final output happens, they are pruned after
	 * merged into rename/copy pairs as appropriate.
998
	 */
999
	if (reverse_diff)
1000 1001
		addremove = (addremove == '+' ? '-' :
			     addremove == '-' ? '+' : addremove);
1002

1003 1004 1005 1006
	if (!path) path = "";
	sprintf(concatpath, "%s%s", base, path);
	one = alloc_filespec(concatpath);
	two = alloc_filespec(concatpath);
1007

1008 1009 1010 1011
	if (addremove != '+')
		fill_filespec(one, sha1, mode);
	if (addremove != '-')
		fill_filespec(two, sha1, mode);
1012

1013
	diff_queue(&diff_queued_diff, one, two);
1014 1015
}

1016 1017 1018 1019 1020 1021 1022 1023
void diff_helper_input(unsigned old_mode,
		       unsigned new_mode,
		       const unsigned char *old_sha1,
		       const unsigned char *new_sha1,
		       const char *old_path,
		       int status,
		       int score,
		       const char *new_path)
1024 1025
{
	struct diff_filespec *one, *two;
1026
	struct diff_filepair *dp;
1027 1028 1029 1030 1031 1032 1033

	one = alloc_filespec(old_path);
	two = alloc_filespec(new_path);
	if (old_mode)
		fill_filespec(one, old_sha1, old_mode);
	if (new_mode)
		fill_filespec(two, new_sha1, new_mode);
1034
	dp = diff_queue(&diff_queued_diff, one, two);
1035
	dp->score = score * MAX_SCORE / 100;
1036
	dp->status = status;
1037 1038
}

1039 1040 1041
void diff_change(unsigned old_mode, unsigned new_mode,
		 const unsigned char *old_sha1,
		 const unsigned char *new_sha1,
1042 1043
		 const char *base, const char *path) 
{
1044
	char concatpath[PATH_MAX];
1045
	struct diff_filespec *one, *two;
1046

1047 1048 1049 1050 1051 1052
	if (reverse_diff) {
		unsigned tmp;
		const unsigned char *tmp_c;
		tmp = old_mode; old_mode = new_mode; new_mode = tmp;
		tmp_c = old_sha1; old_sha1 = new_sha1; new_sha1 = tmp_c;
	}
1053 1054 1055 1056 1057 1058 1059
	if (!path) path = "";
	sprintf(concatpath, "%s%s", base, path);
	one = alloc_filespec(concatpath);
	two = alloc_filespec(concatpath);
	fill_filespec(one, old_sha1, old_mode);
	fill_filespec(two, new_sha1, new_mode);

1060
	diff_queue(&diff_queued_diff, one, two);
1061
}
1062

1063 1064
void diff_unmerge(const char *path)
{
J
Junio C Hamano 已提交
1065 1066 1067 1068
	struct diff_filespec *one, *two;
	one = alloc_filespec(path);
	two = alloc_filespec(path);
	diff_queue(&diff_queued_diff, one, two);
1069
}