sha1_file.c 30.8 KB
Newer Older
1 2 3 4 5 6 7 8
/*
 * GIT - The information manager from hell
 *
 * Copyright (C) Linus Torvalds, 2005
 *
 * This handles basic git sha1 object files - packing, unpacking,
 * creation etc.
 */
9 10
#include <sys/types.h>
#include <dirent.h>
11
#include "cache.h"
12
#include "delta.h"
13
#include "pack.h"
14

15 16 17 18 19 20 21 22 23 24
#ifndef O_NOATIME
#if defined(__linux__) && (defined(__i386__) || defined(__PPC__))
#define O_NOATIME 01000000
#else
#define O_NOATIME 0
#endif
#endif

static unsigned int sha1_file_open_flag = O_NOATIME;

25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
static unsigned hexval(char c)
{
	if (c >= '0' && c <= '9')
		return c - '0';
	if (c >= 'a' && c <= 'f')
		return c - 'a' + 10;
	if (c >= 'A' && c <= 'F')
		return c - 'A' + 10;
	return ~0;
}

int get_sha1_hex(const char *hex, unsigned char *sha1)
{
	int i;
	for (i = 0; i < 20; i++) {
		unsigned int val = (hexval(hex[0]) << 4) | hexval(hex[1]);
		if (val & ~0xff)
			return -1;
		*sha1++ = val;
		hex += 2;
	}
	return 0;
}

L
Linus Torvalds 已提交
49
static int get_sha1_file(const char *path, unsigned char *result)
50 51 52 53 54 55 56 57 58 59 60 61 62 63
{
	char buffer[60];
	int fd = open(path, O_RDONLY);
	int len;

	if (fd < 0)
		return -1;
	len = read(fd, buffer, sizeof(buffer));
	close(fd);
	if (len < 40)
		return -1;
	return get_sha1_hex(buffer, result);
}

64 65
static char *git_dir, *git_object_dir, *git_index_file, *git_refs_dir,
	*git_graft_file;
66 67 68 69 70 71 72 73 74 75
static void setup_git_env(void)
{
	git_dir = gitenv(GIT_DIR_ENVIRONMENT);
	if (!git_dir)
		git_dir = DEFAULT_GIT_DIR_ENVIRONMENT;
	git_object_dir = gitenv(DB_ENVIRONMENT);
	if (!git_object_dir) {
		git_object_dir = xmalloc(strlen(git_dir) + 9);
		sprintf(git_object_dir, "%s/objects", git_dir);
	}
D
Daniel Barkalow 已提交
76 77
	git_refs_dir = xmalloc(strlen(git_dir) + 6);
	sprintf(git_refs_dir, "%s/refs", git_dir);
78 79 80 81 82
	git_index_file = gitenv(INDEX_ENVIRONMENT);
	if (!git_index_file) {
		git_index_file = xmalloc(strlen(git_dir) + 7);
		sprintf(git_index_file, "%s/index", git_dir);
	}
83 84 85
	git_graft_file = gitenv(GRAFT_ENVIRONMENT);
	if (!git_graft_file)
		git_graft_file = strdup(git_path("info/grafts"));
86 87 88 89 90 91 92 93 94
}

char *get_object_directory(void)
{
	if (!git_object_dir)
		setup_git_env();
	return git_object_dir;
}

D
Daniel Barkalow 已提交
95 96 97 98 99 100 101
char *get_refs_directory(void)
{
	if (!git_refs_dir)
		setup_git_env();
	return git_refs_dir;
}

102 103 104 105 106 107 108
char *get_index_file(void)
{
	if (!git_index_file)
		setup_git_env();
	return git_index_file;
}

109 110 111 112 113 114 115
char *get_graft_file(void)
{
	if (!git_graft_file)
		setup_git_env();
	return git_graft_file;
}

116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133
int safe_create_leading_directories(char *path)
{
	char *pos = path;

	while (pos) {
		pos = strchr(pos, '/');
		if (!pos)
			break;
		*pos = 0;
		if (mkdir(path, 0777) < 0)
			if (errno != EEXIST) {
				*pos = '/';
				return -1;
			}
		*pos++ = '/';
	}
	return 0;
}
134 135 136

int get_sha1(const char *str, unsigned char *sha1)
{
137 138 139 140 141 142 143 144 145
	static const char *prefix[] = {
		"",
		"refs",
		"refs/tags",
		"refs/heads",
		"refs/snap",
		NULL
	};
	const char **p;
146 147 148

	if (!get_sha1_hex(str, sha1))
		return 0;
149 150

	for (p = prefix; *p; p++) {
151
		char * pathname = git_path("%s/%s", *p, str);
152 153 154 155
		if (!get_sha1_file(pathname, sha1))
			return 0;
	}

156 157 158
	return -1;
}

159 160 161 162 163 164 165 166 167 168 169 170 171 172 173
char * sha1_to_hex(const unsigned char *sha1)
{
	static char buffer[50];
	static const char hex[] = "0123456789abcdef";
	char *buf = buffer;
	int i;

	for (i = 0; i < 20; i++) {
		unsigned int val = *sha1++;
		*buf++ = hex[val >> 4];
		*buf++ = hex[val & 0xf];
	}
	return buffer;
}

174 175 176 177 178 179 180 181 182 183 184 185
static void fill_sha1_path(char *pathbuf, const unsigned char *sha1)
{
	int i;
	for (i = 0; i < 20; i++) {
		static char hex[] = "0123456789abcdef";
		unsigned int val = sha1[i];
		char *pos = pathbuf + i*2 + (i > 0);
		*pos++ = hex[val >> 4];
		*pos = hex[val & 0xf];
	}
}

186 187 188 189
/*
 * NOTE! This returns a statically allocated buffer, so you have to be
 * careful about using it. Do a "strdup()" if you need to save the
 * filename.
190 191 192
 *
 * Also note that this returns the location for creating.  Reading
 * SHA1 file can happen from any alternate directory listed in the
J
Junio C Hamano 已提交
193
 * DB_ENVIRONMENT environment variable if it is not found in
194
 * the primary object database.
195 196 197 198 199 200
 */
char *sha1_file_name(const unsigned char *sha1)
{
	static char *name, *base;

	if (!base) {
J
Junio C Hamano 已提交
201
		const char *sha1_file_directory = get_object_directory();
202
		int len = strlen(sha1_file_directory);
203
		base = xmalloc(len + 60);
204 205 206 207 208 209
		memcpy(base, sha1_file_directory, len);
		memset(base+len, 0, 60);
		base[len] = '/';
		base[len+3] = '/';
		name = base + len + 1;
	}
210
	fill_sha1_path(name, sha1);
211 212 213
	return base;
}

214
struct alternate_object_database *alt_odb;
215

J
Junio C Hamano 已提交
216 217 218 219 220
/*
 * Prepare alternate object database registry.
 * alt_odb points at an array of struct alternate_object_database.
 * This array is terminated with an element that has both its base
 * and name set to NULL.  alt_odb[n] comes from n'th non-empty
J
Junio C Hamano 已提交
221
 * element from colon separated ALTERNATE_DB_ENVIRONMENT environment
J
Junio C Hamano 已提交
222 223 224 225 226 227 228 229 230 231
 * variable, and its base points at a statically allocated buffer
 * that contains "/the/directory/corresponding/to/.git/objects/...",
 * while its name points just after the slash at the end of
 * ".git/objects/" in the example above, and has enough space to hold
 * 40-byte hex SHA1, an extra slash for the first level indirection,
 * and the terminating NUL.
 * This function allocates the alt_odb array and all the strings
 * pointed by base fields of the array elements with one xmalloc();
 * the string pool immediately follows the array.
 */
232
void prepare_alt_odb(void)
233 234 235
{
	int pass, totlen, i;
	const char *cp, *last;
L
Linus Torvalds 已提交
236
	char *op = NULL;
J
Junio C Hamano 已提交
237
	const char *alt = gitenv(ALTERNATE_DB_ENVIRONMENT) ? : "";
238

239 240
	if (alt_odb)
		return;
J
Junio C Hamano 已提交
241 242 243 244 245 246
	/* The first pass counts how large an area to allocate to
	 * hold the entire alt_odb structure, including array of
	 * structs and path buffers for them.  The second pass fills
	 * the structure and prepares the path buffers for use by
	 * fill_sha1_path().
	 */
247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273
	for (totlen = pass = 0; pass < 2; pass++) {
		last = alt;
		i = 0;
		do {
			cp = strchr(last, ':') ? : last + strlen(last);
			if (last != cp) {
				/* 43 = 40-byte + 2 '/' + terminating NUL */
				int pfxlen = cp - last;
				int entlen = pfxlen + 43;
				if (pass == 0)
					totlen += entlen;
				else {
					alt_odb[i].base = op;
					alt_odb[i].name = op + pfxlen + 1;
					memcpy(op, last, pfxlen);
					op[pfxlen] = op[pfxlen + 3] = '/';
					op[entlen-1] = 0;
					op += entlen;
				}
				i++;
			}
			while (*cp && *cp == ':')
				cp++;
			last = cp;
		} while (*cp);
		if (pass)
			break;
J
Junio C Hamano 已提交
274
		alt_odb = xmalloc(sizeof(*alt_odb) * (i + 1) + totlen);
L
Linus Torvalds 已提交
275
		alt_odb[i].base = alt_odb[i].name = NULL;
276 277 278 279 280 281 282 283 284 285 286
		op = (char*)(&alt_odb[i+1]);
	}
}

static char *find_sha1_file(const unsigned char *sha1, struct stat *st)
{
	int i;
	char *name = sha1_file_name(sha1);

	if (!stat(name, st))
		return name;
287
	prepare_alt_odb();
288 289 290 291 292 293 294 295
	for (i = 0; (name = alt_odb[i].name) != NULL; i++) {
		fill_sha1_path(name, sha1);
		if (!stat(alt_odb[i].base, st))
			return alt_odb[i].base;
	}
	return NULL;
}

296 297 298
#define PACK_MAX_SZ (1<<26)
static int pack_used_ctr;
static unsigned long pack_mapped;
299
struct packed_git *packed_git;
300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322

static int check_packed_git_idx(const char *path, unsigned long *idx_size_,
				void **idx_map_)
{
	void *idx_map;
	unsigned int *index;
	unsigned long idx_size;
	int nr, i;
	int fd = open(path, O_RDONLY);
	struct stat st;
	if (fd < 0)
		return -1;
	if (fstat(fd, &st)) {
		close(fd);
		return -1;
	}
	idx_size = st.st_size;
	idx_map = mmap(NULL, idx_size, PROT_READ, MAP_PRIVATE, fd, 0);
	close(fd);
	if (idx_map == MAP_FAILED)
		return -1;

	index = idx_map;
323 324
	*idx_map_ = idx_map;
	*idx_size_ = idx_size;
325 326

	/* check index map */
327
	if (idx_size < 4*256 + 20 + 20)
328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
		return error("index file too small");
	nr = 0;
	for (i = 0; i < 256; i++) {
		unsigned int n = ntohl(index[i]);
		if (n < nr)
			return error("non-monotonic index");
		nr = n;
	}

	/*
	 * Total size:
	 *  - 256 index entries 4 bytes each
	 *  - 24-byte entries * nr (20-byte sha1 + 4-byte offset)
	 *  - 20-byte SHA1 of the packfile
	 *  - 20-byte SHA1 file checksum
	 */
	if (idx_size != 4*256 + nr * 24 + 20 + 20)
		return error("wrong index file size");

	return 0;
}

350
static int unuse_one_packed_git(void)
351
{
352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369
	struct packed_git *p, *lru = NULL;

	for (p = packed_git; p; p = p->next) {
		if (p->pack_use_cnt || !p->pack_base)
			continue;
		if (!lru || p->pack_last_used < lru->pack_last_used)
			lru = p;
	}
	if (!lru)
		return 0;
	munmap(lru->pack_base, lru->pack_size);
	lru->pack_base = NULL;
	return 1;
}

void unuse_packed_git(struct packed_git *p)
{
	p->pack_use_cnt--;
370 371
}

372
int use_packed_git(struct packed_git *p)
373 374 375 376 377 378 379
{
	if (!p->pack_base) {
		int fd;
		struct stat st;
		void *map;

		pack_mapped += p->pack_size;
380 381
		while (PACK_MAX_SZ < pack_mapped && unuse_one_packed_git())
			; /* nothing */
382 383
		fd = open(p->pack_name, O_RDONLY);
		if (fd < 0)
384
			die("packfile %s cannot be opened", p->pack_name);
385 386
		if (fstat(fd, &st)) {
			close(fd);
387
			die("packfile %s cannot be opened", p->pack_name);
388 389
		}
		if (st.st_size != p->pack_size)
390
			die("packfile %s size mismatch.", p->pack_name);
391 392 393
		map = mmap(NULL, p->pack_size, PROT_READ, MAP_PRIVATE, fd, 0);
		close(fd);
		if (map == MAP_FAILED)
394
			die("packfile %s cannot be mapped.", p->pack_name);
395
		p->pack_base = map;
396 397 398 399 400 401 402

		/* Check if the pack file matches with the index file.
		 * this is cheap.
		 */
		if (memcmp((char*)(p->index_base) + p->index_size - 40,
			   p->pack_base + p->pack_size - 20, 20))
			die("packfile %s does not match index.", p->pack_name);
403 404
	}
	p->pack_last_used = pack_used_ctr++;
405
	p->pack_use_cnt++;
406 407 408
	return 0;
}

409
struct packed_git *add_packed_git(char *path, int path_len)
410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433
{
	struct stat st;
	struct packed_git *p;
	unsigned long idx_size;
	void *idx_map;

	if (check_packed_git_idx(path, &idx_size, &idx_map))
		return NULL;

	/* do we have a corresponding .pack file? */
	strcpy(path + path_len - 4, ".pack");
	if (stat(path, &st) || !S_ISREG(st.st_mode)) {
		munmap(idx_map, idx_size);
		return NULL;
	}
	/* ok, it looks sane as far as we can check without
	 * actually mapping the pack file.
	 */
	p = xmalloc(sizeof(*p) + path_len + 2);
	strcpy(p->pack_name, path);
	p->index_size = idx_size;
	p->pack_size = st.st_size;
	p->index_base = idx_map;
	p->next = NULL;
434
	p->pack_base = NULL;
435
	p->pack_last_used = 0;
436
	p->pack_use_cnt = 0;
437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467
	return p;
}

static void prepare_packed_git_one(char *objdir)
{
	char path[PATH_MAX];
	int len;
	DIR *dir;
	struct dirent *de;

	sprintf(path, "%s/pack", objdir);
	len = strlen(path);
	dir = opendir(path);
	if (!dir)
		return;
	path[len++] = '/';
	while ((de = readdir(dir)) != NULL) {
		int namelen = strlen(de->d_name);
		struct packed_git *p;

		if (strcmp(de->d_name + namelen - 4, ".idx"))
			continue;

		/* we have .idx.  Is it a file we can map? */
		strcpy(path + len, de->d_name);
		p = add_packed_git(path, len + namelen);
		if (!p)
			continue;
		p->next = packed_git;
		packed_git = p;
	}
468
	closedir(dir);
469 470
}

471
void prepare_packed_git(void)
472 473 474 475 476 477 478 479
{
	int i;
	static int run_once = 0;

	if (run_once++)
		return;

	prepare_packed_git_one(get_object_directory());
480
	prepare_alt_odb();
481 482 483 484 485 486
	for (i = 0; alt_odb[i].base != NULL; i++) {
		alt_odb[i].name[0] = 0;
		prepare_packed_git_one(alt_odb[i].base);
	}
}

487
int check_sha1_signature(const unsigned char *sha1, void *map, unsigned long size, const char *type)
488
{
489
	char header[100];
490 491 492 493
	unsigned char real_sha1[20];
	SHA_CTX c;

	SHA1_Init(&c);
494
	SHA1_Update(&c, header, 1+sprintf(header, "%s %lu", type, size));
495 496 497 498 499
	SHA1_Update(&c, map, size);
	SHA1_Final(real_sha1, &c);
	return memcmp(sha1, real_sha1, 20) ? -1 : 0;
}

500
static void *map_sha1_file_internal(const unsigned char *sha1,
D
Daniel Barkalow 已提交
501
				    unsigned long *size)
502 503 504
{
	struct stat st;
	void *map;
505
	int fd;
506 507 508 509 510
	char *filename = find_sha1_file(sha1, &st);

	if (!filename) {
		return NULL;
	}
511

512
	fd = open(filename, O_RDONLY | sha1_file_open_flag);
513
	if (fd < 0) {
514 515 516 517 518 519 520 521 522 523 524
		/* See if it works without O_NOATIME */
		switch (sha1_file_open_flag) {
		default:
			fd = open(filename, O_RDONLY);
			if (fd >= 0)
				break;
		/* Fallthrough */
		case 0:
			return NULL;
		}

525 526 527
		/* If it failed once, it will probably fail again.
		 * Stop using O_NOATIME
		 */
528
		sha1_file_open_flag = 0;
529 530 531
	}
	map = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fd, 0);
	close(fd);
P
Pavel Roskin 已提交
532
	if (map == MAP_FAILED)
533 534 535 536 537
		return NULL;
	*size = st.st_size;
	return map;
}

538 539 540 541 542 543 544 545 546 547 548 549 550
int unpack_sha1_header(z_stream *stream, void *map, unsigned long mapsize, void *buffer, unsigned long size)
{
	/* Get the data stream */
	memset(stream, 0, sizeof(*stream));
	stream->next_in = map;
	stream->avail_in = mapsize;
	stream->next_out = buffer;
	stream->avail_out = size;

	inflateInit(stream);
	return inflate(stream, 0);
}

L
Linus Torvalds 已提交
551
static void *unpack_sha1_rest(z_stream *stream, void *buffer, unsigned long size)
552 553
{
	int bytes = strlen(buffer) + 1;
554
	unsigned char *buf = xmalloc(1+size);
555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618

	memcpy(buf, buffer + bytes, stream->total_out - bytes);
	bytes = stream->total_out - bytes;
	if (bytes < size) {
		stream->next_out = buf + bytes;
		stream->avail_out = size - bytes;
		while (inflate(stream, Z_FINISH) == Z_OK)
			/* nothing */;
	}
	buf[size] = 0;
	inflateEnd(stream);
	return buf;
}

/*
 * We used to just use "sscanf()", but that's actually way
 * too permissive for what we want to check. So do an anal
 * object header parse by hand.
 */
int parse_sha1_header(char *hdr, char *type, unsigned long *sizep)
{
	int i;
	unsigned long size;

	/*
	 * The type can be at most ten bytes (including the 
	 * terminating '\0' that we add), and is followed by
	 * a space. 
	 */
	i = 10;
	for (;;) {
		char c = *hdr++;
		if (c == ' ')
			break;
		if (!--i)
			return -1;
		*type++ = c;
	}
	*type = 0;

	/*
	 * The length must follow immediately, and be in canonical
	 * decimal format (ie "010" is not valid).
	 */
	size = *hdr++ - '0';
	if (size > 9)
		return -1;
	if (size) {
		for (;;) {
			unsigned long c = *hdr - '0';
			if (c > 9)
				break;
			hdr++;
			size = size * 10 + c;
		}
	}
	*sizep = size;

	/*
	 * The length must be followed by a zero byte
	 */
	return *hdr ? -1 : 0;
}

619 620
void * unpack_sha1_file(void *map, unsigned long mapsize, char *type, unsigned long *size)
{
621
	int ret;
622
	z_stream stream;
623
	char hdr[8192];
624

625 626
	ret = unpack_sha1_header(&stream, map, mapsize, hdr, sizeof(hdr));
	if (ret < Z_OK || parse_sha1_header(hdr, type, size) < 0)
627 628
		return NULL;

629
	return unpack_sha1_rest(&stream, hdr, *size);
630 631
}

J
Junio C Hamano 已提交
632 633 634 635
/* forward declaration for a mutually recursive function */
static int packed_object_info(struct pack_entry *entry,
			      char *type, unsigned long *sizep);

636 637 638 639
static int packed_delta_info(unsigned char *base_sha1,
			     unsigned long delta_size,
			     unsigned long left,
			     char *type,
J
Junio C Hamano 已提交
640 641
			     unsigned long *sizep,
			     struct packed_git *p)
642
{
J
Junio C Hamano 已提交
643 644
	struct pack_entry base_ent;

645 646 647
	if (left < 20)
		die("truncated pack file");

J
Junio C Hamano 已提交
648 649 650 651 652
	/* The base entry _must_ be in the same pack */
	if (!find_pack_entry_one(base_sha1, &base_ent, p))
		die("failed to find delta-pack base object %s",
		    sha1_to_hex(base_sha1));

653 654 655 656 657
	/* We choose to only get the type of the base object and
	 * ignore potentially corrupt pack file that expects the delta
	 * based on a base with a wrong size.  This saves tons of
	 * inflate() calls.
	 */
658

J
Junio C Hamano 已提交
659
	if (packed_object_info(&base_ent, type, NULL))
660
		die("cannot get info for delta-pack base");
661

662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687
	if (sizep) {
		const unsigned char *data;
		unsigned char delta_head[64];
		unsigned long result_size;
		z_stream stream;
		int st;

		memset(&stream, 0, sizeof(stream));

		data = stream.next_in = base_sha1 + 20;
		stream.avail_in = left - 20;
		stream.next_out = delta_head;
		stream.avail_out = sizeof(delta_head);

		inflateInit(&stream);
		st = inflate(&stream, Z_FINISH);
		inflateEnd(&stream);
		if ((st != Z_STREAM_END) &&
		    stream.total_out != sizeof(delta_head))
			die("delta data unpack-initial failed");

		/* Examine the initial part of the delta to figure out
		 * the result size.
		 */
		data = delta_head;
		get_delta_hdr_size(&data); /* ignore base size */
688

689 690 691 692
		/* Read the result size */
		result_size = get_delta_hdr_size(&data);
		*sizep = result_size;
	}
693 694 695
	return 0;
}

696 697 698
static unsigned long unpack_object_header(struct packed_git *p, unsigned long offset,
	enum object_type *type, unsigned long *sizep)
{
699
	unsigned shift;
700 701 702 703 704 705 706 707 708 709 710
	unsigned char *pack, c;
	unsigned long size;

	if (offset >= p->pack_size)
		die("object offset outside of pack file");

	pack =  p->pack_base + offset;
	c = *pack++;
	offset++;
	*type = (c >> 4) & 7;
	size = c & 15;
711
	shift = 4;
712 713 714 715 716
	while (c & 0x80) {
		if (offset >= p->pack_size)
			die("object offset outside of pack file");
		c = *pack++;
		offset++;
717 718
		size += (c & 0x7f) << shift;
		shift += 7;
719 720 721 722 723
	}
	*sizep = size;
	return offset;
}

724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774
void packed_object_info_detail(struct pack_entry *e,
			       char *type,
			       unsigned long *size,
			       unsigned long *store_size,
			       int *delta_chain_length,
			       unsigned char *base_sha1)
{
	struct packed_git *p = e->p;
	unsigned long offset, left;
	unsigned char *pack;
	enum object_type kind;

	offset = unpack_object_header(p, e->offset, &kind, size);
	pack = p->pack_base + offset;
	left = p->pack_size - offset;
	if (kind != OBJ_DELTA)
		*delta_chain_length = 0;
	else {
		int chain_length = 0;
		memcpy(base_sha1, pack, 20);
		do {
			struct pack_entry base_ent;
			unsigned long junk;

			find_pack_entry_one(pack, &base_ent, p);
			offset = unpack_object_header(p, base_ent.offset,
						      &kind, &junk);
			pack = p->pack_base + offset;
			chain_length++;
		} while (kind == OBJ_DELTA);
		*delta_chain_length = chain_length;
	}
	switch (kind) {
	case OBJ_COMMIT:
		strcpy(type, "commit");
		break;
	case OBJ_TREE:
		strcpy(type, "tree");
		break;
	case OBJ_BLOB:
		strcpy(type, "blob");
		break;
	case OBJ_TAG:
		strcpy(type, "tag");
		break;
	default:
		die("corrupted pack file");
	}
	*store_size = 0; /* notyet */
}

775 776 777 778 779 780
static int packed_object_info(struct pack_entry *entry,
			      char *type, unsigned long *sizep)
{
	struct packed_git *p = entry->p;
	unsigned long offset, size, left;
	unsigned char *pack;
781
	enum object_type kind;
782
	int retval;
783 784 785 786

	if (use_packed_git(p))
		die("cannot map packed file");

787
	offset = unpack_object_header(p, entry->offset, &kind, &size);
788
	pack = p->pack_base + offset;
789 790 791 792
	left = p->pack_size - offset;

	switch (kind) {
	case OBJ_DELTA:
J
Junio C Hamano 已提交
793
		retval = packed_delta_info(pack, size, left, type, sizep, p);
794 795
		unuse_packed_git(p);
		return retval;
796
	case OBJ_COMMIT:
797 798
		strcpy(type, "commit");
		break;
799
	case OBJ_TREE:
800 801
		strcpy(type, "tree");
		break;
802
	case OBJ_BLOB:
803 804
		strcpy(type, "blob");
		break;
805
	case OBJ_TAG:
806 807
		strcpy(type, "tag");
		break;
808 809 810
	default:
		die("corrupted pack file");
	}
811 812
	if (sizep)
		*sizep = size;
813
	unuse_packed_git(p);
814 815 816 817 818 819 820 821 822 823
	return 0;
}

/* forward declaration for a mutually recursive function */
static void *unpack_entry(struct pack_entry *, char *, unsigned long *);

static void *unpack_delta_entry(unsigned char *base_sha1,
				unsigned long delta_size,
				unsigned long left,
				char *type,
J
Junio C Hamano 已提交
824 825
				unsigned long *sizep,
				struct packed_git *p)
826
{
J
Junio C Hamano 已提交
827
	struct pack_entry base_ent;
828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851
	void *data, *delta_data, *result, *base;
	unsigned long data_size, result_size, base_size;
	z_stream stream;
	int st;

	if (left < 20)
		die("truncated pack file");
	data = base_sha1 + 20;
	data_size = left - 20;
	delta_data = xmalloc(delta_size);

	memset(&stream, 0, sizeof(stream));

	stream.next_in = data;
	stream.avail_in = data_size;
	stream.next_out = delta_data;
	stream.avail_out = delta_size;

	inflateInit(&stream);
	st = inflate(&stream, Z_FINISH);
	inflateEnd(&stream);
	if ((st != Z_STREAM_END) || stream.total_out != delta_size)
		die("delta data unpack failed");

J
Junio C Hamano 已提交
852 853 854 855 856
	/* The base entry _must_ be in the same pack */
	if (!find_pack_entry_one(base_sha1, &base_ent, p))
		die("failed to find delta-pack base object %s",
		    sha1_to_hex(base_sha1));
	base = unpack_entry_gently(&base_ent, type, &base_size);
857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876
	if (!base)
		die("failed to read delta-pack base object %s",
		    sha1_to_hex(base_sha1));
	result = patch_delta(base, base_size,
			     delta_data, delta_size,
			     &result_size);
	if (!result)
		die("failed to apply delta");
	free(delta_data);
	free(base);
	*sizep = result_size;
	return result;
}

static void *unpack_non_delta_entry(unsigned char *data,
				    unsigned long size,
				    unsigned long left)
{
	int st;
	z_stream stream;
877
	unsigned char *buffer;
878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901

	buffer = xmalloc(size + 1);
	buffer[size] = 0;
	memset(&stream, 0, sizeof(stream));
	stream.next_in = data;
	stream.avail_in = left;
	stream.next_out = buffer;
	stream.avail_out = size;

	inflateInit(&stream);
	st = inflate(&stream, Z_FINISH);
	inflateEnd(&stream);
	if ((st != Z_STREAM_END) || stream.total_out != size) {
		free(buffer);
		return NULL;
	}

	return buffer;
}

static void *unpack_entry(struct pack_entry *entry,
			  char *type, unsigned long *sizep)
{
	struct packed_git *p = entry->p;
902
	void *retval;
903 904 905

	if (use_packed_git(p))
		die("cannot map packed file");
J
Junio C Hamano 已提交
906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921
	retval = unpack_entry_gently(entry, type, sizep);
	unuse_packed_git(p);
	if (!retval)
		die("corrupted pack file");
	return retval;
}

/* The caller is responsible for use_packed_git()/unuse_packed_git() pair */
void *unpack_entry_gently(struct pack_entry *entry,
			  char *type, unsigned long *sizep)
{
	struct packed_git *p = entry->p;
	unsigned long offset, size, left;
	unsigned char *pack;
	enum object_type kind;
	void *retval;
922

923
	offset = unpack_object_header(p, entry->offset, &kind, &size);
924
	pack = p->pack_base + offset;
925 926 927
	left = p->pack_size - offset;
	switch (kind) {
	case OBJ_DELTA:
J
Junio C Hamano 已提交
928
		retval = unpack_delta_entry(pack, size, left, type, sizep, p);
929
		return retval;
930
	case OBJ_COMMIT:
931 932
		strcpy(type, "commit");
		break;
933
	case OBJ_TREE:
934 935
		strcpy(type, "tree");
		break;
936
	case OBJ_BLOB:
937 938
		strcpy(type, "blob");
		break;
939
	case OBJ_TAG:
940 941
		strcpy(type, "tag");
		break;
942
	default:
J
Junio C Hamano 已提交
943
		return NULL;
944 945
	}
	*sizep = size;
946 947
	retval = unpack_non_delta_entry(pack, size, left);
	return retval;
948 949
}

950 951
int num_packed_objects(const struct packed_git *p)
{
952
	/* See check_packed_git_idx() */
953 954 955 956 957 958 959 960 961 962 963 964 965
	return (p->index_size - 20 - 20 - 4*256) / 24;
}

int nth_packed_object_sha1(const struct packed_git *p, int n,
			   unsigned char* sha1)
{
	void *index = p->index_base + 256;
	if (n < 0 || num_packed_objects(p) <= n)
		return -1;
	memcpy(sha1, (index + 24 * n + 4), 20);
	return 0;
}

J
Junio C Hamano 已提交
966 967
int find_pack_entry_one(const unsigned char *sha1,
			struct pack_entry *e, struct packed_git *p)
968
{
969
	unsigned int *level1_ofs = p->index_base;
970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996
	int hi = ntohl(level1_ofs[*sha1]);
	int lo = ((*sha1 == 0x0) ? 0 : ntohl(level1_ofs[*sha1 - 1]));
	void *index = p->index_base + 256;

	do {
		int mi = (lo + hi) / 2;
		int cmp = memcmp(index + 24 * mi + 4, sha1, 20);
		if (!cmp) {
			e->offset = ntohl(*((int*)(index + 24 * mi)));
			memcpy(e->sha1, sha1, 20);
			e->p = p;
			return 1;
		}
		if (cmp > 0)
			hi = mi;
		else
			lo = mi+1;
	} while (lo < hi);
	return 0;
}

static int find_pack_entry(const unsigned char *sha1, struct pack_entry *e)
{
	struct packed_git *p;
	prepare_packed_git();

	for (p = packed_git; p; p = p->next) {
J
Junio C Hamano 已提交
997
		if (find_pack_entry_one(sha1, e, p))
998 999 1000 1001 1002
			return 1;
	}
	return 0;
}

1003
int sha1_object_info(const unsigned char *sha1, char *type, unsigned long *sizep)
1004
{
1005
	int status;
1006 1007 1008
	unsigned long mapsize, size;
	void *map;
	z_stream stream;
1009
	char hdr[128];
1010

D
Daniel Barkalow 已提交
1011
	map = map_sha1_file_internal(sha1, &mapsize);
1012 1013 1014 1015 1016
	if (!map) {
		struct pack_entry e;

		if (!find_pack_entry(sha1, &e))
			return error("unable to find %s", sha1_to_hex(sha1));
1017
		return packed_object_info(&e, type, sizep);
1018
	}
1019 1020 1021 1022 1023
	if (unpack_sha1_header(&stream, map, mapsize, hdr, sizeof(hdr)) < 0)
		status = error("unable to unpack %s header",
			       sha1_to_hex(sha1));
	if (parse_sha1_header(hdr, type, &size) < 0)
		status = error("unable to parse %s header", sha1_to_hex(sha1));
1024
	else {
1025
		status = 0;
1026 1027
		if (sizep)
			*sizep = size;
1028 1029 1030 1031 1032 1033
	}
	inflateEnd(&stream);
	munmap(map, mapsize);
	return status;
}

1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044
static void *read_packed_sha1(const unsigned char *sha1, char *type, unsigned long *size)
{
	struct pack_entry e;

	if (!find_pack_entry(sha1, &e)) {
		error("cannot read sha1_file for %s", sha1_to_hex(sha1));
		return NULL;
	}
	return unpack_entry(&e, type, size);
}

1045 1046 1047 1048
void * read_sha1_file(const unsigned char *sha1, char *type, unsigned long *size)
{
	unsigned long mapsize;
	void *map, *buf;
1049
	struct pack_entry e;
1050

1051 1052
	if (find_pack_entry(sha1, &e))
		return read_packed_sha1(sha1, type, size);
D
Daniel Barkalow 已提交
1053
	map = map_sha1_file_internal(sha1, &mapsize);
1054 1055 1056 1057 1058
	if (map) {
		buf = unpack_sha1_file(map, mapsize, type, size);
		munmap(map, mapsize);
		return buf;
	}
1059
	return NULL;
1060 1061
}

1062
void *read_object_with_reference(const unsigned char *sha1,
1063
				 const char *required_type,
1064 1065
				 unsigned long *size,
				 unsigned char *actual_sha1_return)
1066 1067 1068 1069
{
	char type[20];
	void *buffer;
	unsigned long isize;
1070
	unsigned char actual_sha1[20];
1071

1072 1073 1074 1075
	memcpy(actual_sha1, sha1, 20);
	while (1) {
		int ref_length = -1;
		const char *ref_type = NULL;
1076

1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095
		buffer = read_sha1_file(actual_sha1, type, &isize);
		if (!buffer)
			return NULL;
		if (!strcmp(type, required_type)) {
			*size = isize;
			if (actual_sha1_return)
				memcpy(actual_sha1_return, actual_sha1, 20);
			return buffer;
		}
		/* Handle references */
		else if (!strcmp(type, "commit"))
			ref_type = "tree ";
		else if (!strcmp(type, "tag"))
			ref_type = "object ";
		else {
			free(buffer);
			return NULL;
		}
		ref_length = strlen(ref_type);
1096

1097 1098 1099 1100 1101 1102 1103
		if (memcmp(buffer, ref_type, ref_length) ||
		    get_sha1_hex(buffer + ref_length, actual_sha1)) {
			free(buffer);
			return NULL;
		}
		/* Now we have the ID of the referred-to object in
		 * actual_sha1.  Check again. */
1104 1105 1106
	}
}

1107 1108 1109 1110 1111 1112
char *write_sha1_file_prepare(void *buf,
			      unsigned long len,
			      const char *type,
			      unsigned char *sha1,
			      unsigned char *hdr,
			      int *hdrlen)
1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127
{
	SHA_CTX c;

	/* Generate the header */
	*hdrlen = sprintf((char *)hdr, "%s %lu", type, len)+1;

	/* Sha1.. */
	SHA1_Init(&c);
	SHA1_Update(&c, hdr, *hdrlen);
	SHA1_Update(&c, buf, len);
	SHA1_Final(sha1, &c);

	return sha1_file_name(sha1);
}

1128
int write_sha1_file(void *buf, unsigned long len, const char *type, unsigned char *returnsha1)
1129 1130
{
	int size;
1131
	unsigned char *compressed;
1132 1133
	z_stream stream;
	unsigned char sha1[20];
1134
	char *filename;
1135
	static char tmpfile[PATH_MAX];
1136
	unsigned char hdr[50];
1137
	int fd, hdrlen, ret;
1138

1139 1140 1141 1142
	/* Normally if we have it in the pack then we do not bother writing
	 * it out into .git/objects/??/?{38} file.
	 */
	filename = write_sha1_file_prepare(buf, len, type, sha1, hdr, &hdrlen);
1143 1144
	if (returnsha1)
		memcpy(returnsha1, sha1, 20);
1145 1146
	if (has_sha1_file(sha1))
		return 0;
1147 1148
	fd = open(filename, O_RDONLY);
	if (fd >= 0) {
1149
		/*
1150 1151
		 * FIXME!!! We might do collision checking here, but we'd
		 * need to uncompress the old file and check it. Later.
1152
		 */
1153
		close(fd);
1154 1155 1156
		return 0;
	}

1157 1158 1159 1160 1161 1162
	if (errno != ENOENT) {
		fprintf(stderr, "sha1 file %s: %s", filename, strerror(errno));
		return -1;
	}

	snprintf(tmpfile, sizeof(tmpfile), "%s/obj_XXXXXX", get_object_directory());
1163

1164 1165 1166 1167 1168 1169
	fd = mkstemp(tmpfile);
	if (fd < 0) {
		fprintf(stderr, "unable to create temporary sha1 filename %s: %s", tmpfile, strerror(errno));
		return -1;
	}

1170 1171 1172
	/* Set it up */
	memset(&stream, 0, sizeof(stream));
	deflateInit(&stream, Z_BEST_COMPRESSION);
1173
	size = deflateBound(&stream, len+hdrlen);
1174
	compressed = xmalloc(size);
1175 1176 1177 1178

	/* Compress it */
	stream.next_out = compressed;
	stream.avail_out = size;
1179 1180 1181 1182 1183

	/* First header.. */
	stream.next_in = hdr;
	stream.avail_in = hdrlen;
	while (deflate(&stream, 0) == Z_OK)
1184
		/* nothing */;
1185 1186 1187 1188

	/* Then the data itself.. */
	stream.next_in = buf;
	stream.avail_in = len;
1189 1190 1191 1192 1193
	while (deflate(&stream, Z_FINISH) == Z_OK)
		/* nothing */;
	deflateEnd(&stream);
	size = stream.total_out;

1194 1195
	if (write(fd, compressed, size) != size)
		die("unable to write file");
1196
	fchmod(fd, 0444);
1197
	close(fd);
1198
	free(compressed);
1199

1200
	ret = link(tmpfile, filename);
1201
	if (ret < 0) {
1202
		ret = errno;
1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215

		/*
		 * Coda hack - coda doesn't like cross-directory links,
		 * so we fall back to a rename, which will mean that it
		 * won't be able to check collisions, but that's not a
		 * big deal.
		 *
		 * When this succeeds, we just return 0. We have nothing
		 * left to unlink.
		 */
		if (ret == EXDEV && !rename(tmpfile, filename))
			return 0;
	}
1216 1217 1218 1219
	unlink(tmpfile);
	if (ret) {
		if (ret != EEXIST) {
			fprintf(stderr, "unable to write sha1 filename %s: %s", filename, strerror(ret));
1220
			return -1;
1221 1222
		}
		/* FIXME!!! Collision check here ? */
1223
	}
1224

1225 1226
	return 0;
}
1227

D
Daniel Barkalow 已提交
1228 1229 1230 1231 1232
int write_sha1_to_fd(int fd, const unsigned char *sha1)
{
	ssize_t size;
	unsigned long objsize;
	int posn = 0;
1233
	void *buf = map_sha1_file_internal(sha1, &objsize);
D
Daniel Barkalow 已提交
1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256
	z_stream stream;
	if (!buf) {
		unsigned char *unpacked;
		unsigned long len;
		char type[20];
		char hdr[50];
		int hdrlen;
		// need to unpack and recompress it by itself
		unpacked = read_packed_sha1(sha1, type, &len);

		hdrlen = sprintf(hdr, "%s %lu", type, len) + 1;

		/* Set it up */
		memset(&stream, 0, sizeof(stream));
		deflateInit(&stream, Z_BEST_COMPRESSION);
		size = deflateBound(&stream, len + hdrlen);
		buf = xmalloc(size);

		/* Compress it */
		stream.next_out = buf;
		stream.avail_out = size;
		
		/* First header.. */
1257
		stream.next_in = (void *)hdr;
D
Daniel Barkalow 已提交
1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286
		stream.avail_in = hdrlen;
		while (deflate(&stream, 0) == Z_OK)
			/* nothing */;

		/* Then the data itself.. */
		stream.next_in = unpacked;
		stream.avail_in = len;
		while (deflate(&stream, Z_FINISH) == Z_OK)
			/* nothing */;
		deflateEnd(&stream);
		
		objsize = stream.total_out;
	}

	do {
		size = write(fd, buf + posn, objsize - posn);
		if (size <= 0) {
			if (!size) {
				fprintf(stderr, "write closed");
			} else {
				perror("write ");
			}
			return -1;
		}
		posn += size;
	} while (posn < objsize);
	return 0;
}

1287 1288 1289 1290 1291 1292 1293
int write_sha1_from_fd(const unsigned char *sha1, int fd)
{
	char *filename = sha1_file_name(sha1);

	int local;
	z_stream stream;
	unsigned char real_sha1[20];
1294 1295
	unsigned char buf[4096];
	unsigned char discard[4096];
1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348
	int ret;
	SHA_CTX c;

	local = open(filename, O_WRONLY | O_CREAT | O_EXCL, 0666);

	if (local < 0)
		return error("Couldn't open %s\n", filename);

	memset(&stream, 0, sizeof(stream));

	inflateInit(&stream);

	SHA1_Init(&c);

	do {
		ssize_t size;
		size = read(fd, buf, 4096);
		if (size <= 0) {
			close(local);
			unlink(filename);
			if (!size)
				return error("Connection closed?");
			perror("Reading from connection");
			return -1;
		}
		write(local, buf, size);
		stream.avail_in = size;
		stream.next_in = buf;
		do {
			stream.next_out = discard;
			stream.avail_out = sizeof(discard);
			ret = inflate(&stream, Z_SYNC_FLUSH);
			SHA1_Update(&c, discard, sizeof(discard) -
				    stream.avail_out);
		} while (stream.avail_in && ret == Z_OK);
		
	} while (ret == Z_OK);
	inflateEnd(&stream);

	close(local);
	SHA1_Final(real_sha1, &c);
	if (ret != Z_STREAM_END) {
		unlink(filename);
		return error("File %s corrupted", sha1_to_hex(sha1));
	}
	if (memcmp(sha1, real_sha1, 20)) {
		unlink(filename);
		return error("File %s has bad hash\n", sha1_to_hex(sha1));
	}
	
	return 0;
}

1349 1350 1351 1352 1353 1354
int has_sha1_pack(const unsigned char *sha1)
{
	struct pack_entry e;
	return find_pack_entry(sha1, &e);
}

1355 1356 1357
int has_sha1_file(const unsigned char *sha1)
{
	struct stat st;
1358 1359
	struct pack_entry e;

1360
	if (find_pack_entry(sha1, &e))
1361
		return 1;
1362
	return find_sha1_file(sha1, &st) ? 1 : 0;
1363
}
J
Junio C Hamano 已提交
1364

1365
int index_fd(unsigned char *sha1, int fd, struct stat *st, int write_object, const char *type)
J
Junio C Hamano 已提交
1366 1367
{
	unsigned long size = st->st_size;
1368 1369
	void *buf;
	int ret;
1370 1371
	unsigned char hdr[50];
	int hdrlen;
J
Junio C Hamano 已提交
1372

1373
	buf = "";
J
Junio C Hamano 已提交
1374
	if (size)
1375
		buf = mmap(NULL, size, PROT_READ, MAP_PRIVATE, fd, 0);
J
Junio C Hamano 已提交
1376
	close(fd);
P
Pavel Roskin 已提交
1377
	if (buf == MAP_FAILED)
J
Junio C Hamano 已提交
1378 1379
		return -1;

1380 1381 1382 1383 1384 1385 1386 1387
	if (!type)
		type = "blob";
	if (write_object)
		ret = write_sha1_file(buf, size, type, sha1);
	else {
		write_sha1_file_prepare(buf, size, type, sha1, hdr, &hdrlen);
		ret = 0;
	}
1388 1389 1390
	if (size)
		munmap(buf, size);
	return ret;
J
Junio C Hamano 已提交
1391
}