http.c 46.1 KB
Newer Older
1
#include "git-compat-util.h"
2
#include "http.h"
3
#include "pack.h"
4
#include "sideband.h"
5
#include "run-command.h"
6
#include "url.h"
7
#include "urlmatch.h"
8
#include "credential.h"
9
#include "version.h"
10
#include "pkt-line.h"
11
#include "gettext.h"
12
#include "transport.h"
13

J
Junio C Hamano 已提交
14
int active_requests;
15
int http_is_verbose;
16
size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
17

18 19 20 21
#if LIBCURL_VERSION_NUM >= 0x070a06
#define LIBCURL_CAN_HANDLE_AUTH_ANY
#endif

T
Tay Ray Chuan 已提交
22 23
static int min_curl_sessions = 1;
static int curl_session_count;
24
#ifdef USE_CURL_MULTI
M
Mike Hommey 已提交
25 26
static int max_requests = -1;
static CURLM *curlm;
27 28
#endif
#ifndef NO_CURL_EASY_DUPHANDLE
M
Mike Hommey 已提交
29
static CURL *curl_default;
30
#endif
31 32 33

#define PREV_BUF_SIZE 4096

34 35
char curl_errorstr[CURL_ERROR_SIZE];

M
Mike Hommey 已提交
36
static int curl_ssl_verify = -1;
37
static int curl_ssl_try;
J
Junio C Hamano 已提交
38
static const char *ssl_cert;
39
static const char *ssl_cipherlist;
40 41 42 43 44 45 46 47 48 49 50 51 52 53
static const char *ssl_version;
static struct {
	const char *name;
	long ssl_version;
} sslversions[] = {
	{ "sslv2", CURL_SSLVERSION_SSLv2 },
	{ "sslv3", CURL_SSLVERSION_SSLv3 },
	{ "tlsv1", CURL_SSLVERSION_TLSv1 },
#if LIBCURL_VERSION_NUM >= 0x072200
	{ "tlsv1.0", CURL_SSLVERSION_TLSv1_0 },
	{ "tlsv1.1", CURL_SSLVERSION_TLSv1_1 },
	{ "tlsv1.2", CURL_SSLVERSION_TLSv1_2 },
#endif
};
54
#if LIBCURL_VERSION_NUM >= 0x070903
J
Junio C Hamano 已提交
55
static const char *ssl_key;
56 57
#endif
#if LIBCURL_VERSION_NUM >= 0x070908
J
Junio C Hamano 已提交
58
static const char *ssl_capath;
59
#endif
J
Junio C Hamano 已提交
60
static const char *ssl_cainfo;
M
Mike Hommey 已提交
61 62
static long curl_low_speed_limit = -1;
static long curl_low_speed_time = -1;
J
Junio C Hamano 已提交
63 64
static int curl_ftp_no_epsv;
static const char *curl_http_proxy;
65
static const char *curl_cookie_file;
66
static int curl_save_cookies;
67
struct credential http_auth = CREDENTIAL_INIT;
J
Jeff King 已提交
68
static int http_proactive_auth;
69
static const char *user_agent;
70

71 72 73 74 75 76 77 78
#if LIBCURL_VERSION_NUM >= 0x071700
/* Use CURLOPT_KEYPASSWD as is */
#elif LIBCURL_VERSION_NUM >= 0x070903
#define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
#else
#define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
#endif

79
static struct credential cert_auth = CREDENTIAL_INIT;
80
static int ssl_cert_password_required;
81 82 83
#ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
static unsigned long http_auth_methods = CURLAUTH_ANY;
#endif
84

M
Mike Hommey 已提交
85
static struct curl_slist *pragma_header;
86
static struct curl_slist *no_pragma_header;
87

J
Junio C Hamano 已提交
88
static struct active_request_slot *active_queue_head;
89

90 91
static char *cached_accept_language;

92
size_t fread_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
93 94
{
	size_t size = eltsize * nmemb;
95 96
	struct buffer *buffer = buffer_;

M
Mike Hommey 已提交
97 98 99
	if (size > buffer->buf.len - buffer->posn)
		size = buffer->buf.len - buffer->posn;
	memcpy(ptr, buffer->buf.buf + buffer->posn, size);
100
	buffer->posn += size;
M
Mike Hommey 已提交
101

102 103 104
	return size;
}

105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
#ifndef NO_CURL_IOCTL
curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
{
	struct buffer *buffer = clientp;

	switch (cmd) {
	case CURLIOCMD_NOP:
		return CURLIOE_OK;

	case CURLIOCMD_RESTARTREAD:
		buffer->posn = 0;
		return CURLIOE_OK;

	default:
		return CURLIOE_UNKNOWNCMD;
	}
}
#endif

124
size_t fwrite_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
125 126
{
	size_t size = eltsize * nmemb;
127 128
	struct strbuf *buffer = buffer_;

M
Mike Hommey 已提交
129
	strbuf_add(buffer, ptr, size);
130 131 132
	return size;
}

133
size_t fwrite_null(char *ptr, size_t eltsize, size_t nmemb, void *strbuf)
134 135 136 137
{
	return eltsize * nmemb;
}

138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168
static void closedown_active_slot(struct active_request_slot *slot)
{
	active_requests--;
	slot->in_use = 0;
}

static void finish_active_slot(struct active_request_slot *slot)
{
	closedown_active_slot(slot);
	curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);

	if (slot->finished != NULL)
		(*slot->finished) = 1;

	/* Store slot results so they can be read after the slot is reused */
	if (slot->results != NULL) {
		slot->results->curl_result = slot->curl_result;
		slot->results->http_code = slot->http_code;
#if LIBCURL_VERSION_NUM >= 0x070a08
		curl_easy_getinfo(slot->curl, CURLINFO_HTTPAUTH_AVAIL,
				  &slot->results->auth_avail);
#else
		slot->results->auth_avail = 0;
#endif
	}

	/* Run callback if appropriate */
	if (slot->callback_func != NULL)
		slot->callback_func(slot->callback_data);
}

169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
#ifdef USE_CURL_MULTI
static void process_curl_messages(void)
{
	int num_messages;
	struct active_request_slot *slot;
	CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);

	while (curl_message != NULL) {
		if (curl_message->msg == CURLMSG_DONE) {
			int curl_result = curl_message->data.result;
			slot = active_queue_head;
			while (slot != NULL &&
			       slot->curl != curl_message->easy_handle)
				slot = slot->next;
			if (slot != NULL) {
				curl_multi_remove_handle(curlm, slot->curl);
				slot->curl_result = curl_result;
				finish_active_slot(slot);
			} else {
				fprintf(stderr, "Received DONE message for unknown request!\n");
			}
		} else {
			fprintf(stderr, "Unknown CURL message received: %d\n",
				(int)curl_message->msg);
		}
		curl_message = curl_multi_info_read(curlm, &num_messages);
	}
}
#endif

199
static int http_options(const char *var, const char *value, void *cb)
200 201
{
	if (!strcmp("http.sslverify", var)) {
202
		curl_ssl_verify = git_config_bool(var, value);
203 204
		return 0;
	}
205 206
	if (!strcmp("http.sslcipherlist", var))
		return git_config_string(&ssl_cipherlist, var, value);
207 208
	if (!strcmp("http.sslversion", var))
		return git_config_string(&ssl_version, var, value);
209 210
	if (!strcmp("http.sslcert", var))
		return git_config_string(&ssl_cert, var, value);
211
#if LIBCURL_VERSION_NUM >= 0x070903
212 213
	if (!strcmp("http.sslkey", var))
		return git_config_string(&ssl_key, var, value);
214 215
#endif
#if LIBCURL_VERSION_NUM >= 0x070908
216
	if (!strcmp("http.sslcapath", var))
217
		return git_config_pathname(&ssl_capath, var, value);
218
#endif
219
	if (!strcmp("http.sslcainfo", var))
220
		return git_config_pathname(&ssl_cainfo, var, value);
221
	if (!strcmp("http.sslcertpasswordprotected", var)) {
222
		ssl_cert_password_required = git_config_bool(var, value);
223 224
		return 0;
	}
225 226 227 228
	if (!strcmp("http.ssltry", var)) {
		curl_ssl_try = git_config_bool(var, value);
		return 0;
	}
T
Tay Ray Chuan 已提交
229 230 231 232 233 234 235 236
	if (!strcmp("http.minsessions", var)) {
		min_curl_sessions = git_config_int(var, value);
#ifndef USE_CURL_MULTI
		if (min_curl_sessions > 1)
			min_curl_sessions = 1;
#endif
		return 0;
	}
J
Junio C Hamano 已提交
237
#ifdef USE_CURL_MULTI
238
	if (!strcmp("http.maxrequests", var)) {
239
		max_requests = git_config_int(var, value);
240 241 242 243
		return 0;
	}
#endif
	if (!strcmp("http.lowspeedlimit", var)) {
244
		curl_low_speed_limit = (long)git_config_int(var, value);
245 246 247
		return 0;
	}
	if (!strcmp("http.lowspeedtime", var)) {
248
		curl_low_speed_time = (long)git_config_int(var, value);
249 250 251
		return 0;
	}

252 253 254 255
	if (!strcmp("http.noepsv", var)) {
		curl_ftp_no_epsv = git_config_bool(var, value);
		return 0;
	}
256 257
	if (!strcmp("http.proxy", var))
		return git_config_string(&curl_http_proxy, var, value);
258

259 260
	if (!strcmp("http.cookiefile", var))
		return git_config_string(&curl_cookie_file, var, value);
261 262 263 264
	if (!strcmp("http.savecookies", var)) {
		curl_save_cookies = git_config_bool(var, value);
		return 0;
	}
265

266 267 268 269 270 271 272
	if (!strcmp("http.postbuffer", var)) {
		http_post_buffer = git_config_int(var, value);
		if (http_post_buffer < LARGE_PACKET_MAX)
			http_post_buffer = LARGE_PACKET_MAX;
		return 0;
	}

273 274 275
	if (!strcmp("http.useragent", var))
		return git_config_string(&user_agent, var, value);

276
	/* Fall back on the default ones */
277
	return git_default_config(var, value, cb);
278 279
}

J
Junio C Hamano 已提交
280 281
static void init_curl_http_auth(CURL *result)
{
282 283 284 285 286 287 288 289 290 291
	if (!http_auth.username)
		return;

	credential_fill(&http_auth);

#if LIBCURL_VERSION_NUM >= 0x071301
	curl_easy_setopt(result, CURLOPT_USERNAME, http_auth.username);
	curl_easy_setopt(result, CURLOPT_PASSWORD, http_auth.password);
#else
	{
292
		static struct strbuf up = STRBUF_INIT;
293 294 295 296 297 298 299 300 301
		/*
		 * Note that we assume we only ever have a single set of
		 * credentials in a given program run, so we do not have
		 * to worry about updating this buffer, only setting its
		 * initial value.
		 */
		if (!up.len)
			strbuf_addf(&up, "%s:%s",
				http_auth.username, http_auth.password);
302
		curl_easy_setopt(result, CURLOPT_USERPWD, up.buf);
J
Junio C Hamano 已提交
303
	}
304
#endif
J
Junio C Hamano 已提交
305 306
}

307 308 309 310
static int has_cert_password(void)
{
	if (ssl_cert == NULL || ssl_cert_password_required != 1)
		return 0;
311 312
	if (!cert_auth.password) {
		cert_auth.protocol = xstrdup("cert");
313
		cert_auth.username = xstrdup("");
314 315 316 317
		cert_auth.path = xstrdup(ssl_cert);
		credential_fill(&cert_auth);
	}
	return 1;
318 319
}

320 321 322 323 324 325 326
#if LIBCURL_VERSION_NUM >= 0x071900
static void set_curl_keepalive(CURL *c)
{
	curl_easy_setopt(c, CURLOPT_TCP_KEEPALIVE, 1);
}

#elif LIBCURL_VERSION_NUM >= 0x071000
E
Eric Wong 已提交
327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343
static int sockopt_callback(void *client, curl_socket_t fd, curlsocktype type)
{
	int ka = 1;
	int rc;
	socklen_t len = (socklen_t)sizeof(ka);

	if (type != CURLSOCKTYPE_IPCXN)
		return 0;

	rc = setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, (void *)&ka, len);
	if (rc < 0)
		warning("unable to set SO_KEEPALIVE on socket %s",
			strerror(errno));

	return 0; /* CURL_SOCKOPT_OK only exists since curl 7.21.5 */
}

344 345 346 347 348 349 350 351 352 353 354 355
static void set_curl_keepalive(CURL *c)
{
	curl_easy_setopt(c, CURLOPT_SOCKOPTFUNCTION, sockopt_callback);
}

#else
static void set_curl_keepalive(CURL *c)
{
	/* not supported on older curl versions */
}
#endif

J
Junio C Hamano 已提交
356
static CURL *get_curl_handle(void)
357
{
J
Junio C Hamano 已提交
358
	CURL *result = curl_easy_init();
359
	long allowed_protocols = 0;
360

361 362 363
	if (!result)
		die("curl_easy_init failed");

364 365 366 367 368 369 370 371 372 373
	if (!curl_ssl_verify) {
		curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
		curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
	} else {
		/* Verify authenticity of the peer's certificate */
		curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
		/* The name in the cert must match whom we tried to connect */
		curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
	}

374 375 376
#if LIBCURL_VERSION_NUM >= 0x070907
	curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
#endif
377
#ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
J
Junio C Hamano 已提交
378
	curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
379
#endif
380

J
Jeff King 已提交
381 382 383
	if (http_proactive_auth)
		init_curl_http_auth(result);

384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399
	if (getenv("GIT_SSL_VERSION"))
		ssl_version = getenv("GIT_SSL_VERSION");
	if (ssl_version && *ssl_version) {
		int i;
		for (i = 0; i < ARRAY_SIZE(sslversions); i++) {
			if (!strcmp(ssl_version, sslversions[i].name)) {
				curl_easy_setopt(result, CURLOPT_SSLVERSION,
						 sslversions[i].ssl_version);
				break;
			}
		}
		if (i == ARRAY_SIZE(sslversions))
			warning("unsupported ssl version %s: using default",
				ssl_version);
	}

400 401 402 403 404 405
	if (getenv("GIT_SSL_CIPHER_LIST"))
		ssl_cipherlist = getenv("GIT_SSL_CIPHER_LIST");
	if (ssl_cipherlist != NULL && *ssl_cipherlist)
		curl_easy_setopt(result, CURLOPT_SSL_CIPHER_LIST,
				ssl_cipherlist);

406 407
	if (ssl_cert != NULL)
		curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
408
	if (has_cert_password())
409
		curl_easy_setopt(result, CURLOPT_KEYPASSWD, cert_auth.password);
410
#if LIBCURL_VERSION_NUM >= 0x070903
411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428
	if (ssl_key != NULL)
		curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
#endif
#if LIBCURL_VERSION_NUM >= 0x070908
	if (ssl_capath != NULL)
		curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
#endif
	if (ssl_cainfo != NULL)
		curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);

	if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
		curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
				 curl_low_speed_limit);
		curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
				 curl_low_speed_time);
	}

	curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
B
Blake Burkhart 已提交
429
	curl_easy_setopt(result, CURLOPT_MAXREDIRS, 20);
430 431 432 433 434
#if LIBCURL_VERSION_NUM >= 0x071301
	curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
#elif LIBCURL_VERSION_NUM >= 0x071101
	curl_easy_setopt(result, CURLOPT_POST301, 1);
#endif
435 436 437 438 439 440 441 442 443 444 445 446 447 448 449
#if LIBCURL_VERSION_NUM >= 0x071304
	if (is_transport_allowed("http"))
		allowed_protocols |= CURLPROTO_HTTP;
	if (is_transport_allowed("https"))
		allowed_protocols |= CURLPROTO_HTTPS;
	if (is_transport_allowed("ftp"))
		allowed_protocols |= CURLPROTO_FTP;
	if (is_transport_allowed("ftps"))
		allowed_protocols |= CURLPROTO_FTPS;
	curl_easy_setopt(result, CURLOPT_REDIR_PROTOCOLS, allowed_protocols);
#else
	if (transport_restrict_protocols())
		warning("protocol restrictions not applied to curl redirects because\n"
			"your curl version is too old (>= 7.19.4)");
#endif
450

451 452 453
	if (getenv("GIT_CURL_VERBOSE"))
		curl_easy_setopt(result, CURLOPT_VERBOSE, 1);

454
	curl_easy_setopt(result, CURLOPT_USERAGENT,
455
		user_agent ? user_agent : git_user_agent());
456

457 458 459
	if (curl_ftp_no_epsv)
		curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);

460 461 462 463 464
#ifdef CURLOPT_USE_SSL
	if (curl_ssl_try)
		curl_easy_setopt(result, CURLOPT_USE_SSL, CURLUSESSL_TRY);
#endif

465
	if (curl_http_proxy) {
466
		curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
P
Pat Thoyts 已提交
467 468 469 470 471 472 473 474 475 476 477
#if LIBCURL_VERSION_NUM >= 0x071800
		if (starts_with(curl_http_proxy, "socks5"))
			curl_easy_setopt(result,
				CURLOPT_PROXYTYPE, CURLPROXY_SOCKS5);
		else if (starts_with(curl_http_proxy, "socks4a"))
			curl_easy_setopt(result,
				CURLOPT_PROXYTYPE, CURLPROXY_SOCKS4A);
		else if (starts_with(curl_http_proxy, "socks"))
			curl_easy_setopt(result,
				CURLOPT_PROXYTYPE, CURLPROXY_SOCKS4);
#endif
478
	}
T
Tom G. Christensen 已提交
479
#if LIBCURL_VERSION_NUM >= 0x070a07
480
	curl_easy_setopt(result, CURLOPT_PROXYAUTH, CURLAUTH_ANY);
T
Tom G. Christensen 已提交
481
#endif
482

483
	set_curl_keepalive(result);
E
Eric Wong 已提交
484

485 486 487
	return result;
}

488 489 490 491 492 493 494
static void set_from_env(const char **var, const char *envname)
{
	const char *val = getenv(envname);
	if (val)
		*var = val;
}

J
Jeff King 已提交
495
void http_init(struct remote *remote, const char *url, int proactive_auth)
496 497 498
{
	char *low_speed_limit;
	char *low_speed_time;
499 500 501 502 503 504 505 506
	char *normalized_url;
	struct urlmatch_config config = { STRING_LIST_INIT_DUP };

	config.section = "http";
	config.key = NULL;
	config.collect_fn = http_options;
	config.cascade_fn = git_default_config;
	config.cb = NULL;
507

508
	http_is_verbose = 0;
509
	normalized_url = url_normalize(url, &config.url);
510

511 512
	git_config(urlmatch_config_entry, &config);
	free(normalized_url);
513

514 515
	if (curl_global_init(CURL_GLOBAL_ALL) != CURLE_OK)
		die("curl_global_init failed");
516

J
Jeff King 已提交
517 518
	http_proactive_auth = proactive_auth;

519 520 521
	if (remote && remote->http_proxy)
		curl_http_proxy = xstrdup(remote->http_proxy);

522
	pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
523
	no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
524 525 526 527 528 529 530 531 532

#ifdef USE_CURL_MULTI
	{
		char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
		if (http_max_requests != NULL)
			max_requests = atoi(http_max_requests);
	}

	curlm = curl_multi_init();
533 534
	if (!curlm)
		die("curl_multi_init failed");
535 536 537 538 539
#endif

	if (getenv("GIT_SSL_NO_VERIFY"))
		curl_ssl_verify = 0;

540
	set_from_env(&ssl_cert, "GIT_SSL_CERT");
541
#if LIBCURL_VERSION_NUM >= 0x070903
542
	set_from_env(&ssl_key, "GIT_SSL_KEY");
543 544
#endif
#if LIBCURL_VERSION_NUM >= 0x070908
545
	set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
546
#endif
547
	set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
548

549 550
	set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");

551 552 553 554 555 556 557 558 559 560
	low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
	if (low_speed_limit != NULL)
		curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
	low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
	if (low_speed_time != NULL)
		curl_low_speed_time = strtol(low_speed_time, NULL, 10);

	if (curl_ssl_verify == -1)
		curl_ssl_verify = 1;

T
Tay Ray Chuan 已提交
561
	curl_session_count = 0;
562 563 564 565 566
#ifdef USE_CURL_MULTI
	if (max_requests < 1)
		max_requests = DEFAULT_MAX_REQUESTS;
#endif

567 568 569
	if (getenv("GIT_CURL_FTP_NO_EPSV"))
		curl_ftp_no_epsv = 1;

570
	if (url) {
571
		credential_from_url(&http_auth, url);
572 573
		if (!ssl_cert_password_required &&
		    getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
574
		    starts_with(url, "https://"))
575 576
			ssl_cert_password_required = 1;
	}
J
Junio C Hamano 已提交
577

578 579 580 581 582 583 584 585 586 587
#ifndef NO_CURL_EASY_DUPHANDLE
	curl_default = get_curl_handle();
#endif
}

void http_cleanup(void)
{
	struct active_request_slot *slot = active_queue_head;

	while (slot != NULL) {
588
		struct active_request_slot *next = slot->next;
589
		if (slot->curl != NULL) {
590
#ifdef USE_CURL_MULTI
591
			curl_multi_remove_handle(curlm, slot->curl);
592 593
#endif
			curl_easy_cleanup(slot->curl);
594
		}
595 596
		free(slot);
		slot = next;
597
	}
598
	active_queue_head = NULL;
599 600 601 602 603 604 605 606 607

#ifndef NO_CURL_EASY_DUPHANDLE
	curl_easy_cleanup(curl_default);
#endif

#ifdef USE_CURL_MULTI
	curl_multi_cleanup(curlm);
#endif
	curl_global_cleanup();
N
Nick Hengeveld 已提交
608 609

	curl_slist_free_all(pragma_header);
610
	pragma_header = NULL;
611

612 613 614
	curl_slist_free_all(no_pragma_header);
	no_pragma_header = NULL;

615
	if (curl_http_proxy) {
616
		free((void *)curl_http_proxy);
617 618
		curl_http_proxy = NULL;
	}
619

620 621 622 623
	if (cert_auth.password != NULL) {
		memset(cert_auth.password, 0, strlen(cert_auth.password));
		free(cert_auth.password);
		cert_auth.password = NULL;
624 625
	}
	ssl_cert_password_required = 0;
626 627 628

	free(cached_accept_language);
	cached_accept_language = NULL;
629 630 631 632 633 634 635 636 637 638 639 640 641
}

struct active_request_slot *get_active_slot(void)
{
	struct active_request_slot *slot = active_queue_head;
	struct active_request_slot *newslot;

#ifdef USE_CURL_MULTI
	int num_transfers;

	/* Wait for a slot to open up if the queue is full */
	while (active_requests >= max_requests) {
		curl_multi_perform(curlm, &num_transfers);
J
Junio C Hamano 已提交
642
		if (num_transfers < active_requests)
643 644 645 646
			process_curl_messages();
	}
#endif

J
Junio C Hamano 已提交
647
	while (slot != NULL && slot->in_use)
648
		slot = slot->next;
J
Junio C Hamano 已提交
649

650 651 652 653 654 655 656 657 658 659
	if (slot == NULL) {
		newslot = xmalloc(sizeof(*newslot));
		newslot->curl = NULL;
		newslot->in_use = 0;
		newslot->next = NULL;

		slot = active_queue_head;
		if (slot == NULL) {
			active_queue_head = newslot;
		} else {
J
Junio C Hamano 已提交
660
			while (slot->next != NULL)
661 662 663 664 665 666 667 668 669 670 671 672
				slot = slot->next;
			slot->next = newslot;
		}
		slot = newslot;
	}

	if (slot->curl == NULL) {
#ifdef NO_CURL_EASY_DUPHANDLE
		slot->curl = get_curl_handle();
#else
		slot->curl = curl_easy_duphandle(curl_default);
#endif
T
Tay Ray Chuan 已提交
673
		curl_session_count++;
674 675 676 677
	}

	active_requests++;
	slot->in_use = 1;
678
	slot->results = NULL;
N
Nick Hengeveld 已提交
679
	slot->finished = NULL;
680 681
	slot->callback_data = NULL;
	slot->callback_func = NULL;
682
	curl_easy_setopt(slot->curl, CURLOPT_COOKIEFILE, curl_cookie_file);
683 684
	if (curl_save_cookies)
		curl_easy_setopt(slot->curl, CURLOPT_COOKIEJAR, curl_cookie_file);
685 686
	curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
	curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
687 688 689
	curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
	curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
	curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
690
	curl_easy_setopt(slot->curl, CURLOPT_POSTFIELDS, NULL);
691 692
	curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
	curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
693
	curl_easy_setopt(slot->curl, CURLOPT_FAILONERROR, 1);
694
	curl_easy_setopt(slot->curl, CURLOPT_RANGE, NULL);
695 696 697
#ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
	curl_easy_setopt(slot->curl, CURLOPT_HTTPAUTH, http_auth_methods);
#endif
698 699
	if (http_auth.password)
		init_curl_http_auth(slot->curl);
700 701 702 703 704 705 706 707

	return slot;
}

int start_active_slot(struct active_request_slot *slot)
{
#ifdef USE_CURL_MULTI
	CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
708
	int num_transfers;
709 710 711 712 713 714 715

	if (curlm_result != CURLM_OK &&
	    curlm_result != CURLM_CALL_MULTI_PERFORM) {
		active_requests--;
		slot->in_use = 0;
		return 0;
	}
716 717 718 719 720 721

	/*
	 * We know there must be something to do, since we just added
	 * something.
	 */
	curl_multi_perform(curlm, &num_transfers);
722 723 724 725 726
#endif
	return 1;
}

#ifdef USE_CURL_MULTI
727 728 729 730 731 732
struct fill_chain {
	void *data;
	int (*fill)(void *);
	struct fill_chain *next;
};

J
Junio C Hamano 已提交
733
static struct fill_chain *fill_cfg;
734 735 736

void add_fill_function(void *data, int (*fill)(void *))
{
737
	struct fill_chain *new = xmalloc(sizeof(*new));
738 739 740 741 742 743 744 745 746
	struct fill_chain **linkp = &fill_cfg;
	new->data = data;
	new->fill = fill;
	new->next = NULL;
	while (*linkp)
		linkp = &(*linkp)->next;
	*linkp = new;
}

747 748 749 750
void fill_active_slots(void)
{
	struct active_request_slot *slot = active_queue_head;

751 752 753 754 755 756 757
	while (active_requests < max_requests) {
		struct fill_chain *fill;
		for (fill = fill_cfg; fill; fill = fill->next)
			if (fill->fill(fill->data))
				break;

		if (!fill)
758
			break;
759
	}
760 761

	while (slot != NULL) {
T
Tay Ray Chuan 已提交
762 763
		if (!slot->in_use && slot->curl != NULL
			&& curl_session_count > min_curl_sessions) {
764 765
			curl_easy_cleanup(slot->curl);
			slot->curl = NULL;
T
Tay Ray Chuan 已提交
766
			curl_session_count--;
767 768 769 770 771
		}
		slot = slot->next;
	}
}

772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794
void step_active_slots(void)
{
	int num_transfers;
	CURLMcode curlm_result;

	do {
		curlm_result = curl_multi_perform(curlm, &num_transfers);
	} while (curlm_result == CURLM_CALL_MULTI_PERFORM);
	if (num_transfers < active_requests) {
		process_curl_messages();
		fill_active_slots();
	}
}
#endif

void run_active_slot(struct active_request_slot *slot)
{
#ifdef USE_CURL_MULTI
	fd_set readfds;
	fd_set writefds;
	fd_set excfds;
	int max_fd;
	struct timeval select_timeout;
N
Nick Hengeveld 已提交
795
	int finished = 0;
796

N
Nick Hengeveld 已提交
797 798
	slot->finished = &finished;
	while (!finished) {
799 800
		step_active_slots();

801
		if (slot->in_use) {
802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817
#if LIBCURL_VERSION_NUM >= 0x070f04
			long curl_timeout;
			curl_multi_timeout(curlm, &curl_timeout);
			if (curl_timeout == 0) {
				continue;
			} else if (curl_timeout == -1) {
				select_timeout.tv_sec  = 0;
				select_timeout.tv_usec = 50000;
			} else {
				select_timeout.tv_sec  =  curl_timeout / 1000;
				select_timeout.tv_usec = (curl_timeout % 1000) * 1000;
			}
#else
			select_timeout.tv_sec  = 0;
			select_timeout.tv_usec = 50000;
#endif
818

819
			max_fd = -1;
820 821 822
			FD_ZERO(&readfds);
			FD_ZERO(&writefds);
			FD_ZERO(&excfds);
823
			curl_multi_fdset(curlm, &readfds, &writefds, &excfds, &max_fd);
824

825 826 827 828 829 830 831 832 833 834 835 836
			/*
			 * It can happen that curl_multi_timeout returns a pathologically
			 * long timeout when curl_multi_fdset returns no file descriptors
			 * to read.  See commit message for more details.
			 */
			if (max_fd < 0 &&
			    (select_timeout.tv_sec > 0 ||
			     select_timeout.tv_usec > 50000)) {
				select_timeout.tv_sec  = 0;
				select_timeout.tv_usec = 50000;
			}

837
			select(max_fd+1, &readfds, &writefds, &excfds, &select_timeout);
838 839 840 841 842 843 844 845 846 847
		}
	}
#else
	while (slot->in_use) {
		slot->curl_result = curl_easy_perform(slot->curl);
		finish_active_slot(slot);
	}
#endif
}

848
static void release_active_slot(struct active_request_slot *slot)
849 850
{
	closedown_active_slot(slot);
T
Tay Ray Chuan 已提交
851
	if (slot->curl && curl_session_count > min_curl_sessions) {
N
Nick Hengeveld 已提交
852
#ifdef USE_CURL_MULTI
853
		curl_multi_remove_handle(curlm, slot->curl);
N
Nick Hengeveld 已提交
854
#endif
855 856
		curl_easy_cleanup(slot->curl);
		slot->curl = NULL;
T
Tay Ray Chuan 已提交
857
		curl_session_count--;
858
	}
N
Nick Hengeveld 已提交
859
#ifdef USE_CURL_MULTI
860
	fill_active_slots();
N
Nick Hengeveld 已提交
861
#endif
862 863
}

864 865 866 867 868 869 870 871 872 873 874 875
void finish_all_active_slots(void)
{
	struct active_request_slot *slot = active_queue_head;

	while (slot != NULL)
		if (slot->in_use) {
			run_active_slot(slot);
			slot = active_queue_head;
		} else {
			slot = slot->next;
		}
}
876

877
/* Helpers for modifying and creating URLs */
878 879 880 881 882 883 884 885 886 887 888 889 890 891
static inline int needs_quote(int ch)
{
	if (((ch >= 'A') && (ch <= 'Z'))
			|| ((ch >= 'a') && (ch <= 'z'))
			|| ((ch >= '0') && (ch <= '9'))
			|| (ch == '/')
			|| (ch == '-')
			|| (ch == '.'))
		return 0;
	return 1;
}

static char *quote_ref_url(const char *base, const char *ref)
{
892
	struct strbuf buf = STRBUF_INIT;
893
	const char *cp;
894
	int ch;
895

896
	end_url_with_slash(&buf, base);
897 898

	for (cp = ref; (ch = *cp) != 0; cp++)
899
		if (needs_quote(ch))
900
			strbuf_addf(&buf, "%%%02x", ch);
901
		else
902
			strbuf_addch(&buf, *cp);
903

904
	return strbuf_detach(&buf, NULL);
905 906
}

907 908 909 910
void append_remote_object_url(struct strbuf *buf, const char *url,
			      const char *hex,
			      int only_two_digit_prefix)
{
911 912 913
	end_url_with_slash(buf, url);

	strbuf_addf(buf, "objects/%.*s/", 2, hex);
914 915 916 917 918 919 920 921 922 923 924 925
	if (!only_two_digit_prefix)
		strbuf_addf(buf, "%s", hex+2);
}

char *get_remote_object_url(const char *url, const char *hex,
			    int only_two_digit_prefix)
{
	struct strbuf buf = STRBUF_INIT;
	append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
	return strbuf_detach(&buf, NULL);
}

926
static int handle_curl_result(struct slot_results *results)
927
{
J
Jeff King 已提交
928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946
	/*
	 * If we see a failing http code with CURLE_OK, we have turned off
	 * FAILONERROR (to keep the server's custom error response), and should
	 * translate the code into failure here.
	 */
	if (results->curl_result == CURLE_OK &&
	    results->http_code >= 400) {
		results->curl_result = CURLE_HTTP_RETURNED_ERROR;
		/*
		 * Normally curl will already have put the "reason phrase"
		 * from the server into curl_errorstr; unfortunately without
		 * FAILONERROR it is lost, so we can give only the numeric
		 * status code.
		 */
		snprintf(curl_errorstr, sizeof(curl_errorstr),
			 "The requested URL returned error: %ld",
			 results->http_code);
	}

947 948 949 950 951 952 953 954 955 956
	if (results->curl_result == CURLE_OK) {
		credential_approve(&http_auth);
		return HTTP_OK;
	} else if (missing_target(results))
		return HTTP_MISSING_TARGET;
	else if (results->http_code == 401) {
		if (http_auth.username && http_auth.password) {
			credential_reject(&http_auth);
			return HTTP_NOAUTH;
		} else {
957 958 959
#ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
			http_auth_methods &= ~CURLAUTH_GSSNEGOTIATE;
#endif
960 961 962
			return HTTP_REAUTH;
		}
	} else {
963
#if LIBCURL_VERSION_NUM >= 0x070c00
964 965 966 967
		if (!curl_errorstr[0])
			strlcpy(curl_errorstr,
				curl_easy_strerror(results->curl_result),
				sizeof(curl_errorstr));
968
#endif
969 970 971 972
		return HTTP_ERROR;
	}
}

J
Jeff King 已提交
973 974 975 976 977 978 979 980 981 982 983 984 985 986
int run_one_slot(struct active_request_slot *slot,
		 struct slot_results *results)
{
	slot->results = results;
	if (!start_active_slot(slot)) {
		snprintf(curl_errorstr, sizeof(curl_errorstr),
			 "failed to start HTTP request");
		return HTTP_START_FAILED;
	}

	run_active_slot(slot);
	return handle_curl_result(results);
}

987 988 989 990 991 992 993 994 995 996 997 998
static CURLcode curlinfo_strbuf(CURL *curl, CURLINFO info, struct strbuf *buf)
{
	char *ptr;
	CURLcode ret;

	strbuf_reset(buf);
	ret = curl_easy_getinfo(curl, info, &ptr);
	if (!ret && ptr)
		strbuf_addstr(buf, ptr);
	return ret;
}

999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019
/*
 * Check for and extract a content-type parameter. "raw"
 * should be positioned at the start of the potential
 * parameter, with any whitespace already removed.
 *
 * "name" is the name of the parameter. The value is appended
 * to "out".
 */
static int extract_param(const char *raw, const char *name,
			 struct strbuf *out)
{
	size_t len = strlen(name);

	if (strncasecmp(raw, name, len))
		return -1;
	raw += len;

	if (*raw != '=')
		return -1;
	raw++;

1020
	while (*raw && !isspace(*raw) && *raw != ';')
1021 1022 1023 1024
		strbuf_addch(out, *raw++);
	return 0;
}

1025 1026 1027 1028 1029 1030 1031 1032 1033 1034
/*
 * Extract a normalized version of the content type, with any
 * spaces suppressed, all letters lowercased, and no trailing ";"
 * or parameters.
 *
 * Note that we will silently remove even invalid whitespace. For
 * example, "text / plain" is specifically forbidden by RFC 2616,
 * but "text/plain" is the only reasonable output, and this keeps
 * our code simple.
 *
1035 1036 1037
 * If the "charset" argument is not NULL, store the value of any
 * charset parameter there.
 *
1038
 * Example:
1039
 *   "TEXT/PLAIN; charset=utf-8" -> "text/plain", "utf-8"
1040 1041
 *   "text / plain" -> "text/plain"
 */
1042 1043
static void extract_content_type(struct strbuf *raw, struct strbuf *type,
				 struct strbuf *charset)
1044 1045 1046 1047 1048 1049 1050 1051
{
	const char *p;

	strbuf_reset(type);
	strbuf_grow(type, raw->len);
	for (p = raw->buf; *p; p++) {
		if (isspace(*p))
			continue;
1052 1053
		if (*p == ';') {
			p++;
1054
			break;
1055
		}
1056 1057
		strbuf_addch(type, tolower(*p));
	}
1058 1059 1060 1061 1062 1063

	if (!charset)
		return;

	strbuf_reset(charset);
	while (*p) {
1064
		while (isspace(*p) || *p == ';')
1065 1066 1067 1068 1069 1070
			p++;
		if (!extract_param(p, "charset", charset))
			return;
		while (*p && !isspace(*p))
			p++;
	}
1071 1072 1073

	if (!charset->len && starts_with(type->buf, "text/"))
		strbuf_addstr(charset, "ISO-8859-1");
1074 1075
}

1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135
static void write_accept_language(struct strbuf *buf)
{
	/*
	 * MAX_DECIMAL_PLACES must not be larger than 3. If it is larger than
	 * that, q-value will be smaller than 0.001, the minimum q-value the
	 * HTTP specification allows. See
	 * http://tools.ietf.org/html/rfc7231#section-5.3.1 for q-value.
	 */
	const int MAX_DECIMAL_PLACES = 3;
	const int MAX_LANGUAGE_TAGS = 1000;
	const int MAX_ACCEPT_LANGUAGE_HEADER_SIZE = 4000;
	char **language_tags = NULL;
	int num_langs = 0;
	const char *s = get_preferred_languages();
	int i;
	struct strbuf tag = STRBUF_INIT;

	/* Don't add Accept-Language header if no language is preferred. */
	if (!s)
		return;

	/*
	 * Split the colon-separated string of preferred languages into
	 * language_tags array.
	 */
	do {
		/* collect language tag */
		for (; *s && (isalnum(*s) || *s == '_'); s++)
			strbuf_addch(&tag, *s == '_' ? '-' : *s);

		/* skip .codeset, @modifier and any other unnecessary parts */
		while (*s && *s != ':')
			s++;

		if (tag.len) {
			num_langs++;
			REALLOC_ARRAY(language_tags, num_langs);
			language_tags[num_langs - 1] = strbuf_detach(&tag, NULL);
			if (num_langs >= MAX_LANGUAGE_TAGS - 1) /* -1 for '*' */
				break;
		}
	} while (*s++);

	/* write Accept-Language header into buf */
	if (num_langs) {
		int last_buf_len = 0;
		int max_q;
		int decimal_places;
		char q_format[32];

		/* add '*' */
		REALLOC_ARRAY(language_tags, num_langs + 1);
		language_tags[num_langs++] = "*"; /* it's OK; this won't be freed */

		/* compute decimal_places */
		for (max_q = 1, decimal_places = 0;
		     max_q < num_langs && decimal_places <= MAX_DECIMAL_PLACES;
		     decimal_places++, max_q *= 10)
			;

1136
		xsnprintf(q_format, sizeof(q_format), ";q=0.%%0%dd", decimal_places);
1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186

		strbuf_addstr(buf, "Accept-Language: ");

		for (i = 0; i < num_langs; i++) {
			if (i > 0)
				strbuf_addstr(buf, ", ");

			strbuf_addstr(buf, language_tags[i]);

			if (i > 0)
				strbuf_addf(buf, q_format, max_q - i);

			if (buf->len > MAX_ACCEPT_LANGUAGE_HEADER_SIZE) {
				strbuf_remove(buf, last_buf_len, buf->len - last_buf_len);
				break;
			}

			last_buf_len = buf->len;
		}
	}

	/* free language tags -- last one is a static '*' */
	for (i = 0; i < num_langs - 1; i++)
		free(language_tags[i]);
	free(language_tags);
}

/*
 * Get an Accept-Language header which indicates user's preferred languages.
 *
 * Examples:
 *   LANGUAGE= -> ""
 *   LANGUAGE=ko:en -> "Accept-Language: ko, en; q=0.9, *; q=0.1"
 *   LANGUAGE=ko_KR.UTF-8:sr@latin -> "Accept-Language: ko-KR, sr; q=0.9, *; q=0.1"
 *   LANGUAGE=ko LANG=en_US.UTF-8 -> "Accept-Language: ko, *; q=0.1"
 *   LANGUAGE= LANG=en_US.UTF-8 -> "Accept-Language: en-US, *; q=0.1"
 *   LANGUAGE= LANG=C -> ""
 */
static const char *get_accept_language(void)
{
	if (!cached_accept_language) {
		struct strbuf buf = STRBUF_INIT;
		write_accept_language(&buf);
		if (buf.len > 0)
			cached_accept_language = strbuf_detach(&buf, NULL);
	}

	return cached_accept_language;
}

1187 1188 1189 1190 1191 1192 1193
static void http_opt_request_remainder(CURL *curl, off_t pos)
{
	char buf[128];
	xsnprintf(buf, sizeof(buf), "%"PRIuMAX"-", (uintmax_t)pos);
	curl_easy_setopt(curl, CURLOPT_RANGE, buf);
}

1194 1195 1196 1197
/* http_request() targets */
#define HTTP_REQUEST_STRBUF	0
#define HTTP_REQUEST_FILE	1

J
Jeff King 已提交
1198 1199 1200
static int http_request(const char *url,
			void *result, int target,
			const struct http_get_options *options)
1201 1202 1203 1204 1205
{
	struct active_request_slot *slot;
	struct slot_results results;
	struct curl_slist *headers = NULL;
	struct strbuf buf = STRBUF_INIT;
1206
	const char *accept_language;
1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218
	int ret;

	slot = get_active_slot();
	curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);

	if (result == NULL) {
		curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
	} else {
		curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
		curl_easy_setopt(slot->curl, CURLOPT_FILE, result);

		if (target == HTTP_REQUEST_FILE) {
1219
			off_t posn = ftello(result);
1220 1221
			curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
					 fwrite);
1222 1223
			if (posn > 0)
				http_opt_request_remainder(slot->curl, posn);
1224 1225 1226 1227 1228
		} else
			curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
					 fwrite_buffer);
	}

1229 1230 1231 1232 1233
	accept_language = get_accept_language();

	if (accept_language)
		headers = curl_slist_append(headers, accept_language);

1234
	strbuf_addstr(&buf, "Pragma:");
J
Jeff King 已提交
1235
	if (options && options->no_cache)
1236
		strbuf_addstr(&buf, " no-cache");
J
Jeff King 已提交
1237
	if (options && options->keep_error)
J
Jeff King 已提交
1238
		curl_easy_setopt(slot->curl, CURLOPT_FAILONERROR, 0);
1239 1240 1241 1242 1243

	headers = curl_slist_append(headers, buf.buf);

	curl_easy_setopt(slot->curl, CURLOPT_URL, url);
	curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
1244
	curl_easy_setopt(slot->curl, CURLOPT_ENCODING, "gzip");
1245

J
Jeff King 已提交
1246
	ret = run_one_slot(slot, &results);
1247

1248 1249 1250
	if (options && options->content_type) {
		struct strbuf raw = STRBUF_INIT;
		curlinfo_strbuf(slot->curl, CURLINFO_CONTENT_TYPE, &raw);
1251 1252
		extract_content_type(&raw, options->content_type,
				     options->charset);
1253 1254
		strbuf_release(&raw);
	}
1255

J
Jeff King 已提交
1256 1257 1258
	if (options && options->effective_url)
		curlinfo_strbuf(slot->curl, CURLINFO_EFFECTIVE_URL,
				options->effective_url);
1259

1260 1261 1262 1263 1264 1265
	curl_slist_free_all(headers);
	strbuf_release(&buf);

	return ret;
}

1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300
/*
 * Update the "base" url to a more appropriate value, as deduced by
 * redirects seen when requesting a URL starting with "url".
 *
 * The "asked" parameter is a URL that we asked curl to access, and must begin
 * with "base".
 *
 * The "got" parameter is the URL that curl reported to us as where we ended
 * up.
 *
 * Returns 1 if we updated the base url, 0 otherwise.
 *
 * Our basic strategy is to compare "base" and "asked" to find the bits
 * specific to our request. We then strip those bits off of "got" to yield the
 * new base. So for example, if our base is "http://example.com/foo.git",
 * and we ask for "http://example.com/foo.git/info/refs", we might end up
 * with "https://other.example.com/foo.git/info/refs". We would want the
 * new URL to become "https://other.example.com/foo.git".
 *
 * Note that this assumes a sane redirect scheme. It's entirely possible
 * in the example above to end up at a URL that does not even end in
 * "info/refs".  In such a case we simply punt, as there is not much we can
 * do (and such a scheme is unlikely to represent a real git repository,
 * which means we are likely about to abort anyway).
 */
static int update_url_from_redirect(struct strbuf *base,
				    const char *asked,
				    const struct strbuf *got)
{
	const char *tail;
	size_t tail_len;

	if (!strcmp(asked, got->buf))
		return 0;

1301
	if (!skip_prefix(asked, base->buf, &tail))
1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315
		die("BUG: update_url_from_redirect: %s is not a superset of %s",
		    asked, base->buf);

	tail_len = strlen(tail);

	if (got->len < tail_len ||
	    strcmp(tail, got->buf + got->len - tail_len))
		return 0; /* insane redirect scheme */

	strbuf_reset(base);
	strbuf_add(base, got->buf, got->len - tail_len);
	return 1;
}

1316 1317
static int http_request_reauth(const char *url,
			       void *result, int target,
J
Jeff King 已提交
1318
			       struct http_get_options *options)
1319
{
J
Jeff King 已提交
1320
	int ret = http_request(url, result, target, options);
1321 1322 1323 1324 1325 1326 1327 1328 1329

	if (options && options->effective_url && options->base_url) {
		if (update_url_from_redirect(options->base_url,
					     url, options->effective_url)) {
			credential_from_url(&http_auth, options->base_url->buf);
			url = options->effective_url->buf;
		}
	}

1330 1331
	if (ret != HTTP_REAUTH)
		return ret;
J
Jeff King 已提交
1332 1333 1334 1335 1336 1337 1338

	/*
	 * If we are using KEEP_ERROR, the previous request may have
	 * put cruft into our output stream; we should clear it out before
	 * making our next request. We only know how to do this for
	 * the strbuf case, but that is enough to satisfy current callers.
	 */
J
Jeff King 已提交
1339
	if (options && options->keep_error) {
J
Jeff King 已提交
1340 1341 1342 1343 1344 1345 1346 1347
		switch (target) {
		case HTTP_REQUEST_STRBUF:
			strbuf_reset(result);
			break;
		default:
			die("BUG: HTTP_KEEP_ERROR is only supported with strbufs");
		}
	}
1348 1349 1350

	credential_fill(&http_auth);

J
Jeff King 已提交
1351
	return http_request(url, result, target, options);
1352 1353
}

1354
int http_get_strbuf(const char *url,
J
Jeff King 已提交
1355 1356
		    struct strbuf *result,
		    struct http_get_options *options)
1357
{
J
Jeff King 已提交
1358
	return http_request_reauth(url, result, HTTP_REQUEST_STRBUF, options);
1359 1360
}

1361
/*
J
Jim Meyering 已提交
1362
 * Downloads a URL and stores the result in the given file.
1363 1364 1365 1366
 *
 * If a previous interrupted download is detected (i.e. a previous temporary
 * file is still around) the download is resumed.
 */
J
Jeff King 已提交
1367 1368
static int http_get_file(const char *url, const char *filename,
			 struct http_get_options *options)
1369 1370 1371 1372 1373 1374 1375
{
	int ret;
	struct strbuf tmpfile = STRBUF_INIT;
	FILE *result;

	strbuf_addf(&tmpfile, "%s.temp", filename);
	result = fopen(tmpfile.buf, "a");
J
Jeff King 已提交
1376
	if (!result) {
1377 1378 1379 1380 1381
		error("Unable to open local file %s", tmpfile.buf);
		ret = HTTP_ERROR;
		goto cleanup;
	}

J
Jeff King 已提交
1382
	ret = http_request_reauth(url, result, HTTP_REQUEST_FILE, options);
1383 1384
	fclose(result);

1385
	if (ret == HTTP_OK && finalize_object_file(tmpfile.buf, filename))
1386 1387 1388 1389 1390 1391
		ret = HTTP_ERROR;
cleanup:
	strbuf_release(&tmpfile);
	return ret;
}

1392
int http_fetch_ref(const char *base, struct ref *ref)
1393
{
J
Jeff King 已提交
1394
	struct http_get_options options = {0};
1395 1396
	char *url;
	struct strbuf buffer = STRBUF_INIT;
1397
	int ret = -1;
1398

J
Jeff King 已提交
1399 1400
	options.no_cache = 1;

1401
	url = quote_ref_url(base, ref->name);
J
Jeff King 已提交
1402
	if (http_get_strbuf(url, &buffer, &options) == HTTP_OK) {
1403 1404
		strbuf_rtrim(&buffer);
		if (buffer.len == 40)
1405
			ret = get_oid_hex(buffer.buf, &ref->old_oid);
1406
		else if (starts_with(buffer.buf, "ref: ")) {
1407 1408
			ref->symref = xstrdup(buffer.buf + 5);
			ret = 0;
1409 1410 1411 1412 1413 1414 1415
		}
	}

	strbuf_release(&buffer);
	free(url);
	return ret;
}
T
Tay Ray Chuan 已提交
1416 1417

/* Helpers for fetching packs */
1418
static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
T
Tay Ray Chuan 已提交
1419
{
1420
	char *url, *tmp;
T
Tay Ray Chuan 已提交
1421 1422 1423
	struct strbuf buf = STRBUF_INIT;

	if (http_is_verbose)
1424
		fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
T
Tay Ray Chuan 已提交
1425 1426

	end_url_with_slash(&buf, base_url);
1427
	strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
T
Tay Ray Chuan 已提交
1428 1429
	url = strbuf_detach(&buf, NULL);

1430 1431 1432
	strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
	tmp = strbuf_detach(&buf, NULL);

1433
	if (http_get_file(url, tmp, NULL) != HTTP_OK) {
1434
		error("Unable to get pack index %s", url);
1435 1436 1437
		free(tmp);
		tmp = NULL;
	}
T
Tay Ray Chuan 已提交
1438 1439

	free(url);
1440
	return tmp;
T
Tay Ray Chuan 已提交
1441 1442 1443 1444 1445 1446
}

static int fetch_and_setup_pack_index(struct packed_git **packs_head,
	unsigned char *sha1, const char *base_url)
{
	struct packed_git *new_pack;
1447 1448
	char *tmp_idx = NULL;
	int ret;
T
Tay Ray Chuan 已提交
1449

1450
	if (has_pack_index(sha1)) {
1451
		new_pack = parse_pack_index(sha1, sha1_pack_index_name(sha1));
1452 1453 1454 1455 1456 1457 1458
		if (!new_pack)
			return -1; /* parse_pack_index() already issued error message */
		goto add_pack;
	}

	tmp_idx = fetch_pack_index(sha1, base_url);
	if (!tmp_idx)
T
Tay Ray Chuan 已提交
1459 1460
		return -1;

1461 1462 1463 1464 1465
	new_pack = parse_pack_index(sha1, tmp_idx);
	if (!new_pack) {
		unlink(tmp_idx);
		free(tmp_idx);

T
Tay Ray Chuan 已提交
1466
		return -1; /* parse_pack_index() already issued error message */
1467 1468 1469 1470 1471
	}

	ret = verify_pack_index(new_pack);
	if (!ret) {
		close_pack_index(new_pack);
1472
		ret = finalize_object_file(tmp_idx, sha1_pack_index_name(sha1));
1473 1474 1475 1476 1477 1478
	}
	free(tmp_idx);
	if (ret)
		return -1;

add_pack:
T
Tay Ray Chuan 已提交
1479 1480 1481 1482 1483 1484 1485
	new_pack->next = *packs_head;
	*packs_head = new_pack;
	return 0;
}

int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
{
J
Jeff King 已提交
1486
	struct http_get_options options = {0};
T
Tay Ray Chuan 已提交
1487 1488 1489 1490 1491 1492 1493 1494 1495
	int ret = 0, i = 0;
	char *url, *data;
	struct strbuf buf = STRBUF_INIT;
	unsigned char sha1[20];

	end_url_with_slash(&buf, base_url);
	strbuf_addstr(&buf, "objects/info/packs");
	url = strbuf_detach(&buf, NULL);

J
Jeff King 已提交
1496 1497
	options.no_cache = 1;
	ret = http_get_strbuf(url, &buf, &options);
T
Tay Ray Chuan 已提交
1498 1499 1500 1501 1502 1503 1504 1505 1506
	if (ret != HTTP_OK)
		goto cleanup;

	data = buf.buf;
	while (i < buf.len) {
		switch (data[i]) {
		case 'P':
			i++;
			if (i + 52 <= buf.len &&
1507 1508
			    starts_with(data + i, " pack-") &&
			    starts_with(data + i + 46, ".pack\n")) {
T
Tay Ray Chuan 已提交
1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525
				get_sha1_hex(data + i + 6, sha1);
				fetch_and_setup_pack_index(packs_head, sha1,
						      base_url);
				i += 51;
				break;
			}
		default:
			while (i < buf.len && data[i] != '\n')
				i++;
		}
		i++;
	}

cleanup:
	free(url);
	return ret;
}
1526 1527 1528 1529 1530 1531 1532 1533 1534

void release_http_pack_request(struct http_pack_request *preq)
{
	if (preq->packfile != NULL) {
		fclose(preq->packfile);
		preq->packfile = NULL;
	}
	preq->slot = NULL;
	free(preq->url);
1535
	free(preq);
1536 1537 1538 1539 1540
}

int finish_http_pack_request(struct http_pack_request *preq)
{
	struct packed_git **lst;
1541
	struct packed_git *p = preq->target;
1542
	char *tmp_idx;
1543
	size_t len;
1544
	struct child_process ip = CHILD_PROCESS_INIT;
1545
	const char *ip_argv[8];
1546

1547
	close_pack_index(p);
1548

1549 1550
	fclose(preq->packfile);
	preq->packfile = NULL;
1551 1552

	lst = preq->lst;
1553
	while (*lst != p)
1554 1555 1556
		lst = &((*lst)->next);
	*lst = (*lst)->next;

1557 1558 1559
	if (!strip_suffix(preq->tmpfile, ".pack.temp", &len))
		die("BUG: pack tmpfile does not end in .pack.temp?");
	tmp_idx = xstrfmt("%.*s.idx.temp", (int)len, preq->tmpfile);
1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575

	ip_argv[0] = "index-pack";
	ip_argv[1] = "-o";
	ip_argv[2] = tmp_idx;
	ip_argv[3] = preq->tmpfile;
	ip_argv[4] = NULL;

	ip.argv = ip_argv;
	ip.git_cmd = 1;
	ip.no_stdin = 1;
	ip.no_stdout = 1;

	if (run_command(&ip)) {
		unlink(preq->tmpfile);
		unlink(tmp_idx);
		free(tmp_idx);
1576
		return -1;
1577 1578 1579
	}

	unlink(sha1_pack_index_name(p->sha1));
1580

1581 1582
	if (finalize_object_file(preq->tmpfile, sha1_pack_name(p->sha1))
	 || finalize_object_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1583
		free(tmp_idx);
1584
		return -1;
1585
	}
1586

1587 1588
	install_packed_git(p);
	free(tmp_idx);
1589 1590 1591 1592 1593 1594
	return 0;
}

struct http_pack_request *new_http_pack_request(
	struct packed_git *target, const char *base_url)
{
1595
	off_t prev_posn = 0;
1596 1597 1598
	struct strbuf buf = STRBUF_INIT;
	struct http_pack_request *preq;

T
Tay Ray Chuan 已提交
1599
	preq = xcalloc(1, sizeof(*preq));
1600 1601 1602 1603 1604
	preq->target = target;

	end_url_with_slash(&buf, base_url);
	strbuf_addf(&buf, "objects/pack/pack-%s.pack",
		sha1_to_hex(target->sha1));
1605
	preq->url = strbuf_detach(&buf, NULL);
1606

1607 1608
	snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
		sha1_pack_name(target->sha1));
1609 1610 1611 1612 1613 1614 1615 1616 1617 1618
	preq->packfile = fopen(preq->tmpfile, "a");
	if (!preq->packfile) {
		error("Unable to open local file %s for pack",
		      preq->tmpfile);
		goto abort;
	}

	preq->slot = get_active_slot();
	curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
	curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1619
	curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1620 1621 1622 1623 1624 1625 1626
	curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
		no_pragma_header);

	/*
	 * If there is data present from a previous transfer attempt,
	 * resume where it left off
	 */
1627
	prev_posn = ftello(preq->packfile);
1628 1629 1630
	if (prev_posn>0) {
		if (http_is_verbose)
			fprintf(stderr,
1631 1632
				"Resuming fetch of pack %s at byte %"PRIuMAX"\n",
				sha1_to_hex(target->sha1), (uintmax_t)prev_posn);
1633
		http_opt_request_remainder(preq->slot->curl, prev_posn);
1634 1635 1636 1637 1638
	}

	return preq;

abort:
1639
	free(preq->url);
T
Tay Ray Chuan 已提交
1640
	free(preq);
1641 1642
	return NULL;
}
1643 1644

/* Helpers for fetching objects (loose) */
1645
static size_t fwrite_sha1_file(char *ptr, size_t eltsize, size_t nmemb,
1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661
			       void *data)
{
	unsigned char expn[4096];
	size_t size = eltsize * nmemb;
	int posn = 0;
	struct http_object_request *freq =
		(struct http_object_request *)data;
	do {
		ssize_t retval = xwrite(freq->localfile,
					(char *) ptr + posn, size - posn);
		if (retval < 0)
			return posn;
		posn += retval;
	} while (posn < size);

	freq->stream.avail_in = size;
1662
	freq->stream.next_in = (void *)ptr;
1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676
	do {
		freq->stream.next_out = expn;
		freq->stream.avail_out = sizeof(expn);
		freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
		git_SHA1_Update(&freq->c, expn,
				sizeof(expn) - freq->stream.avail_out);
	} while (freq->stream.avail_in && freq->zret == Z_OK);
	return size;
}

struct http_object_request *new_http_object_request(const char *base_url,
	unsigned char *sha1)
{
	char *hex = sha1_to_hex(sha1);
1677
	const char *filename;
1678 1679
	char prevfile[PATH_MAX];
	int prevlocal;
1680
	char prev_buf[PREV_BUF_SIZE];
1681
	ssize_t prev_read = 0;
1682
	off_t prev_posn = 0;
1683 1684
	struct http_object_request *freq;

T
Tay Ray Chuan 已提交
1685
	freq = xcalloc(1, sizeof(*freq));
1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717
	hashcpy(freq->sha1, sha1);
	freq->localfile = -1;

	filename = sha1_file_name(sha1);
	snprintf(freq->tmpfile, sizeof(freq->tmpfile),
		 "%s.temp", filename);

	snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
	unlink_or_warn(prevfile);
	rename(freq->tmpfile, prevfile);
	unlink_or_warn(freq->tmpfile);

	if (freq->localfile != -1)
		error("fd leakage in start: %d", freq->localfile);
	freq->localfile = open(freq->tmpfile,
			       O_WRONLY | O_CREAT | O_EXCL, 0666);
	/*
	 * This could have failed due to the "lazy directory creation";
	 * try to mkdir the last path component.
	 */
	if (freq->localfile < 0 && errno == ENOENT) {
		char *dir = strrchr(freq->tmpfile, '/');
		if (dir) {
			*dir = 0;
			mkdir(freq->tmpfile, 0777);
			*dir = '/';
		}
		freq->localfile = open(freq->tmpfile,
				       O_WRONLY | O_CREAT | O_EXCL, 0666);
	}

	if (freq->localfile < 0) {
1718 1719
		error("Couldn't create temporary file %s: %s",
		      freq->tmpfile, strerror(errno));
1720 1721 1722 1723 1724 1725 1726
		goto abort;
	}

	git_inflate_init(&freq->stream);

	git_SHA1_Init(&freq->c);

1727
	freq->url = get_remote_object_url(base_url, hex, 0);
1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762

	/*
	 * If a previous temp file is present, process what was already
	 * fetched.
	 */
	prevlocal = open(prevfile, O_RDONLY);
	if (prevlocal != -1) {
		do {
			prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
			if (prev_read>0) {
				if (fwrite_sha1_file(prev_buf,
						     1,
						     prev_read,
						     freq) == prev_read) {
					prev_posn += prev_read;
				} else {
					prev_read = -1;
				}
			}
		} while (prev_read > 0);
		close(prevlocal);
	}
	unlink_or_warn(prevfile);

	/*
	 * Reset inflate/SHA1 if there was an error reading the previous temp
	 * file; also rewind to the beginning of the local file.
	 */
	if (prev_read == -1) {
		memset(&freq->stream, 0, sizeof(freq->stream));
		git_inflate_init(&freq->stream);
		git_SHA1_Init(&freq->c);
		if (prev_posn>0) {
			prev_posn = 0;
			lseek(freq->localfile, 0, SEEK_SET);
1763
			if (ftruncate(freq->localfile, 0) < 0) {
1764 1765
				error("Couldn't truncate temporary file %s: %s",
					  freq->tmpfile, strerror(errno));
1766 1767
				goto abort;
			}
1768 1769 1770 1771 1772 1773 1774 1775
		}
	}

	freq->slot = get_active_slot();

	curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
	curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
	curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1776
	curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1777 1778 1779 1780 1781 1782 1783 1784 1785
	curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);

	/*
	 * If we have successfully processed data from a previous fetch
	 * attempt, only fetch the data we don't already have.
	 */
	if (prev_posn>0) {
		if (http_is_verbose)
			fprintf(stderr,
1786 1787
				"Resuming fetch of object %s at byte %"PRIuMAX"\n",
				hex, (uintmax_t)prev_posn);
1788
		http_opt_request_remainder(freq->slot->curl, prev_posn);
1789 1790 1791 1792 1793
	}

	return freq;

abort:
1794
	free(freq->url);
1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817
	free(freq);
	return NULL;
}

void process_http_object_request(struct http_object_request *freq)
{
	if (freq->slot == NULL)
		return;
	freq->curl_result = freq->slot->curl_result;
	freq->http_code = freq->slot->http_code;
	freq->slot = NULL;
}

int finish_http_object_request(struct http_object_request *freq)
{
	struct stat st;

	close(freq->localfile);
	freq->localfile = -1;

	process_http_object_request(freq);

	if (freq->http_code == 416) {
1818
		warning("requested range invalid; we may already have all the data.");
1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836
	} else if (freq->curl_result != CURLE_OK) {
		if (stat(freq->tmpfile, &st) == 0)
			if (st.st_size == 0)
				unlink_or_warn(freq->tmpfile);
		return -1;
	}

	git_inflate_end(&freq->stream);
	git_SHA1_Final(freq->real_sha1, &freq->c);
	if (freq->zret != Z_STREAM_END) {
		unlink_or_warn(freq->tmpfile);
		return -1;
	}
	if (hashcmp(freq->sha1, freq->real_sha1)) {
		unlink_or_warn(freq->tmpfile);
		return -1;
	}
	freq->rename =
1837
		finalize_object_file(freq->tmpfile, sha1_file_name(freq->sha1));
1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858

	return freq->rename;
}

void abort_http_object_request(struct http_object_request *freq)
{
	unlink_or_warn(freq->tmpfile);

	release_http_object_request(freq);
}

void release_http_object_request(struct http_object_request *freq)
{
	if (freq->localfile != -1) {
		close(freq->localfile);
		freq->localfile = -1;
	}
	if (freq->url != NULL) {
		free(freq->url);
		freq->url = NULL;
	}
1859 1860 1861 1862 1863 1864
	if (freq->slot != NULL) {
		freq->slot->callback_func = NULL;
		freq->slot->callback_data = NULL;
		release_active_slot(freq->slot);
		freq->slot = NULL;
	}
1865
}