index-pack: use streaming interface on large blobs (most of the time)
[git/debian.git] / http.c
blob5cb87f16f25fe3d32e2594c8c6325d562eddc9ca
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
5 #include "url.h"
6 #include "credential.h"
8 int active_requests;
9 int http_is_verbose;
10 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
12 #if LIBCURL_VERSION_NUM >= 0x070a06
13 #define LIBCURL_CAN_HANDLE_AUTH_ANY
14 #endif
16 static int min_curl_sessions = 1;
17 static int curl_session_count;
18 #ifdef USE_CURL_MULTI
19 static int max_requests = -1;
20 static CURLM *curlm;
21 #endif
22 #ifndef NO_CURL_EASY_DUPHANDLE
23 static CURL *curl_default;
24 #endif
26 #define PREV_BUF_SIZE 4096
27 #define RANGE_HEADER_SIZE 30
29 char curl_errorstr[CURL_ERROR_SIZE];
31 static int curl_ssl_verify = -1;
32 static const char *ssl_cert;
33 #if LIBCURL_VERSION_NUM >= 0x070903
34 static const char *ssl_key;
35 #endif
36 #if LIBCURL_VERSION_NUM >= 0x070908
37 static const char *ssl_capath;
38 #endif
39 static const char *ssl_cainfo;
40 static long curl_low_speed_limit = -1;
41 static long curl_low_speed_time = -1;
42 static int curl_ftp_no_epsv;
43 static const char *curl_http_proxy;
44 static const char *curl_cookie_file;
45 static struct credential http_auth = CREDENTIAL_INIT;
46 static int http_proactive_auth;
47 static const char *user_agent;
49 #if LIBCURL_VERSION_NUM >= 0x071700
50 /* Use CURLOPT_KEYPASSWD as is */
51 #elif LIBCURL_VERSION_NUM >= 0x070903
52 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
53 #else
54 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
55 #endif
57 static struct credential cert_auth = CREDENTIAL_INIT;
58 static int ssl_cert_password_required;
60 static struct curl_slist *pragma_header;
61 static struct curl_slist *no_pragma_header;
63 static struct active_request_slot *active_queue_head;
65 size_t fread_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
67 size_t size = eltsize * nmemb;
68 struct buffer *buffer = buffer_;
70 if (size > buffer->buf.len - buffer->posn)
71 size = buffer->buf.len - buffer->posn;
72 memcpy(ptr, buffer->buf.buf + buffer->posn, size);
73 buffer->posn += size;
75 return size;
78 #ifndef NO_CURL_IOCTL
79 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
81 struct buffer *buffer = clientp;
83 switch (cmd) {
84 case CURLIOCMD_NOP:
85 return CURLIOE_OK;
87 case CURLIOCMD_RESTARTREAD:
88 buffer->posn = 0;
89 return CURLIOE_OK;
91 default:
92 return CURLIOE_UNKNOWNCMD;
95 #endif
97 size_t fwrite_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
99 size_t size = eltsize * nmemb;
100 struct strbuf *buffer = buffer_;
102 strbuf_add(buffer, ptr, size);
103 return size;
106 size_t fwrite_null(char *ptr, size_t eltsize, size_t nmemb, void *strbuf)
108 return eltsize * nmemb;
111 #ifdef USE_CURL_MULTI
112 static void process_curl_messages(void)
114 int num_messages;
115 struct active_request_slot *slot;
116 CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
118 while (curl_message != NULL) {
119 if (curl_message->msg == CURLMSG_DONE) {
120 int curl_result = curl_message->data.result;
121 slot = active_queue_head;
122 while (slot != NULL &&
123 slot->curl != curl_message->easy_handle)
124 slot = slot->next;
125 if (slot != NULL) {
126 curl_multi_remove_handle(curlm, slot->curl);
127 slot->curl_result = curl_result;
128 finish_active_slot(slot);
129 } else {
130 fprintf(stderr, "Received DONE message for unknown request!\n");
132 } else {
133 fprintf(stderr, "Unknown CURL message received: %d\n",
134 (int)curl_message->msg);
136 curl_message = curl_multi_info_read(curlm, &num_messages);
139 #endif
141 static int http_options(const char *var, const char *value, void *cb)
143 if (!strcmp("http.sslverify", var)) {
144 curl_ssl_verify = git_config_bool(var, value);
145 return 0;
147 if (!strcmp("http.sslcert", var))
148 return git_config_string(&ssl_cert, var, value);
149 #if LIBCURL_VERSION_NUM >= 0x070903
150 if (!strcmp("http.sslkey", var))
151 return git_config_string(&ssl_key, var, value);
152 #endif
153 #if LIBCURL_VERSION_NUM >= 0x070908
154 if (!strcmp("http.sslcapath", var))
155 return git_config_string(&ssl_capath, var, value);
156 #endif
157 if (!strcmp("http.sslcainfo", var))
158 return git_config_string(&ssl_cainfo, var, value);
159 if (!strcmp("http.sslcertpasswordprotected", var)) {
160 if (git_config_bool(var, value))
161 ssl_cert_password_required = 1;
162 return 0;
164 if (!strcmp("http.minsessions", var)) {
165 min_curl_sessions = git_config_int(var, value);
166 #ifndef USE_CURL_MULTI
167 if (min_curl_sessions > 1)
168 min_curl_sessions = 1;
169 #endif
170 return 0;
172 #ifdef USE_CURL_MULTI
173 if (!strcmp("http.maxrequests", var)) {
174 max_requests = git_config_int(var, value);
175 return 0;
177 #endif
178 if (!strcmp("http.lowspeedlimit", var)) {
179 curl_low_speed_limit = (long)git_config_int(var, value);
180 return 0;
182 if (!strcmp("http.lowspeedtime", var)) {
183 curl_low_speed_time = (long)git_config_int(var, value);
184 return 0;
187 if (!strcmp("http.noepsv", var)) {
188 curl_ftp_no_epsv = git_config_bool(var, value);
189 return 0;
191 if (!strcmp("http.proxy", var))
192 return git_config_string(&curl_http_proxy, var, value);
194 if (!strcmp("http.cookiefile", var))
195 return git_config_string(&curl_cookie_file, var, value);
197 if (!strcmp("http.postbuffer", var)) {
198 http_post_buffer = git_config_int(var, value);
199 if (http_post_buffer < LARGE_PACKET_MAX)
200 http_post_buffer = LARGE_PACKET_MAX;
201 return 0;
204 if (!strcmp("http.useragent", var))
205 return git_config_string(&user_agent, var, value);
207 /* Fall back on the default ones */
208 return git_default_config(var, value, cb);
211 static void init_curl_http_auth(CURL *result)
213 if (!http_auth.username)
214 return;
216 credential_fill(&http_auth);
218 #if LIBCURL_VERSION_NUM >= 0x071301
219 curl_easy_setopt(result, CURLOPT_USERNAME, http_auth.username);
220 curl_easy_setopt(result, CURLOPT_PASSWORD, http_auth.password);
221 #else
223 static struct strbuf up = STRBUF_INIT;
224 strbuf_reset(&up);
225 strbuf_addf(&up, "%s:%s",
226 http_auth.username, http_auth.password);
227 curl_easy_setopt(result, CURLOPT_USERPWD, up.buf);
229 #endif
232 static int has_cert_password(void)
234 if (ssl_cert == NULL || ssl_cert_password_required != 1)
235 return 0;
236 if (!cert_auth.password) {
237 cert_auth.protocol = xstrdup("cert");
238 cert_auth.path = xstrdup(ssl_cert);
239 credential_fill(&cert_auth);
241 return 1;
244 static CURL *get_curl_handle(void)
246 CURL *result = curl_easy_init();
248 if (!curl_ssl_verify) {
249 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
250 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
251 } else {
252 /* Verify authenticity of the peer's certificate */
253 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
254 /* The name in the cert must match whom we tried to connect */
255 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
258 #if LIBCURL_VERSION_NUM >= 0x070907
259 curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
260 #endif
261 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
262 curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
263 #endif
265 if (http_proactive_auth)
266 init_curl_http_auth(result);
268 if (ssl_cert != NULL)
269 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
270 if (has_cert_password())
271 curl_easy_setopt(result, CURLOPT_KEYPASSWD, cert_auth.password);
272 #if LIBCURL_VERSION_NUM >= 0x070903
273 if (ssl_key != NULL)
274 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
275 #endif
276 #if LIBCURL_VERSION_NUM >= 0x070908
277 if (ssl_capath != NULL)
278 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
279 #endif
280 if (ssl_cainfo != NULL)
281 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
282 curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
284 if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
285 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
286 curl_low_speed_limit);
287 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
288 curl_low_speed_time);
291 curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
292 #if LIBCURL_VERSION_NUM >= 0x071301
293 curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
294 #elif LIBCURL_VERSION_NUM >= 0x071101
295 curl_easy_setopt(result, CURLOPT_POST301, 1);
296 #endif
298 if (getenv("GIT_CURL_VERBOSE"))
299 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
301 curl_easy_setopt(result, CURLOPT_USERAGENT,
302 user_agent ? user_agent : GIT_HTTP_USER_AGENT);
304 if (curl_ftp_no_epsv)
305 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
307 if (curl_http_proxy) {
308 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
309 curl_easy_setopt(result, CURLOPT_PROXYAUTH, CURLAUTH_ANY);
312 return result;
315 static void set_from_env(const char **var, const char *envname)
317 const char *val = getenv(envname);
318 if (val)
319 *var = val;
322 void http_init(struct remote *remote, const char *url, int proactive_auth)
324 char *low_speed_limit;
325 char *low_speed_time;
327 http_is_verbose = 0;
329 git_config(http_options, NULL);
331 curl_global_init(CURL_GLOBAL_ALL);
333 http_proactive_auth = proactive_auth;
335 if (remote && remote->http_proxy)
336 curl_http_proxy = xstrdup(remote->http_proxy);
338 pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
339 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
341 #ifdef USE_CURL_MULTI
343 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
344 if (http_max_requests != NULL)
345 max_requests = atoi(http_max_requests);
348 curlm = curl_multi_init();
349 if (curlm == NULL) {
350 fprintf(stderr, "Error creating curl multi handle.\n");
351 exit(1);
353 #endif
355 if (getenv("GIT_SSL_NO_VERIFY"))
356 curl_ssl_verify = 0;
358 set_from_env(&ssl_cert, "GIT_SSL_CERT");
359 #if LIBCURL_VERSION_NUM >= 0x070903
360 set_from_env(&ssl_key, "GIT_SSL_KEY");
361 #endif
362 #if LIBCURL_VERSION_NUM >= 0x070908
363 set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
364 #endif
365 set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
367 set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
369 low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
370 if (low_speed_limit != NULL)
371 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
372 low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
373 if (low_speed_time != NULL)
374 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
376 if (curl_ssl_verify == -1)
377 curl_ssl_verify = 1;
379 curl_session_count = 0;
380 #ifdef USE_CURL_MULTI
381 if (max_requests < 1)
382 max_requests = DEFAULT_MAX_REQUESTS;
383 #endif
385 if (getenv("GIT_CURL_FTP_NO_EPSV"))
386 curl_ftp_no_epsv = 1;
388 if (url) {
389 credential_from_url(&http_auth, url);
390 if (!ssl_cert_password_required &&
391 getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
392 !prefixcmp(url, "https://"))
393 ssl_cert_password_required = 1;
396 #ifndef NO_CURL_EASY_DUPHANDLE
397 curl_default = get_curl_handle();
398 #endif
401 void http_cleanup(void)
403 struct active_request_slot *slot = active_queue_head;
405 while (slot != NULL) {
406 struct active_request_slot *next = slot->next;
407 if (slot->curl != NULL) {
408 #ifdef USE_CURL_MULTI
409 curl_multi_remove_handle(curlm, slot->curl);
410 #endif
411 curl_easy_cleanup(slot->curl);
413 free(slot);
414 slot = next;
416 active_queue_head = NULL;
418 #ifndef NO_CURL_EASY_DUPHANDLE
419 curl_easy_cleanup(curl_default);
420 #endif
422 #ifdef USE_CURL_MULTI
423 curl_multi_cleanup(curlm);
424 #endif
425 curl_global_cleanup();
427 curl_slist_free_all(pragma_header);
428 pragma_header = NULL;
430 curl_slist_free_all(no_pragma_header);
431 no_pragma_header = NULL;
433 if (curl_http_proxy) {
434 free((void *)curl_http_proxy);
435 curl_http_proxy = NULL;
438 if (cert_auth.password != NULL) {
439 memset(cert_auth.password, 0, strlen(cert_auth.password));
440 free(cert_auth.password);
441 cert_auth.password = NULL;
443 ssl_cert_password_required = 0;
446 struct active_request_slot *get_active_slot(void)
448 struct active_request_slot *slot = active_queue_head;
449 struct active_request_slot *newslot;
451 #ifdef USE_CURL_MULTI
452 int num_transfers;
454 /* Wait for a slot to open up if the queue is full */
455 while (active_requests >= max_requests) {
456 curl_multi_perform(curlm, &num_transfers);
457 if (num_transfers < active_requests)
458 process_curl_messages();
460 #endif
462 while (slot != NULL && slot->in_use)
463 slot = slot->next;
465 if (slot == NULL) {
466 newslot = xmalloc(sizeof(*newslot));
467 newslot->curl = NULL;
468 newslot->in_use = 0;
469 newslot->next = NULL;
471 slot = active_queue_head;
472 if (slot == NULL) {
473 active_queue_head = newslot;
474 } else {
475 while (slot->next != NULL)
476 slot = slot->next;
477 slot->next = newslot;
479 slot = newslot;
482 if (slot->curl == NULL) {
483 #ifdef NO_CURL_EASY_DUPHANDLE
484 slot->curl = get_curl_handle();
485 #else
486 slot->curl = curl_easy_duphandle(curl_default);
487 #endif
488 curl_session_count++;
491 active_requests++;
492 slot->in_use = 1;
493 slot->results = NULL;
494 slot->finished = NULL;
495 slot->callback_data = NULL;
496 slot->callback_func = NULL;
497 curl_easy_setopt(slot->curl, CURLOPT_COOKIEFILE, curl_cookie_file);
498 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
499 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
500 curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
501 curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
502 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
503 curl_easy_setopt(slot->curl, CURLOPT_POSTFIELDS, NULL);
504 curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
505 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
506 if (http_auth.password)
507 init_curl_http_auth(slot->curl);
509 return slot;
512 int start_active_slot(struct active_request_slot *slot)
514 #ifdef USE_CURL_MULTI
515 CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
516 int num_transfers;
518 if (curlm_result != CURLM_OK &&
519 curlm_result != CURLM_CALL_MULTI_PERFORM) {
520 active_requests--;
521 slot->in_use = 0;
522 return 0;
526 * We know there must be something to do, since we just added
527 * something.
529 curl_multi_perform(curlm, &num_transfers);
530 #endif
531 return 1;
534 #ifdef USE_CURL_MULTI
535 struct fill_chain {
536 void *data;
537 int (*fill)(void *);
538 struct fill_chain *next;
541 static struct fill_chain *fill_cfg;
543 void add_fill_function(void *data, int (*fill)(void *))
545 struct fill_chain *new = xmalloc(sizeof(*new));
546 struct fill_chain **linkp = &fill_cfg;
547 new->data = data;
548 new->fill = fill;
549 new->next = NULL;
550 while (*linkp)
551 linkp = &(*linkp)->next;
552 *linkp = new;
555 void fill_active_slots(void)
557 struct active_request_slot *slot = active_queue_head;
559 while (active_requests < max_requests) {
560 struct fill_chain *fill;
561 for (fill = fill_cfg; fill; fill = fill->next)
562 if (fill->fill(fill->data))
563 break;
565 if (!fill)
566 break;
569 while (slot != NULL) {
570 if (!slot->in_use && slot->curl != NULL
571 && curl_session_count > min_curl_sessions) {
572 curl_easy_cleanup(slot->curl);
573 slot->curl = NULL;
574 curl_session_count--;
576 slot = slot->next;
580 void step_active_slots(void)
582 int num_transfers;
583 CURLMcode curlm_result;
585 do {
586 curlm_result = curl_multi_perform(curlm, &num_transfers);
587 } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
588 if (num_transfers < active_requests) {
589 process_curl_messages();
590 fill_active_slots();
593 #endif
595 void run_active_slot(struct active_request_slot *slot)
597 #ifdef USE_CURL_MULTI
598 fd_set readfds;
599 fd_set writefds;
600 fd_set excfds;
601 int max_fd;
602 struct timeval select_timeout;
603 int finished = 0;
605 slot->finished = &finished;
606 while (!finished) {
607 step_active_slots();
609 if (slot->in_use) {
610 #if LIBCURL_VERSION_NUM >= 0x070f04
611 long curl_timeout;
612 curl_multi_timeout(curlm, &curl_timeout);
613 if (curl_timeout == 0) {
614 continue;
615 } else if (curl_timeout == -1) {
616 select_timeout.tv_sec = 0;
617 select_timeout.tv_usec = 50000;
618 } else {
619 select_timeout.tv_sec = curl_timeout / 1000;
620 select_timeout.tv_usec = (curl_timeout % 1000) * 1000;
622 #else
623 select_timeout.tv_sec = 0;
624 select_timeout.tv_usec = 50000;
625 #endif
627 max_fd = -1;
628 FD_ZERO(&readfds);
629 FD_ZERO(&writefds);
630 FD_ZERO(&excfds);
631 curl_multi_fdset(curlm, &readfds, &writefds, &excfds, &max_fd);
633 select(max_fd+1, &readfds, &writefds, &excfds, &select_timeout);
636 #else
637 while (slot->in_use) {
638 slot->curl_result = curl_easy_perform(slot->curl);
639 finish_active_slot(slot);
641 #endif
644 static void closedown_active_slot(struct active_request_slot *slot)
646 active_requests--;
647 slot->in_use = 0;
650 static void release_active_slot(struct active_request_slot *slot)
652 closedown_active_slot(slot);
653 if (slot->curl && curl_session_count > min_curl_sessions) {
654 #ifdef USE_CURL_MULTI
655 curl_multi_remove_handle(curlm, slot->curl);
656 #endif
657 curl_easy_cleanup(slot->curl);
658 slot->curl = NULL;
659 curl_session_count--;
661 #ifdef USE_CURL_MULTI
662 fill_active_slots();
663 #endif
666 void finish_active_slot(struct active_request_slot *slot)
668 closedown_active_slot(slot);
669 curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
671 if (slot->finished != NULL)
672 (*slot->finished) = 1;
674 /* Store slot results so they can be read after the slot is reused */
675 if (slot->results != NULL) {
676 slot->results->curl_result = slot->curl_result;
677 slot->results->http_code = slot->http_code;
680 /* Run callback if appropriate */
681 if (slot->callback_func != NULL)
682 slot->callback_func(slot->callback_data);
685 void finish_all_active_slots(void)
687 struct active_request_slot *slot = active_queue_head;
689 while (slot != NULL)
690 if (slot->in_use) {
691 run_active_slot(slot);
692 slot = active_queue_head;
693 } else {
694 slot = slot->next;
698 /* Helpers for modifying and creating URLs */
699 static inline int needs_quote(int ch)
701 if (((ch >= 'A') && (ch <= 'Z'))
702 || ((ch >= 'a') && (ch <= 'z'))
703 || ((ch >= '0') && (ch <= '9'))
704 || (ch == '/')
705 || (ch == '-')
706 || (ch == '.'))
707 return 0;
708 return 1;
711 static char *quote_ref_url(const char *base, const char *ref)
713 struct strbuf buf = STRBUF_INIT;
714 const char *cp;
715 int ch;
717 end_url_with_slash(&buf, base);
719 for (cp = ref; (ch = *cp) != 0; cp++)
720 if (needs_quote(ch))
721 strbuf_addf(&buf, "%%%02x", ch);
722 else
723 strbuf_addch(&buf, *cp);
725 return strbuf_detach(&buf, NULL);
728 void append_remote_object_url(struct strbuf *buf, const char *url,
729 const char *hex,
730 int only_two_digit_prefix)
732 end_url_with_slash(buf, url);
734 strbuf_addf(buf, "objects/%.*s/", 2, hex);
735 if (!only_two_digit_prefix)
736 strbuf_addf(buf, "%s", hex+2);
739 char *get_remote_object_url(const char *url, const char *hex,
740 int only_two_digit_prefix)
742 struct strbuf buf = STRBUF_INIT;
743 append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
744 return strbuf_detach(&buf, NULL);
747 /* http_request() targets */
748 #define HTTP_REQUEST_STRBUF 0
749 #define HTTP_REQUEST_FILE 1
751 static int http_request(const char *url, void *result, int target, int options)
753 struct active_request_slot *slot;
754 struct slot_results results;
755 struct curl_slist *headers = NULL;
756 struct strbuf buf = STRBUF_INIT;
757 int ret;
759 slot = get_active_slot();
760 slot->results = &results;
761 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
763 if (result == NULL) {
764 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
765 } else {
766 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
767 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
769 if (target == HTTP_REQUEST_FILE) {
770 long posn = ftell(result);
771 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
772 fwrite);
773 if (posn > 0) {
774 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
775 headers = curl_slist_append(headers, buf.buf);
776 strbuf_reset(&buf);
778 } else
779 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
780 fwrite_buffer);
783 strbuf_addstr(&buf, "Pragma:");
784 if (options & HTTP_NO_CACHE)
785 strbuf_addstr(&buf, " no-cache");
787 headers = curl_slist_append(headers, buf.buf);
789 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
790 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
792 if (start_active_slot(slot)) {
793 run_active_slot(slot);
794 if (results.curl_result == CURLE_OK)
795 ret = HTTP_OK;
796 else if (missing_target(&results))
797 ret = HTTP_MISSING_TARGET;
798 else if (results.http_code == 401) {
799 if (http_auth.username && http_auth.password) {
800 credential_reject(&http_auth);
801 ret = HTTP_NOAUTH;
802 } else {
803 credential_fill(&http_auth);
804 init_curl_http_auth(slot->curl);
805 ret = HTTP_REAUTH;
807 } else {
808 if (!curl_errorstr[0])
809 strlcpy(curl_errorstr,
810 curl_easy_strerror(results.curl_result),
811 sizeof(curl_errorstr));
812 ret = HTTP_ERROR;
814 } else {
815 error("Unable to start HTTP request for %s", url);
816 ret = HTTP_START_FAILED;
819 curl_slist_free_all(headers);
820 strbuf_release(&buf);
822 if (ret == HTTP_OK)
823 credential_approve(&http_auth);
825 return ret;
828 static int http_request_reauth(const char *url, void *result, int target,
829 int options)
831 int ret = http_request(url, result, target, options);
832 if (ret != HTTP_REAUTH)
833 return ret;
834 return http_request(url, result, target, options);
837 int http_get_strbuf(const char *url, struct strbuf *result, int options)
839 return http_request_reauth(url, result, HTTP_REQUEST_STRBUF, options);
843 * Downloads a URL and stores the result in the given file.
845 * If a previous interrupted download is detected (i.e. a previous temporary
846 * file is still around) the download is resumed.
848 static int http_get_file(const char *url, const char *filename, int options)
850 int ret;
851 struct strbuf tmpfile = STRBUF_INIT;
852 FILE *result;
854 strbuf_addf(&tmpfile, "%s.temp", filename);
855 result = fopen(tmpfile.buf, "a");
856 if (! result) {
857 error("Unable to open local file %s", tmpfile.buf);
858 ret = HTTP_ERROR;
859 goto cleanup;
862 ret = http_request_reauth(url, result, HTTP_REQUEST_FILE, options);
863 fclose(result);
865 if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
866 ret = HTTP_ERROR;
867 cleanup:
868 strbuf_release(&tmpfile);
869 return ret;
872 int http_error(const char *url, int ret)
874 /* http_request has already handled HTTP_START_FAILED. */
875 if (ret != HTTP_START_FAILED)
876 error("%s while accessing %s", curl_errorstr, url);
878 return ret;
881 int http_fetch_ref(const char *base, struct ref *ref)
883 char *url;
884 struct strbuf buffer = STRBUF_INIT;
885 int ret = -1;
887 url = quote_ref_url(base, ref->name);
888 if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
889 strbuf_rtrim(&buffer);
890 if (buffer.len == 40)
891 ret = get_sha1_hex(buffer.buf, ref->old_sha1);
892 else if (!prefixcmp(buffer.buf, "ref: ")) {
893 ref->symref = xstrdup(buffer.buf + 5);
894 ret = 0;
898 strbuf_release(&buffer);
899 free(url);
900 return ret;
903 /* Helpers for fetching packs */
904 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
906 char *url, *tmp;
907 struct strbuf buf = STRBUF_INIT;
909 if (http_is_verbose)
910 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
912 end_url_with_slash(&buf, base_url);
913 strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
914 url = strbuf_detach(&buf, NULL);
916 strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
917 tmp = strbuf_detach(&buf, NULL);
919 if (http_get_file(url, tmp, 0) != HTTP_OK) {
920 error("Unable to get pack index %s", url);
921 free(tmp);
922 tmp = NULL;
925 free(url);
926 return tmp;
929 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
930 unsigned char *sha1, const char *base_url)
932 struct packed_git *new_pack;
933 char *tmp_idx = NULL;
934 int ret;
936 if (has_pack_index(sha1)) {
937 new_pack = parse_pack_index(sha1, NULL);
938 if (!new_pack)
939 return -1; /* parse_pack_index() already issued error message */
940 goto add_pack;
943 tmp_idx = fetch_pack_index(sha1, base_url);
944 if (!tmp_idx)
945 return -1;
947 new_pack = parse_pack_index(sha1, tmp_idx);
948 if (!new_pack) {
949 unlink(tmp_idx);
950 free(tmp_idx);
952 return -1; /* parse_pack_index() already issued error message */
955 ret = verify_pack_index(new_pack);
956 if (!ret) {
957 close_pack_index(new_pack);
958 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
960 free(tmp_idx);
961 if (ret)
962 return -1;
964 add_pack:
965 new_pack->next = *packs_head;
966 *packs_head = new_pack;
967 return 0;
970 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
972 int ret = 0, i = 0;
973 char *url, *data;
974 struct strbuf buf = STRBUF_INIT;
975 unsigned char sha1[20];
977 end_url_with_slash(&buf, base_url);
978 strbuf_addstr(&buf, "objects/info/packs");
979 url = strbuf_detach(&buf, NULL);
981 ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
982 if (ret != HTTP_OK)
983 goto cleanup;
985 data = buf.buf;
986 while (i < buf.len) {
987 switch (data[i]) {
988 case 'P':
989 i++;
990 if (i + 52 <= buf.len &&
991 !prefixcmp(data + i, " pack-") &&
992 !prefixcmp(data + i + 46, ".pack\n")) {
993 get_sha1_hex(data + i + 6, sha1);
994 fetch_and_setup_pack_index(packs_head, sha1,
995 base_url);
996 i += 51;
997 break;
999 default:
1000 while (i < buf.len && data[i] != '\n')
1001 i++;
1003 i++;
1006 cleanup:
1007 free(url);
1008 return ret;
1011 void release_http_pack_request(struct http_pack_request *preq)
1013 if (preq->packfile != NULL) {
1014 fclose(preq->packfile);
1015 preq->packfile = NULL;
1017 if (preq->range_header != NULL) {
1018 curl_slist_free_all(preq->range_header);
1019 preq->range_header = NULL;
1021 preq->slot = NULL;
1022 free(preq->url);
1025 int finish_http_pack_request(struct http_pack_request *preq)
1027 struct packed_git **lst;
1028 struct packed_git *p = preq->target;
1029 char *tmp_idx;
1030 struct child_process ip;
1031 const char *ip_argv[8];
1033 close_pack_index(p);
1035 fclose(preq->packfile);
1036 preq->packfile = NULL;
1038 lst = preq->lst;
1039 while (*lst != p)
1040 lst = &((*lst)->next);
1041 *lst = (*lst)->next;
1043 tmp_idx = xstrdup(preq->tmpfile);
1044 strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1045 ".idx.temp");
1047 ip_argv[0] = "index-pack";
1048 ip_argv[1] = "-o";
1049 ip_argv[2] = tmp_idx;
1050 ip_argv[3] = preq->tmpfile;
1051 ip_argv[4] = NULL;
1053 memset(&ip, 0, sizeof(ip));
1054 ip.argv = ip_argv;
1055 ip.git_cmd = 1;
1056 ip.no_stdin = 1;
1057 ip.no_stdout = 1;
1059 if (run_command(&ip)) {
1060 unlink(preq->tmpfile);
1061 unlink(tmp_idx);
1062 free(tmp_idx);
1063 return -1;
1066 unlink(sha1_pack_index_name(p->sha1));
1068 if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1069 || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1070 free(tmp_idx);
1071 return -1;
1074 install_packed_git(p);
1075 free(tmp_idx);
1076 return 0;
1079 struct http_pack_request *new_http_pack_request(
1080 struct packed_git *target, const char *base_url)
1082 long prev_posn = 0;
1083 char range[RANGE_HEADER_SIZE];
1084 struct strbuf buf = STRBUF_INIT;
1085 struct http_pack_request *preq;
1087 preq = xcalloc(1, sizeof(*preq));
1088 preq->target = target;
1090 end_url_with_slash(&buf, base_url);
1091 strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1092 sha1_to_hex(target->sha1));
1093 preq->url = strbuf_detach(&buf, NULL);
1095 snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1096 sha1_pack_name(target->sha1));
1097 preq->packfile = fopen(preq->tmpfile, "a");
1098 if (!preq->packfile) {
1099 error("Unable to open local file %s for pack",
1100 preq->tmpfile);
1101 goto abort;
1104 preq->slot = get_active_slot();
1105 curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1106 curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1107 curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1108 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1109 no_pragma_header);
1112 * If there is data present from a previous transfer attempt,
1113 * resume where it left off
1115 prev_posn = ftell(preq->packfile);
1116 if (prev_posn>0) {
1117 if (http_is_verbose)
1118 fprintf(stderr,
1119 "Resuming fetch of pack %s at byte %ld\n",
1120 sha1_to_hex(target->sha1), prev_posn);
1121 sprintf(range, "Range: bytes=%ld-", prev_posn);
1122 preq->range_header = curl_slist_append(NULL, range);
1123 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1124 preq->range_header);
1127 return preq;
1129 abort:
1130 free(preq->url);
1131 free(preq);
1132 return NULL;
1135 /* Helpers for fetching objects (loose) */
1136 static size_t fwrite_sha1_file(char *ptr, size_t eltsize, size_t nmemb,
1137 void *data)
1139 unsigned char expn[4096];
1140 size_t size = eltsize * nmemb;
1141 int posn = 0;
1142 struct http_object_request *freq =
1143 (struct http_object_request *)data;
1144 do {
1145 ssize_t retval = xwrite(freq->localfile,
1146 (char *) ptr + posn, size - posn);
1147 if (retval < 0)
1148 return posn;
1149 posn += retval;
1150 } while (posn < size);
1152 freq->stream.avail_in = size;
1153 freq->stream.next_in = (void *)ptr;
1154 do {
1155 freq->stream.next_out = expn;
1156 freq->stream.avail_out = sizeof(expn);
1157 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1158 git_SHA1_Update(&freq->c, expn,
1159 sizeof(expn) - freq->stream.avail_out);
1160 } while (freq->stream.avail_in && freq->zret == Z_OK);
1161 return size;
1164 struct http_object_request *new_http_object_request(const char *base_url,
1165 unsigned char *sha1)
1167 char *hex = sha1_to_hex(sha1);
1168 char *filename;
1169 char prevfile[PATH_MAX];
1170 int prevlocal;
1171 char prev_buf[PREV_BUF_SIZE];
1172 ssize_t prev_read = 0;
1173 long prev_posn = 0;
1174 char range[RANGE_HEADER_SIZE];
1175 struct curl_slist *range_header = NULL;
1176 struct http_object_request *freq;
1178 freq = xcalloc(1, sizeof(*freq));
1179 hashcpy(freq->sha1, sha1);
1180 freq->localfile = -1;
1182 filename = sha1_file_name(sha1);
1183 snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1184 "%s.temp", filename);
1186 snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1187 unlink_or_warn(prevfile);
1188 rename(freq->tmpfile, prevfile);
1189 unlink_or_warn(freq->tmpfile);
1191 if (freq->localfile != -1)
1192 error("fd leakage in start: %d", freq->localfile);
1193 freq->localfile = open(freq->tmpfile,
1194 O_WRONLY | O_CREAT | O_EXCL, 0666);
1196 * This could have failed due to the "lazy directory creation";
1197 * try to mkdir the last path component.
1199 if (freq->localfile < 0 && errno == ENOENT) {
1200 char *dir = strrchr(freq->tmpfile, '/');
1201 if (dir) {
1202 *dir = 0;
1203 mkdir(freq->tmpfile, 0777);
1204 *dir = '/';
1206 freq->localfile = open(freq->tmpfile,
1207 O_WRONLY | O_CREAT | O_EXCL, 0666);
1210 if (freq->localfile < 0) {
1211 error("Couldn't create temporary file %s: %s",
1212 freq->tmpfile, strerror(errno));
1213 goto abort;
1216 git_inflate_init(&freq->stream);
1218 git_SHA1_Init(&freq->c);
1220 freq->url = get_remote_object_url(base_url, hex, 0);
1223 * If a previous temp file is present, process what was already
1224 * fetched.
1226 prevlocal = open(prevfile, O_RDONLY);
1227 if (prevlocal != -1) {
1228 do {
1229 prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1230 if (prev_read>0) {
1231 if (fwrite_sha1_file(prev_buf,
1233 prev_read,
1234 freq) == prev_read) {
1235 prev_posn += prev_read;
1236 } else {
1237 prev_read = -1;
1240 } while (prev_read > 0);
1241 close(prevlocal);
1243 unlink_or_warn(prevfile);
1246 * Reset inflate/SHA1 if there was an error reading the previous temp
1247 * file; also rewind to the beginning of the local file.
1249 if (prev_read == -1) {
1250 memset(&freq->stream, 0, sizeof(freq->stream));
1251 git_inflate_init(&freq->stream);
1252 git_SHA1_Init(&freq->c);
1253 if (prev_posn>0) {
1254 prev_posn = 0;
1255 lseek(freq->localfile, 0, SEEK_SET);
1256 if (ftruncate(freq->localfile, 0) < 0) {
1257 error("Couldn't truncate temporary file %s: %s",
1258 freq->tmpfile, strerror(errno));
1259 goto abort;
1264 freq->slot = get_active_slot();
1266 curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1267 curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1268 curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1269 curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1270 curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1273 * If we have successfully processed data from a previous fetch
1274 * attempt, only fetch the data we don't already have.
1276 if (prev_posn>0) {
1277 if (http_is_verbose)
1278 fprintf(stderr,
1279 "Resuming fetch of object %s at byte %ld\n",
1280 hex, prev_posn);
1281 sprintf(range, "Range: bytes=%ld-", prev_posn);
1282 range_header = curl_slist_append(range_header, range);
1283 curl_easy_setopt(freq->slot->curl,
1284 CURLOPT_HTTPHEADER, range_header);
1287 return freq;
1289 abort:
1290 free(freq->url);
1291 free(freq);
1292 return NULL;
1295 void process_http_object_request(struct http_object_request *freq)
1297 if (freq->slot == NULL)
1298 return;
1299 freq->curl_result = freq->slot->curl_result;
1300 freq->http_code = freq->slot->http_code;
1301 freq->slot = NULL;
1304 int finish_http_object_request(struct http_object_request *freq)
1306 struct stat st;
1308 close(freq->localfile);
1309 freq->localfile = -1;
1311 process_http_object_request(freq);
1313 if (freq->http_code == 416) {
1314 warning("requested range invalid; we may already have all the data.");
1315 } else if (freq->curl_result != CURLE_OK) {
1316 if (stat(freq->tmpfile, &st) == 0)
1317 if (st.st_size == 0)
1318 unlink_or_warn(freq->tmpfile);
1319 return -1;
1322 git_inflate_end(&freq->stream);
1323 git_SHA1_Final(freq->real_sha1, &freq->c);
1324 if (freq->zret != Z_STREAM_END) {
1325 unlink_or_warn(freq->tmpfile);
1326 return -1;
1328 if (hashcmp(freq->sha1, freq->real_sha1)) {
1329 unlink_or_warn(freq->tmpfile);
1330 return -1;
1332 freq->rename =
1333 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1335 return freq->rename;
1338 void abort_http_object_request(struct http_object_request *freq)
1340 unlink_or_warn(freq->tmpfile);
1342 release_http_object_request(freq);
1345 void release_http_object_request(struct http_object_request *freq)
1347 if (freq->localfile != -1) {
1348 close(freq->localfile);
1349 freq->localfile = -1;
1351 if (freq->url != NULL) {
1352 free(freq->url);
1353 freq->url = NULL;
1355 if (freq->slot != NULL) {
1356 freq->slot->callback_func = NULL;
1357 freq->slot->callback_data = NULL;
1358 release_active_slot(freq->slot);
1359 freq->slot = NULL;