diffcore-delta: make the hash a bit denser.
[git/jnareb-git.git] / http-fetch.c
blob8fd9de081fc636dc2d5010caea9686caa901c91f
1 #include "cache.h"
2 #include "commit.h"
3 #include "pack.h"
4 #include "fetch.h"
5 #include "http.h"
7 #define PREV_BUF_SIZE 4096
8 #define RANGE_HEADER_SIZE 30
10 static int got_alternates = -1;
12 static struct curl_slist *no_pragma_header;
14 struct alt_base
16 char *base;
17 int got_indices;
18 struct packed_git *packs;
19 struct alt_base *next;
22 static struct alt_base *alt = NULL;
24 enum object_request_state {
25 WAITING,
26 ABORTED,
27 ACTIVE,
28 COMPLETE,
31 struct object_request
33 unsigned char sha1[20];
34 struct alt_base *repo;
35 char *url;
36 char filename[PATH_MAX];
37 char tmpfile[PATH_MAX];
38 int local;
39 enum object_request_state state;
40 CURLcode curl_result;
41 char errorstr[CURL_ERROR_SIZE];
42 long http_code;
43 unsigned char real_sha1[20];
44 SHA_CTX c;
45 z_stream stream;
46 int zret;
47 int rename;
48 struct active_request_slot *slot;
49 struct object_request *next;
52 struct alternates_request {
53 char *base;
54 char *url;
55 struct buffer *buffer;
56 struct active_request_slot *slot;
57 int http_specific;
60 static struct object_request *object_queue_head = NULL;
62 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
63 void *data)
65 unsigned char expn[4096];
66 size_t size = eltsize * nmemb;
67 int posn = 0;
68 struct object_request *obj_req = (struct object_request *)data;
69 do {
70 ssize_t retval = write(obj_req->local,
71 ptr + posn, size - posn);
72 if (retval < 0)
73 return posn;
74 posn += retval;
75 } while (posn < size);
77 obj_req->stream.avail_in = size;
78 obj_req->stream.next_in = ptr;
79 do {
80 obj_req->stream.next_out = expn;
81 obj_req->stream.avail_out = sizeof(expn);
82 obj_req->zret = inflate(&obj_req->stream, Z_SYNC_FLUSH);
83 SHA1_Update(&obj_req->c, expn,
84 sizeof(expn) - obj_req->stream.avail_out);
85 } while (obj_req->stream.avail_in && obj_req->zret == Z_OK);
86 data_received++;
87 return size;
90 static void fetch_alternates(char *base);
92 static void process_object_response(void *callback_data);
94 static void start_object_request(struct object_request *obj_req)
96 char *hex = sha1_to_hex(obj_req->sha1);
97 char prevfile[PATH_MAX];
98 char *url;
99 char *posn;
100 int prevlocal;
101 unsigned char prev_buf[PREV_BUF_SIZE];
102 ssize_t prev_read = 0;
103 long prev_posn = 0;
104 char range[RANGE_HEADER_SIZE];
105 struct curl_slist *range_header = NULL;
106 struct active_request_slot *slot;
108 snprintf(prevfile, sizeof(prevfile), "%s.prev", obj_req->filename);
109 unlink(prevfile);
110 rename(obj_req->tmpfile, prevfile);
111 unlink(obj_req->tmpfile);
113 if (obj_req->local != -1)
114 error("fd leakage in start: %d", obj_req->local);
115 obj_req->local = open(obj_req->tmpfile,
116 O_WRONLY | O_CREAT | O_EXCL, 0666);
117 /* This could have failed due to the "lazy directory creation";
118 * try to mkdir the last path component.
120 if (obj_req->local < 0 && errno == ENOENT) {
121 char *dir = strrchr(obj_req->tmpfile, '/');
122 if (dir) {
123 *dir = 0;
124 mkdir(obj_req->tmpfile, 0777);
125 *dir = '/';
127 obj_req->local = open(obj_req->tmpfile,
128 O_WRONLY | O_CREAT | O_EXCL, 0666);
131 if (obj_req->local < 0) {
132 obj_req->state = ABORTED;
133 error("Couldn't create temporary file %s for %s: %s",
134 obj_req->tmpfile, obj_req->filename, strerror(errno));
135 return;
138 memset(&obj_req->stream, 0, sizeof(obj_req->stream));
140 inflateInit(&obj_req->stream);
142 SHA1_Init(&obj_req->c);
144 url = xmalloc(strlen(obj_req->repo->base) + 50);
145 obj_req->url = xmalloc(strlen(obj_req->repo->base) + 50);
146 strcpy(url, obj_req->repo->base);
147 posn = url + strlen(obj_req->repo->base);
148 strcpy(posn, "objects/");
149 posn += 8;
150 memcpy(posn, hex, 2);
151 posn += 2;
152 *(posn++) = '/';
153 strcpy(posn, hex + 2);
154 strcpy(obj_req->url, url);
156 /* If a previous temp file is present, process what was already
157 fetched. */
158 prevlocal = open(prevfile, O_RDONLY);
159 if (prevlocal != -1) {
160 do {
161 prev_read = read(prevlocal, prev_buf, PREV_BUF_SIZE);
162 if (prev_read>0) {
163 if (fwrite_sha1_file(prev_buf,
165 prev_read,
166 obj_req) == prev_read) {
167 prev_posn += prev_read;
168 } else {
169 prev_read = -1;
172 } while (prev_read > 0);
173 close(prevlocal);
175 unlink(prevfile);
177 /* Reset inflate/SHA1 if there was an error reading the previous temp
178 file; also rewind to the beginning of the local file. */
179 if (prev_read == -1) {
180 memset(&obj_req->stream, 0, sizeof(obj_req->stream));
181 inflateInit(&obj_req->stream);
182 SHA1_Init(&obj_req->c);
183 if (prev_posn>0) {
184 prev_posn = 0;
185 lseek(obj_req->local, SEEK_SET, 0);
186 ftruncate(obj_req->local, 0);
190 slot = get_active_slot();
191 slot->callback_func = process_object_response;
192 slot->callback_data = obj_req;
193 obj_req->slot = slot;
195 curl_easy_setopt(slot->curl, CURLOPT_FILE, obj_req);
196 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
197 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, obj_req->errorstr);
198 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
199 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
201 /* If we have successfully processed data from a previous fetch
202 attempt, only fetch the data we don't already have. */
203 if (prev_posn>0) {
204 if (get_verbosely)
205 fprintf(stderr,
206 "Resuming fetch of object %s at byte %ld\n",
207 hex, prev_posn);
208 sprintf(range, "Range: bytes=%ld-", prev_posn);
209 range_header = curl_slist_append(range_header, range);
210 curl_easy_setopt(slot->curl,
211 CURLOPT_HTTPHEADER, range_header);
214 /* Try to get the request started, abort the request on error */
215 obj_req->state = ACTIVE;
216 if (!start_active_slot(slot)) {
217 obj_req->state = ABORTED;
218 obj_req->slot = NULL;
219 close(obj_req->local); obj_req->local = -1;
220 free(obj_req->url);
221 return;
225 static void finish_object_request(struct object_request *obj_req)
227 struct stat st;
229 fchmod(obj_req->local, 0444);
230 close(obj_req->local); obj_req->local = -1;
232 if (obj_req->http_code == 416) {
233 fprintf(stderr, "Warning: requested range invalid; we may already have all the data.\n");
234 } else if (obj_req->curl_result != CURLE_OK) {
235 if (stat(obj_req->tmpfile, &st) == 0)
236 if (st.st_size == 0)
237 unlink(obj_req->tmpfile);
238 return;
241 inflateEnd(&obj_req->stream);
242 SHA1_Final(obj_req->real_sha1, &obj_req->c);
243 if (obj_req->zret != Z_STREAM_END) {
244 unlink(obj_req->tmpfile);
245 return;
247 if (memcmp(obj_req->sha1, obj_req->real_sha1, 20)) {
248 unlink(obj_req->tmpfile);
249 return;
251 obj_req->rename =
252 move_temp_to_file(obj_req->tmpfile, obj_req->filename);
254 if (obj_req->rename == 0)
255 pull_say("got %s\n", sha1_to_hex(obj_req->sha1));
258 static void process_object_response(void *callback_data)
260 struct object_request *obj_req =
261 (struct object_request *)callback_data;
263 obj_req->curl_result = obj_req->slot->curl_result;
264 obj_req->http_code = obj_req->slot->http_code;
265 obj_req->slot = NULL;
266 obj_req->state = COMPLETE;
268 /* Use alternates if necessary */
269 if (obj_req->http_code == 404 ||
270 obj_req->curl_result == CURLE_FILE_COULDNT_READ_FILE) {
271 fetch_alternates(alt->base);
272 if (obj_req->repo->next != NULL) {
273 obj_req->repo =
274 obj_req->repo->next;
275 close(obj_req->local);
276 obj_req->local = -1;
277 start_object_request(obj_req);
278 return;
282 finish_object_request(obj_req);
285 static void release_object_request(struct object_request *obj_req)
287 struct object_request *entry = object_queue_head;
289 if (obj_req->local != -1)
290 error("fd leakage in release: %d", obj_req->local);
291 if (obj_req == object_queue_head) {
292 object_queue_head = obj_req->next;
293 } else {
294 while (entry->next != NULL && entry->next != obj_req)
295 entry = entry->next;
296 if (entry->next == obj_req)
297 entry->next = entry->next->next;
300 free(obj_req->url);
301 free(obj_req);
304 #ifdef USE_CURL_MULTI
305 void fill_active_slots(void)
307 struct object_request *obj_req = object_queue_head;
308 struct active_request_slot *slot = active_queue_head;
309 int num_transfers;
311 while (active_requests < max_requests && obj_req != NULL) {
312 if (obj_req->state == WAITING) {
313 if (has_sha1_file(obj_req->sha1))
314 obj_req->state = COMPLETE;
315 else
316 start_object_request(obj_req);
317 curl_multi_perform(curlm, &num_transfers);
319 obj_req = obj_req->next;
322 while (slot != NULL) {
323 if (!slot->in_use && slot->curl != NULL) {
324 curl_easy_cleanup(slot->curl);
325 slot->curl = NULL;
327 slot = slot->next;
330 #endif
332 void prefetch(unsigned char *sha1)
334 struct object_request *newreq;
335 struct object_request *tail;
336 char *filename = sha1_file_name(sha1);
338 newreq = xmalloc(sizeof(*newreq));
339 memcpy(newreq->sha1, sha1, 20);
340 newreq->repo = alt;
341 newreq->url = NULL;
342 newreq->local = -1;
343 newreq->state = WAITING;
344 snprintf(newreq->filename, sizeof(newreq->filename), "%s", filename);
345 snprintf(newreq->tmpfile, sizeof(newreq->tmpfile),
346 "%s.temp", filename);
347 newreq->next = NULL;
349 if (object_queue_head == NULL) {
350 object_queue_head = newreq;
351 } else {
352 tail = object_queue_head;
353 while (tail->next != NULL) {
354 tail = tail->next;
356 tail->next = newreq;
359 #ifdef USE_CURL_MULTI
360 fill_active_slots();
361 step_active_slots();
362 #endif
365 static int fetch_index(struct alt_base *repo, unsigned char *sha1)
367 char *hex = sha1_to_hex(sha1);
368 char *filename;
369 char *url;
370 char tmpfile[PATH_MAX];
371 long prev_posn = 0;
372 char range[RANGE_HEADER_SIZE];
373 struct curl_slist *range_header = NULL;
375 FILE *indexfile;
376 struct active_request_slot *slot;
377 struct slot_results results;
379 if (has_pack_index(sha1))
380 return 0;
382 if (get_verbosely)
383 fprintf(stderr, "Getting index for pack %s\n", hex);
385 url = xmalloc(strlen(repo->base) + 64);
386 sprintf(url, "%s/objects/pack/pack-%s.idx", repo->base, hex);
388 filename = sha1_pack_index_name(sha1);
389 snprintf(tmpfile, sizeof(tmpfile), "%s.temp", filename);
390 indexfile = fopen(tmpfile, "a");
391 if (!indexfile)
392 return error("Unable to open local file %s for pack index",
393 filename);
395 slot = get_active_slot();
396 slot->results = &results;
397 curl_easy_setopt(slot->curl, CURLOPT_FILE, indexfile);
398 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
399 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
400 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
401 slot->local = indexfile;
403 /* If there is data present from a previous transfer attempt,
404 resume where it left off */
405 prev_posn = ftell(indexfile);
406 if (prev_posn>0) {
407 if (get_verbosely)
408 fprintf(stderr,
409 "Resuming fetch of index for pack %s at byte %ld\n",
410 hex, prev_posn);
411 sprintf(range, "Range: bytes=%ld-", prev_posn);
412 range_header = curl_slist_append(range_header, range);
413 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, range_header);
416 if (start_active_slot(slot)) {
417 run_active_slot(slot);
418 if (results.curl_result != CURLE_OK) {
419 fclose(indexfile);
420 return error("Unable to get pack index %s\n%s", url,
421 curl_errorstr);
423 } else {
424 fclose(indexfile);
425 return error("Unable to start request");
428 fclose(indexfile);
430 return move_temp_to_file(tmpfile, filename);
433 static int setup_index(struct alt_base *repo, unsigned char *sha1)
435 struct packed_git *new_pack;
436 if (has_pack_file(sha1))
437 return 0; // don't list this as something we can get
439 if (fetch_index(repo, sha1))
440 return -1;
442 new_pack = parse_pack_index(sha1);
443 new_pack->next = repo->packs;
444 repo->packs = new_pack;
445 return 0;
448 static void process_alternates_response(void *callback_data)
450 struct alternates_request *alt_req =
451 (struct alternates_request *)callback_data;
452 struct active_request_slot *slot = alt_req->slot;
453 struct alt_base *tail = alt;
454 char *base = alt_req->base;
455 static const char null_byte = '\0';
456 char *data;
457 int i = 0;
459 if (alt_req->http_specific) {
460 if (slot->curl_result != CURLE_OK ||
461 !alt_req->buffer->posn) {
463 /* Try reusing the slot to get non-http alternates */
464 alt_req->http_specific = 0;
465 sprintf(alt_req->url, "%s/objects/info/alternates",
466 base);
467 curl_easy_setopt(slot->curl, CURLOPT_URL,
468 alt_req->url);
469 active_requests++;
470 slot->in_use = 1;
471 if (!start_active_slot(slot)) {
472 got_alternates = -1;
473 slot->in_use = 0;
475 return;
477 } else if (slot->curl_result != CURLE_OK) {
478 if (slot->http_code != 404 &&
479 slot->curl_result != CURLE_FILE_COULDNT_READ_FILE) {
480 got_alternates = -1;
481 return;
485 fwrite_buffer(&null_byte, 1, 1, alt_req->buffer);
486 alt_req->buffer->posn--;
487 data = alt_req->buffer->buffer;
489 while (i < alt_req->buffer->posn) {
490 int posn = i;
491 while (posn < alt_req->buffer->posn && data[posn] != '\n')
492 posn++;
493 if (data[posn] == '\n') {
494 int okay = 0;
495 int serverlen = 0;
496 struct alt_base *newalt;
497 char *target = NULL;
498 if (data[i] == '/') {
499 serverlen = strchr(base + 8, '/') - base;
500 okay = 1;
501 } else if (!memcmp(data + i, "../", 3)) {
502 i += 3;
503 serverlen = strlen(base);
504 while (i + 2 < posn &&
505 !memcmp(data + i, "../", 3)) {
506 do {
507 serverlen--;
508 } while (serverlen &&
509 base[serverlen - 1] != '/');
510 i += 3;
512 // If the server got removed, give up.
513 okay = strchr(base, ':') - base + 3 <
514 serverlen;
515 } else if (alt_req->http_specific) {
516 char *colon = strchr(data + i, ':');
517 char *slash = strchr(data + i, '/');
518 if (colon && slash && colon < data + posn &&
519 slash < data + posn && colon < slash) {
520 okay = 1;
523 // skip 'objects' at end
524 if (okay) {
525 target = xmalloc(serverlen + posn - i - 6);
526 strncpy(target, base, serverlen);
527 strncpy(target + serverlen, data + i,
528 posn - i - 7);
529 target[serverlen + posn - i - 7] = '\0';
530 if (get_verbosely)
531 fprintf(stderr,
532 "Also look at %s\n", target);
533 newalt = xmalloc(sizeof(*newalt));
534 newalt->next = NULL;
535 newalt->base = target;
536 newalt->got_indices = 0;
537 newalt->packs = NULL;
538 while (tail->next != NULL)
539 tail = tail->next;
540 tail->next = newalt;
543 i = posn + 1;
546 got_alternates = 1;
549 static void fetch_alternates(char *base)
551 struct buffer buffer;
552 char *url;
553 char *data;
554 struct active_request_slot *slot;
555 struct alternates_request alt_req;
557 /* If another request has already started fetching alternates,
558 wait for them to arrive and return to processing this request's
559 curl message */
560 #ifdef USE_CURL_MULTI
561 while (got_alternates == 0) {
562 step_active_slots();
564 #endif
566 /* Nothing to do if they've already been fetched */
567 if (got_alternates == 1)
568 return;
570 /* Start the fetch */
571 got_alternates = 0;
573 data = xmalloc(4096);
574 buffer.size = 4096;
575 buffer.posn = 0;
576 buffer.buffer = data;
578 if (get_verbosely)
579 fprintf(stderr, "Getting alternates list for %s\n", base);
581 url = xmalloc(strlen(base) + 31);
582 sprintf(url, "%s/objects/info/http-alternates", base);
584 /* Use a callback to process the result, since another request
585 may fail and need to have alternates loaded before continuing */
586 slot = get_active_slot();
587 slot->callback_func = process_alternates_response;
588 slot->callback_data = &alt_req;
590 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
591 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
592 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
594 alt_req.base = base;
595 alt_req.url = url;
596 alt_req.buffer = &buffer;
597 alt_req.http_specific = 1;
598 alt_req.slot = slot;
600 if (start_active_slot(slot))
601 run_active_slot(slot);
602 else
603 got_alternates = -1;
605 free(data);
606 free(url);
609 static int fetch_indices(struct alt_base *repo)
611 unsigned char sha1[20];
612 char *url;
613 struct buffer buffer;
614 char *data;
615 int i = 0;
617 struct active_request_slot *slot;
618 struct slot_results results;
620 if (repo->got_indices)
621 return 0;
623 data = xmalloc(4096);
624 buffer.size = 4096;
625 buffer.posn = 0;
626 buffer.buffer = data;
628 if (get_verbosely)
629 fprintf(stderr, "Getting pack list for %s\n", repo->base);
631 url = xmalloc(strlen(repo->base) + 21);
632 sprintf(url, "%s/objects/info/packs", repo->base);
634 slot = get_active_slot();
635 slot->results = &results;
636 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
637 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
638 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
639 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, NULL);
640 if (start_active_slot(slot)) {
641 run_active_slot(slot);
642 if (results.curl_result != CURLE_OK) {
643 if (results.http_code == 404 ||
644 results.curl_result == CURLE_FILE_COULDNT_READ_FILE) {
645 repo->got_indices = 1;
646 free(buffer.buffer);
647 return 0;
648 } else {
649 repo->got_indices = 0;
650 free(buffer.buffer);
651 return error("%s", curl_errorstr);
654 } else {
655 repo->got_indices = 0;
656 free(buffer.buffer);
657 return error("Unable to start request");
660 data = buffer.buffer;
661 while (i < buffer.posn) {
662 switch (data[i]) {
663 case 'P':
664 i++;
665 if (i + 52 <= buffer.posn &&
666 !strncmp(data + i, " pack-", 6) &&
667 !strncmp(data + i + 46, ".pack\n", 6)) {
668 get_sha1_hex(data + i + 6, sha1);
669 setup_index(repo, sha1);
670 i += 51;
671 break;
673 default:
674 while (i < buffer.posn && data[i] != '\n')
675 i++;
677 i++;
680 free(buffer.buffer);
681 repo->got_indices = 1;
682 return 0;
685 static int fetch_pack(struct alt_base *repo, unsigned char *sha1)
687 char *url;
688 struct packed_git *target;
689 struct packed_git **lst;
690 FILE *packfile;
691 char *filename;
692 char tmpfile[PATH_MAX];
693 int ret;
694 long prev_posn = 0;
695 char range[RANGE_HEADER_SIZE];
696 struct curl_slist *range_header = NULL;
698 struct active_request_slot *slot;
699 struct slot_results results;
701 if (fetch_indices(repo))
702 return -1;
703 target = find_sha1_pack(sha1, repo->packs);
704 if (!target)
705 return -1;
707 if (get_verbosely) {
708 fprintf(stderr, "Getting pack %s\n",
709 sha1_to_hex(target->sha1));
710 fprintf(stderr, " which contains %s\n",
711 sha1_to_hex(sha1));
714 url = xmalloc(strlen(repo->base) + 65);
715 sprintf(url, "%s/objects/pack/pack-%s.pack",
716 repo->base, sha1_to_hex(target->sha1));
718 filename = sha1_pack_name(target->sha1);
719 snprintf(tmpfile, sizeof(tmpfile), "%s.temp", filename);
720 packfile = fopen(tmpfile, "a");
721 if (!packfile)
722 return error("Unable to open local file %s for pack",
723 filename);
725 slot = get_active_slot();
726 slot->results = &results;
727 curl_easy_setopt(slot->curl, CURLOPT_FILE, packfile);
728 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
729 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
730 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
731 slot->local = packfile;
733 /* If there is data present from a previous transfer attempt,
734 resume where it left off */
735 prev_posn = ftell(packfile);
736 if (prev_posn>0) {
737 if (get_verbosely)
738 fprintf(stderr,
739 "Resuming fetch of pack %s at byte %ld\n",
740 sha1_to_hex(target->sha1), prev_posn);
741 sprintf(range, "Range: bytes=%ld-", prev_posn);
742 range_header = curl_slist_append(range_header, range);
743 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, range_header);
746 if (start_active_slot(slot)) {
747 run_active_slot(slot);
748 if (results.curl_result != CURLE_OK) {
749 fclose(packfile);
750 return error("Unable to get pack file %s\n%s", url,
751 curl_errorstr);
753 } else {
754 fclose(packfile);
755 return error("Unable to start request");
758 fclose(packfile);
760 ret = move_temp_to_file(tmpfile, filename);
761 if (ret)
762 return ret;
764 lst = &repo->packs;
765 while (*lst != target)
766 lst = &((*lst)->next);
767 *lst = (*lst)->next;
769 if (verify_pack(target, 0))
770 return -1;
771 install_packed_git(target);
773 return 0;
776 static void abort_object_request(struct object_request *obj_req)
778 if (obj_req->local >= 0) {
779 close(obj_req->local);
780 obj_req->local = -1;
782 unlink(obj_req->tmpfile);
783 if (obj_req->slot) {
784 release_active_slot(obj_req->slot);
785 obj_req->slot = NULL;
787 release_object_request(obj_req);
790 static int fetch_object(struct alt_base *repo, unsigned char *sha1)
792 char *hex = sha1_to_hex(sha1);
793 int ret = 0;
794 struct object_request *obj_req = object_queue_head;
796 while (obj_req != NULL && memcmp(obj_req->sha1, sha1, 20))
797 obj_req = obj_req->next;
798 if (obj_req == NULL)
799 return error("Couldn't find request for %s in the queue", hex);
801 if (has_sha1_file(obj_req->sha1)) {
802 abort_object_request(obj_req);
803 return 0;
806 #ifdef USE_CURL_MULTI
807 while (obj_req->state == WAITING) {
808 step_active_slots();
810 #else
811 start_object_request(obj_req);
812 #endif
814 while (obj_req->state == ACTIVE) {
815 run_active_slot(obj_req->slot);
817 if (obj_req->local != -1) {
818 close(obj_req->local); obj_req->local = -1;
821 if (obj_req->state == ABORTED) {
822 ret = error("Request for %s aborted", hex);
823 } else if (obj_req->curl_result != CURLE_OK &&
824 obj_req->http_code != 416) {
825 if (obj_req->http_code == 404 ||
826 obj_req->curl_result == CURLE_FILE_COULDNT_READ_FILE)
827 ret = -1; /* Be silent, it is probably in a pack. */
828 else
829 ret = error("%s (curl_result = %d, http_code = %ld, sha1 = %s)",
830 obj_req->errorstr, obj_req->curl_result,
831 obj_req->http_code, hex);
832 } else if (obj_req->zret != Z_STREAM_END) {
833 ret = error("File %s (%s) corrupt", hex, obj_req->url);
834 } else if (memcmp(obj_req->sha1, obj_req->real_sha1, 20)) {
835 ret = error("File %s has bad hash", hex);
836 } else if (obj_req->rename < 0) {
837 ret = error("unable to write sha1 filename %s",
838 obj_req->filename);
841 release_object_request(obj_req);
842 return ret;
845 int fetch(unsigned char *sha1)
847 struct alt_base *altbase = alt;
849 if (!fetch_object(altbase, sha1))
850 return 0;
851 while (altbase) {
852 if (!fetch_pack(altbase, sha1))
853 return 0;
854 fetch_alternates(alt->base);
855 altbase = altbase->next;
857 return error("Unable to find %s under %s", sha1_to_hex(sha1),
858 alt->base);
861 static inline int needs_quote(int ch)
863 switch (ch) {
864 case '/': case '-': case '.':
865 case 'A'...'Z': case 'a'...'z': case '0'...'9':
866 return 0;
867 default:
868 return 1;
872 static inline int hex(int v)
874 if (v < 10) return '0' + v;
875 else return 'A' + v - 10;
878 static char *quote_ref_url(const char *base, const char *ref)
880 const char *cp;
881 char *dp, *qref;
882 int len, baselen, ch;
884 baselen = strlen(base);
885 len = baselen + 6; /* "refs/" + NUL */
886 for (cp = ref; (ch = *cp) != 0; cp++, len++)
887 if (needs_quote(ch))
888 len += 2; /* extra two hex plus replacement % */
889 qref = xmalloc(len);
890 memcpy(qref, base, baselen);
891 memcpy(qref + baselen, "refs/", 5);
892 for (cp = ref, dp = qref + baselen + 5; (ch = *cp) != 0; cp++) {
893 if (needs_quote(ch)) {
894 *dp++ = '%';
895 *dp++ = hex((ch >> 4) & 0xF);
896 *dp++ = hex(ch & 0xF);
898 else
899 *dp++ = ch;
901 *dp = 0;
903 return qref;
906 int fetch_ref(char *ref, unsigned char *sha1)
908 char *url;
909 char hex[42];
910 struct buffer buffer;
911 char *base = alt->base;
912 struct active_request_slot *slot;
913 struct slot_results results;
914 buffer.size = 41;
915 buffer.posn = 0;
916 buffer.buffer = hex;
917 hex[41] = '\0';
919 url = quote_ref_url(base, ref);
920 slot = get_active_slot();
921 slot->results = &results;
922 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
923 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
924 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, NULL);
925 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
926 if (start_active_slot(slot)) {
927 run_active_slot(slot);
928 if (results.curl_result != CURLE_OK)
929 return error("Couldn't get %s for %s\n%s",
930 url, ref, curl_errorstr);
931 } else {
932 return error("Unable to start request");
935 hex[40] = '\0';
936 get_sha1_hex(hex, sha1);
937 return 0;
940 int main(int argc, char **argv)
942 char *commit_id;
943 char *url;
944 int arg = 1;
945 int rc = 0;
947 setup_git_directory();
949 while (arg < argc && argv[arg][0] == '-') {
950 if (argv[arg][1] == 't') {
951 get_tree = 1;
952 } else if (argv[arg][1] == 'c') {
953 get_history = 1;
954 } else if (argv[arg][1] == 'a') {
955 get_all = 1;
956 get_tree = 1;
957 get_history = 1;
958 } else if (argv[arg][1] == 'v') {
959 get_verbosely = 1;
960 } else if (argv[arg][1] == 'w') {
961 write_ref = argv[arg + 1];
962 arg++;
963 } else if (!strcmp(argv[arg], "--recover")) {
964 get_recover = 1;
966 arg++;
968 if (argc < arg + 2) {
969 usage("git-http-fetch [-c] [-t] [-a] [-d] [-v] [--recover] [-w ref] commit-id url");
970 return 1;
972 commit_id = argv[arg];
973 url = argv[arg + 1];
975 http_init();
977 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
979 alt = xmalloc(sizeof(*alt));
980 alt->base = url;
981 alt->got_indices = 0;
982 alt->packs = NULL;
983 alt->next = NULL;
985 if (pull(commit_id))
986 rc = 1;
988 curl_slist_free_all(no_pragma_header);
990 http_cleanup();
992 return rc;