7 #define PREV_BUF_SIZE 4096
8 #define RANGE_HEADER_SIZE 30
10 static int got_alternates = -1;
12 static struct curl_slist *no_pragma_header;
18 struct packed_git *packs;
19 struct alt_base *next;
22 static struct alt_base *alt = NULL;
24 enum object_request_state {
33 unsigned char sha1[20];
34 struct alt_base *repo;
36 char filename[PATH_MAX];
37 char tmpfile[PATH_MAX];
39 enum object_request_state state;
41 char errorstr[CURL_ERROR_SIZE];
43 unsigned char real_sha1[20];
48 struct active_request_slot *slot;
49 struct object_request *next;
52 struct alternates_request {
55 struct buffer *buffer;
56 struct active_request_slot *slot;
60 static struct object_request *object_queue_head = NULL;
62 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
65 unsigned char expn[4096];
66 size_t size = eltsize * nmemb;
68 struct object_request *obj_req = (struct object_request *)data;
70 ssize_t retval = write(obj_req->local,
71 ptr + posn, size - posn);
75 } while (posn < size);
77 obj_req->stream.avail_in = size;
78 obj_req->stream.next_in = ptr;
80 obj_req->stream.next_out = expn;
81 obj_req->stream.avail_out = sizeof(expn);
82 obj_req->zret = inflate(&obj_req->stream, Z_SYNC_FLUSH);
83 SHA1_Update(&obj_req->c, expn,
84 sizeof(expn) - obj_req->stream.avail_out);
85 } while (obj_req->stream.avail_in && obj_req->zret == Z_OK);
90 static void fetch_alternates(char *base);
92 static void process_object_response(void *callback_data);
94 static void start_object_request(struct object_request *obj_req)
96 char *hex = sha1_to_hex(obj_req->sha1);
97 char prevfile[PATH_MAX];
101 unsigned char prev_buf[PREV_BUF_SIZE];
102 ssize_t prev_read = 0;
104 char range[RANGE_HEADER_SIZE];
105 struct curl_slist *range_header = NULL;
106 struct active_request_slot *slot;
108 snprintf(prevfile, sizeof(prevfile), "%s.prev", obj_req->filename);
110 rename(obj_req->tmpfile, prevfile);
111 unlink(obj_req->tmpfile);
113 if (obj_req->local != -1)
114 error("fd leakage in start: %d", obj_req->local);
115 obj_req->local = open(obj_req->tmpfile,
116 O_WRONLY | O_CREAT | O_EXCL, 0666);
117 /* This could have failed due to the "lazy directory creation";
118 * try to mkdir the last path component.
120 if (obj_req->local < 0 && errno == ENOENT) {
121 char *dir = strrchr(obj_req->tmpfile, '/');
124 mkdir(obj_req->tmpfile, 0777);
127 obj_req->local = open(obj_req->tmpfile,
128 O_WRONLY | O_CREAT | O_EXCL, 0666);
131 if (obj_req->local < 0) {
132 obj_req->state = ABORTED;
133 error("Couldn't create temporary file %s for %s: %s\n",
134 obj_req->tmpfile, obj_req->filename, strerror(errno));
138 memset(&obj_req->stream, 0, sizeof(obj_req->stream));
140 inflateInit(&obj_req->stream);
142 SHA1_Init(&obj_req->c);
144 url = xmalloc(strlen(obj_req->repo->base) + 50);
145 obj_req->url = xmalloc(strlen(obj_req->repo->base) + 50);
146 strcpy(url, obj_req->repo->base);
147 posn = url + strlen(obj_req->repo->base);
148 strcpy(posn, "objects/");
150 memcpy(posn, hex, 2);
153 strcpy(posn, hex + 2);
154 strcpy(obj_req->url, url);
156 /* If a previous temp file is present, process what was already
158 prevlocal = open(prevfile, O_RDONLY);
159 if (prevlocal != -1) {
161 prev_read = read(prevlocal, prev_buf, PREV_BUF_SIZE);
163 if (fwrite_sha1_file(prev_buf,
166 obj_req) == prev_read) {
167 prev_posn += prev_read;
172 } while (prev_read > 0);
177 /* Reset inflate/SHA1 if there was an error reading the previous temp
178 file; also rewind to the beginning of the local file. */
179 if (prev_read == -1) {
180 memset(&obj_req->stream, 0, sizeof(obj_req->stream));
181 inflateInit(&obj_req->stream);
182 SHA1_Init(&obj_req->c);
185 lseek(obj_req->local, SEEK_SET, 0);
186 ftruncate(obj_req->local, 0);
190 slot = get_active_slot();
191 slot->callback_func = process_object_response;
192 slot->callback_data = obj_req;
193 obj_req->slot = slot;
195 curl_easy_setopt(slot->curl, CURLOPT_FILE, obj_req);
196 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
197 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, obj_req->errorstr);
198 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
199 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
201 /* If we have successfully processed data from a previous fetch
202 attempt, only fetch the data we don't already have. */
206 "Resuming fetch of object %s at byte %ld\n",
208 sprintf(range, "Range: bytes=%ld-", prev_posn);
209 range_header = curl_slist_append(range_header, range);
210 curl_easy_setopt(slot->curl,
211 CURLOPT_HTTPHEADER, range_header);
214 /* Try to get the request started, abort the request on error */
215 obj_req->state = ACTIVE;
216 if (!start_active_slot(slot)) {
217 obj_req->state = ABORTED;
218 obj_req->slot = NULL;
219 close(obj_req->local); obj_req->local = -1;
225 static void finish_object_request(struct object_request *obj_req)
229 fchmod(obj_req->local, 0444);
230 close(obj_req->local); obj_req->local = -1;
232 if (obj_req->http_code == 416) {
233 fprintf(stderr, "Warning: requested range invalid; we may already have all the data.\n");
234 } else if (obj_req->curl_result != CURLE_OK) {
235 if (stat(obj_req->tmpfile, &st) == 0)
237 unlink(obj_req->tmpfile);
241 inflateEnd(&obj_req->stream);
242 SHA1_Final(obj_req->real_sha1, &obj_req->c);
243 if (obj_req->zret != Z_STREAM_END) {
244 unlink(obj_req->tmpfile);
247 if (memcmp(obj_req->sha1, obj_req->real_sha1, 20)) {
248 unlink(obj_req->tmpfile);
252 move_temp_to_file(obj_req->tmpfile, obj_req->filename);
254 if (obj_req->rename == 0)
255 pull_say("got %s\n", sha1_to_hex(obj_req->sha1));
258 static void process_object_response(void *callback_data)
260 struct object_request *obj_req =
261 (struct object_request *)callback_data;
263 obj_req->curl_result = obj_req->slot->curl_result;
264 obj_req->http_code = obj_req->slot->http_code;
265 obj_req->slot = NULL;
266 obj_req->state = COMPLETE;
268 /* Use alternates if necessary */
269 if (obj_req->http_code == 404 ||
270 obj_req->curl_result == CURLE_FILE_COULDNT_READ_FILE) {
271 fetch_alternates(alt->base);
272 if (obj_req->repo->next != NULL) {
275 close(obj_req->local);
277 start_object_request(obj_req);
282 finish_object_request(obj_req);
285 static void release_object_request(struct object_request *obj_req)
287 struct object_request *entry = object_queue_head;
289 if (obj_req->local != -1)
290 error("fd leakage in release: %d", obj_req->local);
291 if (obj_req == object_queue_head) {
292 object_queue_head = obj_req->next;
294 while (entry->next != NULL && entry->next != obj_req)
296 if (entry->next == obj_req)
297 entry->next = entry->next->next;
304 #ifdef USE_CURL_MULTI
305 void fill_active_slots(void)
307 struct object_request *obj_req = object_queue_head;
308 struct active_request_slot *slot = active_queue_head;
311 while (active_requests < max_requests && obj_req != NULL) {
312 if (obj_req->state == WAITING) {
313 if (has_sha1_file(obj_req->sha1))
314 release_object_request(obj_req);
316 start_object_request(obj_req);
317 curl_multi_perform(curlm, &num_transfers);
319 obj_req = obj_req->next;
322 while (slot != NULL) {
323 if (!slot->in_use && slot->curl != NULL) {
324 curl_easy_cleanup(slot->curl);
332 void prefetch(unsigned char *sha1)
334 struct object_request *newreq;
335 struct object_request *tail;
336 char *filename = sha1_file_name(sha1);
338 newreq = xmalloc(sizeof(*newreq));
339 memcpy(newreq->sha1, sha1, 20);
343 newreq->state = WAITING;
344 snprintf(newreq->filename, sizeof(newreq->filename), "%s", filename);
345 snprintf(newreq->tmpfile, sizeof(newreq->tmpfile),
346 "%s.temp", filename);
349 if (object_queue_head == NULL) {
350 object_queue_head = newreq;
352 tail = object_queue_head;
353 while (tail->next != NULL) {
359 #ifdef USE_CURL_MULTI
365 static int fetch_index(struct alt_base *repo, unsigned char *sha1)
367 char *hex = sha1_to_hex(sha1);
370 char tmpfile[PATH_MAX];
372 char range[RANGE_HEADER_SIZE];
373 struct curl_slist *range_header = NULL;
376 struct active_request_slot *slot;
377 struct slot_results results;
379 if (has_pack_index(sha1))
383 fprintf(stderr, "Getting index for pack %s\n", hex);
385 url = xmalloc(strlen(repo->base) + 64);
386 sprintf(url, "%s/objects/pack/pack-%s.idx", repo->base, hex);
388 filename = sha1_pack_index_name(sha1);
389 snprintf(tmpfile, sizeof(tmpfile), "%s.temp", filename);
390 indexfile = fopen(tmpfile, "a");
392 return error("Unable to open local file %s for pack index",
395 slot = get_active_slot();
396 slot->results = &results;
397 curl_easy_setopt(slot->curl, CURLOPT_FILE, indexfile);
398 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
399 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
400 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
401 slot->local = indexfile;
403 /* If there is data present from a previous transfer attempt,
404 resume where it left off */
405 prev_posn = ftell(indexfile);
409 "Resuming fetch of index for pack %s at byte %ld\n",
411 sprintf(range, "Range: bytes=%ld-", prev_posn);
412 range_header = curl_slist_append(range_header, range);
413 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, range_header);
416 if (start_active_slot(slot)) {
417 run_active_slot(slot);
418 if (results.curl_result != CURLE_OK) {
420 return error("Unable to get pack index %s\n%s", url,
425 return error("Unable to start request");
430 return move_temp_to_file(tmpfile, filename);
433 static int setup_index(struct alt_base *repo, unsigned char *sha1)
435 struct packed_git *new_pack;
436 if (has_pack_file(sha1))
437 return 0; // don't list this as something we can get
439 if (fetch_index(repo, sha1))
442 new_pack = parse_pack_index(sha1);
443 new_pack->next = repo->packs;
444 repo->packs = new_pack;
448 static void process_alternates_response(void *callback_data)
450 struct alternates_request *alt_req =
451 (struct alternates_request *)callback_data;
452 struct active_request_slot *slot = alt_req->slot;
453 struct alt_base *tail = alt;
454 char *base = alt_req->base;
455 static const char null_byte = '\0';
459 if (alt_req->http_specific) {
460 if (slot->curl_result != CURLE_OK ||
461 !alt_req->buffer->posn) {
463 /* Try reusing the slot to get non-http alternates */
464 alt_req->http_specific = 0;
465 sprintf(alt_req->url, "%s/objects/info/alternates",
467 curl_easy_setopt(slot->curl, CURLOPT_URL,
471 if (start_active_slot(slot)) {
479 } else if (slot->curl_result != CURLE_OK) {
480 if (slot->http_code != 404 &&
481 slot->curl_result != CURLE_FILE_COULDNT_READ_FILE) {
487 fwrite_buffer(&null_byte, 1, 1, alt_req->buffer);
488 alt_req->buffer->posn--;
489 data = alt_req->buffer->buffer;
491 while (i < alt_req->buffer->posn) {
493 while (posn < alt_req->buffer->posn && data[posn] != '\n')
495 if (data[posn] == '\n') {
498 struct alt_base *newalt;
500 if (data[i] == '/') {
501 serverlen = strchr(base + 8, '/') - base;
503 } else if (!memcmp(data + i, "../", 3)) {
505 serverlen = strlen(base);
506 while (i + 2 < posn &&
507 !memcmp(data + i, "../", 3)) {
510 } while (serverlen &&
511 base[serverlen - 1] != '/');
514 // If the server got removed, give up.
515 okay = strchr(base, ':') - base + 3 <
517 } else if (alt_req->http_specific) {
518 char *colon = strchr(data + i, ':');
519 char *slash = strchr(data + i, '/');
520 if (colon && slash && colon < data + posn &&
521 slash < data + posn && colon < slash) {
525 // skip 'objects' at end
527 target = xmalloc(serverlen + posn - i - 6);
528 strncpy(target, base, serverlen);
529 strncpy(target + serverlen, data + i,
531 target[serverlen + posn - i - 7] = '\0';
534 "Also look at %s\n", target);
535 newalt = xmalloc(sizeof(*newalt));
537 newalt->base = target;
538 newalt->got_indices = 0;
539 newalt->packs = NULL;
540 while (tail->next != NULL)
551 static void fetch_alternates(char *base)
553 struct buffer buffer;
556 struct active_request_slot *slot;
557 struct alternates_request alt_req;
559 /* If another request has already started fetching alternates,
560 wait for them to arrive and return to processing this request's
562 #ifdef USE_CURL_MULTI
563 while (got_alternates == 0) {
568 /* Nothing to do if they've already been fetched */
569 if (got_alternates == 1)
572 /* Start the fetch */
575 data = xmalloc(4096);
578 buffer.buffer = data;
581 fprintf(stderr, "Getting alternates list for %s\n", base);
583 url = xmalloc(strlen(base) + 31);
584 sprintf(url, "%s/objects/info/http-alternates", base);
586 /* Use a callback to process the result, since another request
587 may fail and need to have alternates loaded before continuing */
588 slot = get_active_slot();
589 slot->callback_func = process_alternates_response;
590 slot->callback_data = &alt_req;
592 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
593 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
594 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
598 alt_req.buffer = &buffer;
599 alt_req.http_specific = 1;
602 if (start_active_slot(slot))
603 run_active_slot(slot);
611 static int fetch_indices(struct alt_base *repo)
613 unsigned char sha1[20];
615 struct buffer buffer;
619 struct active_request_slot *slot;
620 struct slot_results results;
622 if (repo->got_indices)
625 data = xmalloc(4096);
628 buffer.buffer = data;
631 fprintf(stderr, "Getting pack list for %s\n", repo->base);
633 url = xmalloc(strlen(repo->base) + 21);
634 sprintf(url, "%s/objects/info/packs", repo->base);
636 slot = get_active_slot();
637 slot->results = &results;
638 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
639 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
640 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
641 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, NULL);
642 if (start_active_slot(slot)) {
643 run_active_slot(slot);
644 if (results.curl_result != CURLE_OK) {
645 if (results.http_code == 404 ||
646 results.curl_result == CURLE_FILE_COULDNT_READ_FILE) {
647 repo->got_indices = 1;
651 repo->got_indices = 0;
653 return error("%s", curl_errorstr);
657 repo->got_indices = 0;
659 return error("Unable to start request");
662 data = buffer.buffer;
663 while (i < buffer.posn) {
667 if (i + 52 <= buffer.posn &&
668 !strncmp(data + i, " pack-", 6) &&
669 !strncmp(data + i + 46, ".pack\n", 6)) {
670 get_sha1_hex(data + i + 6, sha1);
671 setup_index(repo, sha1);
676 while (i < buffer.posn && data[i] != '\n')
683 repo->got_indices = 1;
687 static int fetch_pack(struct alt_base *repo, unsigned char *sha1)
690 struct packed_git *target;
691 struct packed_git **lst;
694 char tmpfile[PATH_MAX];
697 char range[RANGE_HEADER_SIZE];
698 struct curl_slist *range_header = NULL;
700 struct active_request_slot *slot;
701 struct slot_results results;
703 if (fetch_indices(repo))
705 target = find_sha1_pack(sha1, repo->packs);
710 fprintf(stderr, "Getting pack %s\n",
711 sha1_to_hex(target->sha1));
712 fprintf(stderr, " which contains %s\n",
716 url = xmalloc(strlen(repo->base) + 65);
717 sprintf(url, "%s/objects/pack/pack-%s.pack",
718 repo->base, sha1_to_hex(target->sha1));
720 filename = sha1_pack_name(target->sha1);
721 snprintf(tmpfile, sizeof(tmpfile), "%s.temp", filename);
722 packfile = fopen(tmpfile, "a");
724 return error("Unable to open local file %s for pack",
727 slot = get_active_slot();
728 slot->results = &results;
729 curl_easy_setopt(slot->curl, CURLOPT_FILE, packfile);
730 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
731 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
732 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
733 slot->local = packfile;
735 /* If there is data present from a previous transfer attempt,
736 resume where it left off */
737 prev_posn = ftell(packfile);
741 "Resuming fetch of pack %s at byte %ld\n",
742 sha1_to_hex(target->sha1), prev_posn);
743 sprintf(range, "Range: bytes=%ld-", prev_posn);
744 range_header = curl_slist_append(range_header, range);
745 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, range_header);
748 if (start_active_slot(slot)) {
749 run_active_slot(slot);
750 if (results.curl_result != CURLE_OK) {
752 return error("Unable to get pack file %s\n%s", url,
757 return error("Unable to start request");
762 ret = move_temp_to_file(tmpfile, filename);
767 while (*lst != target)
768 lst = &((*lst)->next);
771 if (verify_pack(target, 0))
773 install_packed_git(target);
778 static int fetch_object(struct alt_base *repo, unsigned char *sha1)
780 char *hex = sha1_to_hex(sha1);
782 struct object_request *obj_req = object_queue_head;
784 while (obj_req != NULL && memcmp(obj_req->sha1, sha1, 20))
785 obj_req = obj_req->next;
787 return error("Couldn't find request for %s in the queue", hex);
789 if (has_sha1_file(obj_req->sha1)) {
790 release_object_request(obj_req);
794 #ifdef USE_CURL_MULTI
795 while (obj_req->state == WAITING) {
799 start_object_request(obj_req);
802 while (obj_req->state == ACTIVE) {
803 run_active_slot(obj_req->slot);
805 if (obj_req->local != -1) {
806 close(obj_req->local); obj_req->local = -1;
809 if (obj_req->state == ABORTED) {
810 ret = error("Request for %s aborted", hex);
811 } else if (obj_req->curl_result != CURLE_OK &&
812 obj_req->http_code != 416) {
813 if (obj_req->http_code == 404 ||
814 obj_req->curl_result == CURLE_FILE_COULDNT_READ_FILE)
815 ret = -1; /* Be silent, it is probably in a pack. */
817 ret = error("%s (curl_result = %d, http_code = %ld, sha1 = %s)",
818 obj_req->errorstr, obj_req->curl_result,
819 obj_req->http_code, hex);
820 } else if (obj_req->zret != Z_STREAM_END) {
821 ret = error("File %s (%s) corrupt\n", hex, obj_req->url);
822 } else if (memcmp(obj_req->sha1, obj_req->real_sha1, 20)) {
823 ret = error("File %s has bad hash\n", hex);
824 } else if (obj_req->rename < 0) {
825 ret = error("unable to write sha1 filename %s: %s",
827 strerror(obj_req->rename));
830 release_object_request(obj_req);
834 int fetch(unsigned char *sha1)
836 struct alt_base *altbase = alt;
838 if (!fetch_object(altbase, sha1))
841 if (!fetch_pack(altbase, sha1))
843 fetch_alternates(alt->base);
844 altbase = altbase->next;
846 return error("Unable to find %s under %s\n", sha1_to_hex(sha1),
850 static inline int needs_quote(int ch)
853 case '/': case '-': case '.':
854 case 'A'...'Z': case 'a'...'z': case '0'...'9':
861 static inline int hex(int v)
863 if (v < 10) return '0' + v;
864 else return 'A' + v - 10;
867 static char *quote_ref_url(const char *base, const char *ref)
871 int len, baselen, ch;
873 baselen = strlen(base);
874 len = baselen + 6; /* "refs/" + NUL */
875 for (cp = ref; (ch = *cp) != 0; cp++, len++)
877 len += 2; /* extra two hex plus replacement % */
879 memcpy(qref, base, baselen);
880 memcpy(qref + baselen, "refs/", 5);
881 for (cp = ref, dp = qref + baselen + 5; (ch = *cp) != 0; cp++) {
882 if (needs_quote(ch)) {
884 *dp++ = hex((ch >> 4) & 0xF);
885 *dp++ = hex(ch & 0xF);
895 int fetch_ref(char *ref, unsigned char *sha1)
899 struct buffer buffer;
900 char *base = alt->base;
901 struct active_request_slot *slot;
902 struct slot_results results;
908 url = quote_ref_url(base, ref);
909 slot = get_active_slot();
910 slot->results = &results;
911 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
912 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
913 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, NULL);
914 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
915 if (start_active_slot(slot)) {
916 run_active_slot(slot);
917 if (results.curl_result != CURLE_OK)
918 return error("Couldn't get %s for %s\n%s",
919 url, ref, curl_errorstr);
921 return error("Unable to start request");
925 get_sha1_hex(hex, sha1);
929 int main(int argc, char **argv)
936 setup_git_directory();
938 while (arg < argc && argv[arg][0] == '-') {
939 if (argv[arg][1] == 't') {
941 } else if (argv[arg][1] == 'c') {
943 } else if (argv[arg][1] == 'a') {
947 } else if (argv[arg][1] == 'v') {
949 } else if (argv[arg][1] == 'w') {
950 write_ref = argv[arg + 1];
952 } else if (!strcmp(argv[arg], "--recover")) {
957 if (argc < arg + 2) {
958 usage("git-http-fetch [-c] [-t] [-a] [-d] [-v] [--recover] [-w ref] commit-id url");
961 commit_id = argv[arg];
966 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
968 alt = xmalloc(sizeof(*alt));
970 alt->got_indices = 0;
977 curl_slist_free_all(no_pragma_header);