Document the underlying protocol used by shallow repositories and --depth commands.
[git] / http.c
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
5 #include "url.h"
6
7 int data_received;
8 int active_requests;
9 int http_is_verbose;
10 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
11
12 #if LIBCURL_VERSION_NUM >= 0x070a06
13 #define LIBCURL_CAN_HANDLE_AUTH_ANY
14 #endif
15
16 static int min_curl_sessions = 1;
17 static int curl_session_count;
18 #ifdef USE_CURL_MULTI
19 static int max_requests = -1;
20 static CURLM *curlm;
21 #endif
22 #ifndef NO_CURL_EASY_DUPHANDLE
23 static CURL *curl_default;
24 #endif
25
26 #define PREV_BUF_SIZE 4096
27 #define RANGE_HEADER_SIZE 30
28
29 char curl_errorstr[CURL_ERROR_SIZE];
30
31 static int curl_ssl_verify = -1;
32 static const char *ssl_cert;
33 #if LIBCURL_VERSION_NUM >= 0x070903
34 static const char *ssl_key;
35 #endif
36 #if LIBCURL_VERSION_NUM >= 0x070908
37 static const char *ssl_capath;
38 #endif
39 static const char *ssl_cainfo;
40 static long curl_low_speed_limit = -1;
41 static long curl_low_speed_time = -1;
42 static int curl_ftp_no_epsv;
43 static const char *curl_http_proxy;
44 static char *user_name, *user_pass;
45 static const char *user_agent;
46
47 #if LIBCURL_VERSION_NUM >= 0x071700
48 /* Use CURLOPT_KEYPASSWD as is */
49 #elif LIBCURL_VERSION_NUM >= 0x070903
50 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
51 #else
52 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
53 #endif
54
55 static char *ssl_cert_password;
56 static int ssl_cert_password_required;
57
58 static struct curl_slist *pragma_header;
59 static struct curl_slist *no_pragma_header;
60
61 static struct active_request_slot *active_queue_head;
62
63 size_t fread_buffer(void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
64 {
65         size_t size = eltsize * nmemb;
66         struct buffer *buffer = buffer_;
67
68         if (size > buffer->buf.len - buffer->posn)
69                 size = buffer->buf.len - buffer->posn;
70         memcpy(ptr, buffer->buf.buf + buffer->posn, size);
71         buffer->posn += size;
72
73         return size;
74 }
75
76 #ifndef NO_CURL_IOCTL
77 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
78 {
79         struct buffer *buffer = clientp;
80
81         switch (cmd) {
82         case CURLIOCMD_NOP:
83                 return CURLIOE_OK;
84
85         case CURLIOCMD_RESTARTREAD:
86                 buffer->posn = 0;
87                 return CURLIOE_OK;
88
89         default:
90                 return CURLIOE_UNKNOWNCMD;
91         }
92 }
93 #endif
94
95 size_t fwrite_buffer(const void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
96 {
97         size_t size = eltsize * nmemb;
98         struct strbuf *buffer = buffer_;
99
100         strbuf_add(buffer, ptr, size);
101         data_received++;
102         return size;
103 }
104
105 size_t fwrite_null(const void *ptr, size_t eltsize, size_t nmemb, void *strbuf)
106 {
107         data_received++;
108         return eltsize * nmemb;
109 }
110
111 #ifdef USE_CURL_MULTI
112 static void process_curl_messages(void)
113 {
114         int num_messages;
115         struct active_request_slot *slot;
116         CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
117
118         while (curl_message != NULL) {
119                 if (curl_message->msg == CURLMSG_DONE) {
120                         int curl_result = curl_message->data.result;
121                         slot = active_queue_head;
122                         while (slot != NULL &&
123                                slot->curl != curl_message->easy_handle)
124                                 slot = slot->next;
125                         if (slot != NULL) {
126                                 curl_multi_remove_handle(curlm, slot->curl);
127                                 slot->curl_result = curl_result;
128                                 finish_active_slot(slot);
129                         } else {
130                                 fprintf(stderr, "Received DONE message for unknown request!\n");
131                         }
132                 } else {
133                         fprintf(stderr, "Unknown CURL message received: %d\n",
134                                 (int)curl_message->msg);
135                 }
136                 curl_message = curl_multi_info_read(curlm, &num_messages);
137         }
138 }
139 #endif
140
141 static int http_options(const char *var, const char *value, void *cb)
142 {
143         if (!strcmp("http.sslverify", var)) {
144                 curl_ssl_verify = git_config_bool(var, value);
145                 return 0;
146         }
147         if (!strcmp("http.sslcert", var))
148                 return git_config_string(&ssl_cert, var, value);
149 #if LIBCURL_VERSION_NUM >= 0x070903
150         if (!strcmp("http.sslkey", var))
151                 return git_config_string(&ssl_key, var, value);
152 #endif
153 #if LIBCURL_VERSION_NUM >= 0x070908
154         if (!strcmp("http.sslcapath", var))
155                 return git_config_string(&ssl_capath, var, value);
156 #endif
157         if (!strcmp("http.sslcainfo", var))
158                 return git_config_string(&ssl_cainfo, var, value);
159         if (!strcmp("http.sslcertpasswordprotected", var)) {
160                 if (git_config_bool(var, value))
161                         ssl_cert_password_required = 1;
162                 return 0;
163         }
164         if (!strcmp("http.minsessions", var)) {
165                 min_curl_sessions = git_config_int(var, value);
166 #ifndef USE_CURL_MULTI
167                 if (min_curl_sessions > 1)
168                         min_curl_sessions = 1;
169 #endif
170                 return 0;
171         }
172 #ifdef USE_CURL_MULTI
173         if (!strcmp("http.maxrequests", var)) {
174                 max_requests = git_config_int(var, value);
175                 return 0;
176         }
177 #endif
178         if (!strcmp("http.lowspeedlimit", var)) {
179                 curl_low_speed_limit = (long)git_config_int(var, value);
180                 return 0;
181         }
182         if (!strcmp("http.lowspeedtime", var)) {
183                 curl_low_speed_time = (long)git_config_int(var, value);
184                 return 0;
185         }
186
187         if (!strcmp("http.noepsv", var)) {
188                 curl_ftp_no_epsv = git_config_bool(var, value);
189                 return 0;
190         }
191         if (!strcmp("http.proxy", var))
192                 return git_config_string(&curl_http_proxy, var, value);
193
194         if (!strcmp("http.postbuffer", var)) {
195                 http_post_buffer = git_config_int(var, value);
196                 if (http_post_buffer < LARGE_PACKET_MAX)
197                         http_post_buffer = LARGE_PACKET_MAX;
198                 return 0;
199         }
200
201         if (!strcmp("http.useragent", var))
202                 return git_config_string(&user_agent, var, value);
203
204         /* Fall back on the default ones */
205         return git_default_config(var, value, cb);
206 }
207
208 static void init_curl_http_auth(CURL *result)
209 {
210         if (user_name) {
211                 struct strbuf up = STRBUF_INIT;
212                 if (!user_pass)
213                         user_pass = xstrdup(git_getpass("Password: "));
214                 strbuf_addf(&up, "%s:%s", user_name, user_pass);
215                 curl_easy_setopt(result, CURLOPT_USERPWD,
216                                  strbuf_detach(&up, NULL));
217         }
218 }
219
220 static int has_cert_password(void)
221 {
222         if (ssl_cert_password != NULL)
223                 return 1;
224         if (ssl_cert == NULL || ssl_cert_password_required != 1)
225                 return 0;
226         /* Only prompt the user once. */
227         ssl_cert_password_required = -1;
228         ssl_cert_password = git_getpass("Certificate Password: ");
229         if (ssl_cert_password != NULL) {
230                 ssl_cert_password = xstrdup(ssl_cert_password);
231                 return 1;
232         } else
233                 return 0;
234 }
235
236 static CURL *get_curl_handle(void)
237 {
238         CURL *result = curl_easy_init();
239
240         if (!curl_ssl_verify) {
241                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
242                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
243         } else {
244                 /* Verify authenticity of the peer's certificate */
245                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
246                 /* The name in the cert must match whom we tried to connect */
247                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
248         }
249
250 #if LIBCURL_VERSION_NUM >= 0x070907
251         curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
252 #endif
253 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
254         curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
255 #endif
256
257         init_curl_http_auth(result);
258
259         if (ssl_cert != NULL)
260                 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
261         if (has_cert_password())
262                 curl_easy_setopt(result, CURLOPT_KEYPASSWD, ssl_cert_password);
263 #if LIBCURL_VERSION_NUM >= 0x070903
264         if (ssl_key != NULL)
265                 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
266 #endif
267 #if LIBCURL_VERSION_NUM >= 0x070908
268         if (ssl_capath != NULL)
269                 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
270 #endif
271         if (ssl_cainfo != NULL)
272                 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
273         curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
274
275         if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
276                 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
277                                  curl_low_speed_limit);
278                 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
279                                  curl_low_speed_time);
280         }
281
282         curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
283 #if LIBCURL_VERSION_NUM >= 0x071301
284         curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
285 #elif LIBCURL_VERSION_NUM >= 0x071101
286         curl_easy_setopt(result, CURLOPT_POST301, 1);
287 #endif
288
289         if (getenv("GIT_CURL_VERBOSE"))
290                 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
291
292         curl_easy_setopt(result, CURLOPT_USERAGENT,
293                 user_agent ? user_agent : GIT_HTTP_USER_AGENT);
294
295         if (curl_ftp_no_epsv)
296                 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
297
298         if (curl_http_proxy)
299                 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
300
301         return result;
302 }
303
304 static void http_auth_init(const char *url)
305 {
306         char *at, *colon, *cp, *slash, *decoded;
307         int len;
308
309         cp = strstr(url, "://");
310         if (!cp)
311                 return;
312
313         /*
314          * Ok, the URL looks like "proto://something".  Which one?
315          * "proto://<user>:<pass>@<host>/...",
316          * "proto://<user>@<host>/...", or just
317          * "proto://<host>/..."?
318          */
319         cp += 3;
320         at = strchr(cp, '@');
321         colon = strchr(cp, ':');
322         slash = strchrnul(cp, '/');
323         if (!at || slash <= at)
324                 return; /* No credentials */
325         if (!colon || at <= colon) {
326                 /* Only username */
327                 len = at - cp;
328                 user_name = xmalloc(len + 1);
329                 memcpy(user_name, cp, len);
330                 user_name[len] = '\0';
331                 decoded = url_decode(user_name);
332                 free(user_name);
333                 user_name = decoded;
334                 user_pass = NULL;
335         } else {
336                 len = colon - cp;
337                 user_name = xmalloc(len + 1);
338                 memcpy(user_name, cp, len);
339                 user_name[len] = '\0';
340                 decoded = url_decode(user_name);
341                 free(user_name);
342                 user_name = decoded;
343                 len = at - (colon + 1);
344                 user_pass = xmalloc(len + 1);
345                 memcpy(user_pass, colon + 1, len);
346                 user_pass[len] = '\0';
347                 decoded = url_decode(user_pass);
348                 free(user_pass);
349                 user_pass = decoded;
350         }
351 }
352
353 static void set_from_env(const char **var, const char *envname)
354 {
355         const char *val = getenv(envname);
356         if (val)
357                 *var = val;
358 }
359
360 void http_init(struct remote *remote)
361 {
362         char *low_speed_limit;
363         char *low_speed_time;
364
365         http_is_verbose = 0;
366
367         git_config(http_options, NULL);
368
369         curl_global_init(CURL_GLOBAL_ALL);
370
371         if (remote && remote->http_proxy)
372                 curl_http_proxy = xstrdup(remote->http_proxy);
373
374         pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
375         no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
376
377 #ifdef USE_CURL_MULTI
378         {
379                 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
380                 if (http_max_requests != NULL)
381                         max_requests = atoi(http_max_requests);
382         }
383
384         curlm = curl_multi_init();
385         if (curlm == NULL) {
386                 fprintf(stderr, "Error creating curl multi handle.\n");
387                 exit(1);
388         }
389 #endif
390
391         if (getenv("GIT_SSL_NO_VERIFY"))
392                 curl_ssl_verify = 0;
393
394         set_from_env(&ssl_cert, "GIT_SSL_CERT");
395 #if LIBCURL_VERSION_NUM >= 0x070903
396         set_from_env(&ssl_key, "GIT_SSL_KEY");
397 #endif
398 #if LIBCURL_VERSION_NUM >= 0x070908
399         set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
400 #endif
401         set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
402
403         set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
404
405         low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
406         if (low_speed_limit != NULL)
407                 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
408         low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
409         if (low_speed_time != NULL)
410                 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
411
412         if (curl_ssl_verify == -1)
413                 curl_ssl_verify = 1;
414
415         curl_session_count = 0;
416 #ifdef USE_CURL_MULTI
417         if (max_requests < 1)
418                 max_requests = DEFAULT_MAX_REQUESTS;
419 #endif
420
421         if (getenv("GIT_CURL_FTP_NO_EPSV"))
422                 curl_ftp_no_epsv = 1;
423
424         if (remote && remote->url && remote->url[0]) {
425                 http_auth_init(remote->url[0]);
426                 if (!ssl_cert_password_required &&
427                     getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
428                     !prefixcmp(remote->url[0], "https://"))
429                         ssl_cert_password_required = 1;
430         }
431
432 #ifndef NO_CURL_EASY_DUPHANDLE
433         curl_default = get_curl_handle();
434 #endif
435 }
436
437 void http_cleanup(void)
438 {
439         struct active_request_slot *slot = active_queue_head;
440
441         while (slot != NULL) {
442                 struct active_request_slot *next = slot->next;
443                 if (slot->curl != NULL) {
444 #ifdef USE_CURL_MULTI
445                         curl_multi_remove_handle(curlm, slot->curl);
446 #endif
447                         curl_easy_cleanup(slot->curl);
448                 }
449                 free(slot);
450                 slot = next;
451         }
452         active_queue_head = NULL;
453
454 #ifndef NO_CURL_EASY_DUPHANDLE
455         curl_easy_cleanup(curl_default);
456 #endif
457
458 #ifdef USE_CURL_MULTI
459         curl_multi_cleanup(curlm);
460 #endif
461         curl_global_cleanup();
462
463         curl_slist_free_all(pragma_header);
464         pragma_header = NULL;
465
466         curl_slist_free_all(no_pragma_header);
467         no_pragma_header = NULL;
468
469         if (curl_http_proxy) {
470                 free((void *)curl_http_proxy);
471                 curl_http_proxy = NULL;
472         }
473
474         if (ssl_cert_password != NULL) {
475                 memset(ssl_cert_password, 0, strlen(ssl_cert_password));
476                 free(ssl_cert_password);
477                 ssl_cert_password = NULL;
478         }
479         ssl_cert_password_required = 0;
480 }
481
482 struct active_request_slot *get_active_slot(void)
483 {
484         struct active_request_slot *slot = active_queue_head;
485         struct active_request_slot *newslot;
486
487 #ifdef USE_CURL_MULTI
488         int num_transfers;
489
490         /* Wait for a slot to open up if the queue is full */
491         while (active_requests >= max_requests) {
492                 curl_multi_perform(curlm, &num_transfers);
493                 if (num_transfers < active_requests)
494                         process_curl_messages();
495         }
496 #endif
497
498         while (slot != NULL && slot->in_use)
499                 slot = slot->next;
500
501         if (slot == NULL) {
502                 newslot = xmalloc(sizeof(*newslot));
503                 newslot->curl = NULL;
504                 newslot->in_use = 0;
505                 newslot->next = NULL;
506
507                 slot = active_queue_head;
508                 if (slot == NULL) {
509                         active_queue_head = newslot;
510                 } else {
511                         while (slot->next != NULL)
512                                 slot = slot->next;
513                         slot->next = newslot;
514                 }
515                 slot = newslot;
516         }
517
518         if (slot->curl == NULL) {
519 #ifdef NO_CURL_EASY_DUPHANDLE
520                 slot->curl = get_curl_handle();
521 #else
522                 slot->curl = curl_easy_duphandle(curl_default);
523 #endif
524                 curl_session_count++;
525         }
526
527         active_requests++;
528         slot->in_use = 1;
529         slot->local = NULL;
530         slot->results = NULL;
531         slot->finished = NULL;
532         slot->callback_data = NULL;
533         slot->callback_func = NULL;
534         curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
535         curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
536         curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
537         curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
538         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
539         curl_easy_setopt(slot->curl, CURLOPT_POSTFIELDS, NULL);
540         curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
541         curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
542
543         return slot;
544 }
545
546 int start_active_slot(struct active_request_slot *slot)
547 {
548 #ifdef USE_CURL_MULTI
549         CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
550         int num_transfers;
551
552         if (curlm_result != CURLM_OK &&
553             curlm_result != CURLM_CALL_MULTI_PERFORM) {
554                 active_requests--;
555                 slot->in_use = 0;
556                 return 0;
557         }
558
559         /*
560          * We know there must be something to do, since we just added
561          * something.
562          */
563         curl_multi_perform(curlm, &num_transfers);
564 #endif
565         return 1;
566 }
567
568 #ifdef USE_CURL_MULTI
569 struct fill_chain {
570         void *data;
571         int (*fill)(void *);
572         struct fill_chain *next;
573 };
574
575 static struct fill_chain *fill_cfg;
576
577 void add_fill_function(void *data, int (*fill)(void *))
578 {
579         struct fill_chain *new = xmalloc(sizeof(*new));
580         struct fill_chain **linkp = &fill_cfg;
581         new->data = data;
582         new->fill = fill;
583         new->next = NULL;
584         while (*linkp)
585                 linkp = &(*linkp)->next;
586         *linkp = new;
587 }
588
589 void fill_active_slots(void)
590 {
591         struct active_request_slot *slot = active_queue_head;
592
593         while (active_requests < max_requests) {
594                 struct fill_chain *fill;
595                 for (fill = fill_cfg; fill; fill = fill->next)
596                         if (fill->fill(fill->data))
597                                 break;
598
599                 if (!fill)
600                         break;
601         }
602
603         while (slot != NULL) {
604                 if (!slot->in_use && slot->curl != NULL
605                         && curl_session_count > min_curl_sessions) {
606                         curl_easy_cleanup(slot->curl);
607                         slot->curl = NULL;
608                         curl_session_count--;
609                 }
610                 slot = slot->next;
611         }
612 }
613
614 void step_active_slots(void)
615 {
616         int num_transfers;
617         CURLMcode curlm_result;
618
619         do {
620                 curlm_result = curl_multi_perform(curlm, &num_transfers);
621         } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
622         if (num_transfers < active_requests) {
623                 process_curl_messages();
624                 fill_active_slots();
625         }
626 }
627 #endif
628
629 void run_active_slot(struct active_request_slot *slot)
630 {
631 #ifdef USE_CURL_MULTI
632         long last_pos = 0;
633         long current_pos;
634         fd_set readfds;
635         fd_set writefds;
636         fd_set excfds;
637         int max_fd;
638         struct timeval select_timeout;
639         int finished = 0;
640
641         slot->finished = &finished;
642         while (!finished) {
643                 data_received = 0;
644                 step_active_slots();
645
646                 if (!data_received && slot->local != NULL) {
647                         current_pos = ftell(slot->local);
648                         if (current_pos > last_pos)
649                                 data_received++;
650                         last_pos = current_pos;
651                 }
652
653                 if (slot->in_use && !data_received) {
654                         max_fd = 0;
655                         FD_ZERO(&readfds);
656                         FD_ZERO(&writefds);
657                         FD_ZERO(&excfds);
658                         select_timeout.tv_sec = 0;
659                         select_timeout.tv_usec = 50000;
660                         select(max_fd, &readfds, &writefds,
661                                &excfds, &select_timeout);
662                 }
663         }
664 #else
665         while (slot->in_use) {
666                 slot->curl_result = curl_easy_perform(slot->curl);
667                 finish_active_slot(slot);
668         }
669 #endif
670 }
671
672 static void closedown_active_slot(struct active_request_slot *slot)
673 {
674         active_requests--;
675         slot->in_use = 0;
676 }
677
678 static void release_active_slot(struct active_request_slot *slot)
679 {
680         closedown_active_slot(slot);
681         if (slot->curl && curl_session_count > min_curl_sessions) {
682 #ifdef USE_CURL_MULTI
683                 curl_multi_remove_handle(curlm, slot->curl);
684 #endif
685                 curl_easy_cleanup(slot->curl);
686                 slot->curl = NULL;
687                 curl_session_count--;
688         }
689 #ifdef USE_CURL_MULTI
690         fill_active_slots();
691 #endif
692 }
693
694 void finish_active_slot(struct active_request_slot *slot)
695 {
696         closedown_active_slot(slot);
697         curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
698
699         if (slot->finished != NULL)
700                 (*slot->finished) = 1;
701
702         /* Store slot results so they can be read after the slot is reused */
703         if (slot->results != NULL) {
704                 slot->results->curl_result = slot->curl_result;
705                 slot->results->http_code = slot->http_code;
706         }
707
708         /* Run callback if appropriate */
709         if (slot->callback_func != NULL)
710                 slot->callback_func(slot->callback_data);
711 }
712
713 void finish_all_active_slots(void)
714 {
715         struct active_request_slot *slot = active_queue_head;
716
717         while (slot != NULL)
718                 if (slot->in_use) {
719                         run_active_slot(slot);
720                         slot = active_queue_head;
721                 } else {
722                         slot = slot->next;
723                 }
724 }
725
726 /* Helpers for modifying and creating URLs */
727 static inline int needs_quote(int ch)
728 {
729         if (((ch >= 'A') && (ch <= 'Z'))
730                         || ((ch >= 'a') && (ch <= 'z'))
731                         || ((ch >= '0') && (ch <= '9'))
732                         || (ch == '/')
733                         || (ch == '-')
734                         || (ch == '.'))
735                 return 0;
736         return 1;
737 }
738
739 static inline int hex(int v)
740 {
741         if (v < 10)
742                 return '0' + v;
743         else
744                 return 'A' + v - 10;
745 }
746
747 static char *quote_ref_url(const char *base, const char *ref)
748 {
749         struct strbuf buf = STRBUF_INIT;
750         const char *cp;
751         int ch;
752
753         end_url_with_slash(&buf, base);
754
755         for (cp = ref; (ch = *cp) != 0; cp++)
756                 if (needs_quote(ch))
757                         strbuf_addf(&buf, "%%%02x", ch);
758                 else
759                         strbuf_addch(&buf, *cp);
760
761         return strbuf_detach(&buf, NULL);
762 }
763
764 void append_remote_object_url(struct strbuf *buf, const char *url,
765                               const char *hex,
766                               int only_two_digit_prefix)
767 {
768         end_url_with_slash(buf, url);
769
770         strbuf_addf(buf, "objects/%.*s/", 2, hex);
771         if (!only_two_digit_prefix)
772                 strbuf_addf(buf, "%s", hex+2);
773 }
774
775 char *get_remote_object_url(const char *url, const char *hex,
776                             int only_two_digit_prefix)
777 {
778         struct strbuf buf = STRBUF_INIT;
779         append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
780         return strbuf_detach(&buf, NULL);
781 }
782
783 /* http_request() targets */
784 #define HTTP_REQUEST_STRBUF     0
785 #define HTTP_REQUEST_FILE       1
786
787 static int http_request(const char *url, void *result, int target, int options)
788 {
789         struct active_request_slot *slot;
790         struct slot_results results;
791         struct curl_slist *headers = NULL;
792         struct strbuf buf = STRBUF_INIT;
793         int ret;
794
795         slot = get_active_slot();
796         slot->results = &results;
797         curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
798
799         if (result == NULL) {
800                 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
801         } else {
802                 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
803                 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
804
805                 if (target == HTTP_REQUEST_FILE) {
806                         long posn = ftell(result);
807                         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
808                                          fwrite);
809                         if (posn > 0) {
810                                 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
811                                 headers = curl_slist_append(headers, buf.buf);
812                                 strbuf_reset(&buf);
813                         }
814                         slot->local = result;
815                 } else
816                         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
817                                          fwrite_buffer);
818         }
819
820         strbuf_addstr(&buf, "Pragma:");
821         if (options & HTTP_NO_CACHE)
822                 strbuf_addstr(&buf, " no-cache");
823
824         headers = curl_slist_append(headers, buf.buf);
825
826         curl_easy_setopt(slot->curl, CURLOPT_URL, url);
827         curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
828
829         if (start_active_slot(slot)) {
830                 run_active_slot(slot);
831                 if (results.curl_result == CURLE_OK)
832                         ret = HTTP_OK;
833                 else if (missing_target(&results))
834                         ret = HTTP_MISSING_TARGET;
835                 else if (results.http_code == 401) {
836                         if (user_name) {
837                                 ret = HTTP_NOAUTH;
838                         } else {
839                                 /*
840                                  * git_getpass is needed here because its very likely stdin/stdout are
841                                  * pipes to our parent process.  So we instead need to use /dev/tty,
842                                  * but that is non-portable.  Using git_getpass() can at least be stubbed
843                                  * on other platforms with a different implementation if/when necessary.
844                                  */
845                                 user_name = xstrdup(git_getpass("Username: "));
846                                 init_curl_http_auth(slot->curl);
847                                 ret = HTTP_REAUTH;
848                         }
849                 } else
850                         ret = HTTP_ERROR;
851         } else {
852                 error("Unable to start HTTP request for %s", url);
853                 ret = HTTP_START_FAILED;
854         }
855
856         slot->local = NULL;
857         curl_slist_free_all(headers);
858         strbuf_release(&buf);
859
860         return ret;
861 }
862
863 int http_get_strbuf(const char *url, struct strbuf *result, int options)
864 {
865         int http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
866         if (http_ret == HTTP_REAUTH) {
867                 http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
868         }
869         return http_ret;
870 }
871
872 /*
873  * Downloads an url and stores the result in the given file.
874  *
875  * If a previous interrupted download is detected (i.e. a previous temporary
876  * file is still around) the download is resumed.
877  */
878 static int http_get_file(const char *url, const char *filename, int options)
879 {
880         int ret;
881         struct strbuf tmpfile = STRBUF_INIT;
882         FILE *result;
883
884         strbuf_addf(&tmpfile, "%s.temp", filename);
885         result = fopen(tmpfile.buf, "a");
886         if (! result) {
887                 error("Unable to open local file %s", tmpfile.buf);
888                 ret = HTTP_ERROR;
889                 goto cleanup;
890         }
891
892         ret = http_request(url, result, HTTP_REQUEST_FILE, options);
893         fclose(result);
894
895         if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
896                 ret = HTTP_ERROR;
897 cleanup:
898         strbuf_release(&tmpfile);
899         return ret;
900 }
901
902 int http_error(const char *url, int ret)
903 {
904         /* http_request has already handled HTTP_START_FAILED. */
905         if (ret != HTTP_START_FAILED)
906                 error("%s while accessing %s\n", curl_errorstr, url);
907
908         return ret;
909 }
910
911 int http_fetch_ref(const char *base, struct ref *ref)
912 {
913         char *url;
914         struct strbuf buffer = STRBUF_INIT;
915         int ret = -1;
916
917         url = quote_ref_url(base, ref->name);
918         if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
919                 strbuf_rtrim(&buffer);
920                 if (buffer.len == 40)
921                         ret = get_sha1_hex(buffer.buf, ref->old_sha1);
922                 else if (!prefixcmp(buffer.buf, "ref: ")) {
923                         ref->symref = xstrdup(buffer.buf + 5);
924                         ret = 0;
925                 }
926         }
927
928         strbuf_release(&buffer);
929         free(url);
930         return ret;
931 }
932
933 /* Helpers for fetching packs */
934 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
935 {
936         char *url, *tmp;
937         struct strbuf buf = STRBUF_INIT;
938
939         if (http_is_verbose)
940                 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
941
942         end_url_with_slash(&buf, base_url);
943         strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
944         url = strbuf_detach(&buf, NULL);
945
946         strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
947         tmp = strbuf_detach(&buf, NULL);
948
949         if (http_get_file(url, tmp, 0) != HTTP_OK) {
950                 error("Unable to get pack index %s\n", url);
951                 free(tmp);
952                 tmp = NULL;
953         }
954
955         free(url);
956         return tmp;
957 }
958
959 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
960         unsigned char *sha1, const char *base_url)
961 {
962         struct packed_git *new_pack;
963         char *tmp_idx = NULL;
964         int ret;
965
966         if (has_pack_index(sha1)) {
967                 new_pack = parse_pack_index(sha1, NULL);
968                 if (!new_pack)
969                         return -1; /* parse_pack_index() already issued error message */
970                 goto add_pack;
971         }
972
973         tmp_idx = fetch_pack_index(sha1, base_url);
974         if (!tmp_idx)
975                 return -1;
976
977         new_pack = parse_pack_index(sha1, tmp_idx);
978         if (!new_pack) {
979                 unlink(tmp_idx);
980                 free(tmp_idx);
981
982                 return -1; /* parse_pack_index() already issued error message */
983         }
984
985         ret = verify_pack_index(new_pack);
986         if (!ret) {
987                 close_pack_index(new_pack);
988                 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
989         }
990         free(tmp_idx);
991         if (ret)
992                 return -1;
993
994 add_pack:
995         new_pack->next = *packs_head;
996         *packs_head = new_pack;
997         return 0;
998 }
999
1000 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
1001 {
1002         int ret = 0, i = 0;
1003         char *url, *data;
1004         struct strbuf buf = STRBUF_INIT;
1005         unsigned char sha1[20];
1006
1007         end_url_with_slash(&buf, base_url);
1008         strbuf_addstr(&buf, "objects/info/packs");
1009         url = strbuf_detach(&buf, NULL);
1010
1011         ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
1012         if (ret != HTTP_OK)
1013                 goto cleanup;
1014
1015         data = buf.buf;
1016         while (i < buf.len) {
1017                 switch (data[i]) {
1018                 case 'P':
1019                         i++;
1020                         if (i + 52 <= buf.len &&
1021                             !prefixcmp(data + i, " pack-") &&
1022                             !prefixcmp(data + i + 46, ".pack\n")) {
1023                                 get_sha1_hex(data + i + 6, sha1);
1024                                 fetch_and_setup_pack_index(packs_head, sha1,
1025                                                       base_url);
1026                                 i += 51;
1027                                 break;
1028                         }
1029                 default:
1030                         while (i < buf.len && data[i] != '\n')
1031                                 i++;
1032                 }
1033                 i++;
1034         }
1035
1036 cleanup:
1037         free(url);
1038         return ret;
1039 }
1040
1041 void release_http_pack_request(struct http_pack_request *preq)
1042 {
1043         if (preq->packfile != NULL) {
1044                 fclose(preq->packfile);
1045                 preq->packfile = NULL;
1046                 preq->slot->local = NULL;
1047         }
1048         if (preq->range_header != NULL) {
1049                 curl_slist_free_all(preq->range_header);
1050                 preq->range_header = NULL;
1051         }
1052         preq->slot = NULL;
1053         free(preq->url);
1054 }
1055
1056 int finish_http_pack_request(struct http_pack_request *preq)
1057 {
1058         struct packed_git **lst;
1059         struct packed_git *p = preq->target;
1060         char *tmp_idx;
1061         struct child_process ip;
1062         const char *ip_argv[8];
1063
1064         close_pack_index(p);
1065
1066         fclose(preq->packfile);
1067         preq->packfile = NULL;
1068         preq->slot->local = NULL;
1069
1070         lst = preq->lst;
1071         while (*lst != p)
1072                 lst = &((*lst)->next);
1073         *lst = (*lst)->next;
1074
1075         tmp_idx = xstrdup(preq->tmpfile);
1076         strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1077                ".idx.temp");
1078
1079         ip_argv[0] = "index-pack";
1080         ip_argv[1] = "-o";
1081         ip_argv[2] = tmp_idx;
1082         ip_argv[3] = preq->tmpfile;
1083         ip_argv[4] = NULL;
1084
1085         memset(&ip, 0, sizeof(ip));
1086         ip.argv = ip_argv;
1087         ip.git_cmd = 1;
1088         ip.no_stdin = 1;
1089         ip.no_stdout = 1;
1090
1091         if (run_command(&ip)) {
1092                 unlink(preq->tmpfile);
1093                 unlink(tmp_idx);
1094                 free(tmp_idx);
1095                 return -1;
1096         }
1097
1098         unlink(sha1_pack_index_name(p->sha1));
1099
1100         if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1101          || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1102                 free(tmp_idx);
1103                 return -1;
1104         }
1105
1106         install_packed_git(p);
1107         free(tmp_idx);
1108         return 0;
1109 }
1110
1111 struct http_pack_request *new_http_pack_request(
1112         struct packed_git *target, const char *base_url)
1113 {
1114         long prev_posn = 0;
1115         char range[RANGE_HEADER_SIZE];
1116         struct strbuf buf = STRBUF_INIT;
1117         struct http_pack_request *preq;
1118
1119         preq = xmalloc(sizeof(*preq));
1120         preq->target = target;
1121         preq->range_header = NULL;
1122
1123         end_url_with_slash(&buf, base_url);
1124         strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1125                 sha1_to_hex(target->sha1));
1126         preq->url = strbuf_detach(&buf, NULL);
1127
1128         snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1129                 sha1_pack_name(target->sha1));
1130         preq->packfile = fopen(preq->tmpfile, "a");
1131         if (!preq->packfile) {
1132                 error("Unable to open local file %s for pack",
1133                       preq->tmpfile);
1134                 goto abort;
1135         }
1136
1137         preq->slot = get_active_slot();
1138         preq->slot->local = preq->packfile;
1139         curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1140         curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1141         curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1142         curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1143                 no_pragma_header);
1144
1145         /*
1146          * If there is data present from a previous transfer attempt,
1147          * resume where it left off
1148          */
1149         prev_posn = ftell(preq->packfile);
1150         if (prev_posn>0) {
1151                 if (http_is_verbose)
1152                         fprintf(stderr,
1153                                 "Resuming fetch of pack %s at byte %ld\n",
1154                                 sha1_to_hex(target->sha1), prev_posn);
1155                 sprintf(range, "Range: bytes=%ld-", prev_posn);
1156                 preq->range_header = curl_slist_append(NULL, range);
1157                 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1158                         preq->range_header);
1159         }
1160
1161         return preq;
1162
1163 abort:
1164         free(preq->url);
1165         free(preq);
1166         return NULL;
1167 }
1168
1169 /* Helpers for fetching objects (loose) */
1170 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
1171                                void *data)
1172 {
1173         unsigned char expn[4096];
1174         size_t size = eltsize * nmemb;
1175         int posn = 0;
1176         struct http_object_request *freq =
1177                 (struct http_object_request *)data;
1178         do {
1179                 ssize_t retval = xwrite(freq->localfile,
1180                                         (char *) ptr + posn, size - posn);
1181                 if (retval < 0)
1182                         return posn;
1183                 posn += retval;
1184         } while (posn < size);
1185
1186         freq->stream.avail_in = size;
1187         freq->stream.next_in = ptr;
1188         do {
1189                 freq->stream.next_out = expn;
1190                 freq->stream.avail_out = sizeof(expn);
1191                 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1192                 git_SHA1_Update(&freq->c, expn,
1193                                 sizeof(expn) - freq->stream.avail_out);
1194         } while (freq->stream.avail_in && freq->zret == Z_OK);
1195         data_received++;
1196         return size;
1197 }
1198
1199 struct http_object_request *new_http_object_request(const char *base_url,
1200         unsigned char *sha1)
1201 {
1202         char *hex = sha1_to_hex(sha1);
1203         char *filename;
1204         char prevfile[PATH_MAX];
1205         int prevlocal;
1206         unsigned char prev_buf[PREV_BUF_SIZE];
1207         ssize_t prev_read = 0;
1208         long prev_posn = 0;
1209         char range[RANGE_HEADER_SIZE];
1210         struct curl_slist *range_header = NULL;
1211         struct http_object_request *freq;
1212
1213         freq = xmalloc(sizeof(*freq));
1214         hashcpy(freq->sha1, sha1);
1215         freq->localfile = -1;
1216
1217         filename = sha1_file_name(sha1);
1218         snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1219                  "%s.temp", filename);
1220
1221         snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1222         unlink_or_warn(prevfile);
1223         rename(freq->tmpfile, prevfile);
1224         unlink_or_warn(freq->tmpfile);
1225
1226         if (freq->localfile != -1)
1227                 error("fd leakage in start: %d", freq->localfile);
1228         freq->localfile = open(freq->tmpfile,
1229                                O_WRONLY | O_CREAT | O_EXCL, 0666);
1230         /*
1231          * This could have failed due to the "lazy directory creation";
1232          * try to mkdir the last path component.
1233          */
1234         if (freq->localfile < 0 && errno == ENOENT) {
1235                 char *dir = strrchr(freq->tmpfile, '/');
1236                 if (dir) {
1237                         *dir = 0;
1238                         mkdir(freq->tmpfile, 0777);
1239                         *dir = '/';
1240                 }
1241                 freq->localfile = open(freq->tmpfile,
1242                                        O_WRONLY | O_CREAT | O_EXCL, 0666);
1243         }
1244
1245         if (freq->localfile < 0) {
1246                 error("Couldn't create temporary file %s: %s",
1247                       freq->tmpfile, strerror(errno));
1248                 goto abort;
1249         }
1250
1251         memset(&freq->stream, 0, sizeof(freq->stream));
1252
1253         git_inflate_init(&freq->stream);
1254
1255         git_SHA1_Init(&freq->c);
1256
1257         freq->url = get_remote_object_url(base_url, hex, 0);
1258
1259         /*
1260          * If a previous temp file is present, process what was already
1261          * fetched.
1262          */
1263         prevlocal = open(prevfile, O_RDONLY);
1264         if (prevlocal != -1) {
1265                 do {
1266                         prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1267                         if (prev_read>0) {
1268                                 if (fwrite_sha1_file(prev_buf,
1269                                                      1,
1270                                                      prev_read,
1271                                                      freq) == prev_read) {
1272                                         prev_posn += prev_read;
1273                                 } else {
1274                                         prev_read = -1;
1275                                 }
1276                         }
1277                 } while (prev_read > 0);
1278                 close(prevlocal);
1279         }
1280         unlink_or_warn(prevfile);
1281
1282         /*
1283          * Reset inflate/SHA1 if there was an error reading the previous temp
1284          * file; also rewind to the beginning of the local file.
1285          */
1286         if (prev_read == -1) {
1287                 memset(&freq->stream, 0, sizeof(freq->stream));
1288                 git_inflate_init(&freq->stream);
1289                 git_SHA1_Init(&freq->c);
1290                 if (prev_posn>0) {
1291                         prev_posn = 0;
1292                         lseek(freq->localfile, 0, SEEK_SET);
1293                         if (ftruncate(freq->localfile, 0) < 0) {
1294                                 error("Couldn't truncate temporary file %s: %s",
1295                                           freq->tmpfile, strerror(errno));
1296                                 goto abort;
1297                         }
1298                 }
1299         }
1300
1301         freq->slot = get_active_slot();
1302
1303         curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1304         curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1305         curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1306         curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1307         curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1308
1309         /*
1310          * If we have successfully processed data from a previous fetch
1311          * attempt, only fetch the data we don't already have.
1312          */
1313         if (prev_posn>0) {
1314                 if (http_is_verbose)
1315                         fprintf(stderr,
1316                                 "Resuming fetch of object %s at byte %ld\n",
1317                                 hex, prev_posn);
1318                 sprintf(range, "Range: bytes=%ld-", prev_posn);
1319                 range_header = curl_slist_append(range_header, range);
1320                 curl_easy_setopt(freq->slot->curl,
1321                                  CURLOPT_HTTPHEADER, range_header);
1322         }
1323
1324         return freq;
1325
1326 abort:
1327         free(filename);
1328         free(freq->url);
1329         free(freq);
1330         return NULL;
1331 }
1332
1333 void process_http_object_request(struct http_object_request *freq)
1334 {
1335         if (freq->slot == NULL)
1336                 return;
1337         freq->curl_result = freq->slot->curl_result;
1338         freq->http_code = freq->slot->http_code;
1339         freq->slot = NULL;
1340 }
1341
1342 int finish_http_object_request(struct http_object_request *freq)
1343 {
1344         struct stat st;
1345
1346         close(freq->localfile);
1347         freq->localfile = -1;
1348
1349         process_http_object_request(freq);
1350
1351         if (freq->http_code == 416) {
1352                 warning("requested range invalid; we may already have all the data.");
1353         } else if (freq->curl_result != CURLE_OK) {
1354                 if (stat(freq->tmpfile, &st) == 0)
1355                         if (st.st_size == 0)
1356                                 unlink_or_warn(freq->tmpfile);
1357                 return -1;
1358         }
1359
1360         git_inflate_end(&freq->stream);
1361         git_SHA1_Final(freq->real_sha1, &freq->c);
1362         if (freq->zret != Z_STREAM_END) {
1363                 unlink_or_warn(freq->tmpfile);
1364                 return -1;
1365         }
1366         if (hashcmp(freq->sha1, freq->real_sha1)) {
1367                 unlink_or_warn(freq->tmpfile);
1368                 return -1;
1369         }
1370         freq->rename =
1371                 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1372
1373         return freq->rename;
1374 }
1375
1376 void abort_http_object_request(struct http_object_request *freq)
1377 {
1378         unlink_or_warn(freq->tmpfile);
1379
1380         release_http_object_request(freq);
1381 }
1382
1383 void release_http_object_request(struct http_object_request *freq)
1384 {
1385         if (freq->localfile != -1) {
1386                 close(freq->localfile);
1387                 freq->localfile = -1;
1388         }
1389         if (freq->url != NULL) {
1390                 free(freq->url);
1391                 freq->url = NULL;
1392         }
1393         if (freq->slot != NULL) {
1394                 freq->slot->callback_func = NULL;
1395                 freq->slot->callback_data = NULL;
1396                 release_active_slot(freq->slot);
1397                 freq->slot = NULL;
1398         }
1399 }