Merge branch 'jc/doc-git-updates' (early part)
[git] / http.c
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
5 #include "url.h"
6 #include "credential.h"
7 #include "version.h"
8
9 int active_requests;
10 int http_is_verbose;
11 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
12
13 #if LIBCURL_VERSION_NUM >= 0x070a06
14 #define LIBCURL_CAN_HANDLE_AUTH_ANY
15 #endif
16
17 static int min_curl_sessions = 1;
18 static int curl_session_count;
19 #ifdef USE_CURL_MULTI
20 static int max_requests = -1;
21 static CURLM *curlm;
22 #endif
23 #ifndef NO_CURL_EASY_DUPHANDLE
24 static CURL *curl_default;
25 #endif
26
27 #define PREV_BUF_SIZE 4096
28 #define RANGE_HEADER_SIZE 30
29
30 char curl_errorstr[CURL_ERROR_SIZE];
31
32 static int curl_ssl_verify = -1;
33 static const char *ssl_cert;
34 #if LIBCURL_VERSION_NUM >= 0x070903
35 static const char *ssl_key;
36 #endif
37 #if LIBCURL_VERSION_NUM >= 0x070908
38 static const char *ssl_capath;
39 #endif
40 static const char *ssl_cainfo;
41 static long curl_low_speed_limit = -1;
42 static long curl_low_speed_time = -1;
43 static int curl_ftp_no_epsv;
44 static const char *curl_http_proxy;
45 static const char *curl_cookie_file;
46 static struct credential http_auth = CREDENTIAL_INIT;
47 static int http_proactive_auth;
48 static const char *user_agent;
49
50 #if LIBCURL_VERSION_NUM >= 0x071700
51 /* Use CURLOPT_KEYPASSWD as is */
52 #elif LIBCURL_VERSION_NUM >= 0x070903
53 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
54 #else
55 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
56 #endif
57
58 static struct credential cert_auth = CREDENTIAL_INIT;
59 static int ssl_cert_password_required;
60
61 static struct curl_slist *pragma_header;
62 static struct curl_slist *no_pragma_header;
63
64 static struct active_request_slot *active_queue_head;
65
66 size_t fread_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
67 {
68         size_t size = eltsize * nmemb;
69         struct buffer *buffer = buffer_;
70
71         if (size > buffer->buf.len - buffer->posn)
72                 size = buffer->buf.len - buffer->posn;
73         memcpy(ptr, buffer->buf.buf + buffer->posn, size);
74         buffer->posn += size;
75
76         return size;
77 }
78
79 #ifndef NO_CURL_IOCTL
80 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
81 {
82         struct buffer *buffer = clientp;
83
84         switch (cmd) {
85         case CURLIOCMD_NOP:
86                 return CURLIOE_OK;
87
88         case CURLIOCMD_RESTARTREAD:
89                 buffer->posn = 0;
90                 return CURLIOE_OK;
91
92         default:
93                 return CURLIOE_UNKNOWNCMD;
94         }
95 }
96 #endif
97
98 size_t fwrite_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
99 {
100         size_t size = eltsize * nmemb;
101         struct strbuf *buffer = buffer_;
102
103         strbuf_add(buffer, ptr, size);
104         return size;
105 }
106
107 size_t fwrite_null(char *ptr, size_t eltsize, size_t nmemb, void *strbuf)
108 {
109         return eltsize * nmemb;
110 }
111
112 #ifdef USE_CURL_MULTI
113 static void process_curl_messages(void)
114 {
115         int num_messages;
116         struct active_request_slot *slot;
117         CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
118
119         while (curl_message != NULL) {
120                 if (curl_message->msg == CURLMSG_DONE) {
121                         int curl_result = curl_message->data.result;
122                         slot = active_queue_head;
123                         while (slot != NULL &&
124                                slot->curl != curl_message->easy_handle)
125                                 slot = slot->next;
126                         if (slot != NULL) {
127                                 curl_multi_remove_handle(curlm, slot->curl);
128                                 slot->curl_result = curl_result;
129                                 finish_active_slot(slot);
130                         } else {
131                                 fprintf(stderr, "Received DONE message for unknown request!\n");
132                         }
133                 } else {
134                         fprintf(stderr, "Unknown CURL message received: %d\n",
135                                 (int)curl_message->msg);
136                 }
137                 curl_message = curl_multi_info_read(curlm, &num_messages);
138         }
139 }
140 #endif
141
142 static int http_options(const char *var, const char *value, void *cb)
143 {
144         if (!strcmp("http.sslverify", var)) {
145                 curl_ssl_verify = git_config_bool(var, value);
146                 return 0;
147         }
148         if (!strcmp("http.sslcert", var))
149                 return git_config_string(&ssl_cert, var, value);
150 #if LIBCURL_VERSION_NUM >= 0x070903
151         if (!strcmp("http.sslkey", var))
152                 return git_config_string(&ssl_key, var, value);
153 #endif
154 #if LIBCURL_VERSION_NUM >= 0x070908
155         if (!strcmp("http.sslcapath", var))
156                 return git_config_string(&ssl_capath, var, value);
157 #endif
158         if (!strcmp("http.sslcainfo", var))
159                 return git_config_string(&ssl_cainfo, var, value);
160         if (!strcmp("http.sslcertpasswordprotected", var)) {
161                 if (git_config_bool(var, value))
162                         ssl_cert_password_required = 1;
163                 return 0;
164         }
165         if (!strcmp("http.minsessions", var)) {
166                 min_curl_sessions = git_config_int(var, value);
167 #ifndef USE_CURL_MULTI
168                 if (min_curl_sessions > 1)
169                         min_curl_sessions = 1;
170 #endif
171                 return 0;
172         }
173 #ifdef USE_CURL_MULTI
174         if (!strcmp("http.maxrequests", var)) {
175                 max_requests = git_config_int(var, value);
176                 return 0;
177         }
178 #endif
179         if (!strcmp("http.lowspeedlimit", var)) {
180                 curl_low_speed_limit = (long)git_config_int(var, value);
181                 return 0;
182         }
183         if (!strcmp("http.lowspeedtime", var)) {
184                 curl_low_speed_time = (long)git_config_int(var, value);
185                 return 0;
186         }
187
188         if (!strcmp("http.noepsv", var)) {
189                 curl_ftp_no_epsv = git_config_bool(var, value);
190                 return 0;
191         }
192         if (!strcmp("http.proxy", var))
193                 return git_config_string(&curl_http_proxy, var, value);
194
195         if (!strcmp("http.cookiefile", var))
196                 return git_config_string(&curl_cookie_file, var, value);
197
198         if (!strcmp("http.postbuffer", var)) {
199                 http_post_buffer = git_config_int(var, value);
200                 if (http_post_buffer < LARGE_PACKET_MAX)
201                         http_post_buffer = LARGE_PACKET_MAX;
202                 return 0;
203         }
204
205         if (!strcmp("http.useragent", var))
206                 return git_config_string(&user_agent, var, value);
207
208         /* Fall back on the default ones */
209         return git_default_config(var, value, cb);
210 }
211
212 static void init_curl_http_auth(CURL *result)
213 {
214         if (!http_auth.username)
215                 return;
216
217         credential_fill(&http_auth);
218
219 #if LIBCURL_VERSION_NUM >= 0x071301
220         curl_easy_setopt(result, CURLOPT_USERNAME, http_auth.username);
221         curl_easy_setopt(result, CURLOPT_PASSWORD, http_auth.password);
222 #else
223         {
224                 static struct strbuf up = STRBUF_INIT;
225                 strbuf_reset(&up);
226                 strbuf_addf(&up, "%s:%s",
227                             http_auth.username, http_auth.password);
228                 curl_easy_setopt(result, CURLOPT_USERPWD, up.buf);
229         }
230 #endif
231 }
232
233 static int has_cert_password(void)
234 {
235         if (ssl_cert == NULL || ssl_cert_password_required != 1)
236                 return 0;
237         if (!cert_auth.password) {
238                 cert_auth.protocol = xstrdup("cert");
239                 cert_auth.path = xstrdup(ssl_cert);
240                 credential_fill(&cert_auth);
241         }
242         return 1;
243 }
244
245 static CURL *get_curl_handle(void)
246 {
247         CURL *result = curl_easy_init();
248
249         if (!curl_ssl_verify) {
250                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
251                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
252         } else {
253                 /* Verify authenticity of the peer's certificate */
254                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
255                 /* The name in the cert must match whom we tried to connect */
256                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
257         }
258
259 #if LIBCURL_VERSION_NUM >= 0x070907
260         curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
261 #endif
262 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
263         curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
264 #endif
265
266         if (http_proactive_auth)
267                 init_curl_http_auth(result);
268
269         if (ssl_cert != NULL)
270                 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
271         if (has_cert_password())
272                 curl_easy_setopt(result, CURLOPT_KEYPASSWD, cert_auth.password);
273 #if LIBCURL_VERSION_NUM >= 0x070903
274         if (ssl_key != NULL)
275                 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
276 #endif
277 #if LIBCURL_VERSION_NUM >= 0x070908
278         if (ssl_capath != NULL)
279                 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
280 #endif
281         if (ssl_cainfo != NULL)
282                 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
283         curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
284
285         if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
286                 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
287                                  curl_low_speed_limit);
288                 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
289                                  curl_low_speed_time);
290         }
291
292         curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
293 #if LIBCURL_VERSION_NUM >= 0x071301
294         curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
295 #elif LIBCURL_VERSION_NUM >= 0x071101
296         curl_easy_setopt(result, CURLOPT_POST301, 1);
297 #endif
298
299         if (getenv("GIT_CURL_VERBOSE"))
300                 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
301
302         curl_easy_setopt(result, CURLOPT_USERAGENT,
303                 user_agent ? user_agent : git_user_agent());
304
305         if (curl_ftp_no_epsv)
306                 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
307
308         if (curl_http_proxy) {
309                 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
310                 curl_easy_setopt(result, CURLOPT_PROXYAUTH, CURLAUTH_ANY);
311         }
312
313         return result;
314 }
315
316 static void set_from_env(const char **var, const char *envname)
317 {
318         const char *val = getenv(envname);
319         if (val)
320                 *var = val;
321 }
322
323 void http_init(struct remote *remote, const char *url, int proactive_auth)
324 {
325         char *low_speed_limit;
326         char *low_speed_time;
327
328         http_is_verbose = 0;
329
330         git_config(http_options, NULL);
331
332         curl_global_init(CURL_GLOBAL_ALL);
333
334         http_proactive_auth = proactive_auth;
335
336         if (remote && remote->http_proxy)
337                 curl_http_proxy = xstrdup(remote->http_proxy);
338
339         pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
340         no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
341
342 #ifdef USE_CURL_MULTI
343         {
344                 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
345                 if (http_max_requests != NULL)
346                         max_requests = atoi(http_max_requests);
347         }
348
349         curlm = curl_multi_init();
350         if (curlm == NULL) {
351                 fprintf(stderr, "Error creating curl multi handle.\n");
352                 exit(1);
353         }
354 #endif
355
356         if (getenv("GIT_SSL_NO_VERIFY"))
357                 curl_ssl_verify = 0;
358
359         set_from_env(&ssl_cert, "GIT_SSL_CERT");
360 #if LIBCURL_VERSION_NUM >= 0x070903
361         set_from_env(&ssl_key, "GIT_SSL_KEY");
362 #endif
363 #if LIBCURL_VERSION_NUM >= 0x070908
364         set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
365 #endif
366         set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
367
368         set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
369
370         low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
371         if (low_speed_limit != NULL)
372                 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
373         low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
374         if (low_speed_time != NULL)
375                 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
376
377         if (curl_ssl_verify == -1)
378                 curl_ssl_verify = 1;
379
380         curl_session_count = 0;
381 #ifdef USE_CURL_MULTI
382         if (max_requests < 1)
383                 max_requests = DEFAULT_MAX_REQUESTS;
384 #endif
385
386         if (getenv("GIT_CURL_FTP_NO_EPSV"))
387                 curl_ftp_no_epsv = 1;
388
389         if (url) {
390                 credential_from_url(&http_auth, url);
391                 if (!ssl_cert_password_required &&
392                     getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
393                     !prefixcmp(url, "https://"))
394                         ssl_cert_password_required = 1;
395         }
396
397 #ifndef NO_CURL_EASY_DUPHANDLE
398         curl_default = get_curl_handle();
399 #endif
400 }
401
402 void http_cleanup(void)
403 {
404         struct active_request_slot *slot = active_queue_head;
405
406         while (slot != NULL) {
407                 struct active_request_slot *next = slot->next;
408                 if (slot->curl != NULL) {
409 #ifdef USE_CURL_MULTI
410                         curl_multi_remove_handle(curlm, slot->curl);
411 #endif
412                         curl_easy_cleanup(slot->curl);
413                 }
414                 free(slot);
415                 slot = next;
416         }
417         active_queue_head = NULL;
418
419 #ifndef NO_CURL_EASY_DUPHANDLE
420         curl_easy_cleanup(curl_default);
421 #endif
422
423 #ifdef USE_CURL_MULTI
424         curl_multi_cleanup(curlm);
425 #endif
426         curl_global_cleanup();
427
428         curl_slist_free_all(pragma_header);
429         pragma_header = NULL;
430
431         curl_slist_free_all(no_pragma_header);
432         no_pragma_header = NULL;
433
434         if (curl_http_proxy) {
435                 free((void *)curl_http_proxy);
436                 curl_http_proxy = NULL;
437         }
438
439         if (cert_auth.password != NULL) {
440                 memset(cert_auth.password, 0, strlen(cert_auth.password));
441                 free(cert_auth.password);
442                 cert_auth.password = NULL;
443         }
444         ssl_cert_password_required = 0;
445 }
446
447 struct active_request_slot *get_active_slot(void)
448 {
449         struct active_request_slot *slot = active_queue_head;
450         struct active_request_slot *newslot;
451
452 #ifdef USE_CURL_MULTI
453         int num_transfers;
454
455         /* Wait for a slot to open up if the queue is full */
456         while (active_requests >= max_requests) {
457                 curl_multi_perform(curlm, &num_transfers);
458                 if (num_transfers < active_requests)
459                         process_curl_messages();
460         }
461 #endif
462
463         while (slot != NULL && slot->in_use)
464                 slot = slot->next;
465
466         if (slot == NULL) {
467                 newslot = xmalloc(sizeof(*newslot));
468                 newslot->curl = NULL;
469                 newslot->in_use = 0;
470                 newslot->next = NULL;
471
472                 slot = active_queue_head;
473                 if (slot == NULL) {
474                         active_queue_head = newslot;
475                 } else {
476                         while (slot->next != NULL)
477                                 slot = slot->next;
478                         slot->next = newslot;
479                 }
480                 slot = newslot;
481         }
482
483         if (slot->curl == NULL) {
484 #ifdef NO_CURL_EASY_DUPHANDLE
485                 slot->curl = get_curl_handle();
486 #else
487                 slot->curl = curl_easy_duphandle(curl_default);
488 #endif
489                 curl_session_count++;
490         }
491
492         active_requests++;
493         slot->in_use = 1;
494         slot->results = NULL;
495         slot->finished = NULL;
496         slot->callback_data = NULL;
497         slot->callback_func = NULL;
498         curl_easy_setopt(slot->curl, CURLOPT_COOKIEFILE, curl_cookie_file);
499         curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
500         curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
501         curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
502         curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
503         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
504         curl_easy_setopt(slot->curl, CURLOPT_POSTFIELDS, NULL);
505         curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
506         curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
507         if (http_auth.password)
508                 init_curl_http_auth(slot->curl);
509
510         return slot;
511 }
512
513 int start_active_slot(struct active_request_slot *slot)
514 {
515 #ifdef USE_CURL_MULTI
516         CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
517         int num_transfers;
518
519         if (curlm_result != CURLM_OK &&
520             curlm_result != CURLM_CALL_MULTI_PERFORM) {
521                 active_requests--;
522                 slot->in_use = 0;
523                 return 0;
524         }
525
526         /*
527          * We know there must be something to do, since we just added
528          * something.
529          */
530         curl_multi_perform(curlm, &num_transfers);
531 #endif
532         return 1;
533 }
534
535 #ifdef USE_CURL_MULTI
536 struct fill_chain {
537         void *data;
538         int (*fill)(void *);
539         struct fill_chain *next;
540 };
541
542 static struct fill_chain *fill_cfg;
543
544 void add_fill_function(void *data, int (*fill)(void *))
545 {
546         struct fill_chain *new = xmalloc(sizeof(*new));
547         struct fill_chain **linkp = &fill_cfg;
548         new->data = data;
549         new->fill = fill;
550         new->next = NULL;
551         while (*linkp)
552                 linkp = &(*linkp)->next;
553         *linkp = new;
554 }
555
556 void fill_active_slots(void)
557 {
558         struct active_request_slot *slot = active_queue_head;
559
560         while (active_requests < max_requests) {
561                 struct fill_chain *fill;
562                 for (fill = fill_cfg; fill; fill = fill->next)
563                         if (fill->fill(fill->data))
564                                 break;
565
566                 if (!fill)
567                         break;
568         }
569
570         while (slot != NULL) {
571                 if (!slot->in_use && slot->curl != NULL
572                         && curl_session_count > min_curl_sessions) {
573                         curl_easy_cleanup(slot->curl);
574                         slot->curl = NULL;
575                         curl_session_count--;
576                 }
577                 slot = slot->next;
578         }
579 }
580
581 void step_active_slots(void)
582 {
583         int num_transfers;
584         CURLMcode curlm_result;
585
586         do {
587                 curlm_result = curl_multi_perform(curlm, &num_transfers);
588         } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
589         if (num_transfers < active_requests) {
590                 process_curl_messages();
591                 fill_active_slots();
592         }
593 }
594 #endif
595
596 void run_active_slot(struct active_request_slot *slot)
597 {
598 #ifdef USE_CURL_MULTI
599         fd_set readfds;
600         fd_set writefds;
601         fd_set excfds;
602         int max_fd;
603         struct timeval select_timeout;
604         int finished = 0;
605
606         slot->finished = &finished;
607         while (!finished) {
608                 step_active_slots();
609
610                 if (slot->in_use) {
611 #if LIBCURL_VERSION_NUM >= 0x070f04
612                         long curl_timeout;
613                         curl_multi_timeout(curlm, &curl_timeout);
614                         if (curl_timeout == 0) {
615                                 continue;
616                         } else if (curl_timeout == -1) {
617                                 select_timeout.tv_sec  = 0;
618                                 select_timeout.tv_usec = 50000;
619                         } else {
620                                 select_timeout.tv_sec  =  curl_timeout / 1000;
621                                 select_timeout.tv_usec = (curl_timeout % 1000) * 1000;
622                         }
623 #else
624                         select_timeout.tv_sec  = 0;
625                         select_timeout.tv_usec = 50000;
626 #endif
627
628                         max_fd = -1;
629                         FD_ZERO(&readfds);
630                         FD_ZERO(&writefds);
631                         FD_ZERO(&excfds);
632                         curl_multi_fdset(curlm, &readfds, &writefds, &excfds, &max_fd);
633
634                         select(max_fd+1, &readfds, &writefds, &excfds, &select_timeout);
635                 }
636         }
637 #else
638         while (slot->in_use) {
639                 slot->curl_result = curl_easy_perform(slot->curl);
640                 finish_active_slot(slot);
641         }
642 #endif
643 }
644
645 static void closedown_active_slot(struct active_request_slot *slot)
646 {
647         active_requests--;
648         slot->in_use = 0;
649 }
650
651 static void release_active_slot(struct active_request_slot *slot)
652 {
653         closedown_active_slot(slot);
654         if (slot->curl && curl_session_count > min_curl_sessions) {
655 #ifdef USE_CURL_MULTI
656                 curl_multi_remove_handle(curlm, slot->curl);
657 #endif
658                 curl_easy_cleanup(slot->curl);
659                 slot->curl = NULL;
660                 curl_session_count--;
661         }
662 #ifdef USE_CURL_MULTI
663         fill_active_slots();
664 #endif
665 }
666
667 void finish_active_slot(struct active_request_slot *slot)
668 {
669         closedown_active_slot(slot);
670         curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
671
672         if (slot->finished != NULL)
673                 (*slot->finished) = 1;
674
675         /* Store slot results so they can be read after the slot is reused */
676         if (slot->results != NULL) {
677                 slot->results->curl_result = slot->curl_result;
678                 slot->results->http_code = slot->http_code;
679         }
680
681         /* Run callback if appropriate */
682         if (slot->callback_func != NULL)
683                 slot->callback_func(slot->callback_data);
684 }
685
686 void finish_all_active_slots(void)
687 {
688         struct active_request_slot *slot = active_queue_head;
689
690         while (slot != NULL)
691                 if (slot->in_use) {
692                         run_active_slot(slot);
693                         slot = active_queue_head;
694                 } else {
695                         slot = slot->next;
696                 }
697 }
698
699 /* Helpers for modifying and creating URLs */
700 static inline int needs_quote(int ch)
701 {
702         if (((ch >= 'A') && (ch <= 'Z'))
703                         || ((ch >= 'a') && (ch <= 'z'))
704                         || ((ch >= '0') && (ch <= '9'))
705                         || (ch == '/')
706                         || (ch == '-')
707                         || (ch == '.'))
708                 return 0;
709         return 1;
710 }
711
712 static char *quote_ref_url(const char *base, const char *ref)
713 {
714         struct strbuf buf = STRBUF_INIT;
715         const char *cp;
716         int ch;
717
718         end_url_with_slash(&buf, base);
719
720         for (cp = ref; (ch = *cp) != 0; cp++)
721                 if (needs_quote(ch))
722                         strbuf_addf(&buf, "%%%02x", ch);
723                 else
724                         strbuf_addch(&buf, *cp);
725
726         return strbuf_detach(&buf, NULL);
727 }
728
729 void append_remote_object_url(struct strbuf *buf, const char *url,
730                               const char *hex,
731                               int only_two_digit_prefix)
732 {
733         end_url_with_slash(buf, url);
734
735         strbuf_addf(buf, "objects/%.*s/", 2, hex);
736         if (!only_two_digit_prefix)
737                 strbuf_addf(buf, "%s", hex+2);
738 }
739
740 char *get_remote_object_url(const char *url, const char *hex,
741                             int only_two_digit_prefix)
742 {
743         struct strbuf buf = STRBUF_INIT;
744         append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
745         return strbuf_detach(&buf, NULL);
746 }
747
748 /* http_request() targets */
749 #define HTTP_REQUEST_STRBUF     0
750 #define HTTP_REQUEST_FILE       1
751
752 static int http_request(const char *url, void *result, int target, int options)
753 {
754         struct active_request_slot *slot;
755         struct slot_results results;
756         struct curl_slist *headers = NULL;
757         struct strbuf buf = STRBUF_INIT;
758         int ret;
759
760         slot = get_active_slot();
761         slot->results = &results;
762         curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
763
764         if (result == NULL) {
765                 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
766         } else {
767                 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
768                 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
769
770                 if (target == HTTP_REQUEST_FILE) {
771                         long posn = ftell(result);
772                         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
773                                          fwrite);
774                         if (posn > 0) {
775                                 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
776                                 headers = curl_slist_append(headers, buf.buf);
777                                 strbuf_reset(&buf);
778                         }
779                 } else
780                         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
781                                          fwrite_buffer);
782         }
783
784         strbuf_addstr(&buf, "Pragma:");
785         if (options & HTTP_NO_CACHE)
786                 strbuf_addstr(&buf, " no-cache");
787
788         headers = curl_slist_append(headers, buf.buf);
789
790         curl_easy_setopt(slot->curl, CURLOPT_URL, url);
791         curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
792
793         if (start_active_slot(slot)) {
794                 run_active_slot(slot);
795                 if (results.curl_result == CURLE_OK)
796                         ret = HTTP_OK;
797                 else if (missing_target(&results))
798                         ret = HTTP_MISSING_TARGET;
799                 else if (results.http_code == 401) {
800                         if (http_auth.username && http_auth.password) {
801                                 credential_reject(&http_auth);
802                                 ret = HTTP_NOAUTH;
803                         } else {
804                                 credential_fill(&http_auth);
805                                 init_curl_http_auth(slot->curl);
806                                 ret = HTTP_REAUTH;
807                         }
808                 } else {
809                         if (!curl_errorstr[0])
810                                 strlcpy(curl_errorstr,
811                                         curl_easy_strerror(results.curl_result),
812                                         sizeof(curl_errorstr));
813                         ret = HTTP_ERROR;
814                 }
815         } else {
816                 error("Unable to start HTTP request for %s", url);
817                 ret = HTTP_START_FAILED;
818         }
819
820         curl_slist_free_all(headers);
821         strbuf_release(&buf);
822
823         if (ret == HTTP_OK)
824                 credential_approve(&http_auth);
825
826         return ret;
827 }
828
829 static int http_request_reauth(const char *url, void *result, int target,
830                                int options)
831 {
832         int ret = http_request(url, result, target, options);
833         if (ret != HTTP_REAUTH)
834                 return ret;
835         return http_request(url, result, target, options);
836 }
837
838 int http_get_strbuf(const char *url, struct strbuf *result, int options)
839 {
840         return http_request_reauth(url, result, HTTP_REQUEST_STRBUF, options);
841 }
842
843 /*
844  * Downloads a URL and stores the result in the given file.
845  *
846  * If a previous interrupted download is detected (i.e. a previous temporary
847  * file is still around) the download is resumed.
848  */
849 static int http_get_file(const char *url, const char *filename, int options)
850 {
851         int ret;
852         struct strbuf tmpfile = STRBUF_INIT;
853         FILE *result;
854
855         strbuf_addf(&tmpfile, "%s.temp", filename);
856         result = fopen(tmpfile.buf, "a");
857         if (! result) {
858                 error("Unable to open local file %s", tmpfile.buf);
859                 ret = HTTP_ERROR;
860                 goto cleanup;
861         }
862
863         ret = http_request_reauth(url, result, HTTP_REQUEST_FILE, options);
864         fclose(result);
865
866         if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
867                 ret = HTTP_ERROR;
868 cleanup:
869         strbuf_release(&tmpfile);
870         return ret;
871 }
872
873 int http_error(const char *url, int ret)
874 {
875         /* http_request has already handled HTTP_START_FAILED. */
876         if (ret != HTTP_START_FAILED)
877                 error("%s while accessing %s", curl_errorstr, url);
878
879         return ret;
880 }
881
882 int http_fetch_ref(const char *base, struct ref *ref)
883 {
884         char *url;
885         struct strbuf buffer = STRBUF_INIT;
886         int ret = -1;
887
888         url = quote_ref_url(base, ref->name);
889         if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
890                 strbuf_rtrim(&buffer);
891                 if (buffer.len == 40)
892                         ret = get_sha1_hex(buffer.buf, ref->old_sha1);
893                 else if (!prefixcmp(buffer.buf, "ref: ")) {
894                         ref->symref = xstrdup(buffer.buf + 5);
895                         ret = 0;
896                 }
897         }
898
899         strbuf_release(&buffer);
900         free(url);
901         return ret;
902 }
903
904 /* Helpers for fetching packs */
905 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
906 {
907         char *url, *tmp;
908         struct strbuf buf = STRBUF_INIT;
909
910         if (http_is_verbose)
911                 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
912
913         end_url_with_slash(&buf, base_url);
914         strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
915         url = strbuf_detach(&buf, NULL);
916
917         strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
918         tmp = strbuf_detach(&buf, NULL);
919
920         if (http_get_file(url, tmp, 0) != HTTP_OK) {
921                 error("Unable to get pack index %s", url);
922                 free(tmp);
923                 tmp = NULL;
924         }
925
926         free(url);
927         return tmp;
928 }
929
930 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
931         unsigned char *sha1, const char *base_url)
932 {
933         struct packed_git *new_pack;
934         char *tmp_idx = NULL;
935         int ret;
936
937         if (has_pack_index(sha1)) {
938                 new_pack = parse_pack_index(sha1, NULL);
939                 if (!new_pack)
940                         return -1; /* parse_pack_index() already issued error message */
941                 goto add_pack;
942         }
943
944         tmp_idx = fetch_pack_index(sha1, base_url);
945         if (!tmp_idx)
946                 return -1;
947
948         new_pack = parse_pack_index(sha1, tmp_idx);
949         if (!new_pack) {
950                 unlink(tmp_idx);
951                 free(tmp_idx);
952
953                 return -1; /* parse_pack_index() already issued error message */
954         }
955
956         ret = verify_pack_index(new_pack);
957         if (!ret) {
958                 close_pack_index(new_pack);
959                 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
960         }
961         free(tmp_idx);
962         if (ret)
963                 return -1;
964
965 add_pack:
966         new_pack->next = *packs_head;
967         *packs_head = new_pack;
968         return 0;
969 }
970
971 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
972 {
973         int ret = 0, i = 0;
974         char *url, *data;
975         struct strbuf buf = STRBUF_INIT;
976         unsigned char sha1[20];
977
978         end_url_with_slash(&buf, base_url);
979         strbuf_addstr(&buf, "objects/info/packs");
980         url = strbuf_detach(&buf, NULL);
981
982         ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
983         if (ret != HTTP_OK)
984                 goto cleanup;
985
986         data = buf.buf;
987         while (i < buf.len) {
988                 switch (data[i]) {
989                 case 'P':
990                         i++;
991                         if (i + 52 <= buf.len &&
992                             !prefixcmp(data + i, " pack-") &&
993                             !prefixcmp(data + i + 46, ".pack\n")) {
994                                 get_sha1_hex(data + i + 6, sha1);
995                                 fetch_and_setup_pack_index(packs_head, sha1,
996                                                       base_url);
997                                 i += 51;
998                                 break;
999                         }
1000                 default:
1001                         while (i < buf.len && data[i] != '\n')
1002                                 i++;
1003                 }
1004                 i++;
1005         }
1006
1007 cleanup:
1008         free(url);
1009         return ret;
1010 }
1011
1012 void release_http_pack_request(struct http_pack_request *preq)
1013 {
1014         if (preq->packfile != NULL) {
1015                 fclose(preq->packfile);
1016                 preq->packfile = NULL;
1017         }
1018         if (preq->range_header != NULL) {
1019                 curl_slist_free_all(preq->range_header);
1020                 preq->range_header = NULL;
1021         }
1022         preq->slot = NULL;
1023         free(preq->url);
1024 }
1025
1026 int finish_http_pack_request(struct http_pack_request *preq)
1027 {
1028         struct packed_git **lst;
1029         struct packed_git *p = preq->target;
1030         char *tmp_idx;
1031         struct child_process ip;
1032         const char *ip_argv[8];
1033
1034         close_pack_index(p);
1035
1036         fclose(preq->packfile);
1037         preq->packfile = NULL;
1038
1039         lst = preq->lst;
1040         while (*lst != p)
1041                 lst = &((*lst)->next);
1042         *lst = (*lst)->next;
1043
1044         tmp_idx = xstrdup(preq->tmpfile);
1045         strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1046                ".idx.temp");
1047
1048         ip_argv[0] = "index-pack";
1049         ip_argv[1] = "-o";
1050         ip_argv[2] = tmp_idx;
1051         ip_argv[3] = preq->tmpfile;
1052         ip_argv[4] = NULL;
1053
1054         memset(&ip, 0, sizeof(ip));
1055         ip.argv = ip_argv;
1056         ip.git_cmd = 1;
1057         ip.no_stdin = 1;
1058         ip.no_stdout = 1;
1059
1060         if (run_command(&ip)) {
1061                 unlink(preq->tmpfile);
1062                 unlink(tmp_idx);
1063                 free(tmp_idx);
1064                 return -1;
1065         }
1066
1067         unlink(sha1_pack_index_name(p->sha1));
1068
1069         if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1070          || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1071                 free(tmp_idx);
1072                 return -1;
1073         }
1074
1075         install_packed_git(p);
1076         free(tmp_idx);
1077         return 0;
1078 }
1079
1080 struct http_pack_request *new_http_pack_request(
1081         struct packed_git *target, const char *base_url)
1082 {
1083         long prev_posn = 0;
1084         char range[RANGE_HEADER_SIZE];
1085         struct strbuf buf = STRBUF_INIT;
1086         struct http_pack_request *preq;
1087
1088         preq = xcalloc(1, sizeof(*preq));
1089         preq->target = target;
1090
1091         end_url_with_slash(&buf, base_url);
1092         strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1093                 sha1_to_hex(target->sha1));
1094         preq->url = strbuf_detach(&buf, NULL);
1095
1096         snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1097                 sha1_pack_name(target->sha1));
1098         preq->packfile = fopen(preq->tmpfile, "a");
1099         if (!preq->packfile) {
1100                 error("Unable to open local file %s for pack",
1101                       preq->tmpfile);
1102                 goto abort;
1103         }
1104
1105         preq->slot = get_active_slot();
1106         curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1107         curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1108         curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1109         curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1110                 no_pragma_header);
1111
1112         /*
1113          * If there is data present from a previous transfer attempt,
1114          * resume where it left off
1115          */
1116         prev_posn = ftell(preq->packfile);
1117         if (prev_posn>0) {
1118                 if (http_is_verbose)
1119                         fprintf(stderr,
1120                                 "Resuming fetch of pack %s at byte %ld\n",
1121                                 sha1_to_hex(target->sha1), prev_posn);
1122                 sprintf(range, "Range: bytes=%ld-", prev_posn);
1123                 preq->range_header = curl_slist_append(NULL, range);
1124                 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1125                         preq->range_header);
1126         }
1127
1128         return preq;
1129
1130 abort:
1131         free(preq->url);
1132         free(preq);
1133         return NULL;
1134 }
1135
1136 /* Helpers for fetching objects (loose) */
1137 static size_t fwrite_sha1_file(char *ptr, size_t eltsize, size_t nmemb,
1138                                void *data)
1139 {
1140         unsigned char expn[4096];
1141         size_t size = eltsize * nmemb;
1142         int posn = 0;
1143         struct http_object_request *freq =
1144                 (struct http_object_request *)data;
1145         do {
1146                 ssize_t retval = xwrite(freq->localfile,
1147                                         (char *) ptr + posn, size - posn);
1148                 if (retval < 0)
1149                         return posn;
1150                 posn += retval;
1151         } while (posn < size);
1152
1153         freq->stream.avail_in = size;
1154         freq->stream.next_in = (void *)ptr;
1155         do {
1156                 freq->stream.next_out = expn;
1157                 freq->stream.avail_out = sizeof(expn);
1158                 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1159                 git_SHA1_Update(&freq->c, expn,
1160                                 sizeof(expn) - freq->stream.avail_out);
1161         } while (freq->stream.avail_in && freq->zret == Z_OK);
1162         return size;
1163 }
1164
1165 struct http_object_request *new_http_object_request(const char *base_url,
1166         unsigned char *sha1)
1167 {
1168         char *hex = sha1_to_hex(sha1);
1169         char *filename;
1170         char prevfile[PATH_MAX];
1171         int prevlocal;
1172         char prev_buf[PREV_BUF_SIZE];
1173         ssize_t prev_read = 0;
1174         long prev_posn = 0;
1175         char range[RANGE_HEADER_SIZE];
1176         struct curl_slist *range_header = NULL;
1177         struct http_object_request *freq;
1178
1179         freq = xcalloc(1, sizeof(*freq));
1180         hashcpy(freq->sha1, sha1);
1181         freq->localfile = -1;
1182
1183         filename = sha1_file_name(sha1);
1184         snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1185                  "%s.temp", filename);
1186
1187         snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1188         unlink_or_warn(prevfile);
1189         rename(freq->tmpfile, prevfile);
1190         unlink_or_warn(freq->tmpfile);
1191
1192         if (freq->localfile != -1)
1193                 error("fd leakage in start: %d", freq->localfile);
1194         freq->localfile = open(freq->tmpfile,
1195                                O_WRONLY | O_CREAT | O_EXCL, 0666);
1196         /*
1197          * This could have failed due to the "lazy directory creation";
1198          * try to mkdir the last path component.
1199          */
1200         if (freq->localfile < 0 && errno == ENOENT) {
1201                 char *dir = strrchr(freq->tmpfile, '/');
1202                 if (dir) {
1203                         *dir = 0;
1204                         mkdir(freq->tmpfile, 0777);
1205                         *dir = '/';
1206                 }
1207                 freq->localfile = open(freq->tmpfile,
1208                                        O_WRONLY | O_CREAT | O_EXCL, 0666);
1209         }
1210
1211         if (freq->localfile < 0) {
1212                 error("Couldn't create temporary file %s: %s",
1213                       freq->tmpfile, strerror(errno));
1214                 goto abort;
1215         }
1216
1217         git_inflate_init(&freq->stream);
1218
1219         git_SHA1_Init(&freq->c);
1220
1221         freq->url = get_remote_object_url(base_url, hex, 0);
1222
1223         /*
1224          * If a previous temp file is present, process what was already
1225          * fetched.
1226          */
1227         prevlocal = open(prevfile, O_RDONLY);
1228         if (prevlocal != -1) {
1229                 do {
1230                         prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1231                         if (prev_read>0) {
1232                                 if (fwrite_sha1_file(prev_buf,
1233                                                      1,
1234                                                      prev_read,
1235                                                      freq) == prev_read) {
1236                                         prev_posn += prev_read;
1237                                 } else {
1238                                         prev_read = -1;
1239                                 }
1240                         }
1241                 } while (prev_read > 0);
1242                 close(prevlocal);
1243         }
1244         unlink_or_warn(prevfile);
1245
1246         /*
1247          * Reset inflate/SHA1 if there was an error reading the previous temp
1248          * file; also rewind to the beginning of the local file.
1249          */
1250         if (prev_read == -1) {
1251                 memset(&freq->stream, 0, sizeof(freq->stream));
1252                 git_inflate_init(&freq->stream);
1253                 git_SHA1_Init(&freq->c);
1254                 if (prev_posn>0) {
1255                         prev_posn = 0;
1256                         lseek(freq->localfile, 0, SEEK_SET);
1257                         if (ftruncate(freq->localfile, 0) < 0) {
1258                                 error("Couldn't truncate temporary file %s: %s",
1259                                           freq->tmpfile, strerror(errno));
1260                                 goto abort;
1261                         }
1262                 }
1263         }
1264
1265         freq->slot = get_active_slot();
1266
1267         curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1268         curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1269         curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1270         curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1271         curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1272
1273         /*
1274          * If we have successfully processed data from a previous fetch
1275          * attempt, only fetch the data we don't already have.
1276          */
1277         if (prev_posn>0) {
1278                 if (http_is_verbose)
1279                         fprintf(stderr,
1280                                 "Resuming fetch of object %s at byte %ld\n",
1281                                 hex, prev_posn);
1282                 sprintf(range, "Range: bytes=%ld-", prev_posn);
1283                 range_header = curl_slist_append(range_header, range);
1284                 curl_easy_setopt(freq->slot->curl,
1285                                  CURLOPT_HTTPHEADER, range_header);
1286         }
1287
1288         return freq;
1289
1290 abort:
1291         free(freq->url);
1292         free(freq);
1293         return NULL;
1294 }
1295
1296 void process_http_object_request(struct http_object_request *freq)
1297 {
1298         if (freq->slot == NULL)
1299                 return;
1300         freq->curl_result = freq->slot->curl_result;
1301         freq->http_code = freq->slot->http_code;
1302         freq->slot = NULL;
1303 }
1304
1305 int finish_http_object_request(struct http_object_request *freq)
1306 {
1307         struct stat st;
1308
1309         close(freq->localfile);
1310         freq->localfile = -1;
1311
1312         process_http_object_request(freq);
1313
1314         if (freq->http_code == 416) {
1315                 warning("requested range invalid; we may already have all the data.");
1316         } else if (freq->curl_result != CURLE_OK) {
1317                 if (stat(freq->tmpfile, &st) == 0)
1318                         if (st.st_size == 0)
1319                                 unlink_or_warn(freq->tmpfile);
1320                 return -1;
1321         }
1322
1323         git_inflate_end(&freq->stream);
1324         git_SHA1_Final(freq->real_sha1, &freq->c);
1325         if (freq->zret != Z_STREAM_END) {
1326                 unlink_or_warn(freq->tmpfile);
1327                 return -1;
1328         }
1329         if (hashcmp(freq->sha1, freq->real_sha1)) {
1330                 unlink_or_warn(freq->tmpfile);
1331                 return -1;
1332         }
1333         freq->rename =
1334                 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1335
1336         return freq->rename;
1337 }
1338
1339 void abort_http_object_request(struct http_object_request *freq)
1340 {
1341         unlink_or_warn(freq->tmpfile);
1342
1343         release_http_object_request(freq);
1344 }
1345
1346 void release_http_object_request(struct http_object_request *freq)
1347 {
1348         if (freq->localfile != -1) {
1349                 close(freq->localfile);
1350                 freq->localfile = -1;
1351         }
1352         if (freq->url != NULL) {
1353                 free(freq->url);
1354                 freq->url = NULL;
1355         }
1356         if (freq->slot != NULL) {
1357                 freq->slot->callback_func = NULL;
1358                 freq->slot->callback_data = NULL;
1359                 release_active_slot(freq->slot);
1360                 freq->slot = NULL;
1361         }
1362 }