Merge branch 'rt/maint-clone-single'
[git.git] / http.c
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
5 #include "url.h"
6 #include "credential.h"
7 #include "version.h"
8
9 int active_requests;
10 int http_is_verbose;
11 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
12
13 #if LIBCURL_VERSION_NUM >= 0x070a06
14 #define LIBCURL_CAN_HANDLE_AUTH_ANY
15 #endif
16
17 static int min_curl_sessions = 1;
18 static int curl_session_count;
19 #ifdef USE_CURL_MULTI
20 static int max_requests = -1;
21 static CURLM *curlm;
22 #endif
23 #ifndef NO_CURL_EASY_DUPHANDLE
24 static CURL *curl_default;
25 #endif
26
27 #define PREV_BUF_SIZE 4096
28 #define RANGE_HEADER_SIZE 30
29
30 char curl_errorstr[CURL_ERROR_SIZE];
31
32 static int curl_ssl_verify = -1;
33 static const char *ssl_cert;
34 #if LIBCURL_VERSION_NUM >= 0x070903
35 static const char *ssl_key;
36 #endif
37 #if LIBCURL_VERSION_NUM >= 0x070908
38 static const char *ssl_capath;
39 #endif
40 static const char *ssl_cainfo;
41 static long curl_low_speed_limit = -1;
42 static long curl_low_speed_time = -1;
43 static int curl_ftp_no_epsv;
44 static const char *curl_http_proxy;
45 static const char *curl_cookie_file;
46 static struct credential http_auth = CREDENTIAL_INIT;
47 static int http_proactive_auth;
48 static const char *user_agent;
49
50 #if LIBCURL_VERSION_NUM >= 0x071700
51 /* Use CURLOPT_KEYPASSWD as is */
52 #elif LIBCURL_VERSION_NUM >= 0x070903
53 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
54 #else
55 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
56 #endif
57
58 static struct credential cert_auth = CREDENTIAL_INIT;
59 static int ssl_cert_password_required;
60
61 static struct curl_slist *pragma_header;
62 static struct curl_slist *no_pragma_header;
63
64 static struct active_request_slot *active_queue_head;
65
66 size_t fread_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
67 {
68         size_t size = eltsize * nmemb;
69         struct buffer *buffer = buffer_;
70
71         if (size > buffer->buf.len - buffer->posn)
72                 size = buffer->buf.len - buffer->posn;
73         memcpy(ptr, buffer->buf.buf + buffer->posn, size);
74         buffer->posn += size;
75
76         return size;
77 }
78
79 #ifndef NO_CURL_IOCTL
80 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
81 {
82         struct buffer *buffer = clientp;
83
84         switch (cmd) {
85         case CURLIOCMD_NOP:
86                 return CURLIOE_OK;
87
88         case CURLIOCMD_RESTARTREAD:
89                 buffer->posn = 0;
90                 return CURLIOE_OK;
91
92         default:
93                 return CURLIOE_UNKNOWNCMD;
94         }
95 }
96 #endif
97
98 size_t fwrite_buffer(char *ptr, size_t eltsize, size_t nmemb, void *buffer_)
99 {
100         size_t size = eltsize * nmemb;
101         struct strbuf *buffer = buffer_;
102
103         strbuf_add(buffer, ptr, size);
104         return size;
105 }
106
107 size_t fwrite_null(char *ptr, size_t eltsize, size_t nmemb, void *strbuf)
108 {
109         return eltsize * nmemb;
110 }
111
112 #ifdef USE_CURL_MULTI
113 static void process_curl_messages(void)
114 {
115         int num_messages;
116         struct active_request_slot *slot;
117         CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
118
119         while (curl_message != NULL) {
120                 if (curl_message->msg == CURLMSG_DONE) {
121                         int curl_result = curl_message->data.result;
122                         slot = active_queue_head;
123                         while (slot != NULL &&
124                                slot->curl != curl_message->easy_handle)
125                                 slot = slot->next;
126                         if (slot != NULL) {
127                                 curl_multi_remove_handle(curlm, slot->curl);
128                                 slot->curl_result = curl_result;
129                                 finish_active_slot(slot);
130                         } else {
131                                 fprintf(stderr, "Received DONE message for unknown request!\n");
132                         }
133                 } else {
134                         fprintf(stderr, "Unknown CURL message received: %d\n",
135                                 (int)curl_message->msg);
136                 }
137                 curl_message = curl_multi_info_read(curlm, &num_messages);
138         }
139 }
140 #endif
141
142 static int http_options(const char *var, const char *value, void *cb)
143 {
144         if (!strcmp("http.sslverify", var)) {
145                 curl_ssl_verify = git_config_bool(var, value);
146                 return 0;
147         }
148         if (!strcmp("http.sslcert", var))
149                 return git_config_string(&ssl_cert, var, value);
150 #if LIBCURL_VERSION_NUM >= 0x070903
151         if (!strcmp("http.sslkey", var))
152                 return git_config_string(&ssl_key, var, value);
153 #endif
154 #if LIBCURL_VERSION_NUM >= 0x070908
155         if (!strcmp("http.sslcapath", var))
156                 return git_config_string(&ssl_capath, var, value);
157 #endif
158         if (!strcmp("http.sslcainfo", var))
159                 return git_config_string(&ssl_cainfo, var, value);
160         if (!strcmp("http.sslcertpasswordprotected", var)) {
161                 if (git_config_bool(var, value))
162                         ssl_cert_password_required = 1;
163                 return 0;
164         }
165         if (!strcmp("http.minsessions", var)) {
166                 min_curl_sessions = git_config_int(var, value);
167 #ifndef USE_CURL_MULTI
168                 if (min_curl_sessions > 1)
169                         min_curl_sessions = 1;
170 #endif
171                 return 0;
172         }
173 #ifdef USE_CURL_MULTI
174         if (!strcmp("http.maxrequests", var)) {
175                 max_requests = git_config_int(var, value);
176                 return 0;
177         }
178 #endif
179         if (!strcmp("http.lowspeedlimit", var)) {
180                 curl_low_speed_limit = (long)git_config_int(var, value);
181                 return 0;
182         }
183         if (!strcmp("http.lowspeedtime", var)) {
184                 curl_low_speed_time = (long)git_config_int(var, value);
185                 return 0;
186         }
187
188         if (!strcmp("http.noepsv", var)) {
189                 curl_ftp_no_epsv = git_config_bool(var, value);
190                 return 0;
191         }
192         if (!strcmp("http.proxy", var))
193                 return git_config_string(&curl_http_proxy, var, value);
194
195         if (!strcmp("http.cookiefile", var))
196                 return git_config_string(&curl_cookie_file, var, value);
197
198         if (!strcmp("http.postbuffer", var)) {
199                 http_post_buffer = git_config_int(var, value);
200                 if (http_post_buffer < LARGE_PACKET_MAX)
201                         http_post_buffer = LARGE_PACKET_MAX;
202                 return 0;
203         }
204
205         if (!strcmp("http.useragent", var))
206                 return git_config_string(&user_agent, var, value);
207
208         /* Fall back on the default ones */
209         return git_default_config(var, value, cb);
210 }
211
212 static void init_curl_http_auth(CURL *result)
213 {
214         if (!http_auth.username)
215                 return;
216
217         credential_fill(&http_auth);
218
219 #if LIBCURL_VERSION_NUM >= 0x071301
220         curl_easy_setopt(result, CURLOPT_USERNAME, http_auth.username);
221         curl_easy_setopt(result, CURLOPT_PASSWORD, http_auth.password);
222 #else
223         {
224                 static struct strbuf up = STRBUF_INIT;
225                 strbuf_reset(&up);
226                 strbuf_addf(&up, "%s:%s",
227                             http_auth.username, http_auth.password);
228                 curl_easy_setopt(result, CURLOPT_USERPWD, up.buf);
229         }
230 #endif
231 }
232
233 static int has_cert_password(void)
234 {
235         if (ssl_cert == NULL || ssl_cert_password_required != 1)
236                 return 0;
237         if (!cert_auth.password) {
238                 cert_auth.protocol = xstrdup("cert");
239                 cert_auth.path = xstrdup(ssl_cert);
240                 credential_fill(&cert_auth);
241         }
242         return 1;
243 }
244
245 static CURL *get_curl_handle(void)
246 {
247         CURL *result = curl_easy_init();
248
249         if (!curl_ssl_verify) {
250                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
251                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
252         } else {
253                 /* Verify authenticity of the peer's certificate */
254                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
255                 /* The name in the cert must match whom we tried to connect */
256                 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
257         }
258
259 #if LIBCURL_VERSION_NUM >= 0x070907
260         curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
261 #endif
262 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
263         curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
264 #endif
265
266         if (http_proactive_auth)
267                 init_curl_http_auth(result);
268
269         if (ssl_cert != NULL)
270                 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
271         if (has_cert_password())
272                 curl_easy_setopt(result, CURLOPT_KEYPASSWD, cert_auth.password);
273 #if LIBCURL_VERSION_NUM >= 0x070903
274         if (ssl_key != NULL)
275                 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
276 #endif
277 #if LIBCURL_VERSION_NUM >= 0x070908
278         if (ssl_capath != NULL)
279                 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
280 #endif
281         if (ssl_cainfo != NULL)
282                 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
283         curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
284
285         if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
286                 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
287                                  curl_low_speed_limit);
288                 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
289                                  curl_low_speed_time);
290         }
291
292         curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
293 #if LIBCURL_VERSION_NUM >= 0x071301
294         curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
295 #elif LIBCURL_VERSION_NUM >= 0x071101
296         curl_easy_setopt(result, CURLOPT_POST301, 1);
297 #endif
298
299         if (getenv("GIT_CURL_VERBOSE"))
300                 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
301
302         curl_easy_setopt(result, CURLOPT_USERAGENT,
303                 user_agent ? user_agent : git_user_agent());
304
305         if (curl_ftp_no_epsv)
306                 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
307
308         if (curl_http_proxy) {
309                 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
310                 curl_easy_setopt(result, CURLOPT_PROXYAUTH, CURLAUTH_ANY);
311         }
312
313         return result;
314 }
315
316 static void set_from_env(const char **var, const char *envname)
317 {
318         const char *val = getenv(envname);
319         if (val)
320                 *var = val;
321 }
322
323 void http_init(struct remote *remote, const char *url, int proactive_auth)
324 {
325         char *low_speed_limit;
326         char *low_speed_time;
327
328         http_is_verbose = 0;
329
330         git_config(http_options, NULL);
331
332         curl_global_init(CURL_GLOBAL_ALL);
333
334         http_proactive_auth = proactive_auth;
335
336         if (remote && remote->http_proxy)
337                 curl_http_proxy = xstrdup(remote->http_proxy);
338
339         pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
340         no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
341
342 #ifdef USE_CURL_MULTI
343         {
344                 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
345                 if (http_max_requests != NULL)
346                         max_requests = atoi(http_max_requests);
347         }
348
349         curlm = curl_multi_init();
350         if (curlm == NULL) {
351                 fprintf(stderr, "Error creating curl multi handle.\n");
352                 exit(1);
353         }
354 #endif
355
356         if (getenv("GIT_SSL_NO_VERIFY"))
357                 curl_ssl_verify = 0;
358
359         set_from_env(&ssl_cert, "GIT_SSL_CERT");
360 #if LIBCURL_VERSION_NUM >= 0x070903
361         set_from_env(&ssl_key, "GIT_SSL_KEY");
362 #endif
363 #if LIBCURL_VERSION_NUM >= 0x070908
364         set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
365 #endif
366         set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
367
368         set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
369
370         low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
371         if (low_speed_limit != NULL)
372                 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
373         low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
374         if (low_speed_time != NULL)
375                 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
376
377         if (curl_ssl_verify == -1)
378                 curl_ssl_verify = 1;
379
380         curl_session_count = 0;
381 #ifdef USE_CURL_MULTI
382         if (max_requests < 1)
383                 max_requests = DEFAULT_MAX_REQUESTS;
384 #endif
385
386         if (getenv("GIT_CURL_FTP_NO_EPSV"))
387                 curl_ftp_no_epsv = 1;
388
389         if (url) {
390                 credential_from_url(&http_auth, url);
391                 if (!ssl_cert_password_required &&
392                     getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
393                     !prefixcmp(url, "https://"))
394                         ssl_cert_password_required = 1;
395         }
396
397 #ifndef NO_CURL_EASY_DUPHANDLE
398         curl_default = get_curl_handle();
399 #endif
400 }
401
402 void http_cleanup(void)
403 {
404         struct active_request_slot *slot = active_queue_head;
405
406         while (slot != NULL) {
407                 struct active_request_slot *next = slot->next;
408                 if (slot->curl != NULL) {
409 #ifdef USE_CURL_MULTI
410                         curl_multi_remove_handle(curlm, slot->curl);
411 #endif
412                         curl_easy_cleanup(slot->curl);
413                 }
414                 free(slot);
415                 slot = next;
416         }
417         active_queue_head = NULL;
418
419 #ifndef NO_CURL_EASY_DUPHANDLE
420         curl_easy_cleanup(curl_default);
421 #endif
422
423 #ifdef USE_CURL_MULTI
424         curl_multi_cleanup(curlm);
425 #endif
426         curl_global_cleanup();
427
428         curl_slist_free_all(pragma_header);
429         pragma_header = NULL;
430
431         curl_slist_free_all(no_pragma_header);
432         no_pragma_header = NULL;
433
434         if (curl_http_proxy) {
435                 free((void *)curl_http_proxy);
436                 curl_http_proxy = NULL;
437         }
438
439         if (cert_auth.password != NULL) {
440                 memset(cert_auth.password, 0, strlen(cert_auth.password));
441                 free(cert_auth.password);
442                 cert_auth.password = NULL;
443         }
444         ssl_cert_password_required = 0;
445 }
446
447 struct active_request_slot *get_active_slot(void)
448 {
449         struct active_request_slot *slot = active_queue_head;
450         struct active_request_slot *newslot;
451
452 #ifdef USE_CURL_MULTI
453         int num_transfers;
454
455         /* Wait for a slot to open up if the queue is full */
456         while (active_requests >= max_requests) {
457                 curl_multi_perform(curlm, &num_transfers);
458                 if (num_transfers < active_requests)
459                         process_curl_messages();
460         }
461 #endif
462
463         while (slot != NULL && slot->in_use)
464                 slot = slot->next;
465
466         if (slot == NULL) {
467                 newslot = xmalloc(sizeof(*newslot));
468                 newslot->curl = NULL;
469                 newslot->in_use = 0;
470                 newslot->next = NULL;
471
472                 slot = active_queue_head;
473                 if (slot == NULL) {
474                         active_queue_head = newslot;
475                 } else {
476                         while (slot->next != NULL)
477                                 slot = slot->next;
478                         slot->next = newslot;
479                 }
480                 slot = newslot;
481         }
482
483         if (slot->curl == NULL) {
484 #ifdef NO_CURL_EASY_DUPHANDLE
485                 slot->curl = get_curl_handle();
486 #else
487                 slot->curl = curl_easy_duphandle(curl_default);
488 #endif
489                 curl_session_count++;
490         }
491
492         active_requests++;
493         slot->in_use = 1;
494         slot->results = NULL;
495         slot->finished = NULL;
496         slot->callback_data = NULL;
497         slot->callback_func = NULL;
498         curl_easy_setopt(slot->curl, CURLOPT_COOKIEFILE, curl_cookie_file);
499         curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
500         curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
501         curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
502         curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
503         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
504         curl_easy_setopt(slot->curl, CURLOPT_POSTFIELDS, NULL);
505         curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
506         curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
507         if (http_auth.password)
508                 init_curl_http_auth(slot->curl);
509
510         return slot;
511 }
512
513 int start_active_slot(struct active_request_slot *slot)
514 {
515 #ifdef USE_CURL_MULTI
516         CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
517         int num_transfers;
518
519         if (curlm_result != CURLM_OK &&
520             curlm_result != CURLM_CALL_MULTI_PERFORM) {
521                 active_requests--;
522                 slot->in_use = 0;
523                 return 0;
524         }
525
526         /*
527          * We know there must be something to do, since we just added
528          * something.
529          */
530         curl_multi_perform(curlm, &num_transfers);
531 #endif
532         return 1;
533 }
534
535 #ifdef USE_CURL_MULTI
536 struct fill_chain {
537         void *data;
538         int (*fill)(void *);
539         struct fill_chain *next;
540 };
541
542 static struct fill_chain *fill_cfg;
543
544 void add_fill_function(void *data, int (*fill)(void *))
545 {
546         struct fill_chain *new = xmalloc(sizeof(*new));
547         struct fill_chain **linkp = &fill_cfg;
548         new->data = data;
549         new->fill = fill;
550         new->next = NULL;
551         while (*linkp)
552                 linkp = &(*linkp)->next;
553         *linkp = new;
554 }
555
556 void fill_active_slots(void)
557 {
558         struct active_request_slot *slot = active_queue_head;
559
560         while (active_requests < max_requests) {
561                 struct fill_chain *fill;
562                 for (fill = fill_cfg; fill; fill = fill->next)
563                         if (fill->fill(fill->data))
564                                 break;
565
566                 if (!fill)
567                         break;
568         }
569
570         while (slot != NULL) {
571                 if (!slot->in_use && slot->curl != NULL
572                         && curl_session_count > min_curl_sessions) {
573                         curl_easy_cleanup(slot->curl);
574                         slot->curl = NULL;
575                         curl_session_count--;
576                 }
577                 slot = slot->next;
578         }
579 }
580
581 void step_active_slots(void)
582 {
583         int num_transfers;
584         CURLMcode curlm_result;
585
586         do {
587                 curlm_result = curl_multi_perform(curlm, &num_transfers);
588         } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
589         if (num_transfers < active_requests) {
590                 process_curl_messages();
591                 fill_active_slots();
592         }
593 }
594 #endif
595
596 void run_active_slot(struct active_request_slot *slot)
597 {
598 #ifdef USE_CURL_MULTI
599         fd_set readfds;
600         fd_set writefds;
601         fd_set excfds;
602         int max_fd;
603         struct timeval select_timeout;
604         int finished = 0;
605
606         slot->finished = &finished;
607         while (!finished) {
608                 step_active_slots();
609
610                 if (slot->in_use) {
611 #if LIBCURL_VERSION_NUM >= 0x070f04
612                         long curl_timeout;
613                         curl_multi_timeout(curlm, &curl_timeout);
614                         if (curl_timeout == 0) {
615                                 continue;
616                         } else if (curl_timeout == -1) {
617                                 select_timeout.tv_sec  = 0;
618                                 select_timeout.tv_usec = 50000;
619                         } else {
620                                 select_timeout.tv_sec  =  curl_timeout / 1000;
621                                 select_timeout.tv_usec = (curl_timeout % 1000) * 1000;
622                         }
623 #else
624                         select_timeout.tv_sec  = 0;
625                         select_timeout.tv_usec = 50000;
626 #endif
627
628                         max_fd = -1;
629                         FD_ZERO(&readfds);
630                         FD_ZERO(&writefds);
631                         FD_ZERO(&excfds);
632                         curl_multi_fdset(curlm, &readfds, &writefds, &excfds, &max_fd);
633
634                         select(max_fd+1, &readfds, &writefds, &excfds, &select_timeout);
635                 }
636         }
637 #else
638         while (slot->in_use) {
639                 slot->curl_result = curl_easy_perform(slot->curl);
640                 finish_active_slot(slot);
641         }
642 #endif
643 }
644
645 static void closedown_active_slot(struct active_request_slot *slot)
646 {
647         active_requests--;
648         slot->in_use = 0;
649 }
650
651 static void release_active_slot(struct active_request_slot *slot)
652 {
653         closedown_active_slot(slot);
654         if (slot->curl && curl_session_count > min_curl_sessions) {
655 #ifdef USE_CURL_MULTI
656                 curl_multi_remove_handle(curlm, slot->curl);
657 #endif
658                 curl_easy_cleanup(slot->curl);
659                 slot->curl = NULL;
660                 curl_session_count--;
661         }
662 #ifdef USE_CURL_MULTI
663         fill_active_slots();
664 #endif
665 }
666
667 void finish_active_slot(struct active_request_slot *slot)
668 {
669         closedown_active_slot(slot);
670         curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
671
672         if (slot->finished != NULL)
673                 (*slot->finished) = 1;
674
675         /* Store slot results so they can be read after the slot is reused */
676         if (slot->results != NULL) {
677                 slot->results->curl_result = slot->curl_result;
678                 slot->results->http_code = slot->http_code;
679         }
680
681         /* Run callback if appropriate */
682         if (slot->callback_func != NULL)
683                 slot->callback_func(slot->callback_data);
684 }
685
686 void finish_all_active_slots(void)
687 {
688         struct active_request_slot *slot = active_queue_head;
689
690         while (slot != NULL)
691                 if (slot->in_use) {
692                         run_active_slot(slot);
693                         slot = active_queue_head;
694                 } else {
695                         slot = slot->next;
696                 }
697 }
698
699 /* Helpers for modifying and creating URLs */
700 static inline int needs_quote(int ch)
701 {
702         if (((ch >= 'A') && (ch <= 'Z'))
703                         || ((ch >= 'a') && (ch <= 'z'))
704                         || ((ch >= '0') && (ch <= '9'))
705                         || (ch == '/')
706                         || (ch == '-')
707                         || (ch == '.'))
708                 return 0;
709         return 1;
710 }
711
712 static char *quote_ref_url(const char *base, const char *ref)
713 {
714         struct strbuf buf = STRBUF_INIT;
715         const char *cp;
716         int ch;
717
718         end_url_with_slash(&buf, base);
719
720         for (cp = ref; (ch = *cp) != 0; cp++)
721                 if (needs_quote(ch))
722                         strbuf_addf(&buf, "%%%02x", ch);
723                 else
724                         strbuf_addch(&buf, *cp);
725
726         return strbuf_detach(&buf, NULL);
727 }
728
729 void append_remote_object_url(struct strbuf *buf, const char *url,
730                               const char *hex,
731                               int only_two_digit_prefix)
732 {
733         end_url_with_slash(buf, url);
734
735         strbuf_addf(buf, "objects/%.*s/", 2, hex);
736         if (!only_two_digit_prefix)
737                 strbuf_addf(buf, "%s", hex+2);
738 }
739
740 char *get_remote_object_url(const char *url, const char *hex,
741                             int only_two_digit_prefix)
742 {
743         struct strbuf buf = STRBUF_INIT;
744         append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
745         return strbuf_detach(&buf, NULL);
746 }
747
748 int handle_curl_result(struct active_request_slot *slot)
749 {
750         struct slot_results *results = slot->results;
751
752         if (results->curl_result == CURLE_OK) {
753                 credential_approve(&http_auth);
754                 return HTTP_OK;
755         } else if (missing_target(results))
756                 return HTTP_MISSING_TARGET;
757         else if (results->http_code == 401) {
758                 if (http_auth.username && http_auth.password) {
759                         credential_reject(&http_auth);
760                         return HTTP_NOAUTH;
761                 } else {
762                         credential_fill(&http_auth);
763                         init_curl_http_auth(slot->curl);
764                         return HTTP_REAUTH;
765                 }
766         } else {
767 #if LIBCURL_VERSION_NUM >= 0x070c00
768                 if (!curl_errorstr[0])
769                         strlcpy(curl_errorstr,
770                                 curl_easy_strerror(results->curl_result),
771                                 sizeof(curl_errorstr));
772 #endif
773                 return HTTP_ERROR;
774         }
775 }
776
777 /* http_request() targets */
778 #define HTTP_REQUEST_STRBUF     0
779 #define HTTP_REQUEST_FILE       1
780
781 static int http_request(const char *url, void *result, int target, int options)
782 {
783         struct active_request_slot *slot;
784         struct slot_results results;
785         struct curl_slist *headers = NULL;
786         struct strbuf buf = STRBUF_INIT;
787         int ret;
788
789         slot = get_active_slot();
790         slot->results = &results;
791         curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
792
793         if (result == NULL) {
794                 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
795         } else {
796                 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
797                 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
798
799                 if (target == HTTP_REQUEST_FILE) {
800                         long posn = ftell(result);
801                         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
802                                          fwrite);
803                         if (posn > 0) {
804                                 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
805                                 headers = curl_slist_append(headers, buf.buf);
806                                 strbuf_reset(&buf);
807                         }
808                 } else
809                         curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
810                                          fwrite_buffer);
811         }
812
813         strbuf_addstr(&buf, "Pragma:");
814         if (options & HTTP_NO_CACHE)
815                 strbuf_addstr(&buf, " no-cache");
816
817         headers = curl_slist_append(headers, buf.buf);
818
819         curl_easy_setopt(slot->curl, CURLOPT_URL, url);
820         curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
821         curl_easy_setopt(slot->curl, CURLOPT_ENCODING, "gzip");
822
823         if (start_active_slot(slot)) {
824                 run_active_slot(slot);
825                 ret = handle_curl_result(slot);
826         } else {
827                 error("Unable to start HTTP request for %s", url);
828                 ret = HTTP_START_FAILED;
829         }
830
831         curl_slist_free_all(headers);
832         strbuf_release(&buf);
833
834         return ret;
835 }
836
837 static int http_request_reauth(const char *url, void *result, int target,
838                                int options)
839 {
840         int ret = http_request(url, result, target, options);
841         if (ret != HTTP_REAUTH)
842                 return ret;
843         return http_request(url, result, target, options);
844 }
845
846 int http_get_strbuf(const char *url, struct strbuf *result, int options)
847 {
848         return http_request_reauth(url, result, HTTP_REQUEST_STRBUF, options);
849 }
850
851 /*
852  * Downloads a URL and stores the result in the given file.
853  *
854  * If a previous interrupted download is detected (i.e. a previous temporary
855  * file is still around) the download is resumed.
856  */
857 static int http_get_file(const char *url, const char *filename, int options)
858 {
859         int ret;
860         struct strbuf tmpfile = STRBUF_INIT;
861         FILE *result;
862
863         strbuf_addf(&tmpfile, "%s.temp", filename);
864         result = fopen(tmpfile.buf, "a");
865         if (! result) {
866                 error("Unable to open local file %s", tmpfile.buf);
867                 ret = HTTP_ERROR;
868                 goto cleanup;
869         }
870
871         ret = http_request_reauth(url, result, HTTP_REQUEST_FILE, options);
872         fclose(result);
873
874         if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
875                 ret = HTTP_ERROR;
876 cleanup:
877         strbuf_release(&tmpfile);
878         return ret;
879 }
880
881 int http_error(const char *url, int ret)
882 {
883         /* http_request has already handled HTTP_START_FAILED. */
884         if (ret != HTTP_START_FAILED)
885                 error("%s while accessing %s", curl_errorstr, url);
886
887         return ret;
888 }
889
890 int http_fetch_ref(const char *base, struct ref *ref)
891 {
892         char *url;
893         struct strbuf buffer = STRBUF_INIT;
894         int ret = -1;
895
896         url = quote_ref_url(base, ref->name);
897         if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
898                 strbuf_rtrim(&buffer);
899                 if (buffer.len == 40)
900                         ret = get_sha1_hex(buffer.buf, ref->old_sha1);
901                 else if (!prefixcmp(buffer.buf, "ref: ")) {
902                         ref->symref = xstrdup(buffer.buf + 5);
903                         ret = 0;
904                 }
905         }
906
907         strbuf_release(&buffer);
908         free(url);
909         return ret;
910 }
911
912 /* Helpers for fetching packs */
913 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
914 {
915         char *url, *tmp;
916         struct strbuf buf = STRBUF_INIT;
917
918         if (http_is_verbose)
919                 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
920
921         end_url_with_slash(&buf, base_url);
922         strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
923         url = strbuf_detach(&buf, NULL);
924
925         strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
926         tmp = strbuf_detach(&buf, NULL);
927
928         if (http_get_file(url, tmp, 0) != HTTP_OK) {
929                 error("Unable to get pack index %s", url);
930                 free(tmp);
931                 tmp = NULL;
932         }
933
934         free(url);
935         return tmp;
936 }
937
938 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
939         unsigned char *sha1, const char *base_url)
940 {
941         struct packed_git *new_pack;
942         char *tmp_idx = NULL;
943         int ret;
944
945         if (has_pack_index(sha1)) {
946                 new_pack = parse_pack_index(sha1, NULL);
947                 if (!new_pack)
948                         return -1; /* parse_pack_index() already issued error message */
949                 goto add_pack;
950         }
951
952         tmp_idx = fetch_pack_index(sha1, base_url);
953         if (!tmp_idx)
954                 return -1;
955
956         new_pack = parse_pack_index(sha1, tmp_idx);
957         if (!new_pack) {
958                 unlink(tmp_idx);
959                 free(tmp_idx);
960
961                 return -1; /* parse_pack_index() already issued error message */
962         }
963
964         ret = verify_pack_index(new_pack);
965         if (!ret) {
966                 close_pack_index(new_pack);
967                 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
968         }
969         free(tmp_idx);
970         if (ret)
971                 return -1;
972
973 add_pack:
974         new_pack->next = *packs_head;
975         *packs_head = new_pack;
976         return 0;
977 }
978
979 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
980 {
981         int ret = 0, i = 0;
982         char *url, *data;
983         struct strbuf buf = STRBUF_INIT;
984         unsigned char sha1[20];
985
986         end_url_with_slash(&buf, base_url);
987         strbuf_addstr(&buf, "objects/info/packs");
988         url = strbuf_detach(&buf, NULL);
989
990         ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
991         if (ret != HTTP_OK)
992                 goto cleanup;
993
994         data = buf.buf;
995         while (i < buf.len) {
996                 switch (data[i]) {
997                 case 'P':
998                         i++;
999                         if (i + 52 <= buf.len &&
1000                             !prefixcmp(data + i, " pack-") &&
1001                             !prefixcmp(data + i + 46, ".pack\n")) {
1002                                 get_sha1_hex(data + i + 6, sha1);
1003                                 fetch_and_setup_pack_index(packs_head, sha1,
1004                                                       base_url);
1005                                 i += 51;
1006                                 break;
1007                         }
1008                 default:
1009                         while (i < buf.len && data[i] != '\n')
1010                                 i++;
1011                 }
1012                 i++;
1013         }
1014
1015 cleanup:
1016         free(url);
1017         return ret;
1018 }
1019
1020 void release_http_pack_request(struct http_pack_request *preq)
1021 {
1022         if (preq->packfile != NULL) {
1023                 fclose(preq->packfile);
1024                 preq->packfile = NULL;
1025         }
1026         if (preq->range_header != NULL) {
1027                 curl_slist_free_all(preq->range_header);
1028                 preq->range_header = NULL;
1029         }
1030         preq->slot = NULL;
1031         free(preq->url);
1032 }
1033
1034 int finish_http_pack_request(struct http_pack_request *preq)
1035 {
1036         struct packed_git **lst;
1037         struct packed_git *p = preq->target;
1038         char *tmp_idx;
1039         struct child_process ip;
1040         const char *ip_argv[8];
1041
1042         close_pack_index(p);
1043
1044         fclose(preq->packfile);
1045         preq->packfile = NULL;
1046
1047         lst = preq->lst;
1048         while (*lst != p)
1049                 lst = &((*lst)->next);
1050         *lst = (*lst)->next;
1051
1052         tmp_idx = xstrdup(preq->tmpfile);
1053         strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1054                ".idx.temp");
1055
1056         ip_argv[0] = "index-pack";
1057         ip_argv[1] = "-o";
1058         ip_argv[2] = tmp_idx;
1059         ip_argv[3] = preq->tmpfile;
1060         ip_argv[4] = NULL;
1061
1062         memset(&ip, 0, sizeof(ip));
1063         ip.argv = ip_argv;
1064         ip.git_cmd = 1;
1065         ip.no_stdin = 1;
1066         ip.no_stdout = 1;
1067
1068         if (run_command(&ip)) {
1069                 unlink(preq->tmpfile);
1070                 unlink(tmp_idx);
1071                 free(tmp_idx);
1072                 return -1;
1073         }
1074
1075         unlink(sha1_pack_index_name(p->sha1));
1076
1077         if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1078          || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1079                 free(tmp_idx);
1080                 return -1;
1081         }
1082
1083         install_packed_git(p);
1084         free(tmp_idx);
1085         return 0;
1086 }
1087
1088 struct http_pack_request *new_http_pack_request(
1089         struct packed_git *target, const char *base_url)
1090 {
1091         long prev_posn = 0;
1092         char range[RANGE_HEADER_SIZE];
1093         struct strbuf buf = STRBUF_INIT;
1094         struct http_pack_request *preq;
1095
1096         preq = xcalloc(1, sizeof(*preq));
1097         preq->target = target;
1098
1099         end_url_with_slash(&buf, base_url);
1100         strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1101                 sha1_to_hex(target->sha1));
1102         preq->url = strbuf_detach(&buf, NULL);
1103
1104         snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1105                 sha1_pack_name(target->sha1));
1106         preq->packfile = fopen(preq->tmpfile, "a");
1107         if (!preq->packfile) {
1108                 error("Unable to open local file %s for pack",
1109                       preq->tmpfile);
1110                 goto abort;
1111         }
1112
1113         preq->slot = get_active_slot();
1114         curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1115         curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1116         curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1117         curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1118                 no_pragma_header);
1119
1120         /*
1121          * If there is data present from a previous transfer attempt,
1122          * resume where it left off
1123          */
1124         prev_posn = ftell(preq->packfile);
1125         if (prev_posn>0) {
1126                 if (http_is_verbose)
1127                         fprintf(stderr,
1128                                 "Resuming fetch of pack %s at byte %ld\n",
1129                                 sha1_to_hex(target->sha1), prev_posn);
1130                 sprintf(range, "Range: bytes=%ld-", prev_posn);
1131                 preq->range_header = curl_slist_append(NULL, range);
1132                 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1133                         preq->range_header);
1134         }
1135
1136         return preq;
1137
1138 abort:
1139         free(preq->url);
1140         free(preq);
1141         return NULL;
1142 }
1143
1144 /* Helpers for fetching objects (loose) */
1145 static size_t fwrite_sha1_file(char *ptr, size_t eltsize, size_t nmemb,
1146                                void *data)
1147 {
1148         unsigned char expn[4096];
1149         size_t size = eltsize * nmemb;
1150         int posn = 0;
1151         struct http_object_request *freq =
1152                 (struct http_object_request *)data;
1153         do {
1154                 ssize_t retval = xwrite(freq->localfile,
1155                                         (char *) ptr + posn, size - posn);
1156                 if (retval < 0)
1157                         return posn;
1158                 posn += retval;
1159         } while (posn < size);
1160
1161         freq->stream.avail_in = size;
1162         freq->stream.next_in = (void *)ptr;
1163         do {
1164                 freq->stream.next_out = expn;
1165                 freq->stream.avail_out = sizeof(expn);
1166                 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1167                 git_SHA1_Update(&freq->c, expn,
1168                                 sizeof(expn) - freq->stream.avail_out);
1169         } while (freq->stream.avail_in && freq->zret == Z_OK);
1170         return size;
1171 }
1172
1173 struct http_object_request *new_http_object_request(const char *base_url,
1174         unsigned char *sha1)
1175 {
1176         char *hex = sha1_to_hex(sha1);
1177         char *filename;
1178         char prevfile[PATH_MAX];
1179         int prevlocal;
1180         char prev_buf[PREV_BUF_SIZE];
1181         ssize_t prev_read = 0;
1182         long prev_posn = 0;
1183         char range[RANGE_HEADER_SIZE];
1184         struct curl_slist *range_header = NULL;
1185         struct http_object_request *freq;
1186
1187         freq = xcalloc(1, sizeof(*freq));
1188         hashcpy(freq->sha1, sha1);
1189         freq->localfile = -1;
1190
1191         filename = sha1_file_name(sha1);
1192         snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1193                  "%s.temp", filename);
1194
1195         snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1196         unlink_or_warn(prevfile);
1197         rename(freq->tmpfile, prevfile);
1198         unlink_or_warn(freq->tmpfile);
1199
1200         if (freq->localfile != -1)
1201                 error("fd leakage in start: %d", freq->localfile);
1202         freq->localfile = open(freq->tmpfile,
1203                                O_WRONLY | O_CREAT | O_EXCL, 0666);
1204         /*
1205          * This could have failed due to the "lazy directory creation";
1206          * try to mkdir the last path component.
1207          */
1208         if (freq->localfile < 0 && errno == ENOENT) {
1209                 char *dir = strrchr(freq->tmpfile, '/');
1210                 if (dir) {
1211                         *dir = 0;
1212                         mkdir(freq->tmpfile, 0777);
1213                         *dir = '/';
1214                 }
1215                 freq->localfile = open(freq->tmpfile,
1216                                        O_WRONLY | O_CREAT | O_EXCL, 0666);
1217         }
1218
1219         if (freq->localfile < 0) {
1220                 error("Couldn't create temporary file %s: %s",
1221                       freq->tmpfile, strerror(errno));
1222                 goto abort;
1223         }
1224
1225         git_inflate_init(&freq->stream);
1226
1227         git_SHA1_Init(&freq->c);
1228
1229         freq->url = get_remote_object_url(base_url, hex, 0);
1230
1231         /*
1232          * If a previous temp file is present, process what was already
1233          * fetched.
1234          */
1235         prevlocal = open(prevfile, O_RDONLY);
1236         if (prevlocal != -1) {
1237                 do {
1238                         prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1239                         if (prev_read>0) {
1240                                 if (fwrite_sha1_file(prev_buf,
1241                                                      1,
1242                                                      prev_read,
1243                                                      freq) == prev_read) {
1244                                         prev_posn += prev_read;
1245                                 } else {
1246                                         prev_read = -1;
1247                                 }
1248                         }
1249                 } while (prev_read > 0);
1250                 close(prevlocal);
1251         }
1252         unlink_or_warn(prevfile);
1253
1254         /*
1255          * Reset inflate/SHA1 if there was an error reading the previous temp
1256          * file; also rewind to the beginning of the local file.
1257          */
1258         if (prev_read == -1) {
1259                 memset(&freq->stream, 0, sizeof(freq->stream));
1260                 git_inflate_init(&freq->stream);
1261                 git_SHA1_Init(&freq->c);
1262                 if (prev_posn>0) {
1263                         prev_posn = 0;
1264                         lseek(freq->localfile, 0, SEEK_SET);
1265                         if (ftruncate(freq->localfile, 0) < 0) {
1266                                 error("Couldn't truncate temporary file %s: %s",
1267                                           freq->tmpfile, strerror(errno));
1268                                 goto abort;
1269                         }
1270                 }
1271         }
1272
1273         freq->slot = get_active_slot();
1274
1275         curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1276         curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1277         curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1278         curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1279         curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1280
1281         /*
1282          * If we have successfully processed data from a previous fetch
1283          * attempt, only fetch the data we don't already have.
1284          */
1285         if (prev_posn>0) {
1286                 if (http_is_verbose)
1287                         fprintf(stderr,
1288                                 "Resuming fetch of object %s at byte %ld\n",
1289                                 hex, prev_posn);
1290                 sprintf(range, "Range: bytes=%ld-", prev_posn);
1291                 range_header = curl_slist_append(range_header, range);
1292                 curl_easy_setopt(freq->slot->curl,
1293                                  CURLOPT_HTTPHEADER, range_header);
1294         }
1295
1296         return freq;
1297
1298 abort:
1299         free(freq->url);
1300         free(freq);
1301         return NULL;
1302 }
1303
1304 void process_http_object_request(struct http_object_request *freq)
1305 {
1306         if (freq->slot == NULL)
1307                 return;
1308         freq->curl_result = freq->slot->curl_result;
1309         freq->http_code = freq->slot->http_code;
1310         freq->slot = NULL;
1311 }
1312
1313 int finish_http_object_request(struct http_object_request *freq)
1314 {
1315         struct stat st;
1316
1317         close(freq->localfile);
1318         freq->localfile = -1;
1319
1320         process_http_object_request(freq);
1321
1322         if (freq->http_code == 416) {
1323                 warning("requested range invalid; we may already have all the data.");
1324         } else if (freq->curl_result != CURLE_OK) {
1325                 if (stat(freq->tmpfile, &st) == 0)
1326                         if (st.st_size == 0)
1327                                 unlink_or_warn(freq->tmpfile);
1328                 return -1;
1329         }
1330
1331         git_inflate_end(&freq->stream);
1332         git_SHA1_Final(freq->real_sha1, &freq->c);
1333         if (freq->zret != Z_STREAM_END) {
1334                 unlink_or_warn(freq->tmpfile);
1335                 return -1;
1336         }
1337         if (hashcmp(freq->sha1, freq->real_sha1)) {
1338                 unlink_or_warn(freq->tmpfile);
1339                 return -1;
1340         }
1341         freq->rename =
1342                 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1343
1344         return freq->rename;
1345 }
1346
1347 void abort_http_object_request(struct http_object_request *freq)
1348 {
1349         unlink_or_warn(freq->tmpfile);
1350
1351         release_http_object_request(freq);
1352 }
1353
1354 void release_http_object_request(struct http_object_request *freq)
1355 {
1356         if (freq->localfile != -1) {
1357                 close(freq->localfile);
1358                 freq->localfile = -1;
1359         }
1360         if (freq->url != NULL) {
1361                 free(freq->url);
1362                 freq->url = NULL;
1363         }
1364         if (freq->slot != NULL) {
1365                 freq->slot->callback_func = NULL;
1366                 freq->slot->callback_data = NULL;
1367                 release_active_slot(freq->slot);
1368                 freq->slot = NULL;
1369         }
1370 }