gitweb: Fix handling of whitespace in generated links
[git/jnareb-git/bp-gitweb.git] / http.c
blob17bcf19c5001d309bdbf524e7d3817cf3482a3c3
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
6 int data_received;
7 int active_requests;
8 int http_is_verbose;
9 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
11 #if LIBCURL_VERSION_NUM >= 0x070a06
12 #define LIBCURL_CAN_HANDLE_AUTH_ANY
13 #endif
15 static int min_curl_sessions = 1;
16 static int curl_session_count;
17 #ifdef USE_CURL_MULTI
18 static int max_requests = -1;
19 static CURLM *curlm;
20 #endif
21 #ifndef NO_CURL_EASY_DUPHANDLE
22 static CURL *curl_default;
23 #endif
25 #define PREV_BUF_SIZE 4096
26 #define RANGE_HEADER_SIZE 30
28 char curl_errorstr[CURL_ERROR_SIZE];
30 static int curl_ssl_verify = -1;
31 static const char *ssl_cert;
32 #if LIBCURL_VERSION_NUM >= 0x070903
33 static const char *ssl_key;
34 #endif
35 #if LIBCURL_VERSION_NUM >= 0x070908
36 static const char *ssl_capath;
37 #endif
38 static const char *ssl_cainfo;
39 static long curl_low_speed_limit = -1;
40 static long curl_low_speed_time = -1;
41 static int curl_ftp_no_epsv;
42 static const char *curl_http_proxy;
43 static char *user_name, *user_pass;
44 static const char *user_agent;
46 #if LIBCURL_VERSION_NUM >= 0x071700
47 /* Use CURLOPT_KEYPASSWD as is */
48 #elif LIBCURL_VERSION_NUM >= 0x070903
49 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
50 #else
51 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
52 #endif
54 static char *ssl_cert_password;
55 static int ssl_cert_password_required;
57 static struct curl_slist *pragma_header;
58 static struct curl_slist *no_pragma_header;
60 static struct active_request_slot *active_queue_head;
62 size_t fread_buffer(void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
64 size_t size = eltsize * nmemb;
65 struct buffer *buffer = buffer_;
67 if (size > buffer->buf.len - buffer->posn)
68 size = buffer->buf.len - buffer->posn;
69 memcpy(ptr, buffer->buf.buf + buffer->posn, size);
70 buffer->posn += size;
72 return size;
75 #ifndef NO_CURL_IOCTL
76 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
78 struct buffer *buffer = clientp;
80 switch (cmd) {
81 case CURLIOCMD_NOP:
82 return CURLIOE_OK;
84 case CURLIOCMD_RESTARTREAD:
85 buffer->posn = 0;
86 return CURLIOE_OK;
88 default:
89 return CURLIOE_UNKNOWNCMD;
92 #endif
94 size_t fwrite_buffer(const void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
96 size_t size = eltsize * nmemb;
97 struct strbuf *buffer = buffer_;
99 strbuf_add(buffer, ptr, size);
100 data_received++;
101 return size;
104 size_t fwrite_null(const void *ptr, size_t eltsize, size_t nmemb, void *strbuf)
106 data_received++;
107 return eltsize * nmemb;
110 #ifdef USE_CURL_MULTI
111 static void process_curl_messages(void)
113 int num_messages;
114 struct active_request_slot *slot;
115 CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
117 while (curl_message != NULL) {
118 if (curl_message->msg == CURLMSG_DONE) {
119 int curl_result = curl_message->data.result;
120 slot = active_queue_head;
121 while (slot != NULL &&
122 slot->curl != curl_message->easy_handle)
123 slot = slot->next;
124 if (slot != NULL) {
125 curl_multi_remove_handle(curlm, slot->curl);
126 slot->curl_result = curl_result;
127 finish_active_slot(slot);
128 } else {
129 fprintf(stderr, "Received DONE message for unknown request!\n");
131 } else {
132 fprintf(stderr, "Unknown CURL message received: %d\n",
133 (int)curl_message->msg);
135 curl_message = curl_multi_info_read(curlm, &num_messages);
138 #endif
140 static int http_options(const char *var, const char *value, void *cb)
142 if (!strcmp("http.sslverify", var)) {
143 curl_ssl_verify = git_config_bool(var, value);
144 return 0;
146 if (!strcmp("http.sslcert", var))
147 return git_config_string(&ssl_cert, var, value);
148 #if LIBCURL_VERSION_NUM >= 0x070903
149 if (!strcmp("http.sslkey", var))
150 return git_config_string(&ssl_key, var, value);
151 #endif
152 #if LIBCURL_VERSION_NUM >= 0x070908
153 if (!strcmp("http.sslcapath", var))
154 return git_config_string(&ssl_capath, var, value);
155 #endif
156 if (!strcmp("http.sslcainfo", var))
157 return git_config_string(&ssl_cainfo, var, value);
158 if (!strcmp("http.sslcertpasswordprotected", var)) {
159 if (git_config_bool(var, value))
160 ssl_cert_password_required = 1;
161 return 0;
163 if (!strcmp("http.minsessions", var)) {
164 min_curl_sessions = git_config_int(var, value);
165 #ifndef USE_CURL_MULTI
166 if (min_curl_sessions > 1)
167 min_curl_sessions = 1;
168 #endif
169 return 0;
171 #ifdef USE_CURL_MULTI
172 if (!strcmp("http.maxrequests", var)) {
173 max_requests = git_config_int(var, value);
174 return 0;
176 #endif
177 if (!strcmp("http.lowspeedlimit", var)) {
178 curl_low_speed_limit = (long)git_config_int(var, value);
179 return 0;
181 if (!strcmp("http.lowspeedtime", var)) {
182 curl_low_speed_time = (long)git_config_int(var, value);
183 return 0;
186 if (!strcmp("http.noepsv", var)) {
187 curl_ftp_no_epsv = git_config_bool(var, value);
188 return 0;
190 if (!strcmp("http.proxy", var))
191 return git_config_string(&curl_http_proxy, var, value);
193 if (!strcmp("http.postbuffer", var)) {
194 http_post_buffer = git_config_int(var, value);
195 if (http_post_buffer < LARGE_PACKET_MAX)
196 http_post_buffer = LARGE_PACKET_MAX;
197 return 0;
200 if (!strcmp("http.useragent", var))
201 return git_config_string(&user_agent, var, value);
203 /* Fall back on the default ones */
204 return git_default_config(var, value, cb);
207 static void init_curl_http_auth(CURL *result)
209 if (user_name) {
210 struct strbuf up = STRBUF_INIT;
211 if (!user_pass)
212 user_pass = xstrdup(git_getpass("Password: "));
213 strbuf_addf(&up, "%s:%s", user_name, user_pass);
214 curl_easy_setopt(result, CURLOPT_USERPWD,
215 strbuf_detach(&up, NULL));
219 static int has_cert_password(void)
221 if (ssl_cert_password != NULL)
222 return 1;
223 if (ssl_cert == NULL || ssl_cert_password_required != 1)
224 return 0;
225 /* Only prompt the user once. */
226 ssl_cert_password_required = -1;
227 ssl_cert_password = git_getpass("Certificate Password: ");
228 if (ssl_cert_password != NULL) {
229 ssl_cert_password = xstrdup(ssl_cert_password);
230 return 1;
231 } else
232 return 0;
235 static CURL *get_curl_handle(void)
237 CURL *result = curl_easy_init();
239 if (!curl_ssl_verify) {
240 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
241 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
242 } else {
243 /* Verify authenticity of the peer's certificate */
244 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
245 /* The name in the cert must match whom we tried to connect */
246 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
249 #if LIBCURL_VERSION_NUM >= 0x070907
250 curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
251 #endif
252 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
253 curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
254 #endif
256 init_curl_http_auth(result);
258 if (ssl_cert != NULL)
259 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
260 if (has_cert_password())
261 curl_easy_setopt(result, CURLOPT_KEYPASSWD, ssl_cert_password);
262 #if LIBCURL_VERSION_NUM >= 0x070903
263 if (ssl_key != NULL)
264 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
265 #endif
266 #if LIBCURL_VERSION_NUM >= 0x070908
267 if (ssl_capath != NULL)
268 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
269 #endif
270 if (ssl_cainfo != NULL)
271 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
272 curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
274 if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
275 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
276 curl_low_speed_limit);
277 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
278 curl_low_speed_time);
281 curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
282 #if LIBCURL_VERSION_NUM >= 0x071301
283 curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
284 #elif LIBCURL_VERSION_NUM >= 0x071101
285 curl_easy_setopt(result, CURLOPT_POST301, 1);
286 #endif
288 if (getenv("GIT_CURL_VERBOSE"))
289 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
291 curl_easy_setopt(result, CURLOPT_USERAGENT,
292 user_agent ? user_agent : GIT_HTTP_USER_AGENT);
294 if (curl_ftp_no_epsv)
295 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
297 if (curl_http_proxy)
298 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
300 return result;
303 static void http_auth_init(const char *url)
305 char *at, *colon, *cp, *slash;
306 int len;
308 cp = strstr(url, "://");
309 if (!cp)
310 return;
313 * Ok, the URL looks like "proto://something". Which one?
314 * "proto://<user>:<pass>@<host>/...",
315 * "proto://<user>@<host>/...", or just
316 * "proto://<host>/..."?
318 cp += 3;
319 at = strchr(cp, '@');
320 colon = strchr(cp, ':');
321 slash = strchrnul(cp, '/');
322 if (!at || slash <= at)
323 return; /* No credentials */
324 if (!colon || at <= colon) {
325 /* Only username */
326 len = at - cp;
327 user_name = xmalloc(len + 1);
328 memcpy(user_name, cp, len);
329 user_name[len] = '\0';
330 user_pass = NULL;
331 } else {
332 len = colon - cp;
333 user_name = xmalloc(len + 1);
334 memcpy(user_name, cp, len);
335 user_name[len] = '\0';
336 len = at - (colon + 1);
337 user_pass = xmalloc(len + 1);
338 memcpy(user_pass, colon + 1, len);
339 user_pass[len] = '\0';
343 static void set_from_env(const char **var, const char *envname)
345 const char *val = getenv(envname);
346 if (val)
347 *var = val;
350 void http_init(struct remote *remote)
352 char *low_speed_limit;
353 char *low_speed_time;
355 http_is_verbose = 0;
357 git_config(http_options, NULL);
359 curl_global_init(CURL_GLOBAL_ALL);
361 if (remote && remote->http_proxy)
362 curl_http_proxy = xstrdup(remote->http_proxy);
364 pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
365 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
367 #ifdef USE_CURL_MULTI
369 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
370 if (http_max_requests != NULL)
371 max_requests = atoi(http_max_requests);
374 curlm = curl_multi_init();
375 if (curlm == NULL) {
376 fprintf(stderr, "Error creating curl multi handle.\n");
377 exit(1);
379 #endif
381 if (getenv("GIT_SSL_NO_VERIFY"))
382 curl_ssl_verify = 0;
384 set_from_env(&ssl_cert, "GIT_SSL_CERT");
385 #if LIBCURL_VERSION_NUM >= 0x070903
386 set_from_env(&ssl_key, "GIT_SSL_KEY");
387 #endif
388 #if LIBCURL_VERSION_NUM >= 0x070908
389 set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
390 #endif
391 set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
393 set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
395 low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
396 if (low_speed_limit != NULL)
397 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
398 low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
399 if (low_speed_time != NULL)
400 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
402 if (curl_ssl_verify == -1)
403 curl_ssl_verify = 1;
405 curl_session_count = 0;
406 #ifdef USE_CURL_MULTI
407 if (max_requests < 1)
408 max_requests = DEFAULT_MAX_REQUESTS;
409 #endif
411 if (getenv("GIT_CURL_FTP_NO_EPSV"))
412 curl_ftp_no_epsv = 1;
414 if (remote && remote->url && remote->url[0]) {
415 http_auth_init(remote->url[0]);
416 if (!ssl_cert_password_required &&
417 getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
418 !prefixcmp(remote->url[0], "https://"))
419 ssl_cert_password_required = 1;
422 #ifndef NO_CURL_EASY_DUPHANDLE
423 curl_default = get_curl_handle();
424 #endif
427 void http_cleanup(void)
429 struct active_request_slot *slot = active_queue_head;
431 while (slot != NULL) {
432 struct active_request_slot *next = slot->next;
433 if (slot->curl != NULL) {
434 #ifdef USE_CURL_MULTI
435 curl_multi_remove_handle(curlm, slot->curl);
436 #endif
437 curl_easy_cleanup(slot->curl);
439 free(slot);
440 slot = next;
442 active_queue_head = NULL;
444 #ifndef NO_CURL_EASY_DUPHANDLE
445 curl_easy_cleanup(curl_default);
446 #endif
448 #ifdef USE_CURL_MULTI
449 curl_multi_cleanup(curlm);
450 #endif
451 curl_global_cleanup();
453 curl_slist_free_all(pragma_header);
454 pragma_header = NULL;
456 curl_slist_free_all(no_pragma_header);
457 no_pragma_header = NULL;
459 if (curl_http_proxy) {
460 free((void *)curl_http_proxy);
461 curl_http_proxy = NULL;
464 if (ssl_cert_password != NULL) {
465 memset(ssl_cert_password, 0, strlen(ssl_cert_password));
466 free(ssl_cert_password);
467 ssl_cert_password = NULL;
469 ssl_cert_password_required = 0;
472 struct active_request_slot *get_active_slot(void)
474 struct active_request_slot *slot = active_queue_head;
475 struct active_request_slot *newslot;
477 #ifdef USE_CURL_MULTI
478 int num_transfers;
480 /* Wait for a slot to open up if the queue is full */
481 while (active_requests >= max_requests) {
482 curl_multi_perform(curlm, &num_transfers);
483 if (num_transfers < active_requests)
484 process_curl_messages();
486 #endif
488 while (slot != NULL && slot->in_use)
489 slot = slot->next;
491 if (slot == NULL) {
492 newslot = xmalloc(sizeof(*newslot));
493 newslot->curl = NULL;
494 newslot->in_use = 0;
495 newslot->next = NULL;
497 slot = active_queue_head;
498 if (slot == NULL) {
499 active_queue_head = newslot;
500 } else {
501 while (slot->next != NULL)
502 slot = slot->next;
503 slot->next = newslot;
505 slot = newslot;
508 if (slot->curl == NULL) {
509 #ifdef NO_CURL_EASY_DUPHANDLE
510 slot->curl = get_curl_handle();
511 #else
512 slot->curl = curl_easy_duphandle(curl_default);
513 #endif
514 curl_session_count++;
517 active_requests++;
518 slot->in_use = 1;
519 slot->local = NULL;
520 slot->results = NULL;
521 slot->finished = NULL;
522 slot->callback_data = NULL;
523 slot->callback_func = NULL;
524 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
525 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
526 curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
527 curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
528 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
529 curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
530 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
532 return slot;
535 int start_active_slot(struct active_request_slot *slot)
537 #ifdef USE_CURL_MULTI
538 CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
539 int num_transfers;
541 if (curlm_result != CURLM_OK &&
542 curlm_result != CURLM_CALL_MULTI_PERFORM) {
543 active_requests--;
544 slot->in_use = 0;
545 return 0;
549 * We know there must be something to do, since we just added
550 * something.
552 curl_multi_perform(curlm, &num_transfers);
553 #endif
554 return 1;
557 #ifdef USE_CURL_MULTI
558 struct fill_chain {
559 void *data;
560 int (*fill)(void *);
561 struct fill_chain *next;
564 static struct fill_chain *fill_cfg;
566 void add_fill_function(void *data, int (*fill)(void *))
568 struct fill_chain *new = xmalloc(sizeof(*new));
569 struct fill_chain **linkp = &fill_cfg;
570 new->data = data;
571 new->fill = fill;
572 new->next = NULL;
573 while (*linkp)
574 linkp = &(*linkp)->next;
575 *linkp = new;
578 void fill_active_slots(void)
580 struct active_request_slot *slot = active_queue_head;
582 while (active_requests < max_requests) {
583 struct fill_chain *fill;
584 for (fill = fill_cfg; fill; fill = fill->next)
585 if (fill->fill(fill->data))
586 break;
588 if (!fill)
589 break;
592 while (slot != NULL) {
593 if (!slot->in_use && slot->curl != NULL
594 && curl_session_count > min_curl_sessions) {
595 curl_easy_cleanup(slot->curl);
596 slot->curl = NULL;
597 curl_session_count--;
599 slot = slot->next;
603 void step_active_slots(void)
605 int num_transfers;
606 CURLMcode curlm_result;
608 do {
609 curlm_result = curl_multi_perform(curlm, &num_transfers);
610 } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
611 if (num_transfers < active_requests) {
612 process_curl_messages();
613 fill_active_slots();
616 #endif
618 void run_active_slot(struct active_request_slot *slot)
620 #ifdef USE_CURL_MULTI
621 long last_pos = 0;
622 long current_pos;
623 fd_set readfds;
624 fd_set writefds;
625 fd_set excfds;
626 int max_fd;
627 struct timeval select_timeout;
628 int finished = 0;
630 slot->finished = &finished;
631 while (!finished) {
632 data_received = 0;
633 step_active_slots();
635 if (!data_received && slot->local != NULL) {
636 current_pos = ftell(slot->local);
637 if (current_pos > last_pos)
638 data_received++;
639 last_pos = current_pos;
642 if (slot->in_use && !data_received) {
643 max_fd = 0;
644 FD_ZERO(&readfds);
645 FD_ZERO(&writefds);
646 FD_ZERO(&excfds);
647 select_timeout.tv_sec = 0;
648 select_timeout.tv_usec = 50000;
649 select(max_fd, &readfds, &writefds,
650 &excfds, &select_timeout);
653 #else
654 while (slot->in_use) {
655 slot->curl_result = curl_easy_perform(slot->curl);
656 finish_active_slot(slot);
658 #endif
661 static void closedown_active_slot(struct active_request_slot *slot)
663 active_requests--;
664 slot->in_use = 0;
667 static void release_active_slot(struct active_request_slot *slot)
669 closedown_active_slot(slot);
670 if (slot->curl && curl_session_count > min_curl_sessions) {
671 #ifdef USE_CURL_MULTI
672 curl_multi_remove_handle(curlm, slot->curl);
673 #endif
674 curl_easy_cleanup(slot->curl);
675 slot->curl = NULL;
676 curl_session_count--;
678 #ifdef USE_CURL_MULTI
679 fill_active_slots();
680 #endif
683 void finish_active_slot(struct active_request_slot *slot)
685 closedown_active_slot(slot);
686 curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
688 if (slot->finished != NULL)
689 (*slot->finished) = 1;
691 /* Store slot results so they can be read after the slot is reused */
692 if (slot->results != NULL) {
693 slot->results->curl_result = slot->curl_result;
694 slot->results->http_code = slot->http_code;
697 /* Run callback if appropriate */
698 if (slot->callback_func != NULL)
699 slot->callback_func(slot->callback_data);
702 void finish_all_active_slots(void)
704 struct active_request_slot *slot = active_queue_head;
706 while (slot != NULL)
707 if (slot->in_use) {
708 run_active_slot(slot);
709 slot = active_queue_head;
710 } else {
711 slot = slot->next;
715 /* Helpers for modifying and creating URLs */
716 static inline int needs_quote(int ch)
718 if (((ch >= 'A') && (ch <= 'Z'))
719 || ((ch >= 'a') && (ch <= 'z'))
720 || ((ch >= '0') && (ch <= '9'))
721 || (ch == '/')
722 || (ch == '-')
723 || (ch == '.'))
724 return 0;
725 return 1;
728 static inline int hex(int v)
730 if (v < 10)
731 return '0' + v;
732 else
733 return 'A' + v - 10;
736 void end_url_with_slash(struct strbuf *buf, const char *url)
738 strbuf_addstr(buf, url);
739 if (buf->len && buf->buf[buf->len - 1] != '/')
740 strbuf_addstr(buf, "/");
743 static char *quote_ref_url(const char *base, const char *ref)
745 struct strbuf buf = STRBUF_INIT;
746 const char *cp;
747 int ch;
749 end_url_with_slash(&buf, base);
751 for (cp = ref; (ch = *cp) != 0; cp++)
752 if (needs_quote(ch))
753 strbuf_addf(&buf, "%%%02x", ch);
754 else
755 strbuf_addch(&buf, *cp);
757 return strbuf_detach(&buf, NULL);
760 void append_remote_object_url(struct strbuf *buf, const char *url,
761 const char *hex,
762 int only_two_digit_prefix)
764 end_url_with_slash(buf, url);
766 strbuf_addf(buf, "objects/%.*s/", 2, hex);
767 if (!only_two_digit_prefix)
768 strbuf_addf(buf, "%s", hex+2);
771 char *get_remote_object_url(const char *url, const char *hex,
772 int only_two_digit_prefix)
774 struct strbuf buf = STRBUF_INIT;
775 append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
776 return strbuf_detach(&buf, NULL);
779 /* http_request() targets */
780 #define HTTP_REQUEST_STRBUF 0
781 #define HTTP_REQUEST_FILE 1
783 static int http_request(const char *url, void *result, int target, int options)
785 struct active_request_slot *slot;
786 struct slot_results results;
787 struct curl_slist *headers = NULL;
788 struct strbuf buf = STRBUF_INIT;
789 int ret;
791 slot = get_active_slot();
792 slot->results = &results;
793 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
795 if (result == NULL) {
796 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
797 } else {
798 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
799 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
801 if (target == HTTP_REQUEST_FILE) {
802 long posn = ftell(result);
803 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
804 fwrite);
805 if (posn > 0) {
806 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
807 headers = curl_slist_append(headers, buf.buf);
808 strbuf_reset(&buf);
810 slot->local = result;
811 } else
812 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
813 fwrite_buffer);
816 strbuf_addstr(&buf, "Pragma:");
817 if (options & HTTP_NO_CACHE)
818 strbuf_addstr(&buf, " no-cache");
820 headers = curl_slist_append(headers, buf.buf);
822 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
823 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
825 if (start_active_slot(slot)) {
826 run_active_slot(slot);
827 if (results.curl_result == CURLE_OK)
828 ret = HTTP_OK;
829 else if (missing_target(&results))
830 ret = HTTP_MISSING_TARGET;
831 else if (results.http_code == 401) {
832 if (user_name) {
833 ret = HTTP_NOAUTH;
834 } else {
836 * git_getpass is needed here because its very likely stdin/stdout are
837 * pipes to our parent process. So we instead need to use /dev/tty,
838 * but that is non-portable. Using git_getpass() can at least be stubbed
839 * on other platforms with a different implementation if/when necessary.
841 user_name = xstrdup(git_getpass("Username: "));
842 init_curl_http_auth(slot->curl);
843 ret = HTTP_REAUTH;
845 } else
846 ret = HTTP_ERROR;
847 } else {
848 error("Unable to start HTTP request for %s", url);
849 ret = HTTP_START_FAILED;
852 slot->local = NULL;
853 curl_slist_free_all(headers);
854 strbuf_release(&buf);
856 return ret;
859 int http_get_strbuf(const char *url, struct strbuf *result, int options)
861 int http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
862 if (http_ret == HTTP_REAUTH) {
863 http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
865 return http_ret;
869 * Downloads an url and stores the result in the given file.
871 * If a previous interrupted download is detected (i.e. a previous temporary
872 * file is still around) the download is resumed.
874 static int http_get_file(const char *url, const char *filename, int options)
876 int ret;
877 struct strbuf tmpfile = STRBUF_INIT;
878 FILE *result;
880 strbuf_addf(&tmpfile, "%s.temp", filename);
881 result = fopen(tmpfile.buf, "a");
882 if (! result) {
883 error("Unable to open local file %s", tmpfile.buf);
884 ret = HTTP_ERROR;
885 goto cleanup;
888 ret = http_request(url, result, HTTP_REQUEST_FILE, options);
889 fclose(result);
891 if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
892 ret = HTTP_ERROR;
893 cleanup:
894 strbuf_release(&tmpfile);
895 return ret;
898 int http_error(const char *url, int ret)
900 /* http_request has already handled HTTP_START_FAILED. */
901 if (ret != HTTP_START_FAILED)
902 error("%s while accessing %s\n", curl_errorstr, url);
904 return ret;
907 int http_fetch_ref(const char *base, struct ref *ref)
909 char *url;
910 struct strbuf buffer = STRBUF_INIT;
911 int ret = -1;
913 url = quote_ref_url(base, ref->name);
914 if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
915 strbuf_rtrim(&buffer);
916 if (buffer.len == 40)
917 ret = get_sha1_hex(buffer.buf, ref->old_sha1);
918 else if (!prefixcmp(buffer.buf, "ref: ")) {
919 ref->symref = xstrdup(buffer.buf + 5);
920 ret = 0;
924 strbuf_release(&buffer);
925 free(url);
926 return ret;
929 /* Helpers for fetching packs */
930 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
932 char *url, *tmp;
933 struct strbuf buf = STRBUF_INIT;
935 if (http_is_verbose)
936 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
938 end_url_with_slash(&buf, base_url);
939 strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
940 url = strbuf_detach(&buf, NULL);
942 strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
943 tmp = strbuf_detach(&buf, NULL);
945 if (http_get_file(url, tmp, 0) != HTTP_OK) {
946 error("Unable to get pack index %s\n", url);
947 free(tmp);
948 tmp = NULL;
951 free(url);
952 return tmp;
955 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
956 unsigned char *sha1, const char *base_url)
958 struct packed_git *new_pack;
959 char *tmp_idx = NULL;
960 int ret;
962 if (has_pack_index(sha1)) {
963 new_pack = parse_pack_index(sha1, NULL);
964 if (!new_pack)
965 return -1; /* parse_pack_index() already issued error message */
966 goto add_pack;
969 tmp_idx = fetch_pack_index(sha1, base_url);
970 if (!tmp_idx)
971 return -1;
973 new_pack = parse_pack_index(sha1, tmp_idx);
974 if (!new_pack) {
975 unlink(tmp_idx);
976 free(tmp_idx);
978 return -1; /* parse_pack_index() already issued error message */
981 ret = verify_pack_index(new_pack);
982 if (!ret) {
983 close_pack_index(new_pack);
984 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
986 free(tmp_idx);
987 if (ret)
988 return -1;
990 add_pack:
991 new_pack->next = *packs_head;
992 *packs_head = new_pack;
993 return 0;
996 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
998 int ret = 0, i = 0;
999 char *url, *data;
1000 struct strbuf buf = STRBUF_INIT;
1001 unsigned char sha1[20];
1003 end_url_with_slash(&buf, base_url);
1004 strbuf_addstr(&buf, "objects/info/packs");
1005 url = strbuf_detach(&buf, NULL);
1007 ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
1008 if (ret != HTTP_OK)
1009 goto cleanup;
1011 data = buf.buf;
1012 while (i < buf.len) {
1013 switch (data[i]) {
1014 case 'P':
1015 i++;
1016 if (i + 52 <= buf.len &&
1017 !prefixcmp(data + i, " pack-") &&
1018 !prefixcmp(data + i + 46, ".pack\n")) {
1019 get_sha1_hex(data + i + 6, sha1);
1020 fetch_and_setup_pack_index(packs_head, sha1,
1021 base_url);
1022 i += 51;
1023 break;
1025 default:
1026 while (i < buf.len && data[i] != '\n')
1027 i++;
1029 i++;
1032 cleanup:
1033 free(url);
1034 return ret;
1037 void release_http_pack_request(struct http_pack_request *preq)
1039 if (preq->packfile != NULL) {
1040 fclose(preq->packfile);
1041 preq->packfile = NULL;
1042 preq->slot->local = NULL;
1044 if (preq->range_header != NULL) {
1045 curl_slist_free_all(preq->range_header);
1046 preq->range_header = NULL;
1048 preq->slot = NULL;
1049 free(preq->url);
1052 int finish_http_pack_request(struct http_pack_request *preq)
1054 struct packed_git **lst;
1055 struct packed_git *p = preq->target;
1056 char *tmp_idx;
1057 struct child_process ip;
1058 const char *ip_argv[8];
1060 close_pack_index(p);
1062 fclose(preq->packfile);
1063 preq->packfile = NULL;
1064 preq->slot->local = NULL;
1066 lst = preq->lst;
1067 while (*lst != p)
1068 lst = &((*lst)->next);
1069 *lst = (*lst)->next;
1071 tmp_idx = xstrdup(preq->tmpfile);
1072 strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1073 ".idx.temp");
1075 ip_argv[0] = "index-pack";
1076 ip_argv[1] = "-o";
1077 ip_argv[2] = tmp_idx;
1078 ip_argv[3] = preq->tmpfile;
1079 ip_argv[4] = NULL;
1081 memset(&ip, 0, sizeof(ip));
1082 ip.argv = ip_argv;
1083 ip.git_cmd = 1;
1084 ip.no_stdin = 1;
1085 ip.no_stdout = 1;
1087 if (run_command(&ip)) {
1088 unlink(preq->tmpfile);
1089 unlink(tmp_idx);
1090 free(tmp_idx);
1091 return -1;
1094 unlink(sha1_pack_index_name(p->sha1));
1096 if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1097 || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1098 free(tmp_idx);
1099 return -1;
1102 install_packed_git(p);
1103 free(tmp_idx);
1104 return 0;
1107 struct http_pack_request *new_http_pack_request(
1108 struct packed_git *target, const char *base_url)
1110 long prev_posn = 0;
1111 char range[RANGE_HEADER_SIZE];
1112 struct strbuf buf = STRBUF_INIT;
1113 struct http_pack_request *preq;
1115 preq = xmalloc(sizeof(*preq));
1116 preq->target = target;
1117 preq->range_header = NULL;
1119 end_url_with_slash(&buf, base_url);
1120 strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1121 sha1_to_hex(target->sha1));
1122 preq->url = strbuf_detach(&buf, NULL);
1124 snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1125 sha1_pack_name(target->sha1));
1126 preq->packfile = fopen(preq->tmpfile, "a");
1127 if (!preq->packfile) {
1128 error("Unable to open local file %s for pack",
1129 preq->tmpfile);
1130 goto abort;
1133 preq->slot = get_active_slot();
1134 preq->slot->local = preq->packfile;
1135 curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1136 curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1137 curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1138 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1139 no_pragma_header);
1142 * If there is data present from a previous transfer attempt,
1143 * resume where it left off
1145 prev_posn = ftell(preq->packfile);
1146 if (prev_posn>0) {
1147 if (http_is_verbose)
1148 fprintf(stderr,
1149 "Resuming fetch of pack %s at byte %ld\n",
1150 sha1_to_hex(target->sha1), prev_posn);
1151 sprintf(range, "Range: bytes=%ld-", prev_posn);
1152 preq->range_header = curl_slist_append(NULL, range);
1153 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1154 preq->range_header);
1157 return preq;
1159 abort:
1160 free(preq->url);
1161 free(preq);
1162 return NULL;
1165 /* Helpers for fetching objects (loose) */
1166 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
1167 void *data)
1169 unsigned char expn[4096];
1170 size_t size = eltsize * nmemb;
1171 int posn = 0;
1172 struct http_object_request *freq =
1173 (struct http_object_request *)data;
1174 do {
1175 ssize_t retval = xwrite(freq->localfile,
1176 (char *) ptr + posn, size - posn);
1177 if (retval < 0)
1178 return posn;
1179 posn += retval;
1180 } while (posn < size);
1182 freq->stream.avail_in = size;
1183 freq->stream.next_in = ptr;
1184 do {
1185 freq->stream.next_out = expn;
1186 freq->stream.avail_out = sizeof(expn);
1187 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1188 git_SHA1_Update(&freq->c, expn,
1189 sizeof(expn) - freq->stream.avail_out);
1190 } while (freq->stream.avail_in && freq->zret == Z_OK);
1191 data_received++;
1192 return size;
1195 struct http_object_request *new_http_object_request(const char *base_url,
1196 unsigned char *sha1)
1198 char *hex = sha1_to_hex(sha1);
1199 char *filename;
1200 char prevfile[PATH_MAX];
1201 int prevlocal;
1202 unsigned char prev_buf[PREV_BUF_SIZE];
1203 ssize_t prev_read = 0;
1204 long prev_posn = 0;
1205 char range[RANGE_HEADER_SIZE];
1206 struct curl_slist *range_header = NULL;
1207 struct http_object_request *freq;
1209 freq = xmalloc(sizeof(*freq));
1210 hashcpy(freq->sha1, sha1);
1211 freq->localfile = -1;
1213 filename = sha1_file_name(sha1);
1214 snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1215 "%s.temp", filename);
1217 snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1218 unlink_or_warn(prevfile);
1219 rename(freq->tmpfile, prevfile);
1220 unlink_or_warn(freq->tmpfile);
1222 if (freq->localfile != -1)
1223 error("fd leakage in start: %d", freq->localfile);
1224 freq->localfile = open(freq->tmpfile,
1225 O_WRONLY | O_CREAT | O_EXCL, 0666);
1227 * This could have failed due to the "lazy directory creation";
1228 * try to mkdir the last path component.
1230 if (freq->localfile < 0 && errno == ENOENT) {
1231 char *dir = strrchr(freq->tmpfile, '/');
1232 if (dir) {
1233 *dir = 0;
1234 mkdir(freq->tmpfile, 0777);
1235 *dir = '/';
1237 freq->localfile = open(freq->tmpfile,
1238 O_WRONLY | O_CREAT | O_EXCL, 0666);
1241 if (freq->localfile < 0) {
1242 error("Couldn't create temporary file %s: %s",
1243 freq->tmpfile, strerror(errno));
1244 goto abort;
1247 memset(&freq->stream, 0, sizeof(freq->stream));
1249 git_inflate_init(&freq->stream);
1251 git_SHA1_Init(&freq->c);
1253 freq->url = get_remote_object_url(base_url, hex, 0);
1256 * If a previous temp file is present, process what was already
1257 * fetched.
1259 prevlocal = open(prevfile, O_RDONLY);
1260 if (prevlocal != -1) {
1261 do {
1262 prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1263 if (prev_read>0) {
1264 if (fwrite_sha1_file(prev_buf,
1266 prev_read,
1267 freq) == prev_read) {
1268 prev_posn += prev_read;
1269 } else {
1270 prev_read = -1;
1273 } while (prev_read > 0);
1274 close(prevlocal);
1276 unlink_or_warn(prevfile);
1279 * Reset inflate/SHA1 if there was an error reading the previous temp
1280 * file; also rewind to the beginning of the local file.
1282 if (prev_read == -1) {
1283 memset(&freq->stream, 0, sizeof(freq->stream));
1284 git_inflate_init(&freq->stream);
1285 git_SHA1_Init(&freq->c);
1286 if (prev_posn>0) {
1287 prev_posn = 0;
1288 lseek(freq->localfile, 0, SEEK_SET);
1289 if (ftruncate(freq->localfile, 0) < 0) {
1290 error("Couldn't truncate temporary file %s: %s",
1291 freq->tmpfile, strerror(errno));
1292 goto abort;
1297 freq->slot = get_active_slot();
1299 curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1300 curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1301 curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1302 curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1303 curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1306 * If we have successfully processed data from a previous fetch
1307 * attempt, only fetch the data we don't already have.
1309 if (prev_posn>0) {
1310 if (http_is_verbose)
1311 fprintf(stderr,
1312 "Resuming fetch of object %s at byte %ld\n",
1313 hex, prev_posn);
1314 sprintf(range, "Range: bytes=%ld-", prev_posn);
1315 range_header = curl_slist_append(range_header, range);
1316 curl_easy_setopt(freq->slot->curl,
1317 CURLOPT_HTTPHEADER, range_header);
1320 return freq;
1322 abort:
1323 free(filename);
1324 free(freq->url);
1325 free(freq);
1326 return NULL;
1329 void process_http_object_request(struct http_object_request *freq)
1331 if (freq->slot == NULL)
1332 return;
1333 freq->curl_result = freq->slot->curl_result;
1334 freq->http_code = freq->slot->http_code;
1335 freq->slot = NULL;
1338 int finish_http_object_request(struct http_object_request *freq)
1340 struct stat st;
1342 close(freq->localfile);
1343 freq->localfile = -1;
1345 process_http_object_request(freq);
1347 if (freq->http_code == 416) {
1348 warning("requested range invalid; we may already have all the data.");
1349 } else if (freq->curl_result != CURLE_OK) {
1350 if (stat(freq->tmpfile, &st) == 0)
1351 if (st.st_size == 0)
1352 unlink_or_warn(freq->tmpfile);
1353 return -1;
1356 git_inflate_end(&freq->stream);
1357 git_SHA1_Final(freq->real_sha1, &freq->c);
1358 if (freq->zret != Z_STREAM_END) {
1359 unlink_or_warn(freq->tmpfile);
1360 return -1;
1362 if (hashcmp(freq->sha1, freq->real_sha1)) {
1363 unlink_or_warn(freq->tmpfile);
1364 return -1;
1366 freq->rename =
1367 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1369 return freq->rename;
1372 void abort_http_object_request(struct http_object_request *freq)
1374 unlink_or_warn(freq->tmpfile);
1376 release_http_object_request(freq);
1379 void release_http_object_request(struct http_object_request *freq)
1381 if (freq->localfile != -1) {
1382 close(freq->localfile);
1383 freq->localfile = -1;
1385 if (freq->url != NULL) {
1386 free(freq->url);
1387 freq->url = NULL;
1389 if (freq->slot != NULL) {
1390 freq->slot->callback_func = NULL;
1391 freq->slot->callback_data = NULL;
1392 release_active_slot(freq->slot);
1393 freq->slot = NULL;