Update documentation for C-style quoting.
[git/jnareb-git/bp-gitweb.git] / http-fetch.c
blobefa6e82329ad514fc31f7c5d335e9b6ec962d95b
1 #include "cache.h"
2 #include "commit.h"
3 #include "pack.h"
4 #include "fetch.h"
6 #include <curl/curl.h>
7 #include <curl/easy.h>
9 #if LIBCURL_VERSION_NUM >= 0x070908
10 #define USE_CURL_MULTI
11 #define DEFAULT_MAX_REQUESTS 5
12 #endif
14 #if LIBCURL_VERSION_NUM < 0x070704
15 #define curl_global_cleanup() do { /* nothing */ } while(0)
16 #endif
17 #if LIBCURL_VERSION_NUM < 0x070800
18 #define curl_global_init(a) do { /* nothing */ } while(0)
19 #endif
21 #if LIBCURL_VERSION_NUM < 0x070c04
22 #define NO_CURL_EASY_DUPHANDLE
23 #endif
25 #define PREV_BUF_SIZE 4096
26 #define RANGE_HEADER_SIZE 30
28 static int active_requests = 0;
29 static int data_received;
31 #ifdef USE_CURL_MULTI
32 static int max_requests = -1;
33 static CURLM *curlm;
34 #endif
35 #ifndef NO_CURL_EASY_DUPHANDLE
36 static CURL *curl_default;
37 #endif
38 static struct curl_slist *pragma_header;
39 static struct curl_slist *no_pragma_header;
40 static struct curl_slist *no_range_header;
41 static char curl_errorstr[CURL_ERROR_SIZE];
43 struct alt_base
45 char *base;
46 int got_indices;
47 struct packed_git *packs;
48 struct alt_base *next;
51 static struct alt_base *alt = NULL;
53 enum transfer_state {
54 WAITING,
55 ABORTED,
56 ACTIVE,
57 COMPLETE,
60 struct transfer_request
62 unsigned char sha1[20];
63 struct alt_base *repo;
64 char *url;
65 char filename[PATH_MAX];
66 char tmpfile[PATH_MAX];
67 int local;
68 enum transfer_state state;
69 CURLcode curl_result;
70 char errorstr[CURL_ERROR_SIZE];
71 long http_code;
72 unsigned char real_sha1[20];
73 SHA_CTX c;
74 z_stream stream;
75 int zret;
76 int rename;
77 struct active_request_slot *slot;
78 struct transfer_request *next;
81 struct active_request_slot
83 CURL *curl;
84 FILE *local;
85 int in_use;
86 int done;
87 CURLcode curl_result;
88 struct active_request_slot *next;
91 static struct transfer_request *request_queue_head = NULL;
92 static struct active_request_slot *active_queue_head = NULL;
94 static int curl_ssl_verify = -1;
95 static char *ssl_cert = NULL;
96 #if LIBCURL_VERSION_NUM >= 0x070902
97 static char *ssl_key = NULL;
98 #endif
99 #if LIBCURL_VERSION_NUM >= 0x070908
100 static char *ssl_capath = NULL;
101 #endif
102 static char *ssl_cainfo = NULL;
104 struct buffer
106 size_t posn;
107 size_t size;
108 void *buffer;
111 static int http_options(const char *var, const char *value)
113 if (!strcmp("http.sslverify", var)) {
114 if (curl_ssl_verify == -1) {
115 curl_ssl_verify = git_config_bool(var, value);
117 return 0;
120 if (!strcmp("http.sslcert", var)) {
121 if (ssl_cert == NULL) {
122 ssl_cert = xmalloc(strlen(value)+1);
123 strcpy(ssl_cert, value);
125 return 0;
127 #if LIBCURL_VERSION_NUM >= 0x070902
128 if (!strcmp("http.sslkey", var)) {
129 if (ssl_key == NULL) {
130 ssl_key = xmalloc(strlen(value)+1);
131 strcpy(ssl_key, value);
133 return 0;
135 #endif
136 #if LIBCURL_VERSION_NUM >= 0x070908
137 if (!strcmp("http.sslcapath", var)) {
138 if (ssl_capath == NULL) {
139 ssl_capath = xmalloc(strlen(value)+1);
140 strcpy(ssl_capath, value);
142 return 0;
144 #endif
145 if (!strcmp("http.sslcainfo", var)) {
146 if (ssl_cainfo == NULL) {
147 ssl_cainfo = xmalloc(strlen(value)+1);
148 strcpy(ssl_cainfo, value);
150 return 0;
153 #ifdef USE_CURL_MULTI
154 if (!strcmp("http.maxrequests", var)) {
155 if (max_requests == -1)
156 max_requests = git_config_int(var, value);
157 return 0;
159 #endif
161 /* Fall back on the default ones */
162 return git_default_config(var, value);
165 static size_t fwrite_buffer(void *ptr, size_t eltsize, size_t nmemb,
166 struct buffer *buffer)
168 size_t size = eltsize * nmemb;
169 if (size > buffer->size - buffer->posn)
170 size = buffer->size - buffer->posn;
171 memcpy(buffer->buffer + buffer->posn, ptr, size);
172 buffer->posn += size;
173 data_received++;
174 return size;
177 static size_t fwrite_buffer_dynamic(const void *ptr, size_t eltsize,
178 size_t nmemb, struct buffer *buffer)
180 size_t size = eltsize * nmemb;
181 if (size > buffer->size - buffer->posn) {
182 buffer->size = buffer->size * 3 / 2;
183 if (buffer->size < buffer->posn + size)
184 buffer->size = buffer->posn + size;
185 buffer->buffer = xrealloc(buffer->buffer, buffer->size);
187 memcpy(buffer->buffer + buffer->posn, ptr, size);
188 buffer->posn += size;
189 data_received++;
190 return size;
193 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
194 void *data)
196 unsigned char expn[4096];
197 size_t size = eltsize * nmemb;
198 int posn = 0;
199 struct transfer_request *request = (struct transfer_request *)data;
200 do {
201 ssize_t retval = write(request->local,
202 ptr + posn, size - posn);
203 if (retval < 0)
204 return posn;
205 posn += retval;
206 } while (posn < size);
208 request->stream.avail_in = size;
209 request->stream.next_in = ptr;
210 do {
211 request->stream.next_out = expn;
212 request->stream.avail_out = sizeof(expn);
213 request->zret = inflate(&request->stream, Z_SYNC_FLUSH);
214 SHA1_Update(&request->c, expn,
215 sizeof(expn) - request->stream.avail_out);
216 } while (request->stream.avail_in && request->zret == Z_OK);
217 data_received++;
218 return size;
221 #ifdef USE_CURL_MULTI
222 static void process_curl_messages(void);
223 static void process_request_queue(void);
224 #endif
226 static CURL* get_curl_handle(void)
228 CURL* result = curl_easy_init();
230 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, curl_ssl_verify);
231 #if LIBCURL_VERSION_NUM >= 0x070907
232 curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
233 #endif
235 if (ssl_cert != NULL)
236 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
237 #if LIBCURL_VERSION_NUM >= 0x070902
238 if (ssl_key != NULL)
239 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
240 #endif
241 #if LIBCURL_VERSION_NUM >= 0x070908
242 if (ssl_capath != NULL)
243 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
244 #endif
245 if (ssl_cainfo != NULL)
246 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
247 curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
249 return result;
252 static struct active_request_slot *get_active_slot(void)
254 struct active_request_slot *slot = active_queue_head;
255 struct active_request_slot *newslot;
257 #ifdef USE_CURL_MULTI
258 int num_transfers;
260 /* Wait for a slot to open up if the queue is full */
261 while (active_requests >= max_requests) {
262 curl_multi_perform(curlm, &num_transfers);
263 if (num_transfers < active_requests) {
264 process_curl_messages();
267 #endif
269 while (slot != NULL && slot->in_use) {
270 slot = slot->next;
272 if (slot == NULL) {
273 newslot = xmalloc(sizeof(*newslot));
274 #ifdef NO_CURL_EASY_DUPHANDLE
275 newslot->curl = get_curl_handle();
276 #else
277 newslot->curl = curl_easy_duphandle(curl_default);
278 #endif
279 newslot->in_use = 0;
280 newslot->next = NULL;
282 slot = active_queue_head;
283 if (slot == NULL) {
284 active_queue_head = newslot;
285 } else {
286 while (slot->next != NULL) {
287 slot = slot->next;
289 slot->next = newslot;
291 slot = newslot;
294 active_requests++;
295 slot->in_use = 1;
296 slot->done = 0;
297 slot->local = NULL;
298 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
299 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_range_header);
300 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
302 return slot;
305 static int start_active_slot(struct active_request_slot *slot)
307 #ifdef USE_CURL_MULTI
308 CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
310 if (curlm_result != CURLM_OK &&
311 curlm_result != CURLM_CALL_MULTI_PERFORM) {
312 active_requests--;
313 slot->in_use = 0;
314 return 0;
316 #endif
317 return 1;
320 static void run_active_slot(struct active_request_slot *slot)
322 #ifdef USE_CURL_MULTI
323 int num_transfers;
324 long last_pos = 0;
325 long current_pos;
326 fd_set readfds;
327 fd_set writefds;
328 fd_set excfds;
329 int max_fd;
330 struct timeval select_timeout;
331 CURLMcode curlm_result;
333 while (!slot->done) {
334 data_received = 0;
335 do {
336 curlm_result = curl_multi_perform(curlm,
337 &num_transfers);
338 } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
339 if (num_transfers < active_requests) {
340 process_curl_messages();
341 process_request_queue();
344 if (!data_received && slot->local != NULL) {
345 current_pos = ftell(slot->local);
346 if (current_pos > last_pos)
347 data_received++;
348 last_pos = current_pos;
351 if (!slot->done && !data_received) {
352 max_fd = 0;
353 FD_ZERO(&readfds);
354 FD_ZERO(&writefds);
355 FD_ZERO(&excfds);
356 select_timeout.tv_sec = 0;
357 select_timeout.tv_usec = 50000;
358 select(max_fd, &readfds, &writefds,
359 &excfds, &select_timeout);
362 #else
363 slot->curl_result = curl_easy_perform(slot->curl);
364 active_requests--;
365 #endif
368 static void start_request(struct transfer_request *request)
370 char *hex = sha1_to_hex(request->sha1);
371 char prevfile[PATH_MAX];
372 char *url;
373 char *posn;
374 int prevlocal;
375 unsigned char prev_buf[PREV_BUF_SIZE];
376 ssize_t prev_read = 0;
377 long prev_posn = 0;
378 char range[RANGE_HEADER_SIZE];
379 struct curl_slist *range_header = NULL;
380 struct active_request_slot *slot;
382 snprintf(prevfile, sizeof(prevfile), "%s.prev", request->filename);
383 unlink(prevfile);
384 rename(request->tmpfile, prevfile);
385 unlink(request->tmpfile);
387 request->local = open(request->tmpfile,
388 O_WRONLY | O_CREAT | O_EXCL, 0666);
389 /* This could have failed due to the "lazy directory creation";
390 * try to mkdir the last path component.
392 if (request->local < 0 && errno == ENOENT) {
393 char *dir = strrchr(request->tmpfile, '/');
394 if (dir) {
395 *dir = 0;
396 mkdir(request->tmpfile, 0777);
397 *dir = '/';
399 request->local = open(request->tmpfile,
400 O_WRONLY | O_CREAT | O_EXCL, 0666);
403 if (request->local < 0) {
404 request->state = ABORTED;
405 error("Couldn't create temporary file %s for %s: %s\n",
406 request->tmpfile, request->filename, strerror(errno));
407 return;
410 memset(&request->stream, 0, sizeof(request->stream));
412 inflateInit(&request->stream);
414 SHA1_Init(&request->c);
416 url = xmalloc(strlen(request->repo->base) + 50);
417 request->url = xmalloc(strlen(request->repo->base) + 50);
418 strcpy(url, request->repo->base);
419 posn = url + strlen(request->repo->base);
420 strcpy(posn, "objects/");
421 posn += 8;
422 memcpy(posn, hex, 2);
423 posn += 2;
424 *(posn++) = '/';
425 strcpy(posn, hex + 2);
426 strcpy(request->url, url);
428 /* If a previous temp file is present, process what was already
429 fetched. */
430 prevlocal = open(prevfile, O_RDONLY);
431 if (prevlocal != -1) {
432 do {
433 prev_read = read(prevlocal, prev_buf, PREV_BUF_SIZE);
434 if (prev_read>0) {
435 if (fwrite_sha1_file(prev_buf,
437 prev_read,
438 request) == prev_read) {
439 prev_posn += prev_read;
440 } else {
441 prev_read = -1;
444 } while (prev_read > 0);
445 close(prevlocal);
447 unlink(prevfile);
449 /* Reset inflate/SHA1 if there was an error reading the previous temp
450 file; also rewind to the beginning of the local file. */
451 if (prev_read == -1) {
452 memset(&request->stream, 0, sizeof(request->stream));
453 inflateInit(&request->stream);
454 SHA1_Init(&request->c);
455 if (prev_posn>0) {
456 prev_posn = 0;
457 lseek(request->local, SEEK_SET, 0);
458 ftruncate(request->local, 0);
462 slot = get_active_slot();
463 curl_easy_setopt(slot->curl, CURLOPT_FILE, request);
464 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
465 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, request->errorstr);
466 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
467 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
469 /* If we have successfully processed data from a previous fetch
470 attempt, only fetch the data we don't already have. */
471 if (prev_posn>0) {
472 if (get_verbosely)
473 fprintf(stderr,
474 "Resuming fetch of object %s at byte %ld\n",
475 hex, prev_posn);
476 sprintf(range, "Range: bytes=%ld-", prev_posn);
477 range_header = curl_slist_append(range_header, range);
478 curl_easy_setopt(slot->curl,
479 CURLOPT_HTTPHEADER, range_header);
482 /* Try to get the request started, abort the request on error */
483 if (!start_active_slot(slot)) {
484 request->state = ABORTED;
485 close(request->local);
486 free(request->url);
487 return;
490 request->slot = slot;
491 request->state = ACTIVE;
494 static void finish_request(struct transfer_request *request)
496 fchmod(request->local, 0444);
497 close(request->local);
499 if (request->http_code == 416) {
500 fprintf(stderr, "Warning: requested range invalid; we may already have all the data.\n");
501 } else if (request->curl_result != CURLE_OK) {
502 return;
505 inflateEnd(&request->stream);
506 SHA1_Final(request->real_sha1, &request->c);
507 if (request->zret != Z_STREAM_END) {
508 unlink(request->tmpfile);
509 return;
511 if (memcmp(request->sha1, request->real_sha1, 20)) {
512 unlink(request->tmpfile);
513 return;
515 request->rename =
516 move_temp_to_file(request->tmpfile, request->filename);
518 if (request->rename == 0)
519 pull_say("got %s\n", sha1_to_hex(request->sha1));
522 static void release_request(struct transfer_request *request)
524 struct transfer_request *entry = request_queue_head;
526 if (request == request_queue_head) {
527 request_queue_head = request->next;
528 } else {
529 while (entry->next != NULL && entry->next != request)
530 entry = entry->next;
531 if (entry->next == request)
532 entry->next = entry->next->next;
535 free(request->url);
536 free(request);
539 #ifdef USE_CURL_MULTI
540 void process_curl_messages(void)
542 int num_messages;
543 struct active_request_slot *slot;
544 struct transfer_request *request = NULL;
545 CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
547 while (curl_message != NULL) {
548 if (curl_message->msg == CURLMSG_DONE) {
549 slot = active_queue_head;
550 while (slot != NULL &&
551 slot->curl != curl_message->easy_handle)
552 slot = slot->next;
553 if (slot != NULL) {
554 curl_multi_remove_handle(curlm, slot->curl);
555 active_requests--;
556 slot->done = 1;
557 slot->in_use = 0;
558 slot->curl_result = curl_message->data.result;
559 request = request_queue_head;
560 while (request != NULL &&
561 request->slot != slot)
562 request = request->next;
563 } else {
564 fprintf(stderr, "Received DONE message for unknown request!\n");
566 if (request != NULL) {
567 request->curl_result =
568 curl_message->data.result;
569 curl_easy_getinfo(slot->curl,
570 CURLINFO_HTTP_CODE,
571 &request->http_code);
572 request->slot = NULL;
574 /* Use alternates if necessary */
575 if (request->http_code == 404 &&
576 request->repo->next != NULL) {
577 request->repo = request->repo->next;
578 start_request(request);
579 } else {
580 finish_request(request);
581 request->state = COMPLETE;
584 } else {
585 fprintf(stderr, "Unknown CURL message received: %d\n",
586 (int)curl_message->msg);
588 curl_message = curl_multi_info_read(curlm, &num_messages);
592 void process_request_queue(void)
594 struct transfer_request *request = request_queue_head;
595 int num_transfers;
597 while (active_requests < max_requests && request != NULL) {
598 if (request->state == WAITING) {
599 if (has_sha1_file(request->sha1))
600 release_request(request);
601 else
602 start_request(request);
603 curl_multi_perform(curlm, &num_transfers);
605 request = request->next;
608 #endif
610 void prefetch(unsigned char *sha1)
612 struct transfer_request *newreq;
613 struct transfer_request *tail;
614 char *filename = sha1_file_name(sha1);
616 newreq = xmalloc(sizeof(*newreq));
617 memcpy(newreq->sha1, sha1, 20);
618 newreq->repo = alt;
619 newreq->url = NULL;
620 newreq->local = -1;
621 newreq->state = WAITING;
622 snprintf(newreq->filename, sizeof(newreq->filename), "%s", filename);
623 snprintf(newreq->tmpfile, sizeof(newreq->tmpfile),
624 "%s.temp", filename);
625 newreq->next = NULL;
627 if (request_queue_head == NULL) {
628 request_queue_head = newreq;
629 } else {
630 tail = request_queue_head;
631 while (tail->next != NULL) {
632 tail = tail->next;
634 tail->next = newreq;
636 #ifdef USE_CURL_MULTI
637 process_request_queue();
638 process_curl_messages();
639 #endif
642 static int fetch_index(struct alt_base *repo, unsigned char *sha1)
644 char *hex = sha1_to_hex(sha1);
645 char *filename;
646 char *url;
647 char tmpfile[PATH_MAX];
648 long prev_posn = 0;
649 char range[RANGE_HEADER_SIZE];
650 struct curl_slist *range_header = NULL;
652 FILE *indexfile;
653 struct active_request_slot *slot;
655 if (has_pack_index(sha1))
656 return 0;
658 if (get_verbosely)
659 fprintf(stderr, "Getting index for pack %s\n", hex);
661 url = xmalloc(strlen(repo->base) + 64);
662 sprintf(url, "%s/objects/pack/pack-%s.idx", repo->base, hex);
664 filename = sha1_pack_index_name(sha1);
665 snprintf(tmpfile, sizeof(tmpfile), "%s.temp", filename);
666 indexfile = fopen(tmpfile, "a");
667 if (!indexfile)
668 return error("Unable to open local file %s for pack index",
669 filename);
671 slot = get_active_slot();
672 curl_easy_setopt(slot->curl, CURLOPT_FILE, indexfile);
673 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
674 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
675 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
676 slot->local = indexfile;
678 /* If there is data present from a previous transfer attempt,
679 resume where it left off */
680 prev_posn = ftell(indexfile);
681 if (prev_posn>0) {
682 if (get_verbosely)
683 fprintf(stderr,
684 "Resuming fetch of index for pack %s at byte %ld\n",
685 hex, prev_posn);
686 sprintf(range, "Range: bytes=%ld-", prev_posn);
687 range_header = curl_slist_append(range_header, range);
688 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, range_header);
691 if (start_active_slot(slot)) {
692 run_active_slot(slot);
693 if (slot->curl_result != CURLE_OK) {
694 fclose(indexfile);
695 return error("Unable to get pack index %s\n%s", url,
696 curl_errorstr);
698 } else {
699 return error("Unable to start request");
702 fclose(indexfile);
704 return move_temp_to_file(tmpfile, filename);
707 static int setup_index(struct alt_base *repo, unsigned char *sha1)
709 struct packed_git *new_pack;
710 if (has_pack_file(sha1))
711 return 0; // don't list this as something we can get
713 if (fetch_index(repo, sha1))
714 return -1;
716 new_pack = parse_pack_index(sha1);
717 new_pack->next = repo->packs;
718 repo->packs = new_pack;
719 return 0;
722 static int fetch_alternates(char *base)
724 int ret = 0;
725 struct buffer buffer;
726 char *url;
727 char *data;
728 int i = 0;
729 int http_specific = 1;
730 struct alt_base *tail = alt;
731 static const char null_byte = '\0';
733 struct active_request_slot *slot;
735 data = xmalloc(4096);
736 buffer.size = 4096;
737 buffer.posn = 0;
738 buffer.buffer = data;
740 if (get_verbosely)
741 fprintf(stderr, "Getting alternates list\n");
743 url = xmalloc(strlen(base) + 31);
744 sprintf(url, "%s/objects/info/http-alternates", base);
746 slot = get_active_slot();
747 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
748 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
749 fwrite_buffer_dynamic);
750 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
751 if (start_active_slot(slot)) {
752 run_active_slot(slot);
753 if (slot->curl_result != CURLE_OK || !buffer.posn) {
754 http_specific = 0;
756 sprintf(url, "%s/objects/info/alternates", base);
758 slot = get_active_slot();
759 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
760 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
761 fwrite_buffer_dynamic);
762 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
763 if (start_active_slot(slot)) {
764 run_active_slot(slot);
765 if (slot->curl_result != CURLE_OK) {
766 free(buffer.buffer);
767 return 0;
771 } else {
772 free(buffer.buffer);
773 return 0;
776 fwrite_buffer_dynamic(&null_byte, 1, 1, &buffer);
777 buffer.posn--;
778 data = buffer.buffer;
780 while (i < buffer.posn) {
781 int posn = i;
782 while (posn < buffer.posn && data[posn] != '\n')
783 posn++;
784 if (data[posn] == '\n') {
785 int okay = 0;
786 int serverlen = 0;
787 struct alt_base *newalt;
788 char *target = NULL;
789 if (data[i] == '/') {
790 serverlen = strchr(base + 8, '/') - base;
791 okay = 1;
792 } else if (!memcmp(data + i, "../", 3)) {
793 i += 3;
794 serverlen = strlen(base);
795 while (i + 2 < posn &&
796 !memcmp(data + i, "../", 3)) {
797 do {
798 serverlen--;
799 } while (serverlen &&
800 base[serverlen - 1] != '/');
801 i += 3;
803 // If the server got removed, give up.
804 okay = strchr(base, ':') - base + 3 <
805 serverlen;
806 } else if (http_specific) {
807 char *colon = strchr(data + i, ':');
808 char *slash = strchr(data + i, '/');
809 if (colon && slash && colon < data + posn &&
810 slash < data + posn && colon < slash) {
811 okay = 1;
814 // skip 'objects' at end
815 if (okay) {
816 target = xmalloc(serverlen + posn - i - 6);
817 strncpy(target, base, serverlen);
818 strncpy(target + serverlen, data + i,
819 posn - i - 7);
820 target[serverlen + posn - i - 7] = '\0';
821 if (get_verbosely)
822 fprintf(stderr,
823 "Also look at %s\n", target);
824 newalt = xmalloc(sizeof(*newalt));
825 newalt->next = NULL;
826 newalt->base = target;
827 newalt->got_indices = 0;
828 newalt->packs = NULL;
829 while (tail->next != NULL)
830 tail = tail->next;
831 tail->next = newalt;
832 ret++;
835 i = posn + 1;
838 free(buffer.buffer);
839 return ret;
842 static int fetch_indices(struct alt_base *repo)
844 unsigned char sha1[20];
845 char *url;
846 struct buffer buffer;
847 char *data;
848 int i = 0;
850 struct active_request_slot *slot;
852 if (repo->got_indices)
853 return 0;
855 data = xmalloc(4096);
856 buffer.size = 4096;
857 buffer.posn = 0;
858 buffer.buffer = data;
860 if (get_verbosely)
861 fprintf(stderr, "Getting pack list\n");
863 url = xmalloc(strlen(repo->base) + 21);
864 sprintf(url, "%s/objects/info/packs", repo->base);
866 slot = get_active_slot();
867 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
868 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
869 fwrite_buffer_dynamic);
870 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
871 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, NULL);
872 if (start_active_slot(slot)) {
873 run_active_slot(slot);
874 if (slot->curl_result != CURLE_OK) {
875 free(buffer.buffer);
876 return error("%s", curl_errorstr);
878 } else {
879 free(buffer.buffer);
880 return error("Unable to start request");
883 data = buffer.buffer;
884 while (i < buffer.posn) {
885 switch (data[i]) {
886 case 'P':
887 i++;
888 if (i + 52 < buffer.posn &&
889 !strncmp(data + i, " pack-", 6) &&
890 !strncmp(data + i + 46, ".pack\n", 6)) {
891 get_sha1_hex(data + i + 6, sha1);
892 setup_index(repo, sha1);
893 i += 51;
894 break;
896 default:
897 while (data[i] != '\n')
898 i++;
900 i++;
903 free(buffer.buffer);
904 repo->got_indices = 1;
905 return 0;
908 static int fetch_pack(struct alt_base *repo, unsigned char *sha1)
910 char *url;
911 struct packed_git *target;
912 struct packed_git **lst;
913 FILE *packfile;
914 char *filename;
915 char tmpfile[PATH_MAX];
916 int ret;
917 long prev_posn = 0;
918 char range[RANGE_HEADER_SIZE];
919 struct curl_slist *range_header = NULL;
921 struct active_request_slot *slot;
923 if (fetch_indices(repo))
924 return -1;
925 target = find_sha1_pack(sha1, repo->packs);
926 if (!target)
927 return -1;
929 if (get_verbosely) {
930 fprintf(stderr, "Getting pack %s\n",
931 sha1_to_hex(target->sha1));
932 fprintf(stderr, " which contains %s\n",
933 sha1_to_hex(sha1));
936 url = xmalloc(strlen(repo->base) + 65);
937 sprintf(url, "%s/objects/pack/pack-%s.pack",
938 repo->base, sha1_to_hex(target->sha1));
940 filename = sha1_pack_name(target->sha1);
941 snprintf(tmpfile, sizeof(tmpfile), "%s.temp", filename);
942 packfile = fopen(tmpfile, "a");
943 if (!packfile)
944 return error("Unable to open local file %s for pack",
945 filename);
947 slot = get_active_slot();
948 curl_easy_setopt(slot->curl, CURLOPT_FILE, packfile);
949 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
950 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
951 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
952 slot->local = packfile;
954 /* If there is data present from a previous transfer attempt,
955 resume where it left off */
956 prev_posn = ftell(packfile);
957 if (prev_posn>0) {
958 if (get_verbosely)
959 fprintf(stderr,
960 "Resuming fetch of pack %s at byte %ld\n",
961 sha1_to_hex(target->sha1), prev_posn);
962 sprintf(range, "Range: bytes=%ld-", prev_posn);
963 range_header = curl_slist_append(range_header, range);
964 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, range_header);
967 if (start_active_slot(slot)) {
968 run_active_slot(slot);
969 if (slot->curl_result != CURLE_OK) {
970 fclose(packfile);
971 return error("Unable to get pack file %s\n%s", url,
972 curl_errorstr);
974 } else {
975 return error("Unable to start request");
978 fclose(packfile);
980 ret = move_temp_to_file(tmpfile, filename);
981 if (ret)
982 return ret;
984 lst = &repo->packs;
985 while (*lst != target)
986 lst = &((*lst)->next);
987 *lst = (*lst)->next;
989 if (verify_pack(target, 0))
990 return -1;
991 install_packed_git(target);
993 return 0;
996 static int fetch_object(struct alt_base *repo, unsigned char *sha1)
998 char *hex = sha1_to_hex(sha1);
999 int ret;
1000 struct transfer_request *request = request_queue_head;
1002 while (request != NULL && memcmp(request->sha1, sha1, 20))
1003 request = request->next;
1004 if (request == NULL)
1005 return error("Couldn't find request for %s in the queue", hex);
1007 if (has_sha1_file(request->sha1)) {
1008 release_request(request);
1009 return 0;
1012 #ifdef USE_CURL_MULTI
1013 while (request->state == WAITING) {
1014 int num_transfers;
1015 curl_multi_perform(curlm, &num_transfers);
1016 if (num_transfers < active_requests) {
1017 process_curl_messages();
1018 process_request_queue();
1021 #else
1022 start_request(request);
1023 #endif
1025 while (request->state == ACTIVE) {
1026 run_active_slot(request->slot);
1027 #ifndef USE_CURL_MULTI
1028 request->curl_result = request->slot->curl_result;
1029 curl_easy_getinfo(request->slot->curl,
1030 CURLINFO_HTTP_CODE,
1031 &request->http_code);
1032 request->slot = NULL;
1034 /* Use alternates if necessary */
1035 if (request->http_code == 404 &&
1036 request->repo->next != NULL) {
1037 request->repo = request->repo->next;
1038 start_request(request);
1039 } else {
1040 finish_request(request);
1041 request->state = COMPLETE;
1043 #endif
1046 if (request->state == ABORTED) {
1047 release_request(request);
1048 return error("Request for %s aborted", hex);
1051 if (request->curl_result != CURLE_OK && request->http_code != 416) {
1052 ret = error("%s (curl_result = %d, http_code = %ld, sha1 = %s)",
1053 request->errorstr, request->curl_result,
1054 request->http_code, hex);
1055 release_request(request);
1056 return ret;
1059 if (request->zret != Z_STREAM_END) {
1060 ret = error("File %s (%s) corrupt\n", hex, request->url);
1061 release_request(request);
1062 return ret;
1065 if (memcmp(request->sha1, request->real_sha1, 20)) {
1066 release_request(request);
1067 return error("File %s has bad hash\n", hex);
1070 if (request->rename < 0) {
1071 ret = error("unable to write sha1 filename %s: %s",
1072 request->filename,
1073 strerror(request->rename));
1074 release_request(request);
1075 return ret;
1078 release_request(request);
1079 return 0;
1082 int fetch(unsigned char *sha1)
1084 struct alt_base *altbase = alt;
1086 if (!fetch_object(altbase, sha1))
1087 return 0;
1088 while (altbase) {
1089 if (!fetch_pack(altbase, sha1))
1090 return 0;
1091 altbase = altbase->next;
1093 return error("Unable to find %s under %s\n", sha1_to_hex(sha1),
1094 alt->base);
1097 static inline int needs_quote(int ch)
1099 switch (ch) {
1100 case '/': case '-': case '.':
1101 case 'A'...'Z': case 'a'...'z': case '0'...'9':
1102 return 0;
1103 default:
1104 return 1;
1108 static inline int hex(int v)
1110 if (v < 10) return '0' + v;
1111 else return 'A' + v - 10;
1114 static char *quote_ref_url(const char *base, const char *ref)
1116 const char *cp;
1117 char *dp, *qref;
1118 int len, baselen, ch;
1120 baselen = strlen(base);
1121 len = baselen + 6; /* "refs/" + NUL */
1122 for (cp = ref; (ch = *cp) != 0; cp++, len++)
1123 if (needs_quote(ch))
1124 len += 2; /* extra two hex plus replacement % */
1125 qref = xmalloc(len);
1126 memcpy(qref, base, baselen);
1127 memcpy(qref + baselen, "refs/", 5);
1128 for (cp = ref, dp = qref + baselen + 5; (ch = *cp) != 0; cp++) {
1129 if (needs_quote(ch)) {
1130 *dp++ = '%';
1131 *dp++ = hex((ch >> 4) & 0xF);
1132 *dp++ = hex(ch & 0xF);
1134 else
1135 *dp++ = ch;
1137 *dp = 0;
1139 return qref;
1142 int fetch_ref(char *ref, unsigned char *sha1)
1144 char *url;
1145 char hex[42];
1146 struct buffer buffer;
1147 char *base = alt->base;
1148 struct active_request_slot *slot;
1149 buffer.size = 41;
1150 buffer.posn = 0;
1151 buffer.buffer = hex;
1152 hex[41] = '\0';
1154 url = quote_ref_url(base, ref);
1155 slot = get_active_slot();
1156 curl_easy_setopt(slot->curl, CURLOPT_FILE, &buffer);
1157 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, fwrite_buffer);
1158 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, NULL);
1159 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
1160 if (start_active_slot(slot)) {
1161 run_active_slot(slot);
1162 if (slot->curl_result != CURLE_OK)
1163 return error("Couldn't get %s for %s\n%s",
1164 url, ref, curl_errorstr);
1165 } else {
1166 return error("Unable to start request");
1169 hex[40] = '\0';
1170 get_sha1_hex(hex, sha1);
1171 return 0;
1174 int main(int argc, char **argv)
1176 char *commit_id;
1177 char *url;
1178 int arg = 1;
1179 struct active_request_slot *slot;
1181 while (arg < argc && argv[arg][0] == '-') {
1182 if (argv[arg][1] == 't') {
1183 get_tree = 1;
1184 } else if (argv[arg][1] == 'c') {
1185 get_history = 1;
1186 } else if (argv[arg][1] == 'a') {
1187 get_all = 1;
1188 get_tree = 1;
1189 get_history = 1;
1190 } else if (argv[arg][1] == 'v') {
1191 get_verbosely = 1;
1192 } else if (argv[arg][1] == 'w') {
1193 write_ref = argv[arg + 1];
1194 arg++;
1195 } else if (!strcmp(argv[arg], "--recover")) {
1196 get_recover = 1;
1198 arg++;
1200 if (argc < arg + 2) {
1201 usage("git-http-fetch [-c] [-t] [-a] [-d] [-v] [--recover] [-w ref] commit-id url");
1202 return 1;
1204 commit_id = argv[arg];
1205 url = argv[arg + 1];
1207 curl_global_init(CURL_GLOBAL_ALL);
1209 #ifdef USE_CURL_MULTI
1211 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
1212 if (http_max_requests != NULL)
1213 max_requests = atoi(http_max_requests);
1216 curlm = curl_multi_init();
1217 if (curlm == NULL) {
1218 fprintf(stderr, "Error creating curl multi handle.\n");
1219 return 1;
1221 #endif
1223 if (getenv("GIT_SSL_NO_VERIFY"))
1224 curl_ssl_verify = 0;
1226 ssl_cert = getenv("GIT_SSL_CERT");
1227 #if LIBCURL_VERSION_NUM >= 0x070902
1228 ssl_key = getenv("GIT_SSL_KEY");
1229 #endif
1230 #if LIBCURL_VERSION_NUM >= 0x070908
1231 ssl_capath = getenv("GIT_SSL_CAPATH");
1232 #endif
1233 ssl_cainfo = getenv("GIT_SSL_CAINFO");
1235 git_config(http_options);
1237 if (curl_ssl_verify == -1)
1238 curl_ssl_verify = 1;
1240 #ifdef USE_CURL_MULTI
1241 if (max_requests < 1)
1242 max_requests = DEFAULT_MAX_REQUESTS;
1243 #endif
1245 pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
1246 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
1247 no_range_header = curl_slist_append(no_range_header, "Range:");
1249 #ifndef NO_CURL_EASY_DUPHANDLE
1250 curl_default = get_curl_handle();
1251 #endif
1253 alt = xmalloc(sizeof(*alt));
1254 alt->base = url;
1255 alt->got_indices = 0;
1256 alt->packs = NULL;
1257 alt->next = NULL;
1258 fetch_alternates(alt->base);
1260 if (pull(commit_id))
1261 return 1;
1263 curl_slist_free_all(pragma_header);
1264 curl_slist_free_all(no_pragma_header);
1265 curl_slist_free_all(no_range_header);
1266 #ifndef NO_CURL_EASY_DUPHANDLE
1267 curl_easy_cleanup(curl_default);
1268 #endif
1269 slot = active_queue_head;
1270 while (slot != NULL) {
1271 curl_easy_cleanup(slot->curl);
1272 slot = slot->next;
1274 #ifdef USE_CURL_MULTI
1275 curl_multi_cleanup(curlm);
1276 #endif
1277 curl_global_cleanup();
1278 return 0;