Merge branch 'tc/http-urls-ends-with-slash' into maint
[git/git.git] / http.c
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
5 #include "url.h"
6
7 int data_received;
8 int active_requests;
9 int http_is_verbose;
10 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
11
12 #if LIBCURL_VERSION_NUM >= 0x070a06
13 #define LIBCURL_CAN_HANDLE_AUTH_ANY
14 #endif
15
16 static int min_curl_sessions = 1;
17 static int curl_session_count;
18 #ifdef USE_CURL_MULTI
19 static int max_requests = -1;
20 static CURLM *curlm;
21 #endif
22 #ifndef NO_CURL_EASY_DUPHANDLE
23 static CURL *curl_default;
24 #endif
25
26 #define PREV_BUF_SIZE 4096
27 #define RANGE_HEADER_SIZE 30
28
29 char curl_errorstr[CURL_ERROR_SIZE];
30
31 static int curl_ssl_verify = -1;
32 static const char *ssl_cert;
33 #if LIBCURL_VERSION_NUM >= 0x070903
34 static const char *ssl_key;
35 #endif
36 #if LIBCURL_VERSION_NUM >= 0x070908
37 static const char *ssl_capath;
38 #endif
39 static const char *ssl_cainfo;
40 static long curl_low_speed_limit = -1;
41 static long curl_low_speed_time = -1;
42 static int curl_ftp_no_epsv;
43 static const char *curl_http_proxy;
44 static char *user_name, *user_pass;
45 static const char *user_agent;
46
47 #if LIBCURL_VERSION_NUM >= 0x071700
48 /* Use CURLOPT_KEYPASSWD as is */
49 #elif LIBCURL_VERSION_NUM >= 0x070903
50 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
51 #else
52 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
53 #endif
54
55 static char *ssl_cert_password;
56 static int ssl_cert_password_required;
57
58 static struct curl_slist *pragma_header;
59 static struct curl_slist *no_pragma_header;
60
61 static struct active_request_slot *active_queue_head;
62
63 size_t fread_buffer(void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
64 {
65 size_t size = eltsize * nmemb;
66 struct buffer *buffer = buffer_;
67
68 if (size > buffer->buf.len - buffer->posn)
69 size = buffer->buf.len - buffer->posn;
70 memcpy(ptr, buffer->buf.buf + buffer->posn, size);
71 buffer->posn += size;
72
73 return size;
74 }
75
76 #ifndef NO_CURL_IOCTL
77 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
78 {
79 struct buffer *buffer = clientp;
80
81 switch (cmd) {
82 case CURLIOCMD_NOP:
83 return CURLIOE_OK;
84
85 case CURLIOCMD_RESTARTREAD:
86 buffer->posn = 0;
87 return CURLIOE_OK;
88
89 default:
90 return CURLIOE_UNKNOWNCMD;
91 }
92 }
93 #endif
94
95 size_t fwrite_buffer(const void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
96 {
97 size_t size = eltsize * nmemb;
98 struct strbuf *buffer = buffer_;
99
100 strbuf_add(buffer, ptr, size);
101 data_received++;
102 return size;
103 }
104
105 size_t fwrite_null(const void *ptr, size_t eltsize, size_t nmemb, void *strbuf)
106 {
107 data_received++;
108 return eltsize * nmemb;
109 }
110
111 #ifdef USE_CURL_MULTI
112 static void process_curl_messages(void)
113 {
114 int num_messages;
115 struct active_request_slot *slot;
116 CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
117
118 while (curl_message != NULL) {
119 if (curl_message->msg == CURLMSG_DONE) {
120 int curl_result = curl_message->data.result;
121 slot = active_queue_head;
122 while (slot != NULL &&
123 slot->curl != curl_message->easy_handle)
124 slot = slot->next;
125 if (slot != NULL) {
126 curl_multi_remove_handle(curlm, slot->curl);
127 slot->curl_result = curl_result;
128 finish_active_slot(slot);
129 } else {
130 fprintf(stderr, "Received DONE message for unknown request!\n");
131 }
132 } else {
133 fprintf(stderr, "Unknown CURL message received: %d\n",
134 (int)curl_message->msg);
135 }
136 curl_message = curl_multi_info_read(curlm, &num_messages);
137 }
138 }
139 #endif
140
141 static int http_options(const char *var, const char *value, void *cb)
142 {
143 if (!strcmp("http.sslverify", var)) {
144 curl_ssl_verify = git_config_bool(var, value);
145 return 0;
146 }
147 if (!strcmp("http.sslcert", var))
148 return git_config_string(&ssl_cert, var, value);
149 #if LIBCURL_VERSION_NUM >= 0x070903
150 if (!strcmp("http.sslkey", var))
151 return git_config_string(&ssl_key, var, value);
152 #endif
153 #if LIBCURL_VERSION_NUM >= 0x070908
154 if (!strcmp("http.sslcapath", var))
155 return git_config_string(&ssl_capath, var, value);
156 #endif
157 if (!strcmp("http.sslcainfo", var))
158 return git_config_string(&ssl_cainfo, var, value);
159 if (!strcmp("http.sslcertpasswordprotected", var)) {
160 if (git_config_bool(var, value))
161 ssl_cert_password_required = 1;
162 return 0;
163 }
164 if (!strcmp("http.minsessions", var)) {
165 min_curl_sessions = git_config_int(var, value);
166 #ifndef USE_CURL_MULTI
167 if (min_curl_sessions > 1)
168 min_curl_sessions = 1;
169 #endif
170 return 0;
171 }
172 #ifdef USE_CURL_MULTI
173 if (!strcmp("http.maxrequests", var)) {
174 max_requests = git_config_int(var, value);
175 return 0;
176 }
177 #endif
178 if (!strcmp("http.lowspeedlimit", var)) {
179 curl_low_speed_limit = (long)git_config_int(var, value);
180 return 0;
181 }
182 if (!strcmp("http.lowspeedtime", var)) {
183 curl_low_speed_time = (long)git_config_int(var, value);
184 return 0;
185 }
186
187 if (!strcmp("http.noepsv", var)) {
188 curl_ftp_no_epsv = git_config_bool(var, value);
189 return 0;
190 }
191 if (!strcmp("http.proxy", var))
192 return git_config_string(&curl_http_proxy, var, value);
193
194 if (!strcmp("http.postbuffer", var)) {
195 http_post_buffer = git_config_int(var, value);
196 if (http_post_buffer < LARGE_PACKET_MAX)
197 http_post_buffer = LARGE_PACKET_MAX;
198 return 0;
199 }
200
201 if (!strcmp("http.useragent", var))
202 return git_config_string(&user_agent, var, value);
203
204 /* Fall back on the default ones */
205 return git_default_config(var, value, cb);
206 }
207
208 static void init_curl_http_auth(CURL *result)
209 {
210 if (user_name) {
211 struct strbuf up = STRBUF_INIT;
212 if (!user_pass)
213 user_pass = xstrdup(git_getpass("Password: "));
214 strbuf_addf(&up, "%s:%s", user_name, user_pass);
215 curl_easy_setopt(result, CURLOPT_USERPWD,
216 strbuf_detach(&up, NULL));
217 }
218 }
219
220 static int has_cert_password(void)
221 {
222 if (ssl_cert_password != NULL)
223 return 1;
224 if (ssl_cert == NULL || ssl_cert_password_required != 1)
225 return 0;
226 /* Only prompt the user once. */
227 ssl_cert_password_required = -1;
228 ssl_cert_password = git_getpass("Certificate Password: ");
229 if (ssl_cert_password != NULL) {
230 ssl_cert_password = xstrdup(ssl_cert_password);
231 return 1;
232 } else
233 return 0;
234 }
235
236 static CURL *get_curl_handle(void)
237 {
238 CURL *result = curl_easy_init();
239
240 if (!curl_ssl_verify) {
241 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
242 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
243 } else {
244 /* Verify authenticity of the peer's certificate */
245 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
246 /* The name in the cert must match whom we tried to connect */
247 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
248 }
249
250 #if LIBCURL_VERSION_NUM >= 0x070907
251 curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
252 #endif
253 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
254 curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
255 #endif
256
257 init_curl_http_auth(result);
258
259 if (ssl_cert != NULL)
260 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
261 if (has_cert_password())
262 curl_easy_setopt(result, CURLOPT_KEYPASSWD, ssl_cert_password);
263 #if LIBCURL_VERSION_NUM >= 0x070903
264 if (ssl_key != NULL)
265 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
266 #endif
267 #if LIBCURL_VERSION_NUM >= 0x070908
268 if (ssl_capath != NULL)
269 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
270 #endif
271 if (ssl_cainfo != NULL)
272 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
273 curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
274
275 if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
276 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
277 curl_low_speed_limit);
278 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
279 curl_low_speed_time);
280 }
281
282 curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
283 #if LIBCURL_VERSION_NUM >= 0x071301
284 curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
285 #elif LIBCURL_VERSION_NUM >= 0x071101
286 curl_easy_setopt(result, CURLOPT_POST301, 1);
287 #endif
288
289 if (getenv("GIT_CURL_VERBOSE"))
290 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
291
292 curl_easy_setopt(result, CURLOPT_USERAGENT,
293 user_agent ? user_agent : GIT_HTTP_USER_AGENT);
294
295 if (curl_ftp_no_epsv)
296 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
297
298 if (curl_http_proxy)
299 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
300
301 return result;
302 }
303
304 static void http_auth_init(const char *url)
305 {
306 char *at, *colon, *cp, *slash, *decoded;
307 int len;
308
309 cp = strstr(url, "://");
310 if (!cp)
311 return;
312
313 /*
314 * Ok, the URL looks like "proto://something". Which one?
315 * "proto://<user>:<pass>@<host>/...",
316 * "proto://<user>@<host>/...", or just
317 * "proto://<host>/..."?
318 */
319 cp += 3;
320 at = strchr(cp, '@');
321 colon = strchr(cp, ':');
322 slash = strchrnul(cp, '/');
323 if (!at || slash <= at)
324 return; /* No credentials */
325 if (!colon || at <= colon) {
326 /* Only username */
327 len = at - cp;
328 user_name = xmalloc(len + 1);
329 memcpy(user_name, cp, len);
330 user_name[len] = '\0';
331 decoded = url_decode(user_name);
332 free(user_name);
333 user_name = decoded;
334 user_pass = NULL;
335 } else {
336 len = colon - cp;
337 user_name = xmalloc(len + 1);
338 memcpy(user_name, cp, len);
339 user_name[len] = '\0';
340 decoded = url_decode(user_name);
341 free(user_name);
342 user_name = decoded;
343 len = at - (colon + 1);
344 user_pass = xmalloc(len + 1);
345 memcpy(user_pass, colon + 1, len);
346 user_pass[len] = '\0';
347 decoded = url_decode(user_pass);
348 free(user_pass);
349 user_pass = decoded;
350 }
351 }
352
353 static void set_from_env(const char **var, const char *envname)
354 {
355 const char *val = getenv(envname);
356 if (val)
357 *var = val;
358 }
359
360 void http_init(struct remote *remote)
361 {
362 char *low_speed_limit;
363 char *low_speed_time;
364
365 http_is_verbose = 0;
366
367 git_config(http_options, NULL);
368
369 curl_global_init(CURL_GLOBAL_ALL);
370
371 if (remote && remote->http_proxy)
372 curl_http_proxy = xstrdup(remote->http_proxy);
373
374 pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
375 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
376
377 #ifdef USE_CURL_MULTI
378 {
379 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
380 if (http_max_requests != NULL)
381 max_requests = atoi(http_max_requests);
382 }
383
384 curlm = curl_multi_init();
385 if (curlm == NULL) {
386 fprintf(stderr, "Error creating curl multi handle.\n");
387 exit(1);
388 }
389 #endif
390
391 if (getenv("GIT_SSL_NO_VERIFY"))
392 curl_ssl_verify = 0;
393
394 set_from_env(&ssl_cert, "GIT_SSL_CERT");
395 #if LIBCURL_VERSION_NUM >= 0x070903
396 set_from_env(&ssl_key, "GIT_SSL_KEY");
397 #endif
398 #if LIBCURL_VERSION_NUM >= 0x070908
399 set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
400 #endif
401 set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
402
403 set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
404
405 low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
406 if (low_speed_limit != NULL)
407 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
408 low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
409 if (low_speed_time != NULL)
410 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
411
412 if (curl_ssl_verify == -1)
413 curl_ssl_verify = 1;
414
415 curl_session_count = 0;
416 #ifdef USE_CURL_MULTI
417 if (max_requests < 1)
418 max_requests = DEFAULT_MAX_REQUESTS;
419 #endif
420
421 if (getenv("GIT_CURL_FTP_NO_EPSV"))
422 curl_ftp_no_epsv = 1;
423
424 if (remote && remote->url && remote->url[0]) {
425 http_auth_init(remote->url[0]);
426 if (!ssl_cert_password_required &&
427 getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
428 !prefixcmp(remote->url[0], "https://"))
429 ssl_cert_password_required = 1;
430 }
431
432 #ifndef NO_CURL_EASY_DUPHANDLE
433 curl_default = get_curl_handle();
434 #endif
435 }
436
437 void http_cleanup(void)
438 {
439 struct active_request_slot *slot = active_queue_head;
440
441 while (slot != NULL) {
442 struct active_request_slot *next = slot->next;
443 if (slot->curl != NULL) {
444 #ifdef USE_CURL_MULTI
445 curl_multi_remove_handle(curlm, slot->curl);
446 #endif
447 curl_easy_cleanup(slot->curl);
448 }
449 free(slot);
450 slot = next;
451 }
452 active_queue_head = NULL;
453
454 #ifndef NO_CURL_EASY_DUPHANDLE
455 curl_easy_cleanup(curl_default);
456 #endif
457
458 #ifdef USE_CURL_MULTI
459 curl_multi_cleanup(curlm);
460 #endif
461 curl_global_cleanup();
462
463 curl_slist_free_all(pragma_header);
464 pragma_header = NULL;
465
466 curl_slist_free_all(no_pragma_header);
467 no_pragma_header = NULL;
468
469 if (curl_http_proxy) {
470 free((void *)curl_http_proxy);
471 curl_http_proxy = NULL;
472 }
473
474 if (ssl_cert_password != NULL) {
475 memset(ssl_cert_password, 0, strlen(ssl_cert_password));
476 free(ssl_cert_password);
477 ssl_cert_password = NULL;
478 }
479 ssl_cert_password_required = 0;
480 }
481
482 struct active_request_slot *get_active_slot(void)
483 {
484 struct active_request_slot *slot = active_queue_head;
485 struct active_request_slot *newslot;
486
487 #ifdef USE_CURL_MULTI
488 int num_transfers;
489
490 /* Wait for a slot to open up if the queue is full */
491 while (active_requests >= max_requests) {
492 curl_multi_perform(curlm, &num_transfers);
493 if (num_transfers < active_requests)
494 process_curl_messages();
495 }
496 #endif
497
498 while (slot != NULL && slot->in_use)
499 slot = slot->next;
500
501 if (slot == NULL) {
502 newslot = xmalloc(sizeof(*newslot));
503 newslot->curl = NULL;
504 newslot->in_use = 0;
505 newslot->next = NULL;
506
507 slot = active_queue_head;
508 if (slot == NULL) {
509 active_queue_head = newslot;
510 } else {
511 while (slot->next != NULL)
512 slot = slot->next;
513 slot->next = newslot;
514 }
515 slot = newslot;
516 }
517
518 if (slot->curl == NULL) {
519 #ifdef NO_CURL_EASY_DUPHANDLE
520 slot->curl = get_curl_handle();
521 #else
522 slot->curl = curl_easy_duphandle(curl_default);
523 #endif
524 curl_session_count++;
525 }
526
527 active_requests++;
528 slot->in_use = 1;
529 slot->local = NULL;
530 slot->results = NULL;
531 slot->finished = NULL;
532 slot->callback_data = NULL;
533 slot->callback_func = NULL;
534 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
535 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
536 curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
537 curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
538 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
539 curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
540 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
541
542 return slot;
543 }
544
545 int start_active_slot(struct active_request_slot *slot)
546 {
547 #ifdef USE_CURL_MULTI
548 CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
549 int num_transfers;
550
551 if (curlm_result != CURLM_OK &&
552 curlm_result != CURLM_CALL_MULTI_PERFORM) {
553 active_requests--;
554 slot->in_use = 0;
555 return 0;
556 }
557
558 /*
559 * We know there must be something to do, since we just added
560 * something.
561 */
562 curl_multi_perform(curlm, &num_transfers);
563 #endif
564 return 1;
565 }
566
567 #ifdef USE_CURL_MULTI
568 struct fill_chain {
569 void *data;
570 int (*fill)(void *);
571 struct fill_chain *next;
572 };
573
574 static struct fill_chain *fill_cfg;
575
576 void add_fill_function(void *data, int (*fill)(void *))
577 {
578 struct fill_chain *new = xmalloc(sizeof(*new));
579 struct fill_chain **linkp = &fill_cfg;
580 new->data = data;
581 new->fill = fill;
582 new->next = NULL;
583 while (*linkp)
584 linkp = &(*linkp)->next;
585 *linkp = new;
586 }
587
588 void fill_active_slots(void)
589 {
590 struct active_request_slot *slot = active_queue_head;
591
592 while (active_requests < max_requests) {
593 struct fill_chain *fill;
594 for (fill = fill_cfg; fill; fill = fill->next)
595 if (fill->fill(fill->data))
596 break;
597
598 if (!fill)
599 break;
600 }
601
602 while (slot != NULL) {
603 if (!slot->in_use && slot->curl != NULL
604 && curl_session_count > min_curl_sessions) {
605 curl_easy_cleanup(slot->curl);
606 slot->curl = NULL;
607 curl_session_count--;
608 }
609 slot = slot->next;
610 }
611 }
612
613 void step_active_slots(void)
614 {
615 int num_transfers;
616 CURLMcode curlm_result;
617
618 do {
619 curlm_result = curl_multi_perform(curlm, &num_transfers);
620 } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
621 if (num_transfers < active_requests) {
622 process_curl_messages();
623 fill_active_slots();
624 }
625 }
626 #endif
627
628 void run_active_slot(struct active_request_slot *slot)
629 {
630 #ifdef USE_CURL_MULTI
631 long last_pos = 0;
632 long current_pos;
633 fd_set readfds;
634 fd_set writefds;
635 fd_set excfds;
636 int max_fd;
637 struct timeval select_timeout;
638 int finished = 0;
639
640 slot->finished = &finished;
641 while (!finished) {
642 data_received = 0;
643 step_active_slots();
644
645 if (!data_received && slot->local != NULL) {
646 current_pos = ftell(slot->local);
647 if (current_pos > last_pos)
648 data_received++;
649 last_pos = current_pos;
650 }
651
652 if (slot->in_use && !data_received) {
653 max_fd = 0;
654 FD_ZERO(&readfds);
655 FD_ZERO(&writefds);
656 FD_ZERO(&excfds);
657 select_timeout.tv_sec = 0;
658 select_timeout.tv_usec = 50000;
659 select(max_fd, &readfds, &writefds,
660 &excfds, &select_timeout);
661 }
662 }
663 #else
664 while (slot->in_use) {
665 slot->curl_result = curl_easy_perform(slot->curl);
666 finish_active_slot(slot);
667 }
668 #endif
669 }
670
671 static void closedown_active_slot(struct active_request_slot *slot)
672 {
673 active_requests--;
674 slot->in_use = 0;
675 }
676
677 static void release_active_slot(struct active_request_slot *slot)
678 {
679 closedown_active_slot(slot);
680 if (slot->curl && curl_session_count > min_curl_sessions) {
681 #ifdef USE_CURL_MULTI
682 curl_multi_remove_handle(curlm, slot->curl);
683 #endif
684 curl_easy_cleanup(slot->curl);
685 slot->curl = NULL;
686 curl_session_count--;
687 }
688 #ifdef USE_CURL_MULTI
689 fill_active_slots();
690 #endif
691 }
692
693 void finish_active_slot(struct active_request_slot *slot)
694 {
695 closedown_active_slot(slot);
696 curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
697
698 if (slot->finished != NULL)
699 (*slot->finished) = 1;
700
701 /* Store slot results so they can be read after the slot is reused */
702 if (slot->results != NULL) {
703 slot->results->curl_result = slot->curl_result;
704 slot->results->http_code = slot->http_code;
705 }
706
707 /* Run callback if appropriate */
708 if (slot->callback_func != NULL)
709 slot->callback_func(slot->callback_data);
710 }
711
712 void finish_all_active_slots(void)
713 {
714 struct active_request_slot *slot = active_queue_head;
715
716 while (slot != NULL)
717 if (slot->in_use) {
718 run_active_slot(slot);
719 slot = active_queue_head;
720 } else {
721 slot = slot->next;
722 }
723 }
724
725 /* Helpers for modifying and creating URLs */
726 static inline int needs_quote(int ch)
727 {
728 if (((ch >= 'A') && (ch <= 'Z'))
729 || ((ch >= 'a') && (ch <= 'z'))
730 || ((ch >= '0') && (ch <= '9'))
731 || (ch == '/')
732 || (ch == '-')
733 || (ch == '.'))
734 return 0;
735 return 1;
736 }
737
738 static inline int hex(int v)
739 {
740 if (v < 10)
741 return '0' + v;
742 else
743 return 'A' + v - 10;
744 }
745
746 static char *quote_ref_url(const char *base, const char *ref)
747 {
748 struct strbuf buf = STRBUF_INIT;
749 const char *cp;
750 int ch;
751
752 end_url_with_slash(&buf, base);
753
754 for (cp = ref; (ch = *cp) != 0; cp++)
755 if (needs_quote(ch))
756 strbuf_addf(&buf, "%%%02x", ch);
757 else
758 strbuf_addch(&buf, *cp);
759
760 return strbuf_detach(&buf, NULL);
761 }
762
763 void append_remote_object_url(struct strbuf *buf, const char *url,
764 const char *hex,
765 int only_two_digit_prefix)
766 {
767 end_url_with_slash(buf, url);
768
769 strbuf_addf(buf, "objects/%.*s/", 2, hex);
770 if (!only_two_digit_prefix)
771 strbuf_addf(buf, "%s", hex+2);
772 }
773
774 char *get_remote_object_url(const char *url, const char *hex,
775 int only_two_digit_prefix)
776 {
777 struct strbuf buf = STRBUF_INIT;
778 append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
779 return strbuf_detach(&buf, NULL);
780 }
781
782 /* http_request() targets */
783 #define HTTP_REQUEST_STRBUF 0
784 #define HTTP_REQUEST_FILE 1
785
786 static int http_request(const char *url, void *result, int target, int options)
787 {
788 struct active_request_slot *slot;
789 struct slot_results results;
790 struct curl_slist *headers = NULL;
791 struct strbuf buf = STRBUF_INIT;
792 int ret;
793
794 slot = get_active_slot();
795 slot->results = &results;
796 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
797
798 if (result == NULL) {
799 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
800 } else {
801 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
802 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
803
804 if (target == HTTP_REQUEST_FILE) {
805 long posn = ftell(result);
806 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
807 fwrite);
808 if (posn > 0) {
809 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
810 headers = curl_slist_append(headers, buf.buf);
811 strbuf_reset(&buf);
812 }
813 slot->local = result;
814 } else
815 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
816 fwrite_buffer);
817 }
818
819 strbuf_addstr(&buf, "Pragma:");
820 if (options & HTTP_NO_CACHE)
821 strbuf_addstr(&buf, " no-cache");
822
823 headers = curl_slist_append(headers, buf.buf);
824
825 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
826 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
827
828 if (start_active_slot(slot)) {
829 run_active_slot(slot);
830 if (results.curl_result == CURLE_OK)
831 ret = HTTP_OK;
832 else if (missing_target(&results))
833 ret = HTTP_MISSING_TARGET;
834 else if (results.http_code == 401) {
835 if (user_name) {
836 ret = HTTP_NOAUTH;
837 } else {
838 /*
839 * git_getpass is needed here because its very likely stdin/stdout are
840 * pipes to our parent process. So we instead need to use /dev/tty,
841 * but that is non-portable. Using git_getpass() can at least be stubbed
842 * on other platforms with a different implementation if/when necessary.
843 */
844 user_name = xstrdup(git_getpass("Username: "));
845 init_curl_http_auth(slot->curl);
846 ret = HTTP_REAUTH;
847 }
848 } else
849 ret = HTTP_ERROR;
850 } else {
851 error("Unable to start HTTP request for %s", url);
852 ret = HTTP_START_FAILED;
853 }
854
855 slot->local = NULL;
856 curl_slist_free_all(headers);
857 strbuf_release(&buf);
858
859 return ret;
860 }
861
862 int http_get_strbuf(const char *url, struct strbuf *result, int options)
863 {
864 int http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
865 if (http_ret == HTTP_REAUTH) {
866 http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
867 }
868 return http_ret;
869 }
870
871 /*
872 * Downloads an url and stores the result in the given file.
873 *
874 * If a previous interrupted download is detected (i.e. a previous temporary
875 * file is still around) the download is resumed.
876 */
877 static int http_get_file(const char *url, const char *filename, int options)
878 {
879 int ret;
880 struct strbuf tmpfile = STRBUF_INIT;
881 FILE *result;
882
883 strbuf_addf(&tmpfile, "%s.temp", filename);
884 result = fopen(tmpfile.buf, "a");
885 if (! result) {
886 error("Unable to open local file %s", tmpfile.buf);
887 ret = HTTP_ERROR;
888 goto cleanup;
889 }
890
891 ret = http_request(url, result, HTTP_REQUEST_FILE, options);
892 fclose(result);
893
894 if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
895 ret = HTTP_ERROR;
896 cleanup:
897 strbuf_release(&tmpfile);
898 return ret;
899 }
900
901 int http_error(const char *url, int ret)
902 {
903 /* http_request has already handled HTTP_START_FAILED. */
904 if (ret != HTTP_START_FAILED)
905 error("%s while accessing %s\n", curl_errorstr, url);
906
907 return ret;
908 }
909
910 int http_fetch_ref(const char *base, struct ref *ref)
911 {
912 char *url;
913 struct strbuf buffer = STRBUF_INIT;
914 int ret = -1;
915
916 url = quote_ref_url(base, ref->name);
917 if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
918 strbuf_rtrim(&buffer);
919 if (buffer.len == 40)
920 ret = get_sha1_hex(buffer.buf, ref->old_sha1);
921 else if (!prefixcmp(buffer.buf, "ref: ")) {
922 ref->symref = xstrdup(buffer.buf + 5);
923 ret = 0;
924 }
925 }
926
927 strbuf_release(&buffer);
928 free(url);
929 return ret;
930 }
931
932 /* Helpers for fetching packs */
933 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
934 {
935 char *url, *tmp;
936 struct strbuf buf = STRBUF_INIT;
937
938 if (http_is_verbose)
939 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
940
941 end_url_with_slash(&buf, base_url);
942 strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
943 url = strbuf_detach(&buf, NULL);
944
945 strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
946 tmp = strbuf_detach(&buf, NULL);
947
948 if (http_get_file(url, tmp, 0) != HTTP_OK) {
949 error("Unable to get pack index %s\n", url);
950 free(tmp);
951 tmp = NULL;
952 }
953
954 free(url);
955 return tmp;
956 }
957
958 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
959 unsigned char *sha1, const char *base_url)
960 {
961 struct packed_git *new_pack;
962 char *tmp_idx = NULL;
963 int ret;
964
965 if (has_pack_index(sha1)) {
966 new_pack = parse_pack_index(sha1, NULL);
967 if (!new_pack)
968 return -1; /* parse_pack_index() already issued error message */
969 goto add_pack;
970 }
971
972 tmp_idx = fetch_pack_index(sha1, base_url);
973 if (!tmp_idx)
974 return -1;
975
976 new_pack = parse_pack_index(sha1, tmp_idx);
977 if (!new_pack) {
978 unlink(tmp_idx);
979 free(tmp_idx);
980
981 return -1; /* parse_pack_index() already issued error message */
982 }
983
984 ret = verify_pack_index(new_pack);
985 if (!ret) {
986 close_pack_index(new_pack);
987 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
988 }
989 free(tmp_idx);
990 if (ret)
991 return -1;
992
993 add_pack:
994 new_pack->next = *packs_head;
995 *packs_head = new_pack;
996 return 0;
997 }
998
999 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
1000 {
1001 int ret = 0, i = 0;
1002 char *url, *data;
1003 struct strbuf buf = STRBUF_INIT;
1004 unsigned char sha1[20];
1005
1006 end_url_with_slash(&buf, base_url);
1007 strbuf_addstr(&buf, "objects/info/packs");
1008 url = strbuf_detach(&buf, NULL);
1009
1010 ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
1011 if (ret != HTTP_OK)
1012 goto cleanup;
1013
1014 data = buf.buf;
1015 while (i < buf.len) {
1016 switch (data[i]) {
1017 case 'P':
1018 i++;
1019 if (i + 52 <= buf.len &&
1020 !prefixcmp(data + i, " pack-") &&
1021 !prefixcmp(data + i + 46, ".pack\n")) {
1022 get_sha1_hex(data + i + 6, sha1);
1023 fetch_and_setup_pack_index(packs_head, sha1,
1024 base_url);
1025 i += 51;
1026 break;
1027 }
1028 default:
1029 while (i < buf.len && data[i] != '\n')
1030 i++;
1031 }
1032 i++;
1033 }
1034
1035 cleanup:
1036 free(url);
1037 return ret;
1038 }
1039
1040 void release_http_pack_request(struct http_pack_request *preq)
1041 {
1042 if (preq->packfile != NULL) {
1043 fclose(preq->packfile);
1044 preq->packfile = NULL;
1045 preq->slot->local = NULL;
1046 }
1047 if (preq->range_header != NULL) {
1048 curl_slist_free_all(preq->range_header);
1049 preq->range_header = NULL;
1050 }
1051 preq->slot = NULL;
1052 free(preq->url);
1053 }
1054
1055 int finish_http_pack_request(struct http_pack_request *preq)
1056 {
1057 struct packed_git **lst;
1058 struct packed_git *p = preq->target;
1059 char *tmp_idx;
1060 struct child_process ip;
1061 const char *ip_argv[8];
1062
1063 close_pack_index(p);
1064
1065 fclose(preq->packfile);
1066 preq->packfile = NULL;
1067 preq->slot->local = NULL;
1068
1069 lst = preq->lst;
1070 while (*lst != p)
1071 lst = &((*lst)->next);
1072 *lst = (*lst)->next;
1073
1074 tmp_idx = xstrdup(preq->tmpfile);
1075 strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1076 ".idx.temp");
1077
1078 ip_argv[0] = "index-pack";
1079 ip_argv[1] = "-o";
1080 ip_argv[2] = tmp_idx;
1081 ip_argv[3] = preq->tmpfile;
1082 ip_argv[4] = NULL;
1083
1084 memset(&ip, 0, sizeof(ip));
1085 ip.argv = ip_argv;
1086 ip.git_cmd = 1;
1087 ip.no_stdin = 1;
1088 ip.no_stdout = 1;
1089
1090 if (run_command(&ip)) {
1091 unlink(preq->tmpfile);
1092 unlink(tmp_idx);
1093 free(tmp_idx);
1094 return -1;
1095 }
1096
1097 unlink(sha1_pack_index_name(p->sha1));
1098
1099 if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1100 || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1101 free(tmp_idx);
1102 return -1;
1103 }
1104
1105 install_packed_git(p);
1106 free(tmp_idx);
1107 return 0;
1108 }
1109
1110 struct http_pack_request *new_http_pack_request(
1111 struct packed_git *target, const char *base_url)
1112 {
1113 long prev_posn = 0;
1114 char range[RANGE_HEADER_SIZE];
1115 struct strbuf buf = STRBUF_INIT;
1116 struct http_pack_request *preq;
1117
1118 preq = xmalloc(sizeof(*preq));
1119 preq->target = target;
1120 preq->range_header = NULL;
1121
1122 end_url_with_slash(&buf, base_url);
1123 strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1124 sha1_to_hex(target->sha1));
1125 preq->url = strbuf_detach(&buf, NULL);
1126
1127 snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1128 sha1_pack_name(target->sha1));
1129 preq->packfile = fopen(preq->tmpfile, "a");
1130 if (!preq->packfile) {
1131 error("Unable to open local file %s for pack",
1132 preq->tmpfile);
1133 goto abort;
1134 }
1135
1136 preq->slot = get_active_slot();
1137 preq->slot->local = preq->packfile;
1138 curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1139 curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1140 curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1141 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1142 no_pragma_header);
1143
1144 /*
1145 * If there is data present from a previous transfer attempt,
1146 * resume where it left off
1147 */
1148 prev_posn = ftell(preq->packfile);
1149 if (prev_posn>0) {
1150 if (http_is_verbose)
1151 fprintf(stderr,
1152 "Resuming fetch of pack %s at byte %ld\n",
1153 sha1_to_hex(target->sha1), prev_posn);
1154 sprintf(range, "Range: bytes=%ld-", prev_posn);
1155 preq->range_header = curl_slist_append(NULL, range);
1156 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1157 preq->range_header);
1158 }
1159
1160 return preq;
1161
1162 abort:
1163 free(preq->url);
1164 free(preq);
1165 return NULL;
1166 }
1167
1168 /* Helpers for fetching objects (loose) */
1169 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
1170 void *data)
1171 {
1172 unsigned char expn[4096];
1173 size_t size = eltsize * nmemb;
1174 int posn = 0;
1175 struct http_object_request *freq =
1176 (struct http_object_request *)data;
1177 do {
1178 ssize_t retval = xwrite(freq->localfile,
1179 (char *) ptr + posn, size - posn);
1180 if (retval < 0)
1181 return posn;
1182 posn += retval;
1183 } while (posn < size);
1184
1185 freq->stream.avail_in = size;
1186 freq->stream.next_in = ptr;
1187 do {
1188 freq->stream.next_out = expn;
1189 freq->stream.avail_out = sizeof(expn);
1190 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1191 git_SHA1_Update(&freq->c, expn,
1192 sizeof(expn) - freq->stream.avail_out);
1193 } while (freq->stream.avail_in && freq->zret == Z_OK);
1194 data_received++;
1195 return size;
1196 }
1197
1198 struct http_object_request *new_http_object_request(const char *base_url,
1199 unsigned char *sha1)
1200 {
1201 char *hex = sha1_to_hex(sha1);
1202 char *filename;
1203 char prevfile[PATH_MAX];
1204 int prevlocal;
1205 unsigned char prev_buf[PREV_BUF_SIZE];
1206 ssize_t prev_read = 0;
1207 long prev_posn = 0;
1208 char range[RANGE_HEADER_SIZE];
1209 struct curl_slist *range_header = NULL;
1210 struct http_object_request *freq;
1211
1212 freq = xmalloc(sizeof(*freq));
1213 hashcpy(freq->sha1, sha1);
1214 freq->localfile = -1;
1215
1216 filename = sha1_file_name(sha1);
1217 snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1218 "%s.temp", filename);
1219
1220 snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1221 unlink_or_warn(prevfile);
1222 rename(freq->tmpfile, prevfile);
1223 unlink_or_warn(freq->tmpfile);
1224
1225 if (freq->localfile != -1)
1226 error("fd leakage in start: %d", freq->localfile);
1227 freq->localfile = open(freq->tmpfile,
1228 O_WRONLY | O_CREAT | O_EXCL, 0666);
1229 /*
1230 * This could have failed due to the "lazy directory creation";
1231 * try to mkdir the last path component.
1232 */
1233 if (freq->localfile < 0 && errno == ENOENT) {
1234 char *dir = strrchr(freq->tmpfile, '/');
1235 if (dir) {
1236 *dir = 0;
1237 mkdir(freq->tmpfile, 0777);
1238 *dir = '/';
1239 }
1240 freq->localfile = open(freq->tmpfile,
1241 O_WRONLY | O_CREAT | O_EXCL, 0666);
1242 }
1243
1244 if (freq->localfile < 0) {
1245 error("Couldn't create temporary file %s: %s",
1246 freq->tmpfile, strerror(errno));
1247 goto abort;
1248 }
1249
1250 memset(&freq->stream, 0, sizeof(freq->stream));
1251
1252 git_inflate_init(&freq->stream);
1253
1254 git_SHA1_Init(&freq->c);
1255
1256 freq->url = get_remote_object_url(base_url, hex, 0);
1257
1258 /*
1259 * If a previous temp file is present, process what was already
1260 * fetched.
1261 */
1262 prevlocal = open(prevfile, O_RDONLY);
1263 if (prevlocal != -1) {
1264 do {
1265 prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1266 if (prev_read>0) {
1267 if (fwrite_sha1_file(prev_buf,
1268 1,
1269 prev_read,
1270 freq) == prev_read) {
1271 prev_posn += prev_read;
1272 } else {
1273 prev_read = -1;
1274 }
1275 }
1276 } while (prev_read > 0);
1277 close(prevlocal);
1278 }
1279 unlink_or_warn(prevfile);
1280
1281 /*
1282 * Reset inflate/SHA1 if there was an error reading the previous temp
1283 * file; also rewind to the beginning of the local file.
1284 */
1285 if (prev_read == -1) {
1286 memset(&freq->stream, 0, sizeof(freq->stream));
1287 git_inflate_init(&freq->stream);
1288 git_SHA1_Init(&freq->c);
1289 if (prev_posn>0) {
1290 prev_posn = 0;
1291 lseek(freq->localfile, 0, SEEK_SET);
1292 if (ftruncate(freq->localfile, 0) < 0) {
1293 error("Couldn't truncate temporary file %s: %s",
1294 freq->tmpfile, strerror(errno));
1295 goto abort;
1296 }
1297 }
1298 }
1299
1300 freq->slot = get_active_slot();
1301
1302 curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1303 curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1304 curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1305 curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1306 curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1307
1308 /*
1309 * If we have successfully processed data from a previous fetch
1310 * attempt, only fetch the data we don't already have.
1311 */
1312 if (prev_posn>0) {
1313 if (http_is_verbose)
1314 fprintf(stderr,
1315 "Resuming fetch of object %s at byte %ld\n",
1316 hex, prev_posn);
1317 sprintf(range, "Range: bytes=%ld-", prev_posn);
1318 range_header = curl_slist_append(range_header, range);
1319 curl_easy_setopt(freq->slot->curl,
1320 CURLOPT_HTTPHEADER, range_header);
1321 }
1322
1323 return freq;
1324
1325 abort:
1326 free(filename);
1327 free(freq->url);
1328 free(freq);
1329 return NULL;
1330 }
1331
1332 void process_http_object_request(struct http_object_request *freq)
1333 {
1334 if (freq->slot == NULL)
1335 return;
1336 freq->curl_result = freq->slot->curl_result;
1337 freq->http_code = freq->slot->http_code;
1338 freq->slot = NULL;
1339 }
1340
1341 int finish_http_object_request(struct http_object_request *freq)
1342 {
1343 struct stat st;
1344
1345 close(freq->localfile);
1346 freq->localfile = -1;
1347
1348 process_http_object_request(freq);
1349
1350 if (freq->http_code == 416) {
1351 warning("requested range invalid; we may already have all the data.");
1352 } else if (freq->curl_result != CURLE_OK) {
1353 if (stat(freq->tmpfile, &st) == 0)
1354 if (st.st_size == 0)
1355 unlink_or_warn(freq->tmpfile);
1356 return -1;
1357 }
1358
1359 git_inflate_end(&freq->stream);
1360 git_SHA1_Final(freq->real_sha1, &freq->c);
1361 if (freq->zret != Z_STREAM_END) {
1362 unlink_or_warn(freq->tmpfile);
1363 return -1;
1364 }
1365 if (hashcmp(freq->sha1, freq->real_sha1)) {
1366 unlink_or_warn(freq->tmpfile);
1367 return -1;
1368 }
1369 freq->rename =
1370 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1371
1372 return freq->rename;
1373 }
1374
1375 void abort_http_object_request(struct http_object_request *freq)
1376 {
1377 unlink_or_warn(freq->tmpfile);
1378
1379 release_http_object_request(freq);
1380 }
1381
1382 void release_http_object_request(struct http_object_request *freq)
1383 {
1384 if (freq->localfile != -1) {
1385 close(freq->localfile);
1386 freq->localfile = -1;
1387 }
1388 if (freq->url != NULL) {
1389 free(freq->url);
1390 freq->url = NULL;
1391 }
1392 if (freq->slot != NULL) {
1393 freq->slot->callback_func = NULL;
1394 freq->slot->callback_data = NULL;
1395 release_active_slot(freq->slot);
1396 freq->slot = NULL;
1397 }
1398 }