Merge branch 'gc/http-with-non-ascii-username-url' into maint
[git/git.git] / http.c
1 #include "http.h"
2 #include "pack.h"
3 #include "sideband.h"
4 #include "run-command.h"
5 #include "url.h"
6
7 int data_received;
8 int active_requests;
9 int http_is_verbose;
10 size_t http_post_buffer = 16 * LARGE_PACKET_MAX;
11
12 #if LIBCURL_VERSION_NUM >= 0x070a06
13 #define LIBCURL_CAN_HANDLE_AUTH_ANY
14 #endif
15
16 static int min_curl_sessions = 1;
17 static int curl_session_count;
18 #ifdef USE_CURL_MULTI
19 static int max_requests = -1;
20 static CURLM *curlm;
21 #endif
22 #ifndef NO_CURL_EASY_DUPHANDLE
23 static CURL *curl_default;
24 #endif
25
26 #define PREV_BUF_SIZE 4096
27 #define RANGE_HEADER_SIZE 30
28
29 char curl_errorstr[CURL_ERROR_SIZE];
30
31 static int curl_ssl_verify = -1;
32 static const char *ssl_cert;
33 #if LIBCURL_VERSION_NUM >= 0x070903
34 static const char *ssl_key;
35 #endif
36 #if LIBCURL_VERSION_NUM >= 0x070908
37 static const char *ssl_capath;
38 #endif
39 static const char *ssl_cainfo;
40 static long curl_low_speed_limit = -1;
41 static long curl_low_speed_time = -1;
42 static int curl_ftp_no_epsv;
43 static const char *curl_http_proxy;
44 static char *user_name, *user_pass;
45 static const char *user_agent;
46
47 #if LIBCURL_VERSION_NUM >= 0x071700
48 /* Use CURLOPT_KEYPASSWD as is */
49 #elif LIBCURL_VERSION_NUM >= 0x070903
50 #define CURLOPT_KEYPASSWD CURLOPT_SSLKEYPASSWD
51 #else
52 #define CURLOPT_KEYPASSWD CURLOPT_SSLCERTPASSWD
53 #endif
54
55 static char *ssl_cert_password;
56 static int ssl_cert_password_required;
57
58 static struct curl_slist *pragma_header;
59 static struct curl_slist *no_pragma_header;
60
61 static struct active_request_slot *active_queue_head;
62
63 size_t fread_buffer(void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
64 {
65 size_t size = eltsize * nmemb;
66 struct buffer *buffer = buffer_;
67
68 if (size > buffer->buf.len - buffer->posn)
69 size = buffer->buf.len - buffer->posn;
70 memcpy(ptr, buffer->buf.buf + buffer->posn, size);
71 buffer->posn += size;
72
73 return size;
74 }
75
76 #ifndef NO_CURL_IOCTL
77 curlioerr ioctl_buffer(CURL *handle, int cmd, void *clientp)
78 {
79 struct buffer *buffer = clientp;
80
81 switch (cmd) {
82 case CURLIOCMD_NOP:
83 return CURLIOE_OK;
84
85 case CURLIOCMD_RESTARTREAD:
86 buffer->posn = 0;
87 return CURLIOE_OK;
88
89 default:
90 return CURLIOE_UNKNOWNCMD;
91 }
92 }
93 #endif
94
95 size_t fwrite_buffer(const void *ptr, size_t eltsize, size_t nmemb, void *buffer_)
96 {
97 size_t size = eltsize * nmemb;
98 struct strbuf *buffer = buffer_;
99
100 strbuf_add(buffer, ptr, size);
101 data_received++;
102 return size;
103 }
104
105 size_t fwrite_null(const void *ptr, size_t eltsize, size_t nmemb, void *strbuf)
106 {
107 data_received++;
108 return eltsize * nmemb;
109 }
110
111 #ifdef USE_CURL_MULTI
112 static void process_curl_messages(void)
113 {
114 int num_messages;
115 struct active_request_slot *slot;
116 CURLMsg *curl_message = curl_multi_info_read(curlm, &num_messages);
117
118 while (curl_message != NULL) {
119 if (curl_message->msg == CURLMSG_DONE) {
120 int curl_result = curl_message->data.result;
121 slot = active_queue_head;
122 while (slot != NULL &&
123 slot->curl != curl_message->easy_handle)
124 slot = slot->next;
125 if (slot != NULL) {
126 curl_multi_remove_handle(curlm, slot->curl);
127 slot->curl_result = curl_result;
128 finish_active_slot(slot);
129 } else {
130 fprintf(stderr, "Received DONE message for unknown request!\n");
131 }
132 } else {
133 fprintf(stderr, "Unknown CURL message received: %d\n",
134 (int)curl_message->msg);
135 }
136 curl_message = curl_multi_info_read(curlm, &num_messages);
137 }
138 }
139 #endif
140
141 static int http_options(const char *var, const char *value, void *cb)
142 {
143 if (!strcmp("http.sslverify", var)) {
144 curl_ssl_verify = git_config_bool(var, value);
145 return 0;
146 }
147 if (!strcmp("http.sslcert", var))
148 return git_config_string(&ssl_cert, var, value);
149 #if LIBCURL_VERSION_NUM >= 0x070903
150 if (!strcmp("http.sslkey", var))
151 return git_config_string(&ssl_key, var, value);
152 #endif
153 #if LIBCURL_VERSION_NUM >= 0x070908
154 if (!strcmp("http.sslcapath", var))
155 return git_config_string(&ssl_capath, var, value);
156 #endif
157 if (!strcmp("http.sslcainfo", var))
158 return git_config_string(&ssl_cainfo, var, value);
159 if (!strcmp("http.sslcertpasswordprotected", var)) {
160 if (git_config_bool(var, value))
161 ssl_cert_password_required = 1;
162 return 0;
163 }
164 if (!strcmp("http.minsessions", var)) {
165 min_curl_sessions = git_config_int(var, value);
166 #ifndef USE_CURL_MULTI
167 if (min_curl_sessions > 1)
168 min_curl_sessions = 1;
169 #endif
170 return 0;
171 }
172 #ifdef USE_CURL_MULTI
173 if (!strcmp("http.maxrequests", var)) {
174 max_requests = git_config_int(var, value);
175 return 0;
176 }
177 #endif
178 if (!strcmp("http.lowspeedlimit", var)) {
179 curl_low_speed_limit = (long)git_config_int(var, value);
180 return 0;
181 }
182 if (!strcmp("http.lowspeedtime", var)) {
183 curl_low_speed_time = (long)git_config_int(var, value);
184 return 0;
185 }
186
187 if (!strcmp("http.noepsv", var)) {
188 curl_ftp_no_epsv = git_config_bool(var, value);
189 return 0;
190 }
191 if (!strcmp("http.proxy", var))
192 return git_config_string(&curl_http_proxy, var, value);
193
194 if (!strcmp("http.postbuffer", var)) {
195 http_post_buffer = git_config_int(var, value);
196 if (http_post_buffer < LARGE_PACKET_MAX)
197 http_post_buffer = LARGE_PACKET_MAX;
198 return 0;
199 }
200
201 if (!strcmp("http.useragent", var))
202 return git_config_string(&user_agent, var, value);
203
204 /* Fall back on the default ones */
205 return git_default_config(var, value, cb);
206 }
207
208 static void init_curl_http_auth(CURL *result)
209 {
210 if (user_name) {
211 struct strbuf up = STRBUF_INIT;
212 if (!user_pass)
213 user_pass = xstrdup(git_getpass("Password: "));
214 strbuf_addf(&up, "%s:%s", user_name, user_pass);
215 curl_easy_setopt(result, CURLOPT_USERPWD,
216 strbuf_detach(&up, NULL));
217 }
218 }
219
220 static int has_cert_password(void)
221 {
222 if (ssl_cert_password != NULL)
223 return 1;
224 if (ssl_cert == NULL || ssl_cert_password_required != 1)
225 return 0;
226 /* Only prompt the user once. */
227 ssl_cert_password_required = -1;
228 ssl_cert_password = git_getpass("Certificate Password: ");
229 if (ssl_cert_password != NULL) {
230 ssl_cert_password = xstrdup(ssl_cert_password);
231 return 1;
232 } else
233 return 0;
234 }
235
236 static CURL *get_curl_handle(void)
237 {
238 CURL *result = curl_easy_init();
239
240 if (!curl_ssl_verify) {
241 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 0);
242 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 0);
243 } else {
244 /* Verify authenticity of the peer's certificate */
245 curl_easy_setopt(result, CURLOPT_SSL_VERIFYPEER, 1);
246 /* The name in the cert must match whom we tried to connect */
247 curl_easy_setopt(result, CURLOPT_SSL_VERIFYHOST, 2);
248 }
249
250 #if LIBCURL_VERSION_NUM >= 0x070907
251 curl_easy_setopt(result, CURLOPT_NETRC, CURL_NETRC_OPTIONAL);
252 #endif
253 #ifdef LIBCURL_CAN_HANDLE_AUTH_ANY
254 curl_easy_setopt(result, CURLOPT_HTTPAUTH, CURLAUTH_ANY);
255 #endif
256
257 init_curl_http_auth(result);
258
259 if (ssl_cert != NULL)
260 curl_easy_setopt(result, CURLOPT_SSLCERT, ssl_cert);
261 if (has_cert_password())
262 curl_easy_setopt(result, CURLOPT_KEYPASSWD, ssl_cert_password);
263 #if LIBCURL_VERSION_NUM >= 0x070903
264 if (ssl_key != NULL)
265 curl_easy_setopt(result, CURLOPT_SSLKEY, ssl_key);
266 #endif
267 #if LIBCURL_VERSION_NUM >= 0x070908
268 if (ssl_capath != NULL)
269 curl_easy_setopt(result, CURLOPT_CAPATH, ssl_capath);
270 #endif
271 if (ssl_cainfo != NULL)
272 curl_easy_setopt(result, CURLOPT_CAINFO, ssl_cainfo);
273 curl_easy_setopt(result, CURLOPT_FAILONERROR, 1);
274
275 if (curl_low_speed_limit > 0 && curl_low_speed_time > 0) {
276 curl_easy_setopt(result, CURLOPT_LOW_SPEED_LIMIT,
277 curl_low_speed_limit);
278 curl_easy_setopt(result, CURLOPT_LOW_SPEED_TIME,
279 curl_low_speed_time);
280 }
281
282 curl_easy_setopt(result, CURLOPT_FOLLOWLOCATION, 1);
283 #if LIBCURL_VERSION_NUM >= 0x071301
284 curl_easy_setopt(result, CURLOPT_POSTREDIR, CURL_REDIR_POST_ALL);
285 #elif LIBCURL_VERSION_NUM >= 0x071101
286 curl_easy_setopt(result, CURLOPT_POST301, 1);
287 #endif
288
289 if (getenv("GIT_CURL_VERBOSE"))
290 curl_easy_setopt(result, CURLOPT_VERBOSE, 1);
291
292 curl_easy_setopt(result, CURLOPT_USERAGENT,
293 user_agent ? user_agent : GIT_HTTP_USER_AGENT);
294
295 if (curl_ftp_no_epsv)
296 curl_easy_setopt(result, CURLOPT_FTP_USE_EPSV, 0);
297
298 if (curl_http_proxy)
299 curl_easy_setopt(result, CURLOPT_PROXY, curl_http_proxy);
300
301 return result;
302 }
303
304 static void http_auth_init(const char *url)
305 {
306 char *at, *colon, *cp, *slash, *decoded;
307 int len;
308
309 cp = strstr(url, "://");
310 if (!cp)
311 return;
312
313 /*
314 * Ok, the URL looks like "proto://something". Which one?
315 * "proto://<user>:<pass>@<host>/...",
316 * "proto://<user>@<host>/...", or just
317 * "proto://<host>/..."?
318 */
319 cp += 3;
320 at = strchr(cp, '@');
321 colon = strchr(cp, ':');
322 slash = strchrnul(cp, '/');
323 if (!at || slash <= at)
324 return; /* No credentials */
325 if (!colon || at <= colon) {
326 /* Only username */
327 len = at - cp;
328 user_name = xmalloc(len + 1);
329 memcpy(user_name, cp, len);
330 user_name[len] = '\0';
331 decoded = url_decode(user_name);
332 free(user_name);
333 user_name = decoded;
334 user_pass = NULL;
335 } else {
336 len = colon - cp;
337 user_name = xmalloc(len + 1);
338 memcpy(user_name, cp, len);
339 user_name[len] = '\0';
340 decoded = url_decode(user_name);
341 free(user_name);
342 user_name = decoded;
343 len = at - (colon + 1);
344 user_pass = xmalloc(len + 1);
345 memcpy(user_pass, colon + 1, len);
346 user_pass[len] = '\0';
347 decoded = url_decode(user_pass);
348 free(user_pass);
349 user_pass = decoded;
350 }
351 }
352
353 static void set_from_env(const char **var, const char *envname)
354 {
355 const char *val = getenv(envname);
356 if (val)
357 *var = val;
358 }
359
360 void http_init(struct remote *remote)
361 {
362 char *low_speed_limit;
363 char *low_speed_time;
364
365 http_is_verbose = 0;
366
367 git_config(http_options, NULL);
368
369 curl_global_init(CURL_GLOBAL_ALL);
370
371 if (remote && remote->http_proxy)
372 curl_http_proxy = xstrdup(remote->http_proxy);
373
374 pragma_header = curl_slist_append(pragma_header, "Pragma: no-cache");
375 no_pragma_header = curl_slist_append(no_pragma_header, "Pragma:");
376
377 #ifdef USE_CURL_MULTI
378 {
379 char *http_max_requests = getenv("GIT_HTTP_MAX_REQUESTS");
380 if (http_max_requests != NULL)
381 max_requests = atoi(http_max_requests);
382 }
383
384 curlm = curl_multi_init();
385 if (curlm == NULL) {
386 fprintf(stderr, "Error creating curl multi handle.\n");
387 exit(1);
388 }
389 #endif
390
391 if (getenv("GIT_SSL_NO_VERIFY"))
392 curl_ssl_verify = 0;
393
394 set_from_env(&ssl_cert, "GIT_SSL_CERT");
395 #if LIBCURL_VERSION_NUM >= 0x070903
396 set_from_env(&ssl_key, "GIT_SSL_KEY");
397 #endif
398 #if LIBCURL_VERSION_NUM >= 0x070908
399 set_from_env(&ssl_capath, "GIT_SSL_CAPATH");
400 #endif
401 set_from_env(&ssl_cainfo, "GIT_SSL_CAINFO");
402
403 set_from_env(&user_agent, "GIT_HTTP_USER_AGENT");
404
405 low_speed_limit = getenv("GIT_HTTP_LOW_SPEED_LIMIT");
406 if (low_speed_limit != NULL)
407 curl_low_speed_limit = strtol(low_speed_limit, NULL, 10);
408 low_speed_time = getenv("GIT_HTTP_LOW_SPEED_TIME");
409 if (low_speed_time != NULL)
410 curl_low_speed_time = strtol(low_speed_time, NULL, 10);
411
412 if (curl_ssl_verify == -1)
413 curl_ssl_verify = 1;
414
415 curl_session_count = 0;
416 #ifdef USE_CURL_MULTI
417 if (max_requests < 1)
418 max_requests = DEFAULT_MAX_REQUESTS;
419 #endif
420
421 if (getenv("GIT_CURL_FTP_NO_EPSV"))
422 curl_ftp_no_epsv = 1;
423
424 if (remote && remote->url && remote->url[0]) {
425 http_auth_init(remote->url[0]);
426 if (!ssl_cert_password_required &&
427 getenv("GIT_SSL_CERT_PASSWORD_PROTECTED") &&
428 !prefixcmp(remote->url[0], "https://"))
429 ssl_cert_password_required = 1;
430 }
431
432 #ifndef NO_CURL_EASY_DUPHANDLE
433 curl_default = get_curl_handle();
434 #endif
435 }
436
437 void http_cleanup(void)
438 {
439 struct active_request_slot *slot = active_queue_head;
440
441 while (slot != NULL) {
442 struct active_request_slot *next = slot->next;
443 if (slot->curl != NULL) {
444 #ifdef USE_CURL_MULTI
445 curl_multi_remove_handle(curlm, slot->curl);
446 #endif
447 curl_easy_cleanup(slot->curl);
448 }
449 free(slot);
450 slot = next;
451 }
452 active_queue_head = NULL;
453
454 #ifndef NO_CURL_EASY_DUPHANDLE
455 curl_easy_cleanup(curl_default);
456 #endif
457
458 #ifdef USE_CURL_MULTI
459 curl_multi_cleanup(curlm);
460 #endif
461 curl_global_cleanup();
462
463 curl_slist_free_all(pragma_header);
464 pragma_header = NULL;
465
466 curl_slist_free_all(no_pragma_header);
467 no_pragma_header = NULL;
468
469 if (curl_http_proxy) {
470 free((void *)curl_http_proxy);
471 curl_http_proxy = NULL;
472 }
473
474 if (ssl_cert_password != NULL) {
475 memset(ssl_cert_password, 0, strlen(ssl_cert_password));
476 free(ssl_cert_password);
477 ssl_cert_password = NULL;
478 }
479 ssl_cert_password_required = 0;
480 }
481
482 struct active_request_slot *get_active_slot(void)
483 {
484 struct active_request_slot *slot = active_queue_head;
485 struct active_request_slot *newslot;
486
487 #ifdef USE_CURL_MULTI
488 int num_transfers;
489
490 /* Wait for a slot to open up if the queue is full */
491 while (active_requests >= max_requests) {
492 curl_multi_perform(curlm, &num_transfers);
493 if (num_transfers < active_requests)
494 process_curl_messages();
495 }
496 #endif
497
498 while (slot != NULL && slot->in_use)
499 slot = slot->next;
500
501 if (slot == NULL) {
502 newslot = xmalloc(sizeof(*newslot));
503 newslot->curl = NULL;
504 newslot->in_use = 0;
505 newslot->next = NULL;
506
507 slot = active_queue_head;
508 if (slot == NULL) {
509 active_queue_head = newslot;
510 } else {
511 while (slot->next != NULL)
512 slot = slot->next;
513 slot->next = newslot;
514 }
515 slot = newslot;
516 }
517
518 if (slot->curl == NULL) {
519 #ifdef NO_CURL_EASY_DUPHANDLE
520 slot->curl = get_curl_handle();
521 #else
522 slot->curl = curl_easy_duphandle(curl_default);
523 #endif
524 curl_session_count++;
525 }
526
527 active_requests++;
528 slot->in_use = 1;
529 slot->local = NULL;
530 slot->results = NULL;
531 slot->finished = NULL;
532 slot->callback_data = NULL;
533 slot->callback_func = NULL;
534 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, pragma_header);
535 curl_easy_setopt(slot->curl, CURLOPT_ERRORBUFFER, curl_errorstr);
536 curl_easy_setopt(slot->curl, CURLOPT_CUSTOMREQUEST, NULL);
537 curl_easy_setopt(slot->curl, CURLOPT_READFUNCTION, NULL);
538 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION, NULL);
539 curl_easy_setopt(slot->curl, CURLOPT_UPLOAD, 0);
540 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
541
542 return slot;
543 }
544
545 int start_active_slot(struct active_request_slot *slot)
546 {
547 #ifdef USE_CURL_MULTI
548 CURLMcode curlm_result = curl_multi_add_handle(curlm, slot->curl);
549 int num_transfers;
550
551 if (curlm_result != CURLM_OK &&
552 curlm_result != CURLM_CALL_MULTI_PERFORM) {
553 active_requests--;
554 slot->in_use = 0;
555 return 0;
556 }
557
558 /*
559 * We know there must be something to do, since we just added
560 * something.
561 */
562 curl_multi_perform(curlm, &num_transfers);
563 #endif
564 return 1;
565 }
566
567 #ifdef USE_CURL_MULTI
568 struct fill_chain {
569 void *data;
570 int (*fill)(void *);
571 struct fill_chain *next;
572 };
573
574 static struct fill_chain *fill_cfg;
575
576 void add_fill_function(void *data, int (*fill)(void *))
577 {
578 struct fill_chain *new = xmalloc(sizeof(*new));
579 struct fill_chain **linkp = &fill_cfg;
580 new->data = data;
581 new->fill = fill;
582 new->next = NULL;
583 while (*linkp)
584 linkp = &(*linkp)->next;
585 *linkp = new;
586 }
587
588 void fill_active_slots(void)
589 {
590 struct active_request_slot *slot = active_queue_head;
591
592 while (active_requests < max_requests) {
593 struct fill_chain *fill;
594 for (fill = fill_cfg; fill; fill = fill->next)
595 if (fill->fill(fill->data))
596 break;
597
598 if (!fill)
599 break;
600 }
601
602 while (slot != NULL) {
603 if (!slot->in_use && slot->curl != NULL
604 && curl_session_count > min_curl_sessions) {
605 curl_easy_cleanup(slot->curl);
606 slot->curl = NULL;
607 curl_session_count--;
608 }
609 slot = slot->next;
610 }
611 }
612
613 void step_active_slots(void)
614 {
615 int num_transfers;
616 CURLMcode curlm_result;
617
618 do {
619 curlm_result = curl_multi_perform(curlm, &num_transfers);
620 } while (curlm_result == CURLM_CALL_MULTI_PERFORM);
621 if (num_transfers < active_requests) {
622 process_curl_messages();
623 fill_active_slots();
624 }
625 }
626 #endif
627
628 void run_active_slot(struct active_request_slot *slot)
629 {
630 #ifdef USE_CURL_MULTI
631 long last_pos = 0;
632 long current_pos;
633 fd_set readfds;
634 fd_set writefds;
635 fd_set excfds;
636 int max_fd;
637 struct timeval select_timeout;
638 int finished = 0;
639
640 slot->finished = &finished;
641 while (!finished) {
642 data_received = 0;
643 step_active_slots();
644
645 if (!data_received && slot->local != NULL) {
646 current_pos = ftell(slot->local);
647 if (current_pos > last_pos)
648 data_received++;
649 last_pos = current_pos;
650 }
651
652 if (slot->in_use && !data_received) {
653 max_fd = 0;
654 FD_ZERO(&readfds);
655 FD_ZERO(&writefds);
656 FD_ZERO(&excfds);
657 select_timeout.tv_sec = 0;
658 select_timeout.tv_usec = 50000;
659 select(max_fd, &readfds, &writefds,
660 &excfds, &select_timeout);
661 }
662 }
663 #else
664 while (slot->in_use) {
665 slot->curl_result = curl_easy_perform(slot->curl);
666 finish_active_slot(slot);
667 }
668 #endif
669 }
670
671 static void closedown_active_slot(struct active_request_slot *slot)
672 {
673 active_requests--;
674 slot->in_use = 0;
675 }
676
677 static void release_active_slot(struct active_request_slot *slot)
678 {
679 closedown_active_slot(slot);
680 if (slot->curl && curl_session_count > min_curl_sessions) {
681 #ifdef USE_CURL_MULTI
682 curl_multi_remove_handle(curlm, slot->curl);
683 #endif
684 curl_easy_cleanup(slot->curl);
685 slot->curl = NULL;
686 curl_session_count--;
687 }
688 #ifdef USE_CURL_MULTI
689 fill_active_slots();
690 #endif
691 }
692
693 void finish_active_slot(struct active_request_slot *slot)
694 {
695 closedown_active_slot(slot);
696 curl_easy_getinfo(slot->curl, CURLINFO_HTTP_CODE, &slot->http_code);
697
698 if (slot->finished != NULL)
699 (*slot->finished) = 1;
700
701 /* Store slot results so they can be read after the slot is reused */
702 if (slot->results != NULL) {
703 slot->results->curl_result = slot->curl_result;
704 slot->results->http_code = slot->http_code;
705 }
706
707 /* Run callback if appropriate */
708 if (slot->callback_func != NULL)
709 slot->callback_func(slot->callback_data);
710 }
711
712 void finish_all_active_slots(void)
713 {
714 struct active_request_slot *slot = active_queue_head;
715
716 while (slot != NULL)
717 if (slot->in_use) {
718 run_active_slot(slot);
719 slot = active_queue_head;
720 } else {
721 slot = slot->next;
722 }
723 }
724
725 /* Helpers for modifying and creating URLs */
726 static inline int needs_quote(int ch)
727 {
728 if (((ch >= 'A') && (ch <= 'Z'))
729 || ((ch >= 'a') && (ch <= 'z'))
730 || ((ch >= '0') && (ch <= '9'))
731 || (ch == '/')
732 || (ch == '-')
733 || (ch == '.'))
734 return 0;
735 return 1;
736 }
737
738 static inline int hex(int v)
739 {
740 if (v < 10)
741 return '0' + v;
742 else
743 return 'A' + v - 10;
744 }
745
746 void end_url_with_slash(struct strbuf *buf, const char *url)
747 {
748 strbuf_addstr(buf, url);
749 if (buf->len && buf->buf[buf->len - 1] != '/')
750 strbuf_addstr(buf, "/");
751 }
752
753 static char *quote_ref_url(const char *base, const char *ref)
754 {
755 struct strbuf buf = STRBUF_INIT;
756 const char *cp;
757 int ch;
758
759 end_url_with_slash(&buf, base);
760
761 for (cp = ref; (ch = *cp) != 0; cp++)
762 if (needs_quote(ch))
763 strbuf_addf(&buf, "%%%02x", ch);
764 else
765 strbuf_addch(&buf, *cp);
766
767 return strbuf_detach(&buf, NULL);
768 }
769
770 void append_remote_object_url(struct strbuf *buf, const char *url,
771 const char *hex,
772 int only_two_digit_prefix)
773 {
774 end_url_with_slash(buf, url);
775
776 strbuf_addf(buf, "objects/%.*s/", 2, hex);
777 if (!only_two_digit_prefix)
778 strbuf_addf(buf, "%s", hex+2);
779 }
780
781 char *get_remote_object_url(const char *url, const char *hex,
782 int only_two_digit_prefix)
783 {
784 struct strbuf buf = STRBUF_INIT;
785 append_remote_object_url(&buf, url, hex, only_two_digit_prefix);
786 return strbuf_detach(&buf, NULL);
787 }
788
789 /* http_request() targets */
790 #define HTTP_REQUEST_STRBUF 0
791 #define HTTP_REQUEST_FILE 1
792
793 static int http_request(const char *url, void *result, int target, int options)
794 {
795 struct active_request_slot *slot;
796 struct slot_results results;
797 struct curl_slist *headers = NULL;
798 struct strbuf buf = STRBUF_INIT;
799 int ret;
800
801 slot = get_active_slot();
802 slot->results = &results;
803 curl_easy_setopt(slot->curl, CURLOPT_HTTPGET, 1);
804
805 if (result == NULL) {
806 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 1);
807 } else {
808 curl_easy_setopt(slot->curl, CURLOPT_NOBODY, 0);
809 curl_easy_setopt(slot->curl, CURLOPT_FILE, result);
810
811 if (target == HTTP_REQUEST_FILE) {
812 long posn = ftell(result);
813 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
814 fwrite);
815 if (posn > 0) {
816 strbuf_addf(&buf, "Range: bytes=%ld-", posn);
817 headers = curl_slist_append(headers, buf.buf);
818 strbuf_reset(&buf);
819 }
820 slot->local = result;
821 } else
822 curl_easy_setopt(slot->curl, CURLOPT_WRITEFUNCTION,
823 fwrite_buffer);
824 }
825
826 strbuf_addstr(&buf, "Pragma:");
827 if (options & HTTP_NO_CACHE)
828 strbuf_addstr(&buf, " no-cache");
829
830 headers = curl_slist_append(headers, buf.buf);
831
832 curl_easy_setopt(slot->curl, CURLOPT_URL, url);
833 curl_easy_setopt(slot->curl, CURLOPT_HTTPHEADER, headers);
834
835 if (start_active_slot(slot)) {
836 run_active_slot(slot);
837 if (results.curl_result == CURLE_OK)
838 ret = HTTP_OK;
839 else if (missing_target(&results))
840 ret = HTTP_MISSING_TARGET;
841 else if (results.http_code == 401) {
842 if (user_name) {
843 ret = HTTP_NOAUTH;
844 } else {
845 /*
846 * git_getpass is needed here because its very likely stdin/stdout are
847 * pipes to our parent process. So we instead need to use /dev/tty,
848 * but that is non-portable. Using git_getpass() can at least be stubbed
849 * on other platforms with a different implementation if/when necessary.
850 */
851 user_name = xstrdup(git_getpass("Username: "));
852 init_curl_http_auth(slot->curl);
853 ret = HTTP_REAUTH;
854 }
855 } else
856 ret = HTTP_ERROR;
857 } else {
858 error("Unable to start HTTP request for %s", url);
859 ret = HTTP_START_FAILED;
860 }
861
862 slot->local = NULL;
863 curl_slist_free_all(headers);
864 strbuf_release(&buf);
865
866 return ret;
867 }
868
869 int http_get_strbuf(const char *url, struct strbuf *result, int options)
870 {
871 int http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
872 if (http_ret == HTTP_REAUTH) {
873 http_ret = http_request(url, result, HTTP_REQUEST_STRBUF, options);
874 }
875 return http_ret;
876 }
877
878 /*
879 * Downloads an url and stores the result in the given file.
880 *
881 * If a previous interrupted download is detected (i.e. a previous temporary
882 * file is still around) the download is resumed.
883 */
884 static int http_get_file(const char *url, const char *filename, int options)
885 {
886 int ret;
887 struct strbuf tmpfile = STRBUF_INIT;
888 FILE *result;
889
890 strbuf_addf(&tmpfile, "%s.temp", filename);
891 result = fopen(tmpfile.buf, "a");
892 if (! result) {
893 error("Unable to open local file %s", tmpfile.buf);
894 ret = HTTP_ERROR;
895 goto cleanup;
896 }
897
898 ret = http_request(url, result, HTTP_REQUEST_FILE, options);
899 fclose(result);
900
901 if ((ret == HTTP_OK) && move_temp_to_file(tmpfile.buf, filename))
902 ret = HTTP_ERROR;
903 cleanup:
904 strbuf_release(&tmpfile);
905 return ret;
906 }
907
908 int http_error(const char *url, int ret)
909 {
910 /* http_request has already handled HTTP_START_FAILED. */
911 if (ret != HTTP_START_FAILED)
912 error("%s while accessing %s\n", curl_errorstr, url);
913
914 return ret;
915 }
916
917 int http_fetch_ref(const char *base, struct ref *ref)
918 {
919 char *url;
920 struct strbuf buffer = STRBUF_INIT;
921 int ret = -1;
922
923 url = quote_ref_url(base, ref->name);
924 if (http_get_strbuf(url, &buffer, HTTP_NO_CACHE) == HTTP_OK) {
925 strbuf_rtrim(&buffer);
926 if (buffer.len == 40)
927 ret = get_sha1_hex(buffer.buf, ref->old_sha1);
928 else if (!prefixcmp(buffer.buf, "ref: ")) {
929 ref->symref = xstrdup(buffer.buf + 5);
930 ret = 0;
931 }
932 }
933
934 strbuf_release(&buffer);
935 free(url);
936 return ret;
937 }
938
939 /* Helpers for fetching packs */
940 static char *fetch_pack_index(unsigned char *sha1, const char *base_url)
941 {
942 char *url, *tmp;
943 struct strbuf buf = STRBUF_INIT;
944
945 if (http_is_verbose)
946 fprintf(stderr, "Getting index for pack %s\n", sha1_to_hex(sha1));
947
948 end_url_with_slash(&buf, base_url);
949 strbuf_addf(&buf, "objects/pack/pack-%s.idx", sha1_to_hex(sha1));
950 url = strbuf_detach(&buf, NULL);
951
952 strbuf_addf(&buf, "%s.temp", sha1_pack_index_name(sha1));
953 tmp = strbuf_detach(&buf, NULL);
954
955 if (http_get_file(url, tmp, 0) != HTTP_OK) {
956 error("Unable to get pack index %s\n", url);
957 free(tmp);
958 tmp = NULL;
959 }
960
961 free(url);
962 return tmp;
963 }
964
965 static int fetch_and_setup_pack_index(struct packed_git **packs_head,
966 unsigned char *sha1, const char *base_url)
967 {
968 struct packed_git *new_pack;
969 char *tmp_idx = NULL;
970 int ret;
971
972 if (has_pack_index(sha1)) {
973 new_pack = parse_pack_index(sha1, NULL);
974 if (!new_pack)
975 return -1; /* parse_pack_index() already issued error message */
976 goto add_pack;
977 }
978
979 tmp_idx = fetch_pack_index(sha1, base_url);
980 if (!tmp_idx)
981 return -1;
982
983 new_pack = parse_pack_index(sha1, tmp_idx);
984 if (!new_pack) {
985 unlink(tmp_idx);
986 free(tmp_idx);
987
988 return -1; /* parse_pack_index() already issued error message */
989 }
990
991 ret = verify_pack_index(new_pack);
992 if (!ret) {
993 close_pack_index(new_pack);
994 ret = move_temp_to_file(tmp_idx, sha1_pack_index_name(sha1));
995 }
996 free(tmp_idx);
997 if (ret)
998 return -1;
999
1000 add_pack:
1001 new_pack->next = *packs_head;
1002 *packs_head = new_pack;
1003 return 0;
1004 }
1005
1006 int http_get_info_packs(const char *base_url, struct packed_git **packs_head)
1007 {
1008 int ret = 0, i = 0;
1009 char *url, *data;
1010 struct strbuf buf = STRBUF_INIT;
1011 unsigned char sha1[20];
1012
1013 end_url_with_slash(&buf, base_url);
1014 strbuf_addstr(&buf, "objects/info/packs");
1015 url = strbuf_detach(&buf, NULL);
1016
1017 ret = http_get_strbuf(url, &buf, HTTP_NO_CACHE);
1018 if (ret != HTTP_OK)
1019 goto cleanup;
1020
1021 data = buf.buf;
1022 while (i < buf.len) {
1023 switch (data[i]) {
1024 case 'P':
1025 i++;
1026 if (i + 52 <= buf.len &&
1027 !prefixcmp(data + i, " pack-") &&
1028 !prefixcmp(data + i + 46, ".pack\n")) {
1029 get_sha1_hex(data + i + 6, sha1);
1030 fetch_and_setup_pack_index(packs_head, sha1,
1031 base_url);
1032 i += 51;
1033 break;
1034 }
1035 default:
1036 while (i < buf.len && data[i] != '\n')
1037 i++;
1038 }
1039 i++;
1040 }
1041
1042 cleanup:
1043 free(url);
1044 return ret;
1045 }
1046
1047 void release_http_pack_request(struct http_pack_request *preq)
1048 {
1049 if (preq->packfile != NULL) {
1050 fclose(preq->packfile);
1051 preq->packfile = NULL;
1052 preq->slot->local = NULL;
1053 }
1054 if (preq->range_header != NULL) {
1055 curl_slist_free_all(preq->range_header);
1056 preq->range_header = NULL;
1057 }
1058 preq->slot = NULL;
1059 free(preq->url);
1060 }
1061
1062 int finish_http_pack_request(struct http_pack_request *preq)
1063 {
1064 struct packed_git **lst;
1065 struct packed_git *p = preq->target;
1066 char *tmp_idx;
1067 struct child_process ip;
1068 const char *ip_argv[8];
1069
1070 close_pack_index(p);
1071
1072 fclose(preq->packfile);
1073 preq->packfile = NULL;
1074 preq->slot->local = NULL;
1075
1076 lst = preq->lst;
1077 while (*lst != p)
1078 lst = &((*lst)->next);
1079 *lst = (*lst)->next;
1080
1081 tmp_idx = xstrdup(preq->tmpfile);
1082 strcpy(tmp_idx + strlen(tmp_idx) - strlen(".pack.temp"),
1083 ".idx.temp");
1084
1085 ip_argv[0] = "index-pack";
1086 ip_argv[1] = "-o";
1087 ip_argv[2] = tmp_idx;
1088 ip_argv[3] = preq->tmpfile;
1089 ip_argv[4] = NULL;
1090
1091 memset(&ip, 0, sizeof(ip));
1092 ip.argv = ip_argv;
1093 ip.git_cmd = 1;
1094 ip.no_stdin = 1;
1095 ip.no_stdout = 1;
1096
1097 if (run_command(&ip)) {
1098 unlink(preq->tmpfile);
1099 unlink(tmp_idx);
1100 free(tmp_idx);
1101 return -1;
1102 }
1103
1104 unlink(sha1_pack_index_name(p->sha1));
1105
1106 if (move_temp_to_file(preq->tmpfile, sha1_pack_name(p->sha1))
1107 || move_temp_to_file(tmp_idx, sha1_pack_index_name(p->sha1))) {
1108 free(tmp_idx);
1109 return -1;
1110 }
1111
1112 install_packed_git(p);
1113 free(tmp_idx);
1114 return 0;
1115 }
1116
1117 struct http_pack_request *new_http_pack_request(
1118 struct packed_git *target, const char *base_url)
1119 {
1120 long prev_posn = 0;
1121 char range[RANGE_HEADER_SIZE];
1122 struct strbuf buf = STRBUF_INIT;
1123 struct http_pack_request *preq;
1124
1125 preq = xmalloc(sizeof(*preq));
1126 preq->target = target;
1127 preq->range_header = NULL;
1128
1129 end_url_with_slash(&buf, base_url);
1130 strbuf_addf(&buf, "objects/pack/pack-%s.pack",
1131 sha1_to_hex(target->sha1));
1132 preq->url = strbuf_detach(&buf, NULL);
1133
1134 snprintf(preq->tmpfile, sizeof(preq->tmpfile), "%s.temp",
1135 sha1_pack_name(target->sha1));
1136 preq->packfile = fopen(preq->tmpfile, "a");
1137 if (!preq->packfile) {
1138 error("Unable to open local file %s for pack",
1139 preq->tmpfile);
1140 goto abort;
1141 }
1142
1143 preq->slot = get_active_slot();
1144 preq->slot->local = preq->packfile;
1145 curl_easy_setopt(preq->slot->curl, CURLOPT_FILE, preq->packfile);
1146 curl_easy_setopt(preq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite);
1147 curl_easy_setopt(preq->slot->curl, CURLOPT_URL, preq->url);
1148 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1149 no_pragma_header);
1150
1151 /*
1152 * If there is data present from a previous transfer attempt,
1153 * resume where it left off
1154 */
1155 prev_posn = ftell(preq->packfile);
1156 if (prev_posn>0) {
1157 if (http_is_verbose)
1158 fprintf(stderr,
1159 "Resuming fetch of pack %s at byte %ld\n",
1160 sha1_to_hex(target->sha1), prev_posn);
1161 sprintf(range, "Range: bytes=%ld-", prev_posn);
1162 preq->range_header = curl_slist_append(NULL, range);
1163 curl_easy_setopt(preq->slot->curl, CURLOPT_HTTPHEADER,
1164 preq->range_header);
1165 }
1166
1167 return preq;
1168
1169 abort:
1170 free(preq->url);
1171 free(preq);
1172 return NULL;
1173 }
1174
1175 /* Helpers for fetching objects (loose) */
1176 static size_t fwrite_sha1_file(void *ptr, size_t eltsize, size_t nmemb,
1177 void *data)
1178 {
1179 unsigned char expn[4096];
1180 size_t size = eltsize * nmemb;
1181 int posn = 0;
1182 struct http_object_request *freq =
1183 (struct http_object_request *)data;
1184 do {
1185 ssize_t retval = xwrite(freq->localfile,
1186 (char *) ptr + posn, size - posn);
1187 if (retval < 0)
1188 return posn;
1189 posn += retval;
1190 } while (posn < size);
1191
1192 freq->stream.avail_in = size;
1193 freq->stream.next_in = ptr;
1194 do {
1195 freq->stream.next_out = expn;
1196 freq->stream.avail_out = sizeof(expn);
1197 freq->zret = git_inflate(&freq->stream, Z_SYNC_FLUSH);
1198 git_SHA1_Update(&freq->c, expn,
1199 sizeof(expn) - freq->stream.avail_out);
1200 } while (freq->stream.avail_in && freq->zret == Z_OK);
1201 data_received++;
1202 return size;
1203 }
1204
1205 struct http_object_request *new_http_object_request(const char *base_url,
1206 unsigned char *sha1)
1207 {
1208 char *hex = sha1_to_hex(sha1);
1209 char *filename;
1210 char prevfile[PATH_MAX];
1211 int prevlocal;
1212 unsigned char prev_buf[PREV_BUF_SIZE];
1213 ssize_t prev_read = 0;
1214 long prev_posn = 0;
1215 char range[RANGE_HEADER_SIZE];
1216 struct curl_slist *range_header = NULL;
1217 struct http_object_request *freq;
1218
1219 freq = xmalloc(sizeof(*freq));
1220 hashcpy(freq->sha1, sha1);
1221 freq->localfile = -1;
1222
1223 filename = sha1_file_name(sha1);
1224 snprintf(freq->tmpfile, sizeof(freq->tmpfile),
1225 "%s.temp", filename);
1226
1227 snprintf(prevfile, sizeof(prevfile), "%s.prev", filename);
1228 unlink_or_warn(prevfile);
1229 rename(freq->tmpfile, prevfile);
1230 unlink_or_warn(freq->tmpfile);
1231
1232 if (freq->localfile != -1)
1233 error("fd leakage in start: %d", freq->localfile);
1234 freq->localfile = open(freq->tmpfile,
1235 O_WRONLY | O_CREAT | O_EXCL, 0666);
1236 /*
1237 * This could have failed due to the "lazy directory creation";
1238 * try to mkdir the last path component.
1239 */
1240 if (freq->localfile < 0 && errno == ENOENT) {
1241 char *dir = strrchr(freq->tmpfile, '/');
1242 if (dir) {
1243 *dir = 0;
1244 mkdir(freq->tmpfile, 0777);
1245 *dir = '/';
1246 }
1247 freq->localfile = open(freq->tmpfile,
1248 O_WRONLY | O_CREAT | O_EXCL, 0666);
1249 }
1250
1251 if (freq->localfile < 0) {
1252 error("Couldn't create temporary file %s: %s",
1253 freq->tmpfile, strerror(errno));
1254 goto abort;
1255 }
1256
1257 memset(&freq->stream, 0, sizeof(freq->stream));
1258
1259 git_inflate_init(&freq->stream);
1260
1261 git_SHA1_Init(&freq->c);
1262
1263 freq->url = get_remote_object_url(base_url, hex, 0);
1264
1265 /*
1266 * If a previous temp file is present, process what was already
1267 * fetched.
1268 */
1269 prevlocal = open(prevfile, O_RDONLY);
1270 if (prevlocal != -1) {
1271 do {
1272 prev_read = xread(prevlocal, prev_buf, PREV_BUF_SIZE);
1273 if (prev_read>0) {
1274 if (fwrite_sha1_file(prev_buf,
1275 1,
1276 prev_read,
1277 freq) == prev_read) {
1278 prev_posn += prev_read;
1279 } else {
1280 prev_read = -1;
1281 }
1282 }
1283 } while (prev_read > 0);
1284 close(prevlocal);
1285 }
1286 unlink_or_warn(prevfile);
1287
1288 /*
1289 * Reset inflate/SHA1 if there was an error reading the previous temp
1290 * file; also rewind to the beginning of the local file.
1291 */
1292 if (prev_read == -1) {
1293 memset(&freq->stream, 0, sizeof(freq->stream));
1294 git_inflate_init(&freq->stream);
1295 git_SHA1_Init(&freq->c);
1296 if (prev_posn>0) {
1297 prev_posn = 0;
1298 lseek(freq->localfile, 0, SEEK_SET);
1299 if (ftruncate(freq->localfile, 0) < 0) {
1300 error("Couldn't truncate temporary file %s: %s",
1301 freq->tmpfile, strerror(errno));
1302 goto abort;
1303 }
1304 }
1305 }
1306
1307 freq->slot = get_active_slot();
1308
1309 curl_easy_setopt(freq->slot->curl, CURLOPT_FILE, freq);
1310 curl_easy_setopt(freq->slot->curl, CURLOPT_WRITEFUNCTION, fwrite_sha1_file);
1311 curl_easy_setopt(freq->slot->curl, CURLOPT_ERRORBUFFER, freq->errorstr);
1312 curl_easy_setopt(freq->slot->curl, CURLOPT_URL, freq->url);
1313 curl_easy_setopt(freq->slot->curl, CURLOPT_HTTPHEADER, no_pragma_header);
1314
1315 /*
1316 * If we have successfully processed data from a previous fetch
1317 * attempt, only fetch the data we don't already have.
1318 */
1319 if (prev_posn>0) {
1320 if (http_is_verbose)
1321 fprintf(stderr,
1322 "Resuming fetch of object %s at byte %ld\n",
1323 hex, prev_posn);
1324 sprintf(range, "Range: bytes=%ld-", prev_posn);
1325 range_header = curl_slist_append(range_header, range);
1326 curl_easy_setopt(freq->slot->curl,
1327 CURLOPT_HTTPHEADER, range_header);
1328 }
1329
1330 return freq;
1331
1332 abort:
1333 free(filename);
1334 free(freq->url);
1335 free(freq);
1336 return NULL;
1337 }
1338
1339 void process_http_object_request(struct http_object_request *freq)
1340 {
1341 if (freq->slot == NULL)
1342 return;
1343 freq->curl_result = freq->slot->curl_result;
1344 freq->http_code = freq->slot->http_code;
1345 freq->slot = NULL;
1346 }
1347
1348 int finish_http_object_request(struct http_object_request *freq)
1349 {
1350 struct stat st;
1351
1352 close(freq->localfile);
1353 freq->localfile = -1;
1354
1355 process_http_object_request(freq);
1356
1357 if (freq->http_code == 416) {
1358 warning("requested range invalid; we may already have all the data.");
1359 } else if (freq->curl_result != CURLE_OK) {
1360 if (stat(freq->tmpfile, &st) == 0)
1361 if (st.st_size == 0)
1362 unlink_or_warn(freq->tmpfile);
1363 return -1;
1364 }
1365
1366 git_inflate_end(&freq->stream);
1367 git_SHA1_Final(freq->real_sha1, &freq->c);
1368 if (freq->zret != Z_STREAM_END) {
1369 unlink_or_warn(freq->tmpfile);
1370 return -1;
1371 }
1372 if (hashcmp(freq->sha1, freq->real_sha1)) {
1373 unlink_or_warn(freq->tmpfile);
1374 return -1;
1375 }
1376 freq->rename =
1377 move_temp_to_file(freq->tmpfile, sha1_file_name(freq->sha1));
1378
1379 return freq->rename;
1380 }
1381
1382 void abort_http_object_request(struct http_object_request *freq)
1383 {
1384 unlink_or_warn(freq->tmpfile);
1385
1386 release_http_object_request(freq);
1387 }
1388
1389 void release_http_object_request(struct http_object_request *freq)
1390 {
1391 if (freq->localfile != -1) {
1392 close(freq->localfile);
1393 freq->localfile = -1;
1394 }
1395 if (freq->url != NULL) {
1396 free(freq->url);
1397 freq->url = NULL;
1398 }
1399 if (freq->slot != NULL) {
1400 freq->slot->callback_func = NULL;
1401 freq->slot->callback_data = NULL;
1402 release_active_slot(freq->slot);
1403 freq->slot = NULL;
1404 }
1405 }