]> git.proxmox.com Git - qemu.git/blame - block/curl.c
block/curl: only restrict protocols with libcurl>=7.19.4
[qemu.git] / block / curl.c
CommitLineData
769ce76d
AG
1/*
2 * QEMU Block driver for CURL images
3 *
4 * Copyright (c) 2009 Alexander Graf <agraf@suse.de>
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24#include "qemu-common.h"
737e150e 25#include "block/block_int.h"
769ce76d
AG
26#include <curl/curl.h>
27
28// #define DEBUG
29// #define DEBUG_VERBOSE
30
31#ifdef DEBUG_CURL
d0f2c4c6 32#define DPRINTF(fmt, ...) do { printf(fmt, ## __VA_ARGS__); } while (0)
769ce76d 33#else
d0f2c4c6 34#define DPRINTF(fmt, ...) do { } while (0)
769ce76d
AG
35#endif
36
fb6d1bbd
SH
37#define PROTOCOLS (CURLPROTO_HTTP | CURLPROTO_HTTPS | \
38 CURLPROTO_FTP | CURLPROTO_FTPS | \
39 CURLPROTO_TFTP)
40
769ce76d
AG
41#define CURL_NUM_STATES 8
42#define CURL_NUM_ACB 8
43#define SECTOR_SIZE 512
44#define READ_AHEAD_SIZE (256 * 1024)
45
46#define FIND_RET_NONE 0
47#define FIND_RET_OK 1
48#define FIND_RET_WAIT 2
49
50struct BDRVCURLState;
51
52typedef struct CURLAIOCB {
53 BlockDriverAIOCB common;
363c3c85 54 QEMUBH *bh;
769ce76d 55 QEMUIOVector *qiov;
363c3c85
NT
56
57 int64_t sector_num;
58 int nb_sectors;
59
769ce76d
AG
60 size_t start;
61 size_t end;
62} CURLAIOCB;
63
64typedef struct CURLState
65{
66 struct BDRVCURLState *s;
67 CURLAIOCB *acb[CURL_NUM_ACB];
68 CURL *curl;
69 char *orig_buf;
70 size_t buf_start;
71 size_t buf_off;
72 size_t buf_len;
73 char range[128];
74 char errmsg[CURL_ERROR_SIZE];
75 char in_use;
76} CURLState;
77
78typedef struct BDRVCURLState {
79 CURLM *multi;
80 size_t len;
81 CURLState states[CURL_NUM_STATES];
82 char *url;
c76f4952 83 size_t readahead_size;
769ce76d
AG
84} BDRVCURLState;
85
86static void curl_clean_state(CURLState *s);
87static void curl_multi_do(void *arg);
c84dcdc1 88static int curl_aio_flush(void *opaque);
769ce76d
AG
89
90static int curl_sock_cb(CURL *curl, curl_socket_t fd, int action,
91 void *s, void *sp)
92{
d0f2c4c6 93 DPRINTF("CURL (AIO): Sock action %d on fd %d\n", action, fd);
769ce76d
AG
94 switch (action) {
95 case CURL_POLL_IN:
bafbd6a1 96 qemu_aio_set_fd_handler(fd, curl_multi_do, NULL, curl_aio_flush, s);
769ce76d
AG
97 break;
98 case CURL_POLL_OUT:
bafbd6a1 99 qemu_aio_set_fd_handler(fd, NULL, curl_multi_do, curl_aio_flush, s);
769ce76d
AG
100 break;
101 case CURL_POLL_INOUT:
c84dcdc1 102 qemu_aio_set_fd_handler(fd, curl_multi_do, curl_multi_do,
bafbd6a1 103 curl_aio_flush, s);
769ce76d
AG
104 break;
105 case CURL_POLL_REMOVE:
bafbd6a1 106 qemu_aio_set_fd_handler(fd, NULL, NULL, NULL, NULL);
769ce76d
AG
107 break;
108 }
109
110 return 0;
111}
112
113static size_t curl_size_cb(void *ptr, size_t size, size_t nmemb, void *opaque)
114{
115 CURLState *s = ((CURLState*)opaque);
116 size_t realsize = size * nmemb;
0bfcd599 117 size_t fsize;
769ce76d 118
0bfcd599 119 if(sscanf(ptr, "Content-Length: %zd", &fsize) == 1) {
769ce76d 120 s->s->len = fsize;
0bfcd599 121 }
769ce76d
AG
122
123 return realsize;
124}
125
126static size_t curl_read_cb(void *ptr, size_t size, size_t nmemb, void *opaque)
127{
128 CURLState *s = ((CURLState*)opaque);
129 size_t realsize = size * nmemb;
130 int i;
131
0bfcd599 132 DPRINTF("CURL: Just reading %zd bytes\n", realsize);
769ce76d
AG
133
134 if (!s || !s->orig_buf)
135 goto read_end;
136
137 memcpy(s->orig_buf + s->buf_off, ptr, realsize);
138 s->buf_off += realsize;
139
140 for(i=0; i<CURL_NUM_ACB; i++) {
141 CURLAIOCB *acb = s->acb[i];
142
143 if (!acb)
144 continue;
145
146 if ((s->buf_off >= acb->end)) {
03396148
MT
147 qemu_iovec_from_buf(acb->qiov, 0, s->orig_buf + acb->start,
148 acb->end - acb->start);
769ce76d
AG
149 acb->common.cb(acb->common.opaque, 0);
150 qemu_aio_release(acb);
151 s->acb[i] = NULL;
152 }
153 }
154
155read_end:
156 return realsize;
157}
158
159static int curl_find_buf(BDRVCURLState *s, size_t start, size_t len,
160 CURLAIOCB *acb)
161{
162 int i;
163 size_t end = start + len;
164
165 for (i=0; i<CURL_NUM_STATES; i++) {
166 CURLState *state = &s->states[i];
167 size_t buf_end = (state->buf_start + state->buf_off);
168 size_t buf_fend = (state->buf_start + state->buf_len);
169
170 if (!state->orig_buf)
171 continue;
172 if (!state->buf_off)
173 continue;
174
175 // Does the existing buffer cover our section?
176 if ((start >= state->buf_start) &&
177 (start <= buf_end) &&
178 (end >= state->buf_start) &&
179 (end <= buf_end))
180 {
181 char *buf = state->orig_buf + (start - state->buf_start);
182
03396148 183 qemu_iovec_from_buf(acb->qiov, 0, buf, len);
769ce76d
AG
184 acb->common.cb(acb->common.opaque, 0);
185
186 return FIND_RET_OK;
187 }
188
189 // Wait for unfinished chunks
190 if ((start >= state->buf_start) &&
191 (start <= buf_fend) &&
192 (end >= state->buf_start) &&
193 (end <= buf_fend))
194 {
195 int j;
196
197 acb->start = start - state->buf_start;
198 acb->end = acb->start + len;
199
200 for (j=0; j<CURL_NUM_ACB; j++) {
201 if (!state->acb[j]) {
202 state->acb[j] = acb;
203 return FIND_RET_WAIT;
204 }
205 }
206 }
207 }
208
209 return FIND_RET_NONE;
210}
211
212static void curl_multi_do(void *arg)
213{
214 BDRVCURLState *s = (BDRVCURLState *)arg;
215 int running;
216 int r;
217 int msgs_in_queue;
218
219 if (!s->multi)
220 return;
221
222 do {
223 r = curl_multi_socket_all(s->multi, &running);
224 } while(r == CURLM_CALL_MULTI_PERFORM);
225
226 /* Try to find done transfers, so we can free the easy
227 * handle again. */
228 do {
229 CURLMsg *msg;
230 msg = curl_multi_info_read(s->multi, &msgs_in_queue);
231
232 if (!msg)
233 break;
234 if (msg->msg == CURLMSG_NONE)
235 break;
236
237 switch (msg->msg) {
238 case CURLMSG_DONE:
239 {
240 CURLState *state = NULL;
241 curl_easy_getinfo(msg->easy_handle, CURLINFO_PRIVATE, (char**)&state);
f785a5ae
NT
242
243 /* ACBs for successful messages get completed in curl_read_cb */
244 if (msg->data.result != CURLE_OK) {
245 int i;
246 for (i = 0; i < CURL_NUM_ACB; i++) {
247 CURLAIOCB *acb = state->acb[i];
248
249 if (acb == NULL) {
250 continue;
251 }
252
253 acb->common.cb(acb->common.opaque, -EIO);
254 qemu_aio_release(acb);
255 state->acb[i] = NULL;
256 }
257 }
258
769ce76d
AG
259 curl_clean_state(state);
260 break;
261 }
262 default:
263 msgs_in_queue = 0;
264 break;
265 }
266 } while(msgs_in_queue);
267}
268
269static CURLState *curl_init_state(BDRVCURLState *s)
270{
271 CURLState *state = NULL;
272 int i, j;
273
274 do {
275 for (i=0; i<CURL_NUM_STATES; i++) {
276 for (j=0; j<CURL_NUM_ACB; j++)
277 if (s->states[i].acb[j])
278 continue;
279 if (s->states[i].in_use)
280 continue;
281
282 state = &s->states[i];
283 state->in_use = 1;
284 break;
285 }
286 if (!state) {
fb7c8e8a 287 g_usleep(100);
769ce76d
AG
288 curl_multi_do(s);
289 }
290 } while(!state);
291
292 if (state->curl)
293 goto has_curl;
294
295 state->curl = curl_easy_init();
296 if (!state->curl)
297 return NULL;
298 curl_easy_setopt(state->curl, CURLOPT_URL, s->url);
299 curl_easy_setopt(state->curl, CURLOPT_TIMEOUT, 5);
df3cee1a 300 curl_easy_setopt(state->curl, CURLOPT_WRITEFUNCTION, (void *)curl_read_cb);
769ce76d
AG
301 curl_easy_setopt(state->curl, CURLOPT_WRITEDATA, (void *)state);
302 curl_easy_setopt(state->curl, CURLOPT_PRIVATE, (void *)state);
303 curl_easy_setopt(state->curl, CURLOPT_AUTOREFERER, 1);
304 curl_easy_setopt(state->curl, CURLOPT_FOLLOWLOCATION, 1);
305 curl_easy_setopt(state->curl, CURLOPT_NOSIGNAL, 1);
306 curl_easy_setopt(state->curl, CURLOPT_ERRORBUFFER, state->errmsg);
f785a5ae
NT
307 curl_easy_setopt(state->curl, CURLOPT_FAILONERROR, 1);
308
fb6d1bbd
SH
309 /* Restrict supported protocols to avoid security issues in the more
310 * obscure protocols. For example, do not allow POP3/SMTP/IMAP see
311 * CVE-2013-0249.
8a8f5840
SH
312 *
313 * Restricting protocols is only supported from 7.19.4 upwards.
fb6d1bbd 314 */
8a8f5840 315#if LIBCURL_VERSION_NUM >= 0x071304
fb6d1bbd
SH
316 curl_easy_setopt(state->curl, CURLOPT_PROTOCOLS, PROTOCOLS);
317 curl_easy_setopt(state->curl, CURLOPT_REDIR_PROTOCOLS, PROTOCOLS);
8a8f5840 318#endif
fb6d1bbd 319
769ce76d
AG
320#ifdef DEBUG_VERBOSE
321 curl_easy_setopt(state->curl, CURLOPT_VERBOSE, 1);
322#endif
323
324has_curl:
325
326 state->s = s;
327
328 return state;
329}
330
331static void curl_clean_state(CURLState *s)
332{
333 if (s->s->multi)
334 curl_multi_remove_handle(s->s->multi, s->curl);
335 s->in_use = 0;
336}
337
338static int curl_open(BlockDriverState *bs, const char *filename, int flags)
339{
340 BDRVCURLState *s = bs->opaque;
341 CURLState *state = NULL;
342 double d;
c76f4952
N
343
344 #define RA_OPTSTR ":readahead="
345 char *file;
346 char *ra;
347 const char *ra_val;
348 int parse_state = 0;
349
769ce76d
AG
350 static int inited = 0;
351
7267c094 352 file = g_strdup(filename);
c76f4952
N
353 s->readahead_size = READ_AHEAD_SIZE;
354
355 /* Parse a trailing ":readahead=#:" param, if present. */
356 ra = file + strlen(file) - 1;
357 while (ra >= file) {
358 if (parse_state == 0) {
359 if (*ra == ':')
360 parse_state++;
361 else
362 break;
363 } else if (parse_state == 1) {
364 if (*ra > '9' || *ra < '0') {
365 char *opt_start = ra - strlen(RA_OPTSTR) + 1;
366 if (opt_start > file &&
367 strncmp(opt_start, RA_OPTSTR, strlen(RA_OPTSTR)) == 0) {
368 ra_val = ra + 1;
369 ra -= strlen(RA_OPTSTR) - 1;
370 *ra = '\0';
371 s->readahead_size = atoi(ra_val);
372 break;
373 } else {
374 break;
375 }
376 }
377 }
378 ra--;
379 }
380
381 if ((s->readahead_size & 0x1ff) != 0) {
48a402e6 382 fprintf(stderr, "HTTP_READAHEAD_SIZE %zd is not a multiple of 512\n",
c76f4952
N
383 s->readahead_size);
384 goto out_noclean;
385 }
386
769ce76d
AG
387 if (!inited) {
388 curl_global_init(CURL_GLOBAL_ALL);
389 inited = 1;
390 }
391
d0f2c4c6 392 DPRINTF("CURL: Opening %s\n", file);
c76f4952 393 s->url = file;
769ce76d
AG
394 state = curl_init_state(s);
395 if (!state)
396 goto out_noclean;
397
398 // Get file size
399
400 curl_easy_setopt(state->curl, CURLOPT_NOBODY, 1);
df3cee1a 401 curl_easy_setopt(state->curl, CURLOPT_WRITEFUNCTION, (void *)curl_size_cb);
769ce76d
AG
402 if (curl_easy_perform(state->curl))
403 goto out;
404 curl_easy_getinfo(state->curl, CURLINFO_CONTENT_LENGTH_DOWNLOAD, &d);
df3cee1a 405 curl_easy_setopt(state->curl, CURLOPT_WRITEFUNCTION, (void *)curl_read_cb);
769ce76d
AG
406 curl_easy_setopt(state->curl, CURLOPT_NOBODY, 0);
407 if (d)
408 s->len = (size_t)d;
409 else if(!s->len)
410 goto out;
0bfcd599 411 DPRINTF("CURL: Size = %zd\n", s->len);
769ce76d
AG
412
413 curl_clean_state(state);
414 curl_easy_cleanup(state->curl);
415 state->curl = NULL;
416
417 // Now we know the file exists and its size, so let's
418 // initialize the multi interface!
419
420 s->multi = curl_multi_init();
421 curl_multi_setopt( s->multi, CURLMOPT_SOCKETDATA, s);
422 curl_multi_setopt( s->multi, CURLMOPT_SOCKETFUNCTION, curl_sock_cb );
423 curl_multi_do(s);
424
425 return 0;
426
427out:
428 fprintf(stderr, "CURL: Error opening file: %s\n", state->errmsg);
429 curl_easy_cleanup(state->curl);
430 state->curl = NULL;
431out_noclean:
7267c094 432 g_free(file);
769ce76d
AG
433 return -EINVAL;
434}
435
c84dcdc1
NT
436static int curl_aio_flush(void *opaque)
437{
438 BDRVCURLState *s = opaque;
439 int i, j;
440
441 for (i=0; i < CURL_NUM_STATES; i++) {
442 for(j=0; j < CURL_NUM_ACB; j++) {
443 if (s->states[i].acb[j]) {
444 return 1;
445 }
446 }
447 }
448 return 0;
449}
450
c16b5a2c
CH
451static void curl_aio_cancel(BlockDriverAIOCB *blockacb)
452{
453 // Do we have to implement canceling? Seems to work without...
454}
455
d7331bed 456static const AIOCBInfo curl_aiocb_info = {
c16b5a2c
CH
457 .aiocb_size = sizeof(CURLAIOCB),
458 .cancel = curl_aio_cancel,
459};
460
363c3c85
NT
461
462static void curl_readv_bh_cb(void *p)
769ce76d 463{
769ce76d
AG
464 CURLState *state;
465
363c3c85
NT
466 CURLAIOCB *acb = p;
467 BDRVCURLState *s = acb->common.bs->opaque;
769ce76d 468
363c3c85
NT
469 qemu_bh_delete(acb->bh);
470 acb->bh = NULL;
471
472 size_t start = acb->sector_num * SECTOR_SIZE;
473 size_t end;
769ce76d
AG
474
475 // In case we have the requested data already (e.g. read-ahead),
476 // we can just call the callback and be done.
363c3c85 477 switch (curl_find_buf(s, start, acb->nb_sectors * SECTOR_SIZE, acb)) {
769ce76d
AG
478 case FIND_RET_OK:
479 qemu_aio_release(acb);
480 // fall through
481 case FIND_RET_WAIT:
363c3c85 482 return;
769ce76d
AG
483 default:
484 break;
485 }
486
487 // No cache found, so let's start a new request
769ce76d 488 state = curl_init_state(s);
363c3c85
NT
489 if (!state) {
490 acb->common.cb(acb->common.opaque, -EIO);
491 qemu_aio_release(acb);
492 return;
493 }
769ce76d
AG
494
495 acb->start = 0;
363c3c85 496 acb->end = (acb->nb_sectors * SECTOR_SIZE);
769ce76d
AG
497
498 state->buf_off = 0;
499 if (state->orig_buf)
7267c094 500 g_free(state->orig_buf);
769ce76d 501 state->buf_start = start;
c76f4952 502 state->buf_len = acb->end + s->readahead_size;
769ce76d 503 end = MIN(start + state->buf_len, s->len) - 1;
7267c094 504 state->orig_buf = g_malloc(state->buf_len);
769ce76d
AG
505 state->acb[0] = acb;
506
0bfcd599
BS
507 snprintf(state->range, 127, "%zd-%zd", start, end);
508 DPRINTF("CURL (AIO): Reading %d at %zd (%s)\n",
363c3c85 509 (acb->nb_sectors * SECTOR_SIZE), start, state->range);
769ce76d
AG
510 curl_easy_setopt(state->curl, CURLOPT_RANGE, state->range);
511
512 curl_multi_add_handle(s->multi, state->curl);
513 curl_multi_do(s);
514
363c3c85
NT
515}
516
517static BlockDriverAIOCB *curl_aio_readv(BlockDriverState *bs,
518 int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
519 BlockDriverCompletionFunc *cb, void *opaque)
520{
521 CURLAIOCB *acb;
522
d7331bed 523 acb = qemu_aio_get(&curl_aiocb_info, bs, cb, opaque);
363c3c85 524
363c3c85
NT
525 acb->qiov = qiov;
526 acb->sector_num = sector_num;
527 acb->nb_sectors = nb_sectors;
528
529 acb->bh = qemu_bh_new(curl_readv_bh_cb, acb);
530
531 if (!acb->bh) {
532 DPRINTF("CURL: qemu_bh_new failed\n");
533 return NULL;
534 }
535
536 qemu_bh_schedule(acb->bh);
769ce76d
AG
537 return &acb->common;
538}
539
769ce76d
AG
540static void curl_close(BlockDriverState *bs)
541{
542 BDRVCURLState *s = bs->opaque;
543 int i;
544
d0f2c4c6 545 DPRINTF("CURL: Close\n");
769ce76d
AG
546 for (i=0; i<CURL_NUM_STATES; i++) {
547 if (s->states[i].in_use)
548 curl_clean_state(&s->states[i]);
549 if (s->states[i].curl) {
550 curl_easy_cleanup(s->states[i].curl);
551 s->states[i].curl = NULL;
552 }
553 if (s->states[i].orig_buf) {
7267c094 554 g_free(s->states[i].orig_buf);
769ce76d
AG
555 s->states[i].orig_buf = NULL;
556 }
557 }
558 if (s->multi)
559 curl_multi_cleanup(s->multi);
45724d6d 560 g_free(s->url);
769ce76d
AG
561}
562
563static int64_t curl_getlength(BlockDriverState *bs)
564{
565 BDRVCURLState *s = bs->opaque;
566 return s->len;
567}
568
569static BlockDriver bdrv_http = {
570 .format_name = "http",
571 .protocol_name = "http",
572
573 .instance_size = sizeof(BDRVCURLState),
66f82cee 574 .bdrv_file_open = curl_open,
769ce76d
AG
575 .bdrv_close = curl_close,
576 .bdrv_getlength = curl_getlength,
577
769ce76d 578 .bdrv_aio_readv = curl_aio_readv,
769ce76d
AG
579};
580
581static BlockDriver bdrv_https = {
582 .format_name = "https",
583 .protocol_name = "https",
584
585 .instance_size = sizeof(BDRVCURLState),
66f82cee 586 .bdrv_file_open = curl_open,
769ce76d
AG
587 .bdrv_close = curl_close,
588 .bdrv_getlength = curl_getlength,
589
769ce76d 590 .bdrv_aio_readv = curl_aio_readv,
769ce76d
AG
591};
592
593static BlockDriver bdrv_ftp = {
594 .format_name = "ftp",
595 .protocol_name = "ftp",
596
597 .instance_size = sizeof(BDRVCURLState),
66f82cee 598 .bdrv_file_open = curl_open,
769ce76d
AG
599 .bdrv_close = curl_close,
600 .bdrv_getlength = curl_getlength,
601
769ce76d 602 .bdrv_aio_readv = curl_aio_readv,
769ce76d
AG
603};
604
605static BlockDriver bdrv_ftps = {
606 .format_name = "ftps",
607 .protocol_name = "ftps",
608
609 .instance_size = sizeof(BDRVCURLState),
66f82cee 610 .bdrv_file_open = curl_open,
769ce76d
AG
611 .bdrv_close = curl_close,
612 .bdrv_getlength = curl_getlength,
613
769ce76d 614 .bdrv_aio_readv = curl_aio_readv,
769ce76d
AG
615};
616
617static BlockDriver bdrv_tftp = {
618 .format_name = "tftp",
619 .protocol_name = "tftp",
620
621 .instance_size = sizeof(BDRVCURLState),
66f82cee 622 .bdrv_file_open = curl_open,
769ce76d
AG
623 .bdrv_close = curl_close,
624 .bdrv_getlength = curl_getlength,
625
769ce76d 626 .bdrv_aio_readv = curl_aio_readv,
769ce76d
AG
627};
628
629static void curl_block_init(void)
630{
631 bdrv_register(&bdrv_http);
632 bdrv_register(&bdrv_https);
633 bdrv_register(&bdrv_ftp);
634 bdrv_register(&bdrv_ftps);
635 bdrv_register(&bdrv_tftp);
636}
637
638block_init(curl_block_init);