]> git.proxmox.com Git - mirror_qemu.git/blame - block/nfs.c
block/gluster: add support for SEEK_DATA/SEEK_HOLE
[mirror_qemu.git] / block / nfs.c
CommitLineData
6542aa9c
PL
1/*
2 * QEMU Block driver for native access to files on NFS shares
3 *
4 * Copyright (c) 2014 Peter Lieven <pl@kamp.de>
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
80c71a24 25#include "qemu/osdep.h"
6542aa9c
PL
26
27#include <poll.h>
28#include "qemu-common.h"
29#include "qemu/config-file.h"
30#include "qemu/error-report.h"
d165b8cb 31#include "qapi/error.h"
6542aa9c
PL
32#include "block/block_int.h"
33#include "trace.h"
34#include "qemu/iov.h"
35#include "qemu/uri.h"
0d94b746 36#include "qemu/cutils.h"
6542aa9c
PL
37#include "sysemu/sysemu.h"
38#include <nfsc/libnfs.h>
39
29c838cd 40#define QEMU_NFS_MAX_READAHEAD_SIZE 1048576
7725b8bf 41#define QEMU_NFS_MAX_DEBUG_LEVEL 2
29c838cd 42
6542aa9c
PL
43typedef struct NFSClient {
44 struct nfs_context *context;
45 struct nfsfh *fh;
46 int events;
47 bool has_zero_init;
471799d1 48 AioContext *aio_context;
18a8056e 49 blkcnt_t st_blocks;
6542aa9c
PL
50} NFSClient;
51
52typedef struct NFSRPC {
53 int ret;
54 int complete;
55 QEMUIOVector *iov;
56 struct stat *st;
57 Coroutine *co;
58 QEMUBH *bh;
471799d1 59 NFSClient *client;
6542aa9c
PL
60} NFSRPC;
61
62static void nfs_process_read(void *arg);
63static void nfs_process_write(void *arg);
64
65static void nfs_set_events(NFSClient *client)
66{
67 int ev = nfs_which_events(client->context);
68 if (ev != client->events) {
dca21ef2
FZ
69 aio_set_fd_handler(client->aio_context, nfs_get_fd(client->context),
70 false,
471799d1 71 (ev & POLLIN) ? nfs_process_read : NULL,
dca21ef2 72 (ev & POLLOUT) ? nfs_process_write : NULL, client);
6542aa9c
PL
73
74 }
75 client->events = ev;
76}
77
78static void nfs_process_read(void *arg)
79{
80 NFSClient *client = arg;
81 nfs_service(client->context, POLLIN);
82 nfs_set_events(client);
83}
84
85static void nfs_process_write(void *arg)
86{
87 NFSClient *client = arg;
88 nfs_service(client->context, POLLOUT);
89 nfs_set_events(client);
90}
91
92static void nfs_co_init_task(NFSClient *client, NFSRPC *task)
93{
94 *task = (NFSRPC) {
471799d1
SH
95 .co = qemu_coroutine_self(),
96 .client = client,
6542aa9c
PL
97 };
98}
99
100static void nfs_co_generic_bh_cb(void *opaque)
101{
102 NFSRPC *task = opaque;
a2c0fe2f 103 task->complete = 1;
6542aa9c
PL
104 qemu_bh_delete(task->bh);
105 qemu_coroutine_enter(task->co, NULL);
106}
107
108static void
109nfs_co_generic_cb(int ret, struct nfs_context *nfs, void *data,
110 void *private_data)
111{
112 NFSRPC *task = private_data;
6542aa9c
PL
113 task->ret = ret;
114 if (task->ret > 0 && task->iov) {
115 if (task->ret <= task->iov->size) {
116 qemu_iovec_from_buf(task->iov, 0, data, task->ret);
117 } else {
118 task->ret = -EIO;
119 }
120 }
121 if (task->ret == 0 && task->st) {
122 memcpy(task->st, data, sizeof(struct stat));
123 }
20fccb18
PL
124 if (task->ret < 0) {
125 error_report("NFS Error: %s", nfs_get_error(nfs));
126 }
6542aa9c 127 if (task->co) {
471799d1
SH
128 task->bh = aio_bh_new(task->client->aio_context,
129 nfs_co_generic_bh_cb, task);
6542aa9c 130 qemu_bh_schedule(task->bh);
a2c0fe2f
PL
131 } else {
132 task->complete = 1;
6542aa9c
PL
133 }
134}
135
136static int coroutine_fn nfs_co_readv(BlockDriverState *bs,
137 int64_t sector_num, int nb_sectors,
138 QEMUIOVector *iov)
139{
140 NFSClient *client = bs->opaque;
141 NFSRPC task;
142
143 nfs_co_init_task(client, &task);
144 task.iov = iov;
145
146 if (nfs_pread_async(client->context, client->fh,
147 sector_num * BDRV_SECTOR_SIZE,
148 nb_sectors * BDRV_SECTOR_SIZE,
149 nfs_co_generic_cb, &task) != 0) {
150 return -ENOMEM;
151 }
152
153 while (!task.complete) {
154 nfs_set_events(client);
155 qemu_coroutine_yield();
156 }
157
158 if (task.ret < 0) {
159 return task.ret;
160 }
161
162 /* zero pad short reads */
163 if (task.ret < iov->size) {
164 qemu_iovec_memset(iov, task.ret, 0, iov->size - task.ret);
165 }
166
167 return 0;
168}
169
170static int coroutine_fn nfs_co_writev(BlockDriverState *bs,
171 int64_t sector_num, int nb_sectors,
172 QEMUIOVector *iov)
173{
174 NFSClient *client = bs->opaque;
175 NFSRPC task;
176 char *buf = NULL;
177
178 nfs_co_init_task(client, &task);
179
2347dd7b
KW
180 buf = g_try_malloc(nb_sectors * BDRV_SECTOR_SIZE);
181 if (nb_sectors && buf == NULL) {
182 return -ENOMEM;
183 }
184
6542aa9c
PL
185 qemu_iovec_to_buf(iov, 0, buf, nb_sectors * BDRV_SECTOR_SIZE);
186
187 if (nfs_pwrite_async(client->context, client->fh,
188 sector_num * BDRV_SECTOR_SIZE,
189 nb_sectors * BDRV_SECTOR_SIZE,
190 buf, nfs_co_generic_cb, &task) != 0) {
191 g_free(buf);
192 return -ENOMEM;
193 }
194
195 while (!task.complete) {
196 nfs_set_events(client);
197 qemu_coroutine_yield();
198 }
199
200 g_free(buf);
201
202 if (task.ret != nb_sectors * BDRV_SECTOR_SIZE) {
203 return task.ret < 0 ? task.ret : -EIO;
204 }
205
206 return 0;
207}
208
209static int coroutine_fn nfs_co_flush(BlockDriverState *bs)
210{
211 NFSClient *client = bs->opaque;
212 NFSRPC task;
213
214 nfs_co_init_task(client, &task);
215
216 if (nfs_fsync_async(client->context, client->fh, nfs_co_generic_cb,
217 &task) != 0) {
218 return -ENOMEM;
219 }
220
221 while (!task.complete) {
222 nfs_set_events(client);
223 qemu_coroutine_yield();
224 }
225
226 return task.ret;
227}
228
229/* TODO Convert to fine grained options */
230static QemuOptsList runtime_opts = {
231 .name = "nfs",
232 .head = QTAILQ_HEAD_INITIALIZER(runtime_opts.head),
233 .desc = {
234 {
235 .name = "filename",
236 .type = QEMU_OPT_STRING,
237 .help = "URL to the NFS file",
238 },
239 { /* end of list */ }
240 },
241};
242
471799d1
SH
243static void nfs_detach_aio_context(BlockDriverState *bs)
244{
245 NFSClient *client = bs->opaque;
246
dca21ef2
FZ
247 aio_set_fd_handler(client->aio_context, nfs_get_fd(client->context),
248 false, NULL, NULL, NULL);
471799d1
SH
249 client->events = 0;
250}
251
252static void nfs_attach_aio_context(BlockDriverState *bs,
253 AioContext *new_context)
254{
255 NFSClient *client = bs->opaque;
256
257 client->aio_context = new_context;
258 nfs_set_events(client);
259}
260
6542aa9c
PL
261static void nfs_client_close(NFSClient *client)
262{
263 if (client->context) {
264 if (client->fh) {
265 nfs_close(client->context, client->fh);
266 }
dca21ef2
FZ
267 aio_set_fd_handler(client->aio_context, nfs_get_fd(client->context),
268 false, NULL, NULL, NULL);
6542aa9c
PL
269 nfs_destroy_context(client->context);
270 }
271 memset(client, 0, sizeof(NFSClient));
272}
273
274static void nfs_file_close(BlockDriverState *bs)
275{
276 NFSClient *client = bs->opaque;
277 nfs_client_close(client);
278}
279
280static int64_t nfs_client_open(NFSClient *client, const char *filename,
281 int flags, Error **errp)
282{
283 int ret = -EINVAL, i;
284 struct stat st;
285 URI *uri;
286 QueryParams *qp = NULL;
287 char *file = NULL, *strp = NULL;
288
289 uri = uri_parse(filename);
290 if (!uri) {
291 error_setg(errp, "Invalid URL specified");
5f4d5e1a
HR
292 goto fail;
293 }
294 if (!uri->server) {
295 error_setg(errp, "Invalid URL specified");
6542aa9c
PL
296 goto fail;
297 }
298 strp = strrchr(uri->path, '/');
299 if (strp == NULL) {
300 error_setg(errp, "Invalid URL specified");
301 goto fail;
302 }
303 file = g_strdup(strp);
304 *strp = 0;
305
306 client->context = nfs_init_context();
307 if (client->context == NULL) {
308 error_setg(errp, "Failed to init NFS context");
309 goto fail;
310 }
311
312 qp = query_params_parse(uri->query);
313 for (i = 0; i < qp->n; i++) {
7c24384b 314 unsigned long long val;
6542aa9c
PL
315 if (!qp->p[i].value) {
316 error_setg(errp, "Value for NFS parameter expected: %s",
317 qp->p[i].name);
318 goto fail;
319 }
7c24384b
PL
320 if (parse_uint_full(qp->p[i].value, &val, 0)) {
321 error_setg(errp, "Illegal value for NFS parameter: %s",
322 qp->p[i].name);
323 goto fail;
324 }
325 if (!strcmp(qp->p[i].name, "uid")) {
326 nfs_set_uid(client->context, val);
327 } else if (!strcmp(qp->p[i].name, "gid")) {
328 nfs_set_gid(client->context, val);
329 } else if (!strcmp(qp->p[i].name, "tcp-syncnt")) {
330 nfs_set_tcp_syncnt(client->context, val);
f42ca3ca
PL
331#ifdef LIBNFS_FEATURE_READAHEAD
332 } else if (!strcmp(qp->p[i].name, "readahead")) {
29c838cd
PL
333 if (val > QEMU_NFS_MAX_READAHEAD_SIZE) {
334 error_report("NFS Warning: Truncating NFS readahead"
335 " size to %d", QEMU_NFS_MAX_READAHEAD_SIZE);
336 val = QEMU_NFS_MAX_READAHEAD_SIZE;
337 }
f42ca3ca 338 nfs_set_readahead(client->context, val);
7725b8bf
PL
339#endif
340#ifdef LIBNFS_FEATURE_DEBUG
341 } else if (!strcmp(qp->p[i].name, "debug")) {
342 /* limit the maximum debug level to avoid potential flooding
343 * of our log files. */
344 if (val > QEMU_NFS_MAX_DEBUG_LEVEL) {
345 error_report("NFS Warning: Limiting NFS debug level"
346 " to %d", QEMU_NFS_MAX_DEBUG_LEVEL);
347 val = QEMU_NFS_MAX_DEBUG_LEVEL;
348 }
349 nfs_set_debug(client->context, val);
f42ca3ca 350#endif
6542aa9c
PL
351 } else {
352 error_setg(errp, "Unknown NFS parameter name: %s",
353 qp->p[i].name);
354 goto fail;
355 }
356 }
357
358 ret = nfs_mount(client->context, uri->server, uri->path);
359 if (ret < 0) {
360 error_setg(errp, "Failed to mount nfs share: %s",
361 nfs_get_error(client->context));
362 goto fail;
363 }
364
365 if (flags & O_CREAT) {
366 ret = nfs_creat(client->context, file, 0600, &client->fh);
367 if (ret < 0) {
368 error_setg(errp, "Failed to create file: %s",
369 nfs_get_error(client->context));
370 goto fail;
371 }
372 } else {
373 ret = nfs_open(client->context, file, flags, &client->fh);
374 if (ret < 0) {
375 error_setg(errp, "Failed to open file : %s",
376 nfs_get_error(client->context));
377 goto fail;
378 }
379 }
380
381 ret = nfs_fstat(client->context, client->fh, &st);
382 if (ret < 0) {
383 error_setg(errp, "Failed to fstat file: %s",
384 nfs_get_error(client->context));
385 goto fail;
386 }
387
388 ret = DIV_ROUND_UP(st.st_size, BDRV_SECTOR_SIZE);
18a8056e 389 client->st_blocks = st.st_blocks;
6542aa9c
PL
390 client->has_zero_init = S_ISREG(st.st_mode);
391 goto out;
392fail:
393 nfs_client_close(client);
394out:
395 if (qp) {
396 query_params_free(qp);
397 }
398 uri_free(uri);
399 g_free(file);
400 return ret;
401}
402
403static int nfs_file_open(BlockDriverState *bs, QDict *options, int flags,
404 Error **errp) {
405 NFSClient *client = bs->opaque;
406 int64_t ret;
407 QemuOpts *opts;
408 Error *local_err = NULL;
409
471799d1
SH
410 client->aio_context = bdrv_get_aio_context(bs);
411
6542aa9c
PL
412 opts = qemu_opts_create(&runtime_opts, NULL, 0, &error_abort);
413 qemu_opts_absorb_qdict(opts, options, &local_err);
0fb6395c 414 if (local_err) {
6542aa9c 415 error_propagate(errp, local_err);
810f4f86
FZ
416 ret = -EINVAL;
417 goto out;
6542aa9c
PL
418 }
419 ret = nfs_client_open(client, qemu_opt_get(opts, "filename"),
420 (flags & BDRV_O_RDWR) ? O_RDWR : O_RDONLY,
421 errp);
422 if (ret < 0) {
810f4f86 423 goto out;
6542aa9c
PL
424 }
425 bs->total_sectors = ret;
810f4f86
FZ
426 ret = 0;
427out:
428 qemu_opts_del(opts);
429 return ret;
6542aa9c
PL
430}
431
fd752801
HR
432static QemuOptsList nfs_create_opts = {
433 .name = "nfs-create-opts",
434 .head = QTAILQ_HEAD_INITIALIZER(nfs_create_opts.head),
435 .desc = {
436 {
437 .name = BLOCK_OPT_SIZE,
438 .type = QEMU_OPT_SIZE,
439 .help = "Virtual disk size"
440 },
441 { /* end of list */ }
442 }
443};
444
98c10b81 445static int nfs_file_create(const char *url, QemuOpts *opts, Error **errp)
6542aa9c
PL
446{
447 int ret = 0;
448 int64_t total_size = 0;
5839e53b 449 NFSClient *client = g_new0(NFSClient, 1);
6542aa9c 450
471799d1
SH
451 client->aio_context = qemu_get_aio_context();
452
6542aa9c 453 /* Read out options */
c2eb918e
HT
454 total_size = ROUND_UP(qemu_opt_get_size_del(opts, BLOCK_OPT_SIZE, 0),
455 BDRV_SECTOR_SIZE);
6542aa9c
PL
456
457 ret = nfs_client_open(client, url, O_CREAT, errp);
458 if (ret < 0) {
459 goto out;
460 }
461 ret = nfs_ftruncate(client->context, client->fh, total_size);
462 nfs_client_close(client);
463out:
464 g_free(client);
465 return ret;
466}
467
468static int nfs_has_zero_init(BlockDriverState *bs)
469{
470 NFSClient *client = bs->opaque;
471 return client->has_zero_init;
472}
473
474static int64_t nfs_get_allocated_file_size(BlockDriverState *bs)
475{
476 NFSClient *client = bs->opaque;
477 NFSRPC task = {0};
478 struct stat st;
479
18a8056e
PL
480 if (bdrv_is_read_only(bs) &&
481 !(bs->open_flags & BDRV_O_NOCACHE)) {
482 return client->st_blocks * 512;
483 }
484
6542aa9c
PL
485 task.st = &st;
486 if (nfs_fstat_async(client->context, client->fh, nfs_co_generic_cb,
487 &task) != 0) {
488 return -ENOMEM;
489 }
490
491 while (!task.complete) {
492 nfs_set_events(client);
471799d1 493 aio_poll(client->aio_context, true);
6542aa9c
PL
494 }
495
055c6f91 496 return (task.ret < 0 ? task.ret : st.st_blocks * 512);
6542aa9c
PL
497}
498
499static int nfs_file_truncate(BlockDriverState *bs, int64_t offset)
500{
501 NFSClient *client = bs->opaque;
502 return nfs_ftruncate(client->context, client->fh, offset);
503}
504
18a8056e
PL
505/* Note that this will not re-establish a connection with the NFS server
506 * - it is effectively a NOP. */
507static int nfs_reopen_prepare(BDRVReopenState *state,
508 BlockReopenQueue *queue, Error **errp)
509{
510 NFSClient *client = state->bs->opaque;
511 struct stat st;
512 int ret = 0;
513
514 if (state->flags & BDRV_O_RDWR && bdrv_is_read_only(state->bs)) {
515 error_setg(errp, "Cannot open a read-only mount as read-write");
516 return -EACCES;
517 }
518
519 /* Update cache for read-only reopens */
520 if (!(state->flags & BDRV_O_RDWR)) {
521 ret = nfs_fstat(client->context, client->fh, &st);
522 if (ret < 0) {
523 error_setg(errp, "Failed to fstat file: %s",
524 nfs_get_error(client->context));
525 return ret;
526 }
527 client->st_blocks = st.st_blocks;
528 }
529
530 return 0;
531}
532
6542aa9c 533static BlockDriver bdrv_nfs = {
471799d1
SH
534 .format_name = "nfs",
535 .protocol_name = "nfs",
536
537 .instance_size = sizeof(NFSClient),
538 .bdrv_needs_filename = true,
fd752801
HR
539 .create_opts = &nfs_create_opts,
540
471799d1
SH
541 .bdrv_has_zero_init = nfs_has_zero_init,
542 .bdrv_get_allocated_file_size = nfs_get_allocated_file_size,
543 .bdrv_truncate = nfs_file_truncate,
544
545 .bdrv_file_open = nfs_file_open,
546 .bdrv_close = nfs_file_close,
c282e1fd 547 .bdrv_create = nfs_file_create,
18a8056e 548 .bdrv_reopen_prepare = nfs_reopen_prepare,
471799d1
SH
549
550 .bdrv_co_readv = nfs_co_readv,
551 .bdrv_co_writev = nfs_co_writev,
552 .bdrv_co_flush_to_disk = nfs_co_flush,
553
554 .bdrv_detach_aio_context = nfs_detach_aio_context,
555 .bdrv_attach_aio_context = nfs_attach_aio_context,
6542aa9c
PL
556};
557
558static void nfs_block_init(void)
559{
560 bdrv_register(&bdrv_nfs);
561}
562
563block_init(nfs_block_init);