2 * QEMU Block driver for native access to files on NFS shares
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 #include "qemu/osdep.h"
28 #include "qemu-common.h"
29 #include "qemu/config-file.h"
30 #include "qemu/error-report.h"
31 #include "qapi/error.h"
32 #include "block/block_int.h"
36 #include "qemu/cutils.h"
37 #include "sysemu/sysemu.h"
38 #include "qapi/qmp/qdict.h"
39 #include "qapi/qmp/qint.h"
40 #include "qapi/qmp/qstring.h"
41 #include "qapi-visit.h"
42 #include "qapi/qobject-input-visitor.h"
43 #include "qapi/qobject-output-visitor.h"
44 #include <nfsc/libnfs.h>
47 #define QEMU_NFS_MAX_READAHEAD_SIZE 1048576
48 #define QEMU_NFS_MAX_PAGECACHE_SIZE (8388608 / NFS_BLKSIZE)
49 #define QEMU_NFS_MAX_DEBUG_LEVEL 2
51 typedef struct NFSClient {
52 struct nfs_context *context;
56 AioContext *aio_context;
62 int64_t uid, gid, tcp_syncnt, readahead, pagecache, debug;
65 typedef struct NFSRPC {
75 static int nfs_parse_uri(const char *filename, QDict *options, Error **errp)
78 QueryParams *qp = NULL;
81 uri = uri_parse(filename);
83 error_setg(errp, "Invalid URI specified");
86 if (strcmp(uri->scheme, "nfs") != 0) {
87 error_setg(errp, "URI scheme must be 'nfs'");
92 error_setg(errp, "missing hostname in URI");
97 error_setg(errp, "missing file path in URI");
101 qp = query_params_parse(uri->query);
103 error_setg(errp, "could not parse query parameters");
107 qdict_put(options, "server.host", qstring_from_str(uri->server));
108 qdict_put(options, "server.type", qstring_from_str("inet"));
109 qdict_put(options, "path", qstring_from_str(uri->path));
111 for (i = 0; i < qp->n; i++) {
112 unsigned long long val;
113 if (!qp->p[i].value) {
114 error_setg(errp, "Value for NFS parameter expected: %s",
118 if (parse_uint_full(qp->p[i].value, &val, 0)) {
119 error_setg(errp, "Illegal value for NFS parameter: %s",
123 if (!strcmp(qp->p[i].name, "uid")) {
124 qdict_put(options, "user",
125 qstring_from_str(qp->p[i].value));
126 } else if (!strcmp(qp->p[i].name, "gid")) {
127 qdict_put(options, "group",
128 qstring_from_str(qp->p[i].value));
129 } else if (!strcmp(qp->p[i].name, "tcp-syncnt")) {
130 qdict_put(options, "tcp-syn-count",
131 qstring_from_str(qp->p[i].value));
132 } else if (!strcmp(qp->p[i].name, "readahead")) {
133 qdict_put(options, "readahead-size",
134 qstring_from_str(qp->p[i].value));
135 } else if (!strcmp(qp->p[i].name, "pagecache")) {
136 qdict_put(options, "page-cache-size",
137 qstring_from_str(qp->p[i].value));
138 } else if (!strcmp(qp->p[i].name, "debug")) {
139 qdict_put(options, "debug",
140 qstring_from_str(qp->p[i].value));
142 error_setg(errp, "Unknown NFS parameter name: %s",
150 query_params_free(qp);
158 static bool nfs_has_filename_options_conflict(QDict *options, Error **errp)
160 const QDictEntry *qe;
162 for (qe = qdict_first(options); qe; qe = qdict_next(options, qe)) {
163 if (!strcmp(qe->key, "host") ||
164 !strcmp(qe->key, "path") ||
165 !strcmp(qe->key, "user") ||
166 !strcmp(qe->key, "group") ||
167 !strcmp(qe->key, "tcp-syn-count") ||
168 !strcmp(qe->key, "readahead-size") ||
169 !strcmp(qe->key, "page-cache-size") ||
170 !strcmp(qe->key, "debug") ||
171 strstart(qe->key, "server.", NULL))
173 error_setg(errp, "Option %s cannot be used with a filename",
182 static void nfs_parse_filename(const char *filename, QDict *options,
185 if (nfs_has_filename_options_conflict(options, errp)) {
189 nfs_parse_uri(filename, options, errp);
192 static void nfs_process_read(void *arg);
193 static void nfs_process_write(void *arg);
195 /* Called with QemuMutex held. */
196 static void nfs_set_events(NFSClient *client)
198 int ev = nfs_which_events(client->context);
199 if (ev != client->events) {
200 aio_set_fd_handler(client->aio_context, nfs_get_fd(client->context),
202 (ev & POLLIN) ? nfs_process_read : NULL,
203 (ev & POLLOUT) ? nfs_process_write : NULL,
210 static void nfs_process_read(void *arg)
212 NFSClient *client = arg;
214 qemu_mutex_lock(&client->mutex);
215 nfs_service(client->context, POLLIN);
216 nfs_set_events(client);
217 qemu_mutex_unlock(&client->mutex);
220 static void nfs_process_write(void *arg)
222 NFSClient *client = arg;
224 qemu_mutex_lock(&client->mutex);
225 nfs_service(client->context, POLLOUT);
226 nfs_set_events(client);
227 qemu_mutex_unlock(&client->mutex);
230 static void nfs_co_init_task(BlockDriverState *bs, NFSRPC *task)
233 .co = qemu_coroutine_self(),
235 .client = bs->opaque,
239 static void nfs_co_generic_bh_cb(void *opaque)
241 NFSRPC *task = opaque;
244 aio_co_wake(task->co);
247 /* Called (via nfs_service) with QemuMutex held. */
249 nfs_co_generic_cb(int ret, struct nfs_context *nfs, void *data,
252 NFSRPC *task = private_data;
255 if (task->ret > 0 && task->iov) {
256 if (task->ret <= task->iov->size) {
257 qemu_iovec_from_buf(task->iov, 0, data, task->ret);
263 error_report("NFS Error: %s", nfs_get_error(nfs));
265 aio_bh_schedule_oneshot(task->client->aio_context,
266 nfs_co_generic_bh_cb, task);
269 static int coroutine_fn nfs_co_preadv(BlockDriverState *bs, uint64_t offset,
270 uint64_t bytes, QEMUIOVector *iov,
273 NFSClient *client = bs->opaque;
276 nfs_co_init_task(bs, &task);
279 qemu_mutex_lock(&client->mutex);
280 if (nfs_pread_async(client->context, client->fh,
281 offset, bytes, nfs_co_generic_cb, &task) != 0) {
282 qemu_mutex_unlock(&client->mutex);
286 nfs_set_events(client);
287 qemu_mutex_unlock(&client->mutex);
288 while (!task.complete) {
289 qemu_coroutine_yield();
296 /* zero pad short reads */
297 if (task.ret < iov->size) {
298 qemu_iovec_memset(iov, task.ret, 0, iov->size - task.ret);
304 static int coroutine_fn nfs_co_pwritev(BlockDriverState *bs, uint64_t offset,
305 uint64_t bytes, QEMUIOVector *iov,
308 NFSClient *client = bs->opaque;
311 bool my_buffer = false;
313 nfs_co_init_task(bs, &task);
315 if (iov->niov != 1) {
316 buf = g_try_malloc(bytes);
317 if (bytes && buf == NULL) {
320 qemu_iovec_to_buf(iov, 0, buf, bytes);
323 buf = iov->iov[0].iov_base;
326 qemu_mutex_lock(&client->mutex);
327 if (nfs_pwrite_async(client->context, client->fh,
329 nfs_co_generic_cb, &task) != 0) {
330 qemu_mutex_unlock(&client->mutex);
337 nfs_set_events(client);
338 qemu_mutex_unlock(&client->mutex);
339 while (!task.complete) {
340 qemu_coroutine_yield();
347 if (task.ret != bytes) {
348 return task.ret < 0 ? task.ret : -EIO;
354 static int coroutine_fn nfs_co_flush(BlockDriverState *bs)
356 NFSClient *client = bs->opaque;
359 nfs_co_init_task(bs, &task);
361 qemu_mutex_lock(&client->mutex);
362 if (nfs_fsync_async(client->context, client->fh, nfs_co_generic_cb,
364 qemu_mutex_unlock(&client->mutex);
368 nfs_set_events(client);
369 qemu_mutex_unlock(&client->mutex);
370 while (!task.complete) {
371 qemu_coroutine_yield();
377 static QemuOptsList runtime_opts = {
379 .head = QTAILQ_HEAD_INITIALIZER(runtime_opts.head),
383 .type = QEMU_OPT_STRING,
384 .help = "Path of the image on the host",
388 .type = QEMU_OPT_NUMBER,
389 .help = "UID value to use when talking to the server",
393 .type = QEMU_OPT_NUMBER,
394 .help = "GID value to use when talking to the server",
397 .name = "tcp-syn-count",
398 .type = QEMU_OPT_NUMBER,
399 .help = "Number of SYNs to send during the session establish",
402 .name = "readahead-size",
403 .type = QEMU_OPT_NUMBER,
404 .help = "Set the readahead size in bytes",
407 .name = "page-cache-size",
408 .type = QEMU_OPT_NUMBER,
409 .help = "Set the pagecache size in bytes",
413 .type = QEMU_OPT_NUMBER,
414 .help = "Set the NFS debug level (max 2)",
416 { /* end of list */ }
420 static void nfs_detach_aio_context(BlockDriverState *bs)
422 NFSClient *client = bs->opaque;
424 aio_set_fd_handler(client->aio_context, nfs_get_fd(client->context),
425 false, NULL, NULL, NULL, NULL);
429 static void nfs_attach_aio_context(BlockDriverState *bs,
430 AioContext *new_context)
432 NFSClient *client = bs->opaque;
434 client->aio_context = new_context;
435 nfs_set_events(client);
438 static void nfs_client_close(NFSClient *client)
440 if (client->context) {
442 nfs_close(client->context, client->fh);
444 aio_set_fd_handler(client->aio_context, nfs_get_fd(client->context),
445 false, NULL, NULL, NULL, NULL);
446 nfs_destroy_context(client->context);
448 memset(client, 0, sizeof(NFSClient));
451 static void nfs_file_close(BlockDriverState *bs)
453 NFSClient *client = bs->opaque;
454 nfs_client_close(client);
455 qemu_mutex_destroy(&client->mutex);
458 static NFSServer *nfs_config(QDict *options, Error **errp)
460 NFSServer *server = NULL;
462 QObject *crumpled_addr = NULL;
464 Error *local_error = NULL;
466 qdict_extract_subqdict(options, &addr, "server.");
467 if (!qdict_size(addr)) {
468 error_setg(errp, "NFS server address missing");
472 crumpled_addr = qdict_crumple(addr, errp);
473 if (!crumpled_addr) {
478 * Caution: this works only because all scalar members of
479 * NFSServer are QString in @crumpled_addr. The visitor expects
480 * @crumpled_addr to be typed according to the QAPI schema. It
481 * is when @options come from -blockdev or blockdev_add. But when
482 * they come from -drive, they're all QString.
484 iv = qobject_input_visitor_new(crumpled_addr);
485 visit_type_NFSServer(iv, NULL, &server, &local_error);
487 error_propagate(errp, local_error);
493 qobject_decref(crumpled_addr);
499 static int64_t nfs_client_open(NFSClient *client, QDict *options,
500 int flags, int open_flags, Error **errp)
503 QemuOpts *opts = NULL;
504 Error *local_err = NULL;
506 char *file = NULL, *strp = NULL;
508 opts = qemu_opts_create(&runtime_opts, NULL, 0, &error_abort);
509 qemu_opts_absorb_qdict(opts, options, &local_err);
511 error_propagate(errp, local_err);
516 client->path = g_strdup(qemu_opt_get(opts, "path"));
519 error_setg(errp, "No path was specified");
523 strp = strrchr(client->path, '/');
525 error_setg(errp, "Invalid URL specified");
528 file = g_strdup(strp);
531 /* Pop the config into our state object, Exit if invalid */
532 client->server = nfs_config(options, errp);
533 if (!client->server) {
538 client->context = nfs_init_context();
539 if (client->context == NULL) {
540 error_setg(errp, "Failed to init NFS context");
544 if (qemu_opt_get(opts, "user")) {
545 client->uid = qemu_opt_get_number(opts, "user", 0);
546 nfs_set_uid(client->context, client->uid);
549 if (qemu_opt_get(opts, "group")) {
550 client->gid = qemu_opt_get_number(opts, "group", 0);
551 nfs_set_gid(client->context, client->gid);
554 if (qemu_opt_get(opts, "tcp-syn-count")) {
555 client->tcp_syncnt = qemu_opt_get_number(opts, "tcp-syn-count", 0);
556 nfs_set_tcp_syncnt(client->context, client->tcp_syncnt);
559 #ifdef LIBNFS_FEATURE_READAHEAD
560 if (qemu_opt_get(opts, "readahead-size")) {
561 if (open_flags & BDRV_O_NOCACHE) {
562 error_setg(errp, "Cannot enable NFS readahead "
563 "if cache.direct = on");
566 client->readahead = qemu_opt_get_number(opts, "readahead-size", 0);
567 if (client->readahead > QEMU_NFS_MAX_READAHEAD_SIZE) {
568 error_report("NFS Warning: Truncating NFS readahead "
569 "size to %d", QEMU_NFS_MAX_READAHEAD_SIZE);
570 client->readahead = QEMU_NFS_MAX_READAHEAD_SIZE;
572 nfs_set_readahead(client->context, client->readahead);
573 #ifdef LIBNFS_FEATURE_PAGECACHE
574 nfs_set_pagecache_ttl(client->context, 0);
576 client->cache_used = true;
580 #ifdef LIBNFS_FEATURE_PAGECACHE
581 if (qemu_opt_get(opts, "page-cache-size")) {
582 if (open_flags & BDRV_O_NOCACHE) {
583 error_setg(errp, "Cannot enable NFS pagecache "
584 "if cache.direct = on");
587 client->pagecache = qemu_opt_get_number(opts, "page-cache-size", 0);
588 if (client->pagecache > QEMU_NFS_MAX_PAGECACHE_SIZE) {
589 error_report("NFS Warning: Truncating NFS pagecache "
590 "size to %d pages", QEMU_NFS_MAX_PAGECACHE_SIZE);
591 client->pagecache = QEMU_NFS_MAX_PAGECACHE_SIZE;
593 nfs_set_pagecache(client->context, client->pagecache);
594 nfs_set_pagecache_ttl(client->context, 0);
595 client->cache_used = true;
599 #ifdef LIBNFS_FEATURE_DEBUG
600 if (qemu_opt_get(opts, "debug")) {
601 client->debug = qemu_opt_get_number(opts, "debug", 0);
602 /* limit the maximum debug level to avoid potential flooding
603 * of our log files. */
604 if (client->debug > QEMU_NFS_MAX_DEBUG_LEVEL) {
605 error_report("NFS Warning: Limiting NFS debug level "
606 "to %d", QEMU_NFS_MAX_DEBUG_LEVEL);
607 client->debug = QEMU_NFS_MAX_DEBUG_LEVEL;
609 nfs_set_debug(client->context, client->debug);
613 ret = nfs_mount(client->context, client->server->host, client->path);
615 error_setg(errp, "Failed to mount nfs share: %s",
616 nfs_get_error(client->context));
620 if (flags & O_CREAT) {
621 ret = nfs_creat(client->context, file, 0600, &client->fh);
623 error_setg(errp, "Failed to create file: %s",
624 nfs_get_error(client->context));
628 ret = nfs_open(client->context, file, flags, &client->fh);
630 error_setg(errp, "Failed to open file : %s",
631 nfs_get_error(client->context));
636 ret = nfs_fstat(client->context, client->fh, &st);
638 error_setg(errp, "Failed to fstat file: %s",
639 nfs_get_error(client->context));
643 ret = DIV_ROUND_UP(st.st_size, BDRV_SECTOR_SIZE);
644 client->st_blocks = st.st_blocks;
645 client->has_zero_init = S_ISREG(st.st_mode);
650 nfs_client_close(client);
657 static int nfs_file_open(BlockDriverState *bs, QDict *options, int flags,
659 NFSClient *client = bs->opaque;
662 client->aio_context = bdrv_get_aio_context(bs);
664 ret = nfs_client_open(client, options,
665 (flags & BDRV_O_RDWR) ? O_RDWR : O_RDONLY,
666 bs->open_flags, errp);
670 qemu_mutex_init(&client->mutex);
671 bs->total_sectors = ret;
676 static QemuOptsList nfs_create_opts = {
677 .name = "nfs-create-opts",
678 .head = QTAILQ_HEAD_INITIALIZER(nfs_create_opts.head),
681 .name = BLOCK_OPT_SIZE,
682 .type = QEMU_OPT_SIZE,
683 .help = "Virtual disk size"
685 { /* end of list */ }
689 static int nfs_file_create(const char *url, QemuOpts *opts, Error **errp)
692 int64_t total_size = 0;
693 NFSClient *client = g_new0(NFSClient, 1);
694 QDict *options = NULL;
696 client->aio_context = qemu_get_aio_context();
698 /* Read out options */
699 total_size = ROUND_UP(qemu_opt_get_size_del(opts, BLOCK_OPT_SIZE, 0),
702 options = qdict_new();
703 ret = nfs_parse_uri(url, options, errp);
708 ret = nfs_client_open(client, options, O_CREAT, 0, errp);
712 ret = nfs_ftruncate(client->context, client->fh, total_size);
713 nfs_client_close(client);
720 static int nfs_has_zero_init(BlockDriverState *bs)
722 NFSClient *client = bs->opaque;
723 return client->has_zero_init;
726 /* Called (via nfs_service) with QemuMutex held. */
728 nfs_get_allocated_file_size_cb(int ret, struct nfs_context *nfs, void *data,
731 NFSRPC *task = private_data;
733 if (task->ret == 0) {
734 memcpy(task->st, data, sizeof(struct stat));
737 error_report("NFS Error: %s", nfs_get_error(nfs));
740 bdrv_wakeup(task->bs);
743 static int64_t nfs_get_allocated_file_size(BlockDriverState *bs)
745 NFSClient *client = bs->opaque;
749 if (bdrv_is_read_only(bs) &&
750 !(bs->open_flags & BDRV_O_NOCACHE)) {
751 return client->st_blocks * 512;
756 if (nfs_fstat_async(client->context, client->fh, nfs_get_allocated_file_size_cb,
761 nfs_set_events(client);
762 BDRV_POLL_WHILE(bs, !task.complete);
764 return (task.ret < 0 ? task.ret : st.st_blocks * 512);
767 static int nfs_file_truncate(BlockDriverState *bs, int64_t offset, Error **errp)
769 NFSClient *client = bs->opaque;
772 ret = nfs_ftruncate(client->context, client->fh, offset);
774 error_setg_errno(errp, -ret, "Failed to truncate file");
781 /* Note that this will not re-establish a connection with the NFS server
782 * - it is effectively a NOP. */
783 static int nfs_reopen_prepare(BDRVReopenState *state,
784 BlockReopenQueue *queue, Error **errp)
786 NFSClient *client = state->bs->opaque;
790 if (state->flags & BDRV_O_RDWR && bdrv_is_read_only(state->bs)) {
791 error_setg(errp, "Cannot open a read-only mount as read-write");
795 if ((state->flags & BDRV_O_NOCACHE) && client->cache_used) {
796 error_setg(errp, "Cannot disable cache if libnfs readahead or"
797 " pagecache is enabled");
801 /* Update cache for read-only reopens */
802 if (!(state->flags & BDRV_O_RDWR)) {
803 ret = nfs_fstat(client->context, client->fh, &st);
805 error_setg(errp, "Failed to fstat file: %s",
806 nfs_get_error(client->context));
809 client->st_blocks = st.st_blocks;
815 static void nfs_refresh_filename(BlockDriverState *bs, QDict *options)
817 NFSClient *client = bs->opaque;
818 QDict *opts = qdict_new();
819 QObject *server_qdict;
822 qdict_put(opts, "driver", qstring_from_str("nfs"));
824 if (client->uid && !client->gid) {
825 snprintf(bs->exact_filename, sizeof(bs->exact_filename),
826 "nfs://%s%s?uid=%" PRId64, client->server->host, client->path,
828 } else if (!client->uid && client->gid) {
829 snprintf(bs->exact_filename, sizeof(bs->exact_filename),
830 "nfs://%s%s?gid=%" PRId64, client->server->host, client->path,
832 } else if (client->uid && client->gid) {
833 snprintf(bs->exact_filename, sizeof(bs->exact_filename),
834 "nfs://%s%s?uid=%" PRId64 "&gid=%" PRId64,
835 client->server->host, client->path, client->uid, client->gid);
837 snprintf(bs->exact_filename, sizeof(bs->exact_filename),
838 "nfs://%s%s", client->server->host, client->path);
841 ov = qobject_output_visitor_new(&server_qdict);
842 visit_type_NFSServer(ov, NULL, &client->server, &error_abort);
843 visit_complete(ov, &server_qdict);
844 qdict_put_obj(opts, "server", server_qdict);
845 qdict_put(opts, "path", qstring_from_str(client->path));
848 qdict_put(opts, "user", qint_from_int(client->uid));
851 qdict_put(opts, "group", qint_from_int(client->gid));
853 if (client->tcp_syncnt) {
854 qdict_put(opts, "tcp-syn-cnt",
855 qint_from_int(client->tcp_syncnt));
857 if (client->readahead) {
858 qdict_put(opts, "readahead-size",
859 qint_from_int(client->readahead));
861 if (client->pagecache) {
862 qdict_put(opts, "page-cache-size",
863 qint_from_int(client->pagecache));
866 qdict_put(opts, "debug", qint_from_int(client->debug));
871 bs->full_open_options = opts;
874 #ifdef LIBNFS_FEATURE_PAGECACHE
875 static void nfs_invalidate_cache(BlockDriverState *bs,
878 NFSClient *client = bs->opaque;
879 nfs_pagecache_invalidate(client->context, client->fh);
883 static BlockDriver bdrv_nfs = {
884 .format_name = "nfs",
885 .protocol_name = "nfs",
887 .instance_size = sizeof(NFSClient),
888 .bdrv_parse_filename = nfs_parse_filename,
889 .create_opts = &nfs_create_opts,
891 .bdrv_has_zero_init = nfs_has_zero_init,
892 .bdrv_get_allocated_file_size = nfs_get_allocated_file_size,
893 .bdrv_truncate = nfs_file_truncate,
895 .bdrv_file_open = nfs_file_open,
896 .bdrv_close = nfs_file_close,
897 .bdrv_create = nfs_file_create,
898 .bdrv_reopen_prepare = nfs_reopen_prepare,
900 .bdrv_co_preadv = nfs_co_preadv,
901 .bdrv_co_pwritev = nfs_co_pwritev,
902 .bdrv_co_flush_to_disk = nfs_co_flush,
904 .bdrv_detach_aio_context = nfs_detach_aio_context,
905 .bdrv_attach_aio_context = nfs_attach_aio_context,
906 .bdrv_refresh_filename = nfs_refresh_filename,
908 #ifdef LIBNFS_FEATURE_PAGECACHE
909 .bdrv_invalidate_cache = nfs_invalidate_cache,
913 static void nfs_block_init(void)
915 bdrv_register(&bdrv_nfs);
918 block_init(nfs_block_init);