2 * QEMU block full disk encryption
4 * Copyright (c) 2015-2016 Red Hat, Inc.
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
21 #include "qemu/osdep.h"
23 #include "block/block_int.h"
24 #include "block/qdict.h"
25 #include "sysemu/block-backend.h"
26 #include "crypto/block.h"
27 #include "qapi/opts-visitor.h"
28 #include "qapi/qapi-visit-crypto.h"
29 #include "qapi/qobject-input-visitor.h"
30 #include "qapi/error.h"
31 #include "qemu/module.h"
32 #include "qemu/option.h"
33 #include "qemu/cutils.h"
36 typedef struct BlockCrypto BlockCrypto;
44 static int block_crypto_probe_generic(QCryptoBlockFormat format,
49 if (qcrypto_block_has_format(format, buf, buf_size)) {
57 static ssize_t block_crypto_read_func(QCryptoBlock *block,
64 BlockDriverState *bs = opaque;
67 ret = bdrv_pread(bs->file, offset, buf, buflen);
69 error_setg_errno(errp, -ret, "Could not read encryption header");
75 static ssize_t block_crypto_write_func(QCryptoBlock *block,
82 BlockDriverState *bs = opaque;
85 ret = bdrv_pwrite(bs->file, offset, buf, buflen);
87 error_setg_errno(errp, -ret, "Could not write encryption header");
94 struct BlockCryptoCreateData {
97 PreallocMode prealloc;
101 static ssize_t block_crypto_create_write_func(QCryptoBlock *block,
108 struct BlockCryptoCreateData *data = opaque;
111 ret = blk_pwrite(data->blk, offset, buf, buflen, 0);
113 error_setg_errno(errp, -ret, "Could not write encryption header");
119 static ssize_t block_crypto_create_init_func(QCryptoBlock *block,
124 struct BlockCryptoCreateData *data = opaque;
125 Error *local_error = NULL;
128 if (data->size > INT64_MAX || headerlen > INT64_MAX - data->size) {
133 /* User provided size should reflect amount of space made
134 * available to the guest, so we must take account of that
135 * which will be used by the crypto header
137 ret = blk_truncate(data->blk, data->size + headerlen, false,
138 data->prealloc, 0, &local_error);
146 /* Replace the error message with a better one */
147 error_free(local_error);
148 error_setg(errp, "The requested file size is too large");
150 error_propagate(errp, local_error);
157 static QemuOptsList block_crypto_runtime_opts_luks = {
159 .head = QTAILQ_HEAD_INITIALIZER(block_crypto_runtime_opts_luks.head),
161 BLOCK_CRYPTO_OPT_DEF_LUKS_KEY_SECRET(""),
162 { /* end of list */ }
167 static QemuOptsList block_crypto_create_opts_luks = {
169 .head = QTAILQ_HEAD_INITIALIZER(block_crypto_create_opts_luks.head),
172 .name = BLOCK_OPT_SIZE,
173 .type = QEMU_OPT_SIZE,
174 .help = "Virtual disk size"
176 BLOCK_CRYPTO_OPT_DEF_LUKS_KEY_SECRET(""),
177 BLOCK_CRYPTO_OPT_DEF_LUKS_CIPHER_ALG(""),
178 BLOCK_CRYPTO_OPT_DEF_LUKS_CIPHER_MODE(""),
179 BLOCK_CRYPTO_OPT_DEF_LUKS_IVGEN_ALG(""),
180 BLOCK_CRYPTO_OPT_DEF_LUKS_IVGEN_HASH_ALG(""),
181 BLOCK_CRYPTO_OPT_DEF_LUKS_HASH_ALG(""),
182 BLOCK_CRYPTO_OPT_DEF_LUKS_ITER_TIME(""),
183 { /* end of list */ }
188 static QemuOptsList block_crypto_amend_opts_luks = {
190 .head = QTAILQ_HEAD_INITIALIZER(block_crypto_create_opts_luks.head),
192 BLOCK_CRYPTO_OPT_DEF_LUKS_STATE(""),
193 BLOCK_CRYPTO_OPT_DEF_LUKS_KEYSLOT(""),
194 BLOCK_CRYPTO_OPT_DEF_LUKS_OLD_SECRET(""),
195 BLOCK_CRYPTO_OPT_DEF_LUKS_NEW_SECRET(""),
196 BLOCK_CRYPTO_OPT_DEF_LUKS_ITER_TIME(""),
197 { /* end of list */ }
201 QCryptoBlockOpenOptions *
202 block_crypto_open_opts_init(QDict *opts, Error **errp)
205 QCryptoBlockOpenOptions *ret;
207 v = qobject_input_visitor_new_flat_confused(opts, errp);
212 visit_type_QCryptoBlockOpenOptions(v, NULL, &ret, errp);
219 QCryptoBlockCreateOptions *
220 block_crypto_create_opts_init(QDict *opts, Error **errp)
223 QCryptoBlockCreateOptions *ret;
225 v = qobject_input_visitor_new_flat_confused(opts, errp);
230 visit_type_QCryptoBlockCreateOptions(v, NULL, &ret, errp);
236 QCryptoBlockAmendOptions *
237 block_crypto_amend_opts_init(QDict *opts, Error **errp)
240 QCryptoBlockAmendOptions *ret;
242 v = qobject_input_visitor_new_flat_confused(opts, errp);
247 visit_type_QCryptoBlockAmendOptions(v, NULL, &ret, errp);
254 static int block_crypto_open_generic(QCryptoBlockFormat format,
255 QemuOptsList *opts_spec,
256 BlockDriverState *bs,
261 BlockCrypto *crypto = bs->opaque;
262 QemuOpts *opts = NULL;
263 Error *local_err = NULL;
265 QCryptoBlockOpenOptions *open_opts = NULL;
266 unsigned int cflags = 0;
267 QDict *cryptoopts = NULL;
269 bs->file = bdrv_open_child(NULL, options, "file", bs, &child_of_bds,
270 BDRV_CHILD_IMAGE, false, errp);
275 bs->supported_write_flags = BDRV_REQ_FUA &
276 bs->file->bs->supported_write_flags;
278 opts = qemu_opts_create(opts_spec, NULL, 0, &error_abort);
279 qemu_opts_absorb_qdict(opts, options, &local_err);
281 error_propagate(errp, local_err);
285 cryptoopts = qemu_opts_to_qdict(opts, NULL);
286 qdict_put_str(cryptoopts, "format", QCryptoBlockFormat_str(format));
288 open_opts = block_crypto_open_opts_init(cryptoopts, errp);
293 if (flags & BDRV_O_NO_IO) {
294 cflags |= QCRYPTO_BLOCK_OPEN_NO_IO;
296 crypto->block = qcrypto_block_open(open_opts, NULL,
297 block_crypto_read_func,
303 if (!crypto->block) {
308 bs->encrypted = true;
312 qobject_unref(cryptoopts);
313 qapi_free_QCryptoBlockOpenOptions(open_opts);
318 static int block_crypto_co_create_generic(BlockDriverState *bs,
320 QCryptoBlockCreateOptions *opts,
321 PreallocMode prealloc,
326 QCryptoBlock *crypto = NULL;
327 struct BlockCryptoCreateData data;
329 blk = blk_new_with_bs(bs, BLK_PERM_WRITE | BLK_PERM_RESIZE, BLK_PERM_ALL,
336 if (prealloc == PREALLOC_MODE_METADATA) {
337 prealloc = PREALLOC_MODE_OFF;
340 data = (struct BlockCryptoCreateData) {
343 .prealloc = prealloc,
346 crypto = qcrypto_block_create(opts, NULL,
347 block_crypto_create_init_func,
348 block_crypto_create_write_func,
359 qcrypto_block_free(crypto);
364 static int coroutine_fn
365 block_crypto_co_truncate(BlockDriverState *bs, int64_t offset, bool exact,
366 PreallocMode prealloc, BdrvRequestFlags flags,
369 BlockCrypto *crypto = bs->opaque;
370 uint64_t payload_offset =
371 qcrypto_block_get_payload_offset(crypto->block);
373 if (payload_offset > INT64_MAX - offset) {
374 error_setg(errp, "The requested file size is too large");
378 offset += payload_offset;
380 return bdrv_co_truncate(bs->file, offset, exact, prealloc, 0, errp);
383 static void block_crypto_close(BlockDriverState *bs)
385 BlockCrypto *crypto = bs->opaque;
386 qcrypto_block_free(crypto->block);
389 static int block_crypto_reopen_prepare(BDRVReopenState *state,
390 BlockReopenQueue *queue, Error **errp)
392 /* nothing needs checking */
397 * 1 MB bounce buffer gives good performance / memory tradeoff
398 * when using cache=none|directsync.
400 #define BLOCK_CRYPTO_MAX_IO_SIZE (1024 * 1024)
402 static coroutine_fn int
403 block_crypto_co_preadv(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
404 QEMUIOVector *qiov, int flags)
406 BlockCrypto *crypto = bs->opaque;
407 uint64_t cur_bytes; /* number of bytes in current iteration */
408 uint64_t bytes_done = 0;
409 uint8_t *cipher_data = NULL;
410 QEMUIOVector hd_qiov;
412 uint64_t sector_size = qcrypto_block_get_sector_size(crypto->block);
413 uint64_t payload_offset = qcrypto_block_get_payload_offset(crypto->block);
416 assert(payload_offset < INT64_MAX);
417 assert(QEMU_IS_ALIGNED(offset, sector_size));
418 assert(QEMU_IS_ALIGNED(bytes, sector_size));
420 qemu_iovec_init(&hd_qiov, qiov->niov);
422 /* Bounce buffer because we don't wish to expose cipher text
423 * in qiov which points to guest memory.
426 qemu_try_blockalign(bs->file->bs, MIN(BLOCK_CRYPTO_MAX_IO_SIZE,
428 if (cipher_data == NULL) {
434 cur_bytes = MIN(bytes, BLOCK_CRYPTO_MAX_IO_SIZE);
436 qemu_iovec_reset(&hd_qiov);
437 qemu_iovec_add(&hd_qiov, cipher_data, cur_bytes);
439 ret = bdrv_co_preadv(bs->file, payload_offset + offset + bytes_done,
440 cur_bytes, &hd_qiov, 0);
445 if (qcrypto_block_decrypt(crypto->block, offset + bytes_done,
446 cipher_data, cur_bytes, NULL) < 0) {
451 qemu_iovec_from_buf(qiov, bytes_done, cipher_data, cur_bytes);
454 bytes_done += cur_bytes;
458 qemu_iovec_destroy(&hd_qiov);
459 qemu_vfree(cipher_data);
465 static coroutine_fn int
466 block_crypto_co_pwritev(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
467 QEMUIOVector *qiov, int flags)
469 BlockCrypto *crypto = bs->opaque;
470 uint64_t cur_bytes; /* number of bytes in current iteration */
471 uint64_t bytes_done = 0;
472 uint8_t *cipher_data = NULL;
473 QEMUIOVector hd_qiov;
475 uint64_t sector_size = qcrypto_block_get_sector_size(crypto->block);
476 uint64_t payload_offset = qcrypto_block_get_payload_offset(crypto->block);
478 assert(!(flags & ~BDRV_REQ_FUA));
479 assert(payload_offset < INT64_MAX);
480 assert(QEMU_IS_ALIGNED(offset, sector_size));
481 assert(QEMU_IS_ALIGNED(bytes, sector_size));
483 qemu_iovec_init(&hd_qiov, qiov->niov);
485 /* Bounce buffer because we're not permitted to touch
486 * contents of qiov - it points to guest memory.
489 qemu_try_blockalign(bs->file->bs, MIN(BLOCK_CRYPTO_MAX_IO_SIZE,
491 if (cipher_data == NULL) {
497 cur_bytes = MIN(bytes, BLOCK_CRYPTO_MAX_IO_SIZE);
499 qemu_iovec_to_buf(qiov, bytes_done, cipher_data, cur_bytes);
501 if (qcrypto_block_encrypt(crypto->block, offset + bytes_done,
502 cipher_data, cur_bytes, NULL) < 0) {
507 qemu_iovec_reset(&hd_qiov);
508 qemu_iovec_add(&hd_qiov, cipher_data, cur_bytes);
510 ret = bdrv_co_pwritev(bs->file, payload_offset + offset + bytes_done,
511 cur_bytes, &hd_qiov, flags);
517 bytes_done += cur_bytes;
521 qemu_iovec_destroy(&hd_qiov);
522 qemu_vfree(cipher_data);
527 static void block_crypto_refresh_limits(BlockDriverState *bs, Error **errp)
529 BlockCrypto *crypto = bs->opaque;
530 uint64_t sector_size = qcrypto_block_get_sector_size(crypto->block);
531 bs->bl.request_alignment = sector_size; /* No sub-sector I/O */
535 static int64_t block_crypto_getlength(BlockDriverState *bs)
537 BlockCrypto *crypto = bs->opaque;
538 int64_t len = bdrv_getlength(bs->file->bs);
540 uint64_t offset = qcrypto_block_get_payload_offset(crypto->block);
541 assert(offset < INT64_MAX);
553 static BlockMeasureInfo *block_crypto_measure(QemuOpts *opts,
554 BlockDriverState *in_bs,
557 g_autoptr(QCryptoBlockCreateOptions) create_opts = NULL;
558 Error *local_err = NULL;
559 BlockMeasureInfo *info;
561 size_t luks_payload_size;
565 * Preallocation mode doesn't affect size requirements but we must consume
568 g_free(qemu_opt_get_del(opts, BLOCK_OPT_PREALLOC));
570 size = qemu_opt_get_size_del(opts, BLOCK_OPT_SIZE, 0);
573 int64_t ssize = bdrv_getlength(in_bs);
576 error_setg_errno(&local_err, -ssize,
577 "Unable to get image virtual_size");
584 cryptoopts = qemu_opts_to_qdict_filtered(opts, NULL,
585 &block_crypto_create_opts_luks, true);
586 qdict_put_str(cryptoopts, "format", "luks");
587 create_opts = block_crypto_create_opts_init(cryptoopts, &local_err);
588 qobject_unref(cryptoopts);
593 if (!qcrypto_block_calculate_payload_offset(create_opts, NULL,
600 * Unallocated blocks are still encrypted so allocation status makes no
601 * difference to the file size.
603 info = g_new0(BlockMeasureInfo, 1);
604 info->fully_allocated = luks_payload_size + size;
605 info->required = luks_payload_size + size;
609 error_propagate(errp, local_err);
614 static int block_crypto_probe_luks(const uint8_t *buf,
616 const char *filename) {
617 return block_crypto_probe_generic(Q_CRYPTO_BLOCK_FORMAT_LUKS,
618 buf, buf_size, filename);
621 static int block_crypto_open_luks(BlockDriverState *bs,
626 return block_crypto_open_generic(Q_CRYPTO_BLOCK_FORMAT_LUKS,
627 &block_crypto_runtime_opts_luks,
628 bs, options, flags, errp);
631 static int coroutine_fn
632 block_crypto_co_create_luks(BlockdevCreateOptions *create_options, Error **errp)
634 BlockdevCreateOptionsLUKS *luks_opts;
635 BlockDriverState *bs = NULL;
636 QCryptoBlockCreateOptions create_opts;
637 PreallocMode preallocation = PREALLOC_MODE_OFF;
640 assert(create_options->driver == BLOCKDEV_DRIVER_LUKS);
641 luks_opts = &create_options->u.luks;
643 bs = bdrv_open_blockdev_ref(luks_opts->file, errp);
648 create_opts = (QCryptoBlockCreateOptions) {
649 .format = Q_CRYPTO_BLOCK_FORMAT_LUKS,
650 .u.luks = *qapi_BlockdevCreateOptionsLUKS_base(luks_opts),
653 if (luks_opts->has_preallocation) {
654 preallocation = luks_opts->preallocation;
657 ret = block_crypto_co_create_generic(bs, luks_opts->size, &create_opts,
658 preallocation, errp);
669 static int coroutine_fn block_crypto_co_create_opts_luks(BlockDriver *drv,
670 const char *filename,
674 QCryptoBlockCreateOptions *create_opts = NULL;
675 BlockDriverState *bs = NULL;
677 PreallocMode prealloc;
681 Error *local_err = NULL;
684 size = qemu_opt_get_size_del(opts, BLOCK_OPT_SIZE, 0);
686 buf = qemu_opt_get_del(opts, BLOCK_OPT_PREALLOC);
687 prealloc = qapi_enum_parse(&PreallocMode_lookup, buf,
688 PREALLOC_MODE_OFF, &local_err);
691 error_propagate(errp, local_err);
695 cryptoopts = qemu_opts_to_qdict_filtered(opts, NULL,
696 &block_crypto_create_opts_luks,
699 qdict_put_str(cryptoopts, "format", "luks");
700 create_opts = block_crypto_create_opts_init(cryptoopts, errp);
706 /* Create protocol layer */
707 ret = bdrv_create_file(filename, opts, errp);
712 bs = bdrv_open(filename, NULL, NULL,
713 BDRV_O_RDWR | BDRV_O_RESIZE | BDRV_O_PROTOCOL, errp);
719 /* Create format layer */
720 ret = block_crypto_co_create_generic(bs, size, create_opts, prealloc, errp);
728 * If an error occurred, delete 'filename'. Even if the file existed
729 * beforehand, it has been truncated and corrupted in the process.
732 Error *local_delete_err = NULL;
733 int r_del = bdrv_co_delete_file(bs, &local_delete_err);
735 * ENOTSUP will happen if the block driver doesn't support
736 * the 'bdrv_co_delete_file' interface. This is a predictable
737 * scenario and shouldn't be reported back to the user.
739 if ((r_del < 0) && (r_del != -ENOTSUP)) {
740 error_report_err(local_delete_err);
745 qapi_free_QCryptoBlockCreateOptions(create_opts);
746 qobject_unref(cryptoopts);
750 static int block_crypto_get_info_luks(BlockDriverState *bs,
751 BlockDriverInfo *bdi)
753 BlockDriverInfo subbdi;
756 ret = bdrv_get_info(bs->file->bs, &subbdi);
761 bdi->cluster_size = subbdi.cluster_size;
766 static ImageInfoSpecific *
767 block_crypto_get_specific_info_luks(BlockDriverState *bs, Error **errp)
769 BlockCrypto *crypto = bs->opaque;
770 ImageInfoSpecific *spec_info;
771 QCryptoBlockInfo *info;
773 info = qcrypto_block_get_info(crypto->block, errp);
777 assert(info->format == Q_CRYPTO_BLOCK_FORMAT_LUKS);
779 spec_info = g_new(ImageInfoSpecific, 1);
780 spec_info->type = IMAGE_INFO_SPECIFIC_KIND_LUKS;
781 spec_info->u.luks.data = g_new(QCryptoBlockInfoLUKS, 1);
782 *spec_info->u.luks.data = info->u.luks;
784 /* Blank out pointers we've just stolen to avoid double free */
785 memset(&info->u.luks, 0, sizeof(info->u.luks));
787 qapi_free_QCryptoBlockInfo(info);
793 block_crypto_amend_options_generic_luks(BlockDriverState *bs,
794 QCryptoBlockAmendOptions *amend_options,
798 BlockCrypto *crypto = bs->opaque;
802 assert(crypto->block);
804 /* apply for exclusive read/write permissions to the underlying file*/
805 crypto->updating_keys = true;
806 ret = bdrv_child_refresh_perms(bs, bs->file, errp);
811 ret = qcrypto_block_amend_options(crypto->block,
812 block_crypto_read_func,
813 block_crypto_write_func,
819 /* release exclusive read/write permissions to the underlying file*/
820 crypto->updating_keys = false;
821 bdrv_child_refresh_perms(bs, bs->file, errp);
826 block_crypto_amend_options_luks(BlockDriverState *bs,
828 BlockDriverAmendStatusCB *status_cb,
833 BlockCrypto *crypto = bs->opaque;
834 QDict *cryptoopts = NULL;
835 QCryptoBlockAmendOptions *amend_options = NULL;
839 assert(crypto->block);
841 cryptoopts = qemu_opts_to_qdict(opts, NULL);
842 qdict_put_str(cryptoopts, "format", "luks");
843 amend_options = block_crypto_amend_opts_init(cryptoopts, errp);
844 qobject_unref(cryptoopts);
845 if (!amend_options) {
848 ret = block_crypto_amend_options_generic_luks(bs, amend_options,
851 qapi_free_QCryptoBlockAmendOptions(amend_options);
856 coroutine_fn block_crypto_co_amend_luks(BlockDriverState *bs,
857 BlockdevAmendOptions *opts,
861 QCryptoBlockAmendOptions amend_opts;
863 amend_opts = (QCryptoBlockAmendOptions) {
864 .format = Q_CRYPTO_BLOCK_FORMAT_LUKS,
865 .u.luks = *qapi_BlockdevAmendOptionsLUKS_base(&opts->u.luks),
867 return block_crypto_amend_options_generic_luks(bs, &amend_opts,
872 block_crypto_child_perms(BlockDriverState *bs, BdrvChild *c,
873 const BdrvChildRole role,
874 BlockReopenQueue *reopen_queue,
875 uint64_t perm, uint64_t shared,
876 uint64_t *nperm, uint64_t *nshared)
879 BlockCrypto *crypto = bs->opaque;
881 bdrv_default_perms(bs, c, role, reopen_queue, perm, shared, nperm, nshared);
884 * For backward compatibility, manually share the write
885 * and resize permission
887 *nshared |= (BLK_PERM_WRITE | BLK_PERM_RESIZE);
889 * Since we are not fully a format driver, don't always request
890 * the read/resize permission but only when explicitly
893 *nperm &= ~(BLK_PERM_WRITE | BLK_PERM_RESIZE);
894 *nperm |= perm & (BLK_PERM_WRITE | BLK_PERM_RESIZE);
897 * This driver doesn't modify LUKS metadata except
898 * when updating the encryption slots.
899 * Thus unlike a proper format driver we don't ask for
900 * shared write/read permission. However we need it
901 * when we are updating the keys, to ensure that only we
902 * have access to the device.
904 * Encryption update will set the crypto->updating_keys
905 * during that period and refresh permissions
908 if (crypto->updating_keys) {
909 /* need exclusive write access for header update */
910 *nperm |= BLK_PERM_WRITE;
911 /* unshare read and write permission */
912 *nshared &= ~(BLK_PERM_CONSISTENT_READ | BLK_PERM_WRITE);
917 static const char *const block_crypto_strong_runtime_opts[] = {
918 BLOCK_CRYPTO_OPT_LUKS_KEY_SECRET,
923 static BlockDriver bdrv_crypto_luks = {
924 .format_name = "luks",
925 .instance_size = sizeof(BlockCrypto),
926 .bdrv_probe = block_crypto_probe_luks,
927 .bdrv_open = block_crypto_open_luks,
928 .bdrv_close = block_crypto_close,
929 .bdrv_child_perm = block_crypto_child_perms,
930 .bdrv_co_create = block_crypto_co_create_luks,
931 .bdrv_co_create_opts = block_crypto_co_create_opts_luks,
932 .bdrv_co_truncate = block_crypto_co_truncate,
933 .create_opts = &block_crypto_create_opts_luks,
934 .amend_opts = &block_crypto_amend_opts_luks,
936 .bdrv_reopen_prepare = block_crypto_reopen_prepare,
937 .bdrv_refresh_limits = block_crypto_refresh_limits,
938 .bdrv_co_preadv = block_crypto_co_preadv,
939 .bdrv_co_pwritev = block_crypto_co_pwritev,
940 .bdrv_getlength = block_crypto_getlength,
941 .bdrv_measure = block_crypto_measure,
942 .bdrv_get_info = block_crypto_get_info_luks,
943 .bdrv_get_specific_info = block_crypto_get_specific_info_luks,
944 .bdrv_amend_options = block_crypto_amend_options_luks,
945 .bdrv_co_amend = block_crypto_co_amend_luks,
949 .strong_runtime_opts = block_crypto_strong_runtime_opts,
952 static void block_crypto_init(void)
954 bdrv_register(&bdrv_crypto_luks);
957 block_init(block_crypto_init);