]>
Commit | Line | Data |
---|---|---|
2e6fc7eb | 1 | /* BlockDriver implementation for "raw" format driver |
e1c66c6d | 2 | * |
ad82be2f | 3 | * Copyright (C) 2010-2016 Red Hat, Inc. |
ff369a48 | 4 | * Copyright (C) 2010, Blue Swirl <[email protected]> |
775d6afd | 5 | * Copyright (C) 2009, Anthony Liguori <[email protected]> |
e1c66c6d LE |
6 | * |
7 | * Author: | |
8 | * Laszlo Ersek <[email protected]> | |
9 | * | |
10 | * Permission is hereby granted, free of charge, to any person obtaining a copy | |
11 | * of this software and associated documentation files (the "Software"), to | |
12 | * deal in the Software without restriction, including without limitation the | |
13 | * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or | |
14 | * sell copies of the Software, and to permit persons to whom the Software is | |
15 | * furnished to do so, subject to the following conditions: | |
16 | * | |
17 | * The above copyright notice and this permission notice shall be included in | |
18 | * all copies or substantial portions of the Software. | |
19 | * | |
20 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | |
21 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | |
22 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | |
23 | * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | |
24 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING | |
25 | * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS | |
26 | * IN THE SOFTWARE. | |
27 | */ | |
28 | ||
80c71a24 | 29 | #include "qemu/osdep.h" |
e1c66c6d | 30 | #include "block/block_int.h" |
da34e65c | 31 | #include "qapi/error.h" |
ff369a48 LE |
32 | #include "qemu/option.h" |
33 | ||
2fdc7045 TG |
34 | typedef struct BDRVRawState { |
35 | uint64_t offset; | |
36 | uint64_t size; | |
37 | bool has_size; | |
38 | } BDRVRawState; | |
39 | ||
40 | static QemuOptsList raw_runtime_opts = { | |
41 | .name = "raw", | |
42 | .head = QTAILQ_HEAD_INITIALIZER(raw_runtime_opts.head), | |
43 | .desc = { | |
44 | { | |
45 | .name = "offset", | |
46 | .type = QEMU_OPT_SIZE, | |
47 | .help = "offset in the disk where the image starts", | |
48 | }, | |
49 | { | |
50 | .name = "size", | |
51 | .type = QEMU_OPT_SIZE, | |
52 | .help = "virtual disk size", | |
53 | }, | |
54 | { /* end of list */ } | |
55 | }, | |
56 | }; | |
57 | ||
cd3a4cf6 CL |
58 | static QemuOptsList raw_create_opts = { |
59 | .name = "raw-create-opts", | |
60 | .head = QTAILQ_HEAD_INITIALIZER(raw_create_opts.head), | |
61 | .desc = { | |
62 | { | |
63 | .name = BLOCK_OPT_SIZE, | |
64 | .type = QEMU_OPT_SIZE, | |
65 | .help = "Virtual disk size" | |
66 | }, | |
67 | { /* end of list */ } | |
68 | } | |
ff369a48 | 69 | }; |
e1c66c6d | 70 | |
2fdc7045 TG |
71 | static int raw_read_options(QDict *options, BlockDriverState *bs, |
72 | BDRVRawState *s, Error **errp) | |
73 | { | |
74 | Error *local_err = NULL; | |
75 | QemuOpts *opts = NULL; | |
76 | int64_t real_size = 0; | |
77 | int ret; | |
78 | ||
79 | real_size = bdrv_getlength(bs->file->bs); | |
80 | if (real_size < 0) { | |
81 | error_setg_errno(errp, -real_size, "Could not get image size"); | |
82 | return real_size; | |
83 | } | |
84 | ||
85 | opts = qemu_opts_create(&raw_runtime_opts, NULL, 0, &error_abort); | |
86 | qemu_opts_absorb_qdict(opts, options, &local_err); | |
87 | if (local_err) { | |
88 | error_propagate(errp, local_err); | |
89 | ret = -EINVAL; | |
90 | goto end; | |
91 | } | |
92 | ||
93 | s->offset = qemu_opt_get_size(opts, "offset", 0); | |
40332872 TG |
94 | if (s->offset > real_size) { |
95 | error_setg(errp, "Offset (%" PRIu64 ") cannot be greater than " | |
96 | "size of the containing file (%" PRId64 ")", | |
97 | s->offset, real_size); | |
98 | ret = -EINVAL; | |
99 | goto end; | |
100 | } | |
101 | ||
2fdc7045 TG |
102 | if (qemu_opt_find(opts, "size") != NULL) { |
103 | s->size = qemu_opt_get_size(opts, "size", 0); | |
104 | s->has_size = true; | |
105 | } else { | |
106 | s->has_size = false; | |
107 | s->size = real_size - s->offset; | |
108 | } | |
109 | ||
110 | /* Check size and offset */ | |
40332872 | 111 | if ((real_size - s->offset) < s->size) { |
2fdc7045 TG |
112 | error_setg(errp, "The sum of offset (%" PRIu64 ") and size " |
113 | "(%" PRIu64 ") has to be smaller or equal to the " | |
114 | " actual size of the containing file (%" PRId64 ")", | |
115 | s->offset, s->size, real_size); | |
116 | ret = -EINVAL; | |
117 | goto end; | |
118 | } | |
119 | ||
120 | /* Make sure size is multiple of BDRV_SECTOR_SIZE to prevent rounding | |
121 | * up and leaking out of the specified area. */ | |
80a15e3e | 122 | if (s->has_size && !QEMU_IS_ALIGNED(s->size, BDRV_SECTOR_SIZE)) { |
2fdc7045 TG |
123 | error_setg(errp, "Specified size is not multiple of %llu", |
124 | BDRV_SECTOR_SIZE); | |
125 | ret = -EINVAL; | |
126 | goto end; | |
127 | } | |
128 | ||
129 | ret = 0; | |
130 | ||
131 | end: | |
132 | ||
133 | qemu_opts_del(opts); | |
134 | ||
135 | return ret; | |
136 | } | |
137 | ||
7a6d3fc5 LE |
138 | static int raw_reopen_prepare(BDRVReopenState *reopen_state, |
139 | BlockReopenQueue *queue, Error **errp) | |
e1c66c6d | 140 | { |
2fdc7045 TG |
141 | assert(reopen_state != NULL); |
142 | assert(reopen_state->bs != NULL); | |
143 | ||
144 | reopen_state->opaque = g_new0(BDRVRawState, 1); | |
145 | ||
146 | return raw_read_options( | |
147 | reopen_state->options, | |
148 | reopen_state->bs, | |
149 | reopen_state->opaque, | |
150 | errp); | |
151 | } | |
152 | ||
153 | static void raw_reopen_commit(BDRVReopenState *state) | |
154 | { | |
155 | BDRVRawState *new_s = state->opaque; | |
156 | BDRVRawState *s = state->bs->opaque; | |
157 | ||
158 | memcpy(s, new_s, sizeof(BDRVRawState)); | |
159 | ||
160 | g_free(state->opaque); | |
161 | state->opaque = NULL; | |
162 | } | |
163 | ||
164 | static void raw_reopen_abort(BDRVReopenState *state) | |
165 | { | |
166 | g_free(state->opaque); | |
167 | state->opaque = NULL; | |
e1c66c6d LE |
168 | } |
169 | ||
decaeed7 EB |
170 | static int coroutine_fn raw_co_preadv(BlockDriverState *bs, uint64_t offset, |
171 | uint64_t bytes, QEMUIOVector *qiov, | |
172 | int flags) | |
e1c66c6d | 173 | { |
2fdc7045 TG |
174 | BDRVRawState *s = bs->opaque; |
175 | ||
176 | if (offset > UINT64_MAX - s->offset) { | |
177 | return -EINVAL; | |
178 | } | |
179 | offset += s->offset; | |
180 | ||
9eaafd90 | 181 | BLKDBG_EVENT(bs->file, BLKDBG_READ_AIO); |
decaeed7 | 182 | return bdrv_co_preadv(bs->file, offset, bytes, qiov, flags); |
e1c66c6d LE |
183 | } |
184 | ||
decaeed7 EB |
185 | static int coroutine_fn raw_co_pwritev(BlockDriverState *bs, uint64_t offset, |
186 | uint64_t bytes, QEMUIOVector *qiov, | |
187 | int flags) | |
e1c66c6d | 188 | { |
2fdc7045 | 189 | BDRVRawState *s = bs->opaque; |
38f3ef57 KW |
190 | void *buf = NULL; |
191 | BlockDriver *drv; | |
192 | QEMUIOVector local_qiov; | |
193 | int ret; | |
194 | ||
2fdc7045 TG |
195 | if (s->has_size && (offset > s->size || bytes > (s->size - offset))) { |
196 | /* There's not enough space for the data. Don't write anything and just | |
197 | * fail to prevent leaking out of the size specified in options. */ | |
198 | return -ENOSPC; | |
199 | } | |
200 | ||
201 | if (offset > UINT64_MAX - s->offset) { | |
202 | ret = -EINVAL; | |
203 | goto fail; | |
204 | } | |
205 | ||
decaeed7 EB |
206 | if (bs->probed && offset < BLOCK_PROBE_BUF_SIZE && bytes) { |
207 | /* Handling partial writes would be a pain - so we just | |
208 | * require that guests have 512-byte request alignment if | |
209 | * probing occurred */ | |
38f3ef57 KW |
210 | QEMU_BUILD_BUG_ON(BLOCK_PROBE_BUF_SIZE != 512); |
211 | QEMU_BUILD_BUG_ON(BDRV_SECTOR_SIZE != 512); | |
decaeed7 | 212 | assert(offset == 0 && bytes >= BLOCK_PROBE_BUF_SIZE); |
38f3ef57 | 213 | |
9a4f4c31 | 214 | buf = qemu_try_blockalign(bs->file->bs, 512); |
38f3ef57 KW |
215 | if (!buf) { |
216 | ret = -ENOMEM; | |
217 | goto fail; | |
218 | } | |
219 | ||
220 | ret = qemu_iovec_to_buf(qiov, 0, buf, 512); | |
221 | if (ret != 512) { | |
222 | ret = -EINVAL; | |
223 | goto fail; | |
224 | } | |
225 | ||
226 | drv = bdrv_probe_all(buf, 512, NULL); | |
227 | if (drv != bs->drv) { | |
228 | ret = -EPERM; | |
229 | goto fail; | |
230 | } | |
231 | ||
232 | /* Use the checked buffer, a malicious guest might be overwriting its | |
233 | * original buffer in the background. */ | |
234 | qemu_iovec_init(&local_qiov, qiov->niov + 1); | |
235 | qemu_iovec_add(&local_qiov, buf, 512); | |
236 | qemu_iovec_concat(&local_qiov, qiov, 512, qiov->size - 512); | |
237 | qiov = &local_qiov; | |
238 | } | |
239 | ||
2fdc7045 TG |
240 | offset += s->offset; |
241 | ||
9eaafd90 | 242 | BLKDBG_EVENT(bs->file, BLKDBG_WRITE_AIO); |
decaeed7 | 243 | ret = bdrv_co_pwritev(bs->file, offset, bytes, qiov, flags); |
38f3ef57 KW |
244 | |
245 | fail: | |
246 | if (qiov == &local_qiov) { | |
247 | qemu_iovec_destroy(&local_qiov); | |
248 | } | |
249 | qemu_vfree(buf); | |
250 | return ret; | |
e1c66c6d LE |
251 | } |
252 | ||
b6b8a333 PB |
253 | static int64_t coroutine_fn raw_co_get_block_status(BlockDriverState *bs, |
254 | int64_t sector_num, | |
67a0fd2a FZ |
255 | int nb_sectors, int *pnum, |
256 | BlockDriverState **file) | |
e1c66c6d | 257 | { |
2fdc7045 | 258 | BDRVRawState *s = bs->opaque; |
92bc50a5 | 259 | *pnum = nb_sectors; |
02650acb | 260 | *file = bs->file->bs; |
2fdc7045 | 261 | sector_num += s->offset / BDRV_SECTOR_SIZE; |
92bc50a5 PL |
262 | return BDRV_BLOCK_RAW | BDRV_BLOCK_OFFSET_VALID | BDRV_BLOCK_DATA | |
263 | (sector_num << BDRV_SECTOR_BITS); | |
e1c66c6d LE |
264 | } |
265 | ||
39ad937e EB |
266 | static int coroutine_fn raw_co_pwrite_zeroes(BlockDriverState *bs, |
267 | int64_t offset, int count, | |
268 | BdrvRequestFlags flags) | |
e1c66c6d | 269 | { |
2fdc7045 TG |
270 | BDRVRawState *s = bs->opaque; |
271 | if (offset > UINT64_MAX - s->offset) { | |
272 | return -EINVAL; | |
273 | } | |
274 | offset += s->offset; | |
a03ef88f | 275 | return bdrv_co_pwrite_zeroes(bs->file, offset, count, flags); |
e1c66c6d LE |
276 | } |
277 | ||
5f61ad07 EB |
278 | static int coroutine_fn raw_co_pdiscard(BlockDriverState *bs, |
279 | int64_t offset, int count) | |
e1c66c6d | 280 | { |
2fdc7045 TG |
281 | BDRVRawState *s = bs->opaque; |
282 | if (offset > UINT64_MAX - s->offset) { | |
283 | return -EINVAL; | |
284 | } | |
285 | offset += s->offset; | |
5f61ad07 | 286 | return bdrv_co_pdiscard(bs->file->bs, offset, count); |
e1c66c6d LE |
287 | } |
288 | ||
7a6d3fc5 | 289 | static int64_t raw_getlength(BlockDriverState *bs) |
e1c66c6d | 290 | { |
2fdc7045 TG |
291 | int64_t len; |
292 | BDRVRawState *s = bs->opaque; | |
293 | ||
294 | /* Update size. It should not change unless the file was externally | |
295 | * modified. */ | |
296 | len = bdrv_getlength(bs->file->bs); | |
297 | if (len < 0) { | |
298 | return len; | |
299 | } | |
300 | ||
301 | if (len < s->offset) { | |
302 | s->size = 0; | |
303 | } else { | |
304 | if (s->has_size) { | |
305 | /* Try to honour the size */ | |
306 | s->size = MIN(s->size, len - s->offset); | |
307 | } else { | |
308 | s->size = len - s->offset; | |
309 | } | |
310 | } | |
311 | ||
312 | return s->size; | |
e1c66c6d LE |
313 | } |
314 | ||
7a6d3fc5 | 315 | static int raw_get_info(BlockDriverState *bs, BlockDriverInfo *bdi) |
e1c66c6d | 316 | { |
9a4f4c31 | 317 | return bdrv_get_info(bs->file->bs, bdi); |
e1c66c6d LE |
318 | } |
319 | ||
decaeed7 EB |
320 | static void raw_refresh_limits(BlockDriverState *bs, Error **errp) |
321 | { | |
322 | if (bs->probed) { | |
323 | /* To make it easier to protect the first sector, any probed | |
324 | * image is restricted to read-modify-write on sub-sector | |
325 | * operations. */ | |
326 | bs->bl.request_alignment = BDRV_SECTOR_SIZE; | |
327 | } | |
328 | } | |
329 | ||
4bff28b8 | 330 | static int raw_truncate(BlockDriverState *bs, int64_t offset, Error **errp) |
e1c66c6d | 331 | { |
2fdc7045 TG |
332 | BDRVRawState *s = bs->opaque; |
333 | ||
334 | if (s->has_size) { | |
f59adb32 | 335 | error_setg(errp, "Cannot resize fixed-size raw disks"); |
2fdc7045 TG |
336 | return -ENOTSUP; |
337 | } | |
338 | ||
339 | if (INT64_MAX - offset < s->offset) { | |
f59adb32 | 340 | error_setg(errp, "Disk size too large for the chosen offset"); |
2fdc7045 TG |
341 | return -EINVAL; |
342 | } | |
343 | ||
344 | s->size = offset; | |
345 | offset += s->offset; | |
4bff28b8 | 346 | return bdrv_truncate(bs->file, offset, errp); |
e1c66c6d LE |
347 | } |
348 | ||
7a6d3fc5 | 349 | static int raw_media_changed(BlockDriverState *bs) |
e1c66c6d | 350 | { |
9a4f4c31 | 351 | return bdrv_media_changed(bs->file->bs); |
e1c66c6d LE |
352 | } |
353 | ||
7a6d3fc5 | 354 | static void raw_eject(BlockDriverState *bs, bool eject_flag) |
e1c66c6d | 355 | { |
9a4f4c31 | 356 | bdrv_eject(bs->file->bs, eject_flag); |
e1c66c6d LE |
357 | } |
358 | ||
7a6d3fc5 | 359 | static void raw_lock_medium(BlockDriverState *bs, bool locked) |
e1c66c6d | 360 | { |
9a4f4c31 | 361 | bdrv_lock_medium(bs->file->bs, locked); |
e1c66c6d LE |
362 | } |
363 | ||
151a2930 | 364 | static int raw_co_ioctl(BlockDriverState *bs, unsigned long int req, void *buf) |
e1c66c6d | 365 | { |
2fdc7045 TG |
366 | BDRVRawState *s = bs->opaque; |
367 | if (s->offset || s->has_size) { | |
368 | return -ENOTSUP; | |
369 | } | |
151a2930 | 370 | return bdrv_co_ioctl(bs->file->bs, req, buf); |
e1c66c6d LE |
371 | } |
372 | ||
7a6d3fc5 | 373 | static int raw_has_zero_init(BlockDriverState *bs) |
e1c66c6d | 374 | { |
9a4f4c31 | 375 | return bdrv_has_zero_init(bs->file->bs); |
e1c66c6d LE |
376 | } |
377 | ||
cd3a4cf6 | 378 | static int raw_create(const char *filename, QemuOpts *opts, Error **errp) |
1565262c | 379 | { |
9be38598 | 380 | return bdrv_create_file(filename, opts, errp); |
1565262c | 381 | } |
01dd96d8 | 382 | |
015a1036 HR |
383 | static int raw_open(BlockDriverState *bs, QDict *options, int flags, |
384 | Error **errp) | |
01dd96d8 | 385 | { |
2fdc7045 TG |
386 | BDRVRawState *s = bs->opaque; |
387 | int ret; | |
388 | ||
4e4bf5c4 KW |
389 | bs->file = bdrv_open_child(NULL, options, "file", bs, &child_file, |
390 | false, errp); | |
391 | if (!bs->file) { | |
392 | return -EINVAL; | |
393 | } | |
394 | ||
9a4f4c31 | 395 | bs->sg = bs->file->bs->sg; |
8a39b4d6 EB |
396 | bs->supported_write_flags = BDRV_REQ_FUA & |
397 | bs->file->bs->supported_write_flags; | |
398 | bs->supported_zero_flags = (BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP) & | |
399 | bs->file->bs->supported_zero_flags; | |
38f3ef57 KW |
400 | |
401 | if (bs->probed && !bdrv_is_read_only(bs)) { | |
402 | fprintf(stderr, | |
403 | "WARNING: Image format was not specified for '%s' and probing " | |
404 | "guessed raw.\n" | |
405 | " Automatically detecting the format is dangerous for " | |
406 | "raw images, write operations on block 0 will be restricted.\n" | |
407 | " Specify the 'raw' format explicitly to remove the " | |
408 | "restrictions.\n", | |
9a4f4c31 | 409 | bs->file->bs->filename); |
38f3ef57 KW |
410 | } |
411 | ||
2fdc7045 TG |
412 | ret = raw_read_options(options, bs, s, errp); |
413 | if (ret < 0) { | |
414 | return ret; | |
415 | } | |
416 | ||
417 | if (bs->sg && (s->offset || s->has_size)) { | |
418 | error_setg(errp, "Cannot use offset/size with SCSI generic devices"); | |
419 | return -EINVAL; | |
420 | } | |
421 | ||
01dd96d8 LE |
422 | return 0; |
423 | } | |
424 | ||
7a6d3fc5 | 425 | static void raw_close(BlockDriverState *bs) |
01dd96d8 LE |
426 | { |
427 | } | |
428 | ||
7a6d3fc5 | 429 | static int raw_probe(const uint8_t *buf, int buf_size, const char *filename) |
01dd96d8 LE |
430 | { |
431 | /* smallest possible positive score so that raw is used if and only if no | |
432 | * other block driver works | |
433 | */ | |
434 | return 1; | |
435 | } | |
775d6afd | 436 | |
1a9335e4 ET |
437 | static int raw_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz) |
438 | { | |
2fdc7045 TG |
439 | BDRVRawState *s = bs->opaque; |
440 | int ret; | |
441 | ||
442 | ret = bdrv_probe_blocksizes(bs->file->bs, bsz); | |
443 | if (ret < 0) { | |
444 | return ret; | |
445 | } | |
446 | ||
447 | if (!QEMU_IS_ALIGNED(s->offset, MAX(bsz->log, bsz->phys))) { | |
448 | return -ENOTSUP; | |
449 | } | |
450 | ||
451 | return 0; | |
1a9335e4 ET |
452 | } |
453 | ||
454 | static int raw_probe_geometry(BlockDriverState *bs, HDGeometry *geo) | |
455 | { | |
2fdc7045 TG |
456 | BDRVRawState *s = bs->opaque; |
457 | if (s->offset || s->has_size) { | |
458 | return -ENOTSUP; | |
459 | } | |
9a4f4c31 | 460 | return bdrv_probe_geometry(bs->file->bs, geo); |
1a9335e4 ET |
461 | } |
462 | ||
5f535a94 | 463 | BlockDriver bdrv_raw = { |
775d6afd | 464 | .format_name = "raw", |
2fdc7045 | 465 | .instance_size = sizeof(BDRVRawState), |
775d6afd LE |
466 | .bdrv_probe = &raw_probe, |
467 | .bdrv_reopen_prepare = &raw_reopen_prepare, | |
2fdc7045 TG |
468 | .bdrv_reopen_commit = &raw_reopen_commit, |
469 | .bdrv_reopen_abort = &raw_reopen_abort, | |
775d6afd LE |
470 | .bdrv_open = &raw_open, |
471 | .bdrv_close = &raw_close, | |
d7010dfb | 472 | .bdrv_child_perm = bdrv_filter_default_perms, |
c282e1fd | 473 | .bdrv_create = &raw_create, |
decaeed7 EB |
474 | .bdrv_co_preadv = &raw_co_preadv, |
475 | .bdrv_co_pwritev = &raw_co_pwritev, | |
39ad937e | 476 | .bdrv_co_pwrite_zeroes = &raw_co_pwrite_zeroes, |
5f61ad07 | 477 | .bdrv_co_pdiscard = &raw_co_pdiscard, |
b6b8a333 | 478 | .bdrv_co_get_block_status = &raw_co_get_block_status, |
775d6afd LE |
479 | .bdrv_truncate = &raw_truncate, |
480 | .bdrv_getlength = &raw_getlength, | |
b94a2610 | 481 | .has_variable_length = true, |
775d6afd | 482 | .bdrv_get_info = &raw_get_info, |
decaeed7 | 483 | .bdrv_refresh_limits = &raw_refresh_limits, |
1a9335e4 ET |
484 | .bdrv_probe_blocksizes = &raw_probe_blocksizes, |
485 | .bdrv_probe_geometry = &raw_probe_geometry, | |
775d6afd LE |
486 | .bdrv_media_changed = &raw_media_changed, |
487 | .bdrv_eject = &raw_eject, | |
488 | .bdrv_lock_medium = &raw_lock_medium, | |
151a2930 | 489 | .bdrv_co_ioctl = &raw_co_ioctl, |
cd3a4cf6 | 490 | .create_opts = &raw_create_opts, |
775d6afd LE |
491 | .bdrv_has_zero_init = &raw_has_zero_init |
492 | }; | |
493 | ||
494 | static void bdrv_raw_init(void) | |
495 | { | |
496 | bdrv_register(&bdrv_raw); | |
497 | } | |
498 | ||
499 | block_init(bdrv_raw_init); |