]>
Commit | Line | Data |
---|---|---|
ea2384d3 FB |
1 | /* |
2 | * QEMU System Emulator block driver | |
5fafdf24 | 3 | * |
ea2384d3 | 4 | * Copyright (c) 2003 Fabrice Bellard |
5fafdf24 | 5 | * |
ea2384d3 FB |
6 | * Permission is hereby granted, free of charge, to any person obtaining a copy |
7 | * of this software and associated documentation files (the "Software"), to deal | |
8 | * in the Software without restriction, including without limitation the rights | |
9 | * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | |
10 | * copies of the Software, and to permit persons to whom the Software is | |
11 | * furnished to do so, subject to the following conditions: | |
12 | * | |
13 | * The above copyright notice and this permission notice shall be included in | |
14 | * all copies or substantial portions of the Software. | |
15 | * | |
16 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | |
17 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | |
18 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | |
19 | * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | |
20 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | |
21 | * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | |
22 | * THE SOFTWARE. | |
23 | */ | |
24 | #ifndef BLOCK_INT_H | |
25 | #define BLOCK_INT_H | |
26 | ||
5e5a94b6 | 27 | #include "block/accounting.h" |
737e150e | 28 | #include "block/block.h" |
281d22d8 | 29 | #include "block/throttle-groups.h" |
1de7afc9 PB |
30 | #include "qemu/option.h" |
31 | #include "qemu/queue.h" | |
10817bf0 | 32 | #include "qemu/coroutine.h" |
1de7afc9 | 33 | #include "qemu/timer.h" |
b2023818 | 34 | #include "qapi-types.h" |
8f0720ec | 35 | #include "qemu/hbitmap.h" |
f364ec65 | 36 | #include "block/snapshot.h" |
6a1751b7 | 37 | #include "qemu/main-loop.h" |
cc0681c4 | 38 | #include "qemu/throttle.h" |
faf07963 | 39 | |
bfe8043e SH |
40 | #define BLOCK_FLAG_ENCRYPT 1 |
41 | #define BLOCK_FLAG_COMPAT6 4 | |
42 | #define BLOCK_FLAG_LAZY_REFCOUNTS 8 | |
ec36ba14 | 43 | |
bfe8043e SH |
44 | #define BLOCK_OPT_SIZE "size" |
45 | #define BLOCK_OPT_ENCRYPT "encryption" | |
46 | #define BLOCK_OPT_COMPAT6 "compat6" | |
47 | #define BLOCK_OPT_BACKING_FILE "backing_file" | |
48 | #define BLOCK_OPT_BACKING_FMT "backing_fmt" | |
49 | #define BLOCK_OPT_CLUSTER_SIZE "cluster_size" | |
50 | #define BLOCK_OPT_TABLE_SIZE "table_size" | |
51 | #define BLOCK_OPT_PREALLOC "preallocation" | |
52 | #define BLOCK_OPT_SUBFMT "subformat" | |
53 | #define BLOCK_OPT_COMPAT_LEVEL "compat" | |
54 | #define BLOCK_OPT_LAZY_REFCOUNTS "lazy_refcounts" | |
7f2039f6 | 55 | #define BLOCK_OPT_ADAPTER_TYPE "adapter_type" |
b3af018f | 56 | #define BLOCK_OPT_REDUNDANCY "redundancy" |
4ab15590 | 57 | #define BLOCK_OPT_NOCOW "nocow" |
876eb1b0 | 58 | #define BLOCK_OPT_OBJECT_SIZE "object_size" |
06d05fa7 | 59 | #define BLOCK_OPT_REFCOUNT_BITS "refcount_bits" |
0e7e1989 | 60 | |
7cddd372 KW |
61 | #define BLOCK_PROBE_BUF_SIZE 512 |
62 | ||
d616b224 SH |
63 | typedef struct BdrvTrackedRequest { |
64 | BlockDriverState *bs; | |
793ed47a KW |
65 | int64_t offset; |
66 | unsigned int bytes; | |
d616b224 | 67 | bool is_write; |
7327145f | 68 | |
2dbafdc0 | 69 | bool serialising; |
7327145f KW |
70 | int64_t overlap_offset; |
71 | unsigned int overlap_bytes; | |
72 | ||
d616b224 SH |
73 | QLIST_ENTRY(BdrvTrackedRequest) list; |
74 | Coroutine *co; /* owner, used for deadlock detection */ | |
75 | CoQueue wait_queue; /* coroutines blocked on this request */ | |
6460440f KW |
76 | |
77 | struct BdrvTrackedRequest *waiting_for; | |
d616b224 SH |
78 | } BdrvTrackedRequest; |
79 | ||
ea2384d3 FB |
80 | struct BlockDriver { |
81 | const char *format_name; | |
82 | int instance_size; | |
f6186f49 | 83 | |
b5042a36 BC |
84 | /* set to true if the BlockDriver is a block filter */ |
85 | bool is_filter; | |
86 | /* for snapshots block filter like Quorum can implement the | |
87 | * following recursive callback. | |
212a5a8f BC |
88 | * It's purpose is to recurse on the filter children while calling |
89 | * bdrv_recurse_is_first_non_filter on them. | |
90 | * For a sample implementation look in the future Quorum block filter. | |
f6186f49 | 91 | */ |
212a5a8f BC |
92 | bool (*bdrv_recurse_is_first_non_filter)(BlockDriverState *bs, |
93 | BlockDriverState *candidate); | |
f6186f49 | 94 | |
ea2384d3 | 95 | int (*bdrv_probe)(const uint8_t *buf, int buf_size, const char *filename); |
508c7cb3 | 96 | int (*bdrv_probe_device)(const char *filename); |
c2ad1b0c KW |
97 | |
98 | /* Any driver implementing this callback is expected to be able to handle | |
99 | * NULL file names in its .bdrv_open() implementation */ | |
6963a30d | 100 | void (*bdrv_parse_filename)(const char *filename, QDict *options, Error **errp); |
030be321 BC |
101 | /* Drivers not implementing bdrv_parse_filename nor bdrv_open should have |
102 | * this field set to true, except ones that are defined only by their | |
103 | * child's bs. | |
104 | * An example of the last type will be the quorum block driver. | |
105 | */ | |
106 | bool bdrv_needs_filename; | |
e971aa12 | 107 | |
8ee79e70 KW |
108 | /* Set if a driver can support backing files */ |
109 | bool supports_backing; | |
110 | ||
e971aa12 JC |
111 | /* For handling image reopen for split or non-split files */ |
112 | int (*bdrv_reopen_prepare)(BDRVReopenState *reopen_state, | |
113 | BlockReopenQueue *queue, Error **errp); | |
114 | void (*bdrv_reopen_commit)(BDRVReopenState *reopen_state); | |
115 | void (*bdrv_reopen_abort)(BDRVReopenState *reopen_state); | |
116 | ||
015a1036 HR |
117 | int (*bdrv_open)(BlockDriverState *bs, QDict *options, int flags, |
118 | Error **errp); | |
119 | int (*bdrv_file_open)(BlockDriverState *bs, QDict *options, int flags, | |
120 | Error **errp); | |
5fafdf24 | 121 | int (*bdrv_read)(BlockDriverState *bs, int64_t sector_num, |
ea2384d3 | 122 | uint8_t *buf, int nb_sectors); |
5fafdf24 | 123 | int (*bdrv_write)(BlockDriverState *bs, int64_t sector_num, |
ea2384d3 | 124 | const uint8_t *buf, int nb_sectors); |
e2731add | 125 | void (*bdrv_close)(BlockDriverState *bs); |
c282e1fd | 126 | int (*bdrv_create)(const char *filename, QemuOpts *opts, Error **errp); |
ea2384d3 | 127 | int (*bdrv_set_key)(BlockDriverState *bs, const char *key); |
95389c86 | 128 | int (*bdrv_make_empty)(BlockDriverState *bs); |
91af7014 HR |
129 | |
130 | void (*bdrv_refresh_filename)(BlockDriverState *bs); | |
131 | ||
83f64091 | 132 | /* aio */ |
7c84b1b8 | 133 | BlockAIOCB *(*bdrv_aio_readv)(BlockDriverState *bs, |
f141eafe | 134 | int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, |
097310b5 | 135 | BlockCompletionFunc *cb, void *opaque); |
7c84b1b8 | 136 | BlockAIOCB *(*bdrv_aio_writev)(BlockDriverState *bs, |
f141eafe | 137 | int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, |
097310b5 | 138 | BlockCompletionFunc *cb, void *opaque); |
7c84b1b8 | 139 | BlockAIOCB *(*bdrv_aio_flush)(BlockDriverState *bs, |
097310b5 | 140 | BlockCompletionFunc *cb, void *opaque); |
7c84b1b8 | 141 | BlockAIOCB *(*bdrv_aio_discard)(BlockDriverState *bs, |
4265d620 | 142 | int64_t sector_num, int nb_sectors, |
097310b5 | 143 | BlockCompletionFunc *cb, void *opaque); |
83f64091 | 144 | |
da1fa91d KW |
145 | int coroutine_fn (*bdrv_co_readv)(BlockDriverState *bs, |
146 | int64_t sector_num, int nb_sectors, QEMUIOVector *qiov); | |
147 | int coroutine_fn (*bdrv_co_writev)(BlockDriverState *bs, | |
148 | int64_t sector_num, int nb_sectors, QEMUIOVector *qiov); | |
f08f2dda SH |
149 | /* |
150 | * Efficiently zero a region of the disk image. Typically an image format | |
151 | * would use a compact metadata representation to implement this. This | |
152 | * function pointer may be NULL and .bdrv_co_writev() will be called | |
153 | * instead. | |
154 | */ | |
155 | int coroutine_fn (*bdrv_co_write_zeroes)(BlockDriverState *bs, | |
aa7bfbff | 156 | int64_t sector_num, int nb_sectors, BdrvRequestFlags flags); |
4265d620 PB |
157 | int coroutine_fn (*bdrv_co_discard)(BlockDriverState *bs, |
158 | int64_t sector_num, int nb_sectors); | |
b6b8a333 | 159 | int64_t coroutine_fn (*bdrv_co_get_block_status)(BlockDriverState *bs, |
376ae3f1 | 160 | int64_t sector_num, int nb_sectors, int *pnum); |
da1fa91d | 161 | |
0f15423c AL |
162 | /* |
163 | * Invalidate any cached meta-data. | |
164 | */ | |
5a8a30db | 165 | void (*bdrv_invalidate_cache)(BlockDriverState *bs, Error **errp); |
0f15423c | 166 | |
c68b89ac KW |
167 | /* |
168 | * Flushes all data that was already written to the OS all the way down to | |
169 | * the disk (for example raw-posix calls fsync()). | |
170 | */ | |
171 | int coroutine_fn (*bdrv_co_flush_to_disk)(BlockDriverState *bs); | |
172 | ||
eb489bb1 KW |
173 | /* |
174 | * Flushes all internal caches to the OS. The data may still sit in a | |
175 | * writeback cache of the host OS, but it will survive a crash of the qemu | |
176 | * process. | |
177 | */ | |
178 | int coroutine_fn (*bdrv_co_flush_to_os)(BlockDriverState *bs); | |
179 | ||
83f64091 | 180 | const char *protocol_name; |
83f64091 | 181 | int (*bdrv_truncate)(BlockDriverState *bs, int64_t offset); |
b94a2610 | 182 | |
83f64091 | 183 | int64_t (*bdrv_getlength)(BlockDriverState *bs); |
b94a2610 | 184 | bool has_variable_length; |
4a1d5e1f | 185 | int64_t (*bdrv_get_allocated_file_size)(BlockDriverState *bs); |
b94a2610 | 186 | |
5fafdf24 | 187 | int (*bdrv_write_compressed)(BlockDriverState *bs, int64_t sector_num, |
faea38e7 FB |
188 | const uint8_t *buf, int nb_sectors); |
189 | ||
5fafdf24 | 190 | int (*bdrv_snapshot_create)(BlockDriverState *bs, |
faea38e7 | 191 | QEMUSnapshotInfo *sn_info); |
5fafdf24 | 192 | int (*bdrv_snapshot_goto)(BlockDriverState *bs, |
faea38e7 | 193 | const char *snapshot_id); |
a89d89d3 WX |
194 | int (*bdrv_snapshot_delete)(BlockDriverState *bs, |
195 | const char *snapshot_id, | |
196 | const char *name, | |
197 | Error **errp); | |
5fafdf24 | 198 | int (*bdrv_snapshot_list)(BlockDriverState *bs, |
faea38e7 | 199 | QEMUSnapshotInfo **psn_info); |
51ef6727 | 200 | int (*bdrv_snapshot_load_tmp)(BlockDriverState *bs, |
7b4c4781 WX |
201 | const char *snapshot_id, |
202 | const char *name, | |
203 | Error **errp); | |
faea38e7 | 204 | int (*bdrv_get_info)(BlockDriverState *bs, BlockDriverInfo *bdi); |
eae041fe | 205 | ImageInfoSpecific *(*bdrv_get_specific_info)(BlockDriverState *bs); |
83f64091 | 206 | |
cf8074b3 KW |
207 | int (*bdrv_save_vmstate)(BlockDriverState *bs, QEMUIOVector *qiov, |
208 | int64_t pos); | |
45566e9c CH |
209 | int (*bdrv_load_vmstate)(BlockDriverState *bs, uint8_t *buf, |
210 | int64_t pos, int size); | |
178e08a5 | 211 | |
756e6736 KW |
212 | int (*bdrv_change_backing_file)(BlockDriverState *bs, |
213 | const char *backing_file, const char *backing_fmt); | |
214 | ||
19cb3738 | 215 | /* removable device specific */ |
e031f750 | 216 | bool (*bdrv_is_inserted)(BlockDriverState *bs); |
19cb3738 | 217 | int (*bdrv_media_changed)(BlockDriverState *bs); |
f36f3949 | 218 | void (*bdrv_eject)(BlockDriverState *bs, bool eject_flag); |
025e849a | 219 | void (*bdrv_lock_medium)(BlockDriverState *bs, bool locked); |
3b46e624 | 220 | |
985a03b0 TS |
221 | /* to control generic scsi devices */ |
222 | int (*bdrv_ioctl)(BlockDriverState *bs, unsigned long int req, void *buf); | |
7c84b1b8 | 223 | BlockAIOCB *(*bdrv_aio_ioctl)(BlockDriverState *bs, |
221f715d | 224 | unsigned long int req, void *buf, |
097310b5 | 225 | BlockCompletionFunc *cb, void *opaque); |
985a03b0 | 226 | |
0e7e1989 | 227 | /* List of options for creating images, terminated by name == NULL */ |
83d0521a | 228 | QemuOptsList *create_opts; |
5eb45639 | 229 | |
9ac228e0 KW |
230 | /* |
231 | * Returns 0 for completed check, -errno for internal errors. | |
232 | * The check results are stored in result. | |
233 | */ | |
4534ff54 KW |
234 | int (*bdrv_check)(BlockDriverState* bs, BdrvCheckResult *result, |
235 | BdrvCheckMode fix); | |
e97fc193 | 236 | |
77485434 HR |
237 | int (*bdrv_amend_options)(BlockDriverState *bs, QemuOpts *opts, |
238 | BlockDriverAmendStatusCB *status_cb); | |
6f176b48 | 239 | |
8b9b0cc2 KW |
240 | void (*bdrv_debug_event)(BlockDriverState *bs, BlkDebugEvent event); |
241 | ||
41c695c7 KW |
242 | /* TODO Better pass a option string/QDict/QemuOpts to add any rule? */ |
243 | int (*bdrv_debug_breakpoint)(BlockDriverState *bs, const char *event, | |
244 | const char *tag); | |
4cc70e93 FZ |
245 | int (*bdrv_debug_remove_breakpoint)(BlockDriverState *bs, |
246 | const char *tag); | |
41c695c7 KW |
247 | int (*bdrv_debug_resume)(BlockDriverState *bs, const char *tag); |
248 | bool (*bdrv_debug_is_suspended)(BlockDriverState *bs, const char *tag); | |
249 | ||
3baca891 | 250 | void (*bdrv_refresh_limits)(BlockDriverState *bs, Error **errp); |
d34682cd | 251 | |
336c1c12 KW |
252 | /* |
253 | * Returns 1 if newly created images are guaranteed to contain only | |
254 | * zeros, 0 otherwise. | |
255 | */ | |
256 | int (*bdrv_has_zero_init)(BlockDriverState *bs); | |
12c09b8c | 257 | |
dcd04228 SH |
258 | /* Remove fd handlers, timers, and other event loop callbacks so the event |
259 | * loop is no longer in use. Called with no in-flight requests and in | |
260 | * depth-first traversal order with parents before child nodes. | |
261 | */ | |
262 | void (*bdrv_detach_aio_context)(BlockDriverState *bs); | |
263 | ||
264 | /* Add fd handlers, timers, and other event loop callbacks so I/O requests | |
265 | * can be processed again. Called with no in-flight requests and in | |
266 | * depth-first traversal order with child nodes before parent nodes. | |
267 | */ | |
268 | void (*bdrv_attach_aio_context)(BlockDriverState *bs, | |
269 | AioContext *new_context); | |
270 | ||
448ad91d ML |
271 | /* io queue for linux-aio */ |
272 | void (*bdrv_io_plug)(BlockDriverState *bs); | |
273 | void (*bdrv_io_unplug)(BlockDriverState *bs); | |
274 | void (*bdrv_flush_io_queue)(BlockDriverState *bs); | |
275 | ||
892b7de8 ET |
276 | /** |
277 | * Try to get @bs's logical and physical block size. | |
278 | * On success, store them in @bsz and return zero. | |
279 | * On failure, return negative errno. | |
280 | */ | |
281 | int (*bdrv_probe_blocksizes)(BlockDriverState *bs, BlockSizes *bsz); | |
282 | /** | |
283 | * Try to get @bs's geometry (cyls, heads, sectors) | |
284 | * On success, store them in @geo and return 0. | |
285 | * On failure return -errno. | |
286 | * Only drivers that want to override guest geometry implement this | |
287 | * callback; see hd_geometry_guess(). | |
288 | */ | |
289 | int (*bdrv_probe_geometry)(BlockDriverState *bs, HDGeometry *geo); | |
290 | ||
8a22f02a | 291 | QLIST_ENTRY(BlockDriver) list; |
ea2384d3 FB |
292 | }; |
293 | ||
fe81c2cc PL |
294 | typedef struct BlockLimits { |
295 | /* maximum number of sectors that can be discarded at once */ | |
296 | int max_discard; | |
297 | ||
298 | /* optimal alignment for discard requests in sectors */ | |
299 | int64_t discard_alignment; | |
300 | ||
301 | /* maximum number of sectors that can zeroized at once */ | |
302 | int max_write_zeroes; | |
303 | ||
304 | /* optimal alignment for write zeroes requests in sectors */ | |
305 | int64_t write_zeroes_alignment; | |
7337acaf PL |
306 | |
307 | /* optimal transfer length in sectors */ | |
308 | int opt_transfer_length; | |
339064d5 | 309 | |
2647fab5 PL |
310 | /* maximal transfer length in sectors */ |
311 | int max_transfer_length; | |
312 | ||
339064d5 | 313 | /* memory alignment so that no bounce buffer is needed */ |
4196d2f0 DL |
314 | size_t min_mem_alignment; |
315 | ||
316 | /* memory alignment for bounce buffer */ | |
339064d5 | 317 | size_t opt_mem_alignment; |
fe81c2cc PL |
318 | } BlockLimits; |
319 | ||
fbe40ff7 FZ |
320 | typedef struct BdrvOpBlocker BdrvOpBlocker; |
321 | ||
33384421 HR |
322 | typedef struct BdrvAioNotifier { |
323 | void (*attached_aio_context)(AioContext *new_context, void *opaque); | |
324 | void (*detach_aio_context)(void *opaque); | |
325 | ||
326 | void *opaque; | |
327 | ||
328 | QLIST_ENTRY(BdrvAioNotifier) list; | |
329 | } BdrvAioNotifier; | |
330 | ||
f3930ed0 KW |
331 | struct BdrvChildRole { |
332 | int (*inherit_flags)(int parent_flags); | |
333 | }; | |
334 | ||
335 | extern const BdrvChildRole child_file; | |
336 | extern const BdrvChildRole child_format; | |
337 | ||
b4b059f6 | 338 | struct BdrvChild { |
6e93e7c4 KW |
339 | BlockDriverState *bs; |
340 | const BdrvChildRole *role; | |
341 | QLIST_ENTRY(BdrvChild) next; | |
d42a8a93 | 342 | QLIST_ENTRY(BdrvChild) next_parent; |
b4b059f6 | 343 | }; |
6e93e7c4 | 344 | |
8802d1fd JC |
345 | /* |
346 | * Note: the function bdrv_append() copies and swaps contents of | |
347 | * BlockDriverStates, so if you add new fields to this struct, please | |
348 | * inspect bdrv_append() to determine if the new fields need to be | |
349 | * copied as well. | |
350 | */ | |
ea2384d3 | 351 | struct BlockDriverState { |
d15a771d FB |
352 | int64_t total_sectors; /* if we are reading a disk image, give its |
353 | size in sectors */ | |
ea2384d3 | 354 | int read_only; /* if true, the media is read only */ |
4dca4b63 | 355 | int open_flags; /* flags used to open the file, re-used for re-open */ |
ea2384d3 | 356 | int encrypted; /* if true, the media is encrypted */ |
c0f4ce77 | 357 | int valid_key; /* if true, a valid encryption key has been set */ |
985a03b0 | 358 | int sg; /* if true, the device is a /dev/sg* */ |
53fec9d3 SH |
359 | int copy_on_read; /* if true, copy read backing sectors into image |
360 | note this is a reference count */ | |
38f3ef57 | 361 | bool probed; |
ea2384d3 | 362 | |
19cb3738 | 363 | BlockDriver *drv; /* NULL means no media */ |
ea2384d3 FB |
364 | void *opaque; |
365 | ||
7e7d56d9 MA |
366 | BlockBackend *blk; /* owning backend, if any */ |
367 | ||
dcd04228 | 368 | AioContext *aio_context; /* event loop used for fd handlers, timers, etc */ |
33384421 HR |
369 | /* long-running tasks intended to always use the same AioContext as this |
370 | * BDS may register themselves in this list to be notified of changes | |
371 | * regarding this BDS's context */ | |
372 | QLIST_HEAD(, BdrvAioNotifier) aio_notifiers; | |
dcd04228 | 373 | |
9a29e18f JC |
374 | char filename[PATH_MAX]; |
375 | char backing_file[PATH_MAX]; /* if non zero, the image is a diff of | |
376 | this file image */ | |
5eb45639 | 377 | char backing_format[16]; /* if non-zero and backing_file exists */ |
19cb3738 | 378 | |
91af7014 | 379 | QDict *full_open_options; |
9a29e18f | 380 | char exact_filename[PATH_MAX]; |
91af7014 | 381 | |
760e0063 | 382 | BdrvChild *backing; |
9a4f4c31 | 383 | BdrvChild *file; |
66f82cee | 384 | |
d7d512f6 PB |
385 | NotifierList close_notifiers; |
386 | ||
d616b224 SH |
387 | /* Callback before write request is processed */ |
388 | NotifierWithReturnList before_write_notifiers; | |
389 | ||
2dbafdc0 KW |
390 | /* number of in-flight serialising requests */ |
391 | unsigned int serialising_in_flight; | |
470c0504 | 392 | |
cc0681c4 | 393 | /* I/O throttling */ |
cc0681c4 | 394 | CoQueue throttled_reqs[2]; |
0563e191 | 395 | bool io_limits_enabled; |
76f4afb4 AG |
396 | /* The following fields are protected by the ThrottleGroup lock. |
397 | * See the ThrottleGroup documentation for details. */ | |
398 | ThrottleState *throttle_state; | |
399 | ThrottleTimers throttle_timers; | |
400 | unsigned pending_reqs[2]; | |
2ff1f2e3 | 401 | QLIST_ENTRY(BlockDriverState) round_robin; |
0563e191 | 402 | |
53d8f9d8 HR |
403 | /* Offset after the highest byte written to */ |
404 | uint64_t wr_highest_offset; | |
405 | ||
fe81c2cc PL |
406 | /* I/O Limits */ |
407 | BlockLimits bl; | |
408 | ||
0d51b4de AH |
409 | /* Whether produces zeros when read beyond eof */ |
410 | bool zero_beyond_eof; | |
411 | ||
c25f53b0 PB |
412 | /* Alignment requirement for offset/length of I/O requests */ |
413 | unsigned int request_alignment; | |
414 | ||
e900a7b7 CH |
415 | /* do we need to tell the quest if we have a volatile write cache? */ |
416 | int enable_write_cache; | |
417 | ||
dc364f4c BC |
418 | /* the following member gives a name to every node on the bs graph. */ |
419 | char node_name[32]; | |
420 | /* element of the list of named nodes building the graph */ | |
421 | QTAILQ_ENTRY(BlockDriverState) node_list; | |
dc364f4c BC |
422 | /* element of the list of "drives" the guest sees */ |
423 | QTAILQ_ENTRY(BlockDriverState) device_list; | |
e4654d2d | 424 | QLIST_HEAD(, BdrvDirtyBitmap) dirty_bitmaps; |
9fcb0251 | 425 | int refcnt; |
dbffbdcf SH |
426 | |
427 | QLIST_HEAD(, BdrvTrackedRequest) tracked_requests; | |
eeec61f2 | 428 | |
fbe40ff7 FZ |
429 | /* operation blockers */ |
430 | QLIST_HEAD(, BdrvOpBlocker) op_blockers[BLOCK_OP_TYPE_MAX]; | |
431 | ||
eeec61f2 SH |
432 | /* long-running background operation */ |
433 | BlockJob *job; | |
e971aa12 | 434 | |
bddcec37 KW |
435 | /* The node that this node inherited default options from (and a reopen on |
436 | * which can affect this node by changing these defaults). This is always a | |
437 | * parent node of this node. */ | |
438 | BlockDriverState *inherits_from; | |
6e93e7c4 | 439 | QLIST_HEAD(, BdrvChild) children; |
d42a8a93 | 440 | QLIST_HEAD(, BdrvChild) parents; |
6e93e7c4 | 441 | |
de9c0cec | 442 | QDict *options; |
465bee1d | 443 | BlockdevDetectZeroesOptions detect_zeroes; |
826b6ca0 FZ |
444 | |
445 | /* The error object in use for blocking operations on backing_hd */ | |
446 | Error *backing_blocker; | |
e2462113 FR |
447 | |
448 | /* threshold limit for writes, in bytes. "High water mark". */ | |
449 | uint64_t write_threshold_offset; | |
450 | NotifierWithReturn write_threshold_notifier; | |
51288d79 FZ |
451 | |
452 | int quiesce_counter; | |
ea2384d3 FB |
453 | }; |
454 | ||
281d22d8 HR |
455 | struct BlockBackendRootState { |
456 | int open_flags; | |
457 | bool read_only; | |
458 | BlockdevDetectZeroesOptions detect_zeroes; | |
459 | ||
460 | char *throttle_group; | |
461 | ThrottleState *throttle_state; | |
462 | }; | |
463 | ||
760e0063 KW |
464 | static inline BlockDriverState *backing_bs(BlockDriverState *bs) |
465 | { | |
466 | return bs->backing ? bs->backing->bs : NULL; | |
467 | } | |
468 | ||
5f535a94 HR |
469 | |
470 | /* Essential block drivers which must always be statically linked into qemu, and | |
471 | * which therefore can be accessed without using bdrv_find_format() */ | |
472 | extern BlockDriver bdrv_file; | |
473 | extern BlockDriver bdrv_raw; | |
474 | extern BlockDriver bdrv_qcow2; | |
475 | ||
c69a4dd8 HR |
476 | extern QTAILQ_HEAD(BdrvStates, BlockDriverState) bdrv_states; |
477 | ||
0eb7217e SH |
478 | /** |
479 | * bdrv_setup_io_funcs: | |
480 | * | |
481 | * Prepare a #BlockDriver for I/O request processing by populating | |
482 | * unimplemented coroutine and AIO interfaces with generic wrapper functions | |
483 | * that fall back to implemented interfaces. | |
484 | */ | |
485 | void bdrv_setup_io_funcs(BlockDriver *bdrv); | |
5f535a94 | 486 | |
eba25057 | 487 | int get_tmp_filename(char *filename, int size); |
38f3ef57 KW |
488 | BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size, |
489 | const char *filename); | |
95389c86 | 490 | |
0563e191 | 491 | void bdrv_set_io_limits(BlockDriverState *bs, |
cc0681c4 BC |
492 | ThrottleConfig *cfg); |
493 | ||
0563e191 | 494 | |
d616b224 SH |
495 | /** |
496 | * bdrv_add_before_write_notifier: | |
497 | * | |
498 | * Register a callback that is invoked before write requests are processed but | |
499 | * after any throttling or waiting for overlapping requests. | |
500 | */ | |
501 | void bdrv_add_before_write_notifier(BlockDriverState *bs, | |
502 | NotifierWithReturn *notifier); | |
503 | ||
dcd04228 SH |
504 | /** |
505 | * bdrv_detach_aio_context: | |
506 | * | |
507 | * May be called from .bdrv_detach_aio_context() to detach children from the | |
508 | * current #AioContext. This is only needed by block drivers that manage their | |
760e0063 | 509 | * own children. Both ->file and ->backing are automatically handled and |
dcd04228 SH |
510 | * block drivers should not call this function on them explicitly. |
511 | */ | |
512 | void bdrv_detach_aio_context(BlockDriverState *bs); | |
513 | ||
514 | /** | |
515 | * bdrv_attach_aio_context: | |
516 | * | |
517 | * May be called from .bdrv_attach_aio_context() to attach children to the new | |
518 | * #AioContext. This is only needed by block drivers that manage their own | |
760e0063 | 519 | * children. Both ->file and ->backing are automatically handled and block |
dcd04228 SH |
520 | * drivers should not call this function on them explicitly. |
521 | */ | |
522 | void bdrv_attach_aio_context(BlockDriverState *bs, | |
523 | AioContext *new_context); | |
524 | ||
33384421 HR |
525 | /** |
526 | * bdrv_add_aio_context_notifier: | |
527 | * | |
528 | * If a long-running job intends to be always run in the same AioContext as a | |
529 | * certain BDS, it may use this function to be notified of changes regarding the | |
530 | * association of the BDS to an AioContext. | |
531 | * | |
532 | * attached_aio_context() is called after the target BDS has been attached to a | |
533 | * new AioContext; detach_aio_context() is called before the target BDS is being | |
534 | * detached from its old AioContext. | |
535 | */ | |
536 | void bdrv_add_aio_context_notifier(BlockDriverState *bs, | |
537 | void (*attached_aio_context)(AioContext *new_context, void *opaque), | |
538 | void (*detach_aio_context)(void *opaque), void *opaque); | |
539 | ||
540 | /** | |
541 | * bdrv_remove_aio_context_notifier: | |
542 | * | |
543 | * Unsubscribe of change notifications regarding the BDS's AioContext. The | |
544 | * parameters given here have to be the same as those given to | |
545 | * bdrv_add_aio_context_notifier(). | |
546 | */ | |
547 | void bdrv_remove_aio_context_notifier(BlockDriverState *bs, | |
548 | void (*aio_context_attached)(AioContext *, | |
549 | void *), | |
550 | void (*aio_context_detached)(void *), | |
551 | void *opaque); | |
552 | ||
508c7cb3 CH |
553 | #ifdef _WIN32 |
554 | int is_windows_drive(const char *filename); | |
555 | #endif | |
556 | ||
dc534f8f PB |
557 | /** |
558 | * stream_start: | |
559 | * @bs: Block device to operate on. | |
560 | * @base: Block device that will become the new base, or %NULL to | |
561 | * flatten the whole backing file chain onto @bs. | |
562 | * @base_id: The file name that will be written to @bs as the new | |
563 | * backing file if the job completes. Ignored if @base is %NULL. | |
c83c66c3 | 564 | * @speed: The maximum speed, in bytes per second, or 0 for unlimited. |
1d809098 | 565 | * @on_error: The action to take upon error. |
dc534f8f PB |
566 | * @cb: Completion function for the job. |
567 | * @opaque: Opaque pointer value passed to @cb. | |
fd7f8c65 | 568 | * @errp: Error object. |
dc534f8f PB |
569 | * |
570 | * Start a streaming operation on @bs. Clusters that are unallocated | |
571 | * in @bs, but allocated in any image between @base and @bs (both | |
572 | * exclusive) will be written to @bs. At the end of a successful | |
573 | * streaming job, the backing file of @bs will be changed to | |
574 | * @base_id in the written image and to @base in the live BlockDriverState. | |
575 | */ | |
fd7f8c65 | 576 | void stream_start(BlockDriverState *bs, BlockDriverState *base, |
1d809098 | 577 | const char *base_id, int64_t speed, BlockdevOnError on_error, |
097310b5 | 578 | BlockCompletionFunc *cb, |
fd7f8c65 | 579 | void *opaque, Error **errp); |
4f1043b4 | 580 | |
747ff602 JC |
581 | /** |
582 | * commit_start: | |
03544a6e FZ |
583 | * @bs: Active block device. |
584 | * @top: Top block device to be committed. | |
585 | * @base: Block device that will be written into, and become the new top. | |
747ff602 JC |
586 | * @speed: The maximum speed, in bytes per second, or 0 for unlimited. |
587 | * @on_error: The action to take upon error. | |
588 | * @cb: Completion function for the job. | |
589 | * @opaque: Opaque pointer value passed to @cb. | |
54e26900 | 590 | * @backing_file_str: String to use as the backing file in @top's overlay |
747ff602 JC |
591 | * @errp: Error object. |
592 | * | |
593 | */ | |
594 | void commit_start(BlockDriverState *bs, BlockDriverState *base, | |
595 | BlockDriverState *top, int64_t speed, | |
097310b5 | 596 | BlockdevOnError on_error, BlockCompletionFunc *cb, |
54e26900 | 597 | void *opaque, const char *backing_file_str, Error **errp); |
03544a6e FZ |
598 | /** |
599 | * commit_active_start: | |
600 | * @bs: Active block device to be committed. | |
601 | * @base: Block device that will be written into, and become the new top. | |
602 | * @speed: The maximum speed, in bytes per second, or 0 for unlimited. | |
603 | * @on_error: The action to take upon error. | |
604 | * @cb: Completion function for the job. | |
605 | * @opaque: Opaque pointer value passed to @cb. | |
606 | * @errp: Error object. | |
607 | * | |
608 | */ | |
609 | void commit_active_start(BlockDriverState *bs, BlockDriverState *base, | |
610 | int64_t speed, | |
611 | BlockdevOnError on_error, | |
097310b5 | 612 | BlockCompletionFunc *cb, |
03544a6e | 613 | void *opaque, Error **errp); |
893f7eba PB |
614 | /* |
615 | * mirror_start: | |
616 | * @bs: Block device to operate on. | |
617 | * @target: Block device to write to. | |
09158f00 BC |
618 | * @replaces: Block graph node name to replace once the mirror is done. Can |
619 | * only be used when full mirroring is selected. | |
893f7eba | 620 | * @speed: The maximum speed, in bytes per second, or 0 for unlimited. |
eee13dfe | 621 | * @granularity: The chosen granularity for the dirty bitmap. |
08e4ed6c | 622 | * @buf_size: The amount of data that can be in flight at one time. |
893f7eba | 623 | * @mode: Whether to collapse all images in the chain to the target. |
b952b558 PB |
624 | * @on_source_error: The action to take upon error reading from the source. |
625 | * @on_target_error: The action to take upon error writing to the target. | |
0fc9f8ea | 626 | * @unmap: Whether to unmap target where source sectors only contain zeroes. |
893f7eba PB |
627 | * @cb: Completion function for the job. |
628 | * @opaque: Opaque pointer value passed to @cb. | |
629 | * @errp: Error object. | |
630 | * | |
631 | * Start a mirroring operation on @bs. Clusters that are allocated | |
632 | * in @bs will be written to @bs until the job is cancelled or | |
633 | * manually completed. At the end of a successful mirroring job, | |
634 | * @bs will be switched to read from @target. | |
635 | */ | |
636 | void mirror_start(BlockDriverState *bs, BlockDriverState *target, | |
09158f00 | 637 | const char *replaces, |
5fba6c0e | 638 | int64_t speed, uint32_t granularity, int64_t buf_size, |
08e4ed6c | 639 | MirrorSyncMode mode, BlockdevOnError on_source_error, |
b952b558 | 640 | BlockdevOnError on_target_error, |
0fc9f8ea | 641 | bool unmap, |
097310b5 | 642 | BlockCompletionFunc *cb, |
893f7eba PB |
643 | void *opaque, Error **errp); |
644 | ||
98d2c6f2 DM |
645 | /* |
646 | * backup_start: | |
647 | * @bs: Block device to operate on. | |
648 | * @target: Block device to write to. | |
649 | * @speed: The maximum speed, in bytes per second, or 0 for unlimited. | |
fc5d3f84 | 650 | * @sync_mode: What parts of the disk image should be copied to the destination. |
4b80ab2b | 651 | * @sync_bitmap: The dirty bitmap if sync_mode is MIRROR_SYNC_MODE_INCREMENTAL. |
98d2c6f2 DM |
652 | * @on_source_error: The action to take upon error reading from the source. |
653 | * @on_target_error: The action to take upon error writing to the target. | |
654 | * @cb: Completion function for the job. | |
655 | * @opaque: Opaque pointer value passed to @cb. | |
656 | * | |
657 | * Start a backup operation on @bs. Clusters in @bs are written to @target | |
658 | * until the job is cancelled or manually completed. | |
659 | */ | |
660 | void backup_start(BlockDriverState *bs, BlockDriverState *target, | |
fc5d3f84 | 661 | int64_t speed, MirrorSyncMode sync_mode, |
d58d8453 | 662 | BdrvDirtyBitmap *sync_bitmap, |
fc5d3f84 | 663 | BlockdevOnError on_source_error, |
98d2c6f2 | 664 | BlockdevOnError on_target_error, |
097310b5 | 665 | BlockCompletionFunc *cb, void *opaque, |
98d2c6f2 DM |
666 | Error **errp); |
667 | ||
a2d61900 KW |
668 | void blk_set_bs(BlockBackend *blk, BlockDriverState *bs); |
669 | ||
a7f53e26 MA |
670 | void blk_dev_change_media_cb(BlockBackend *blk, bool load); |
671 | bool blk_dev_has_removable_media(BlockBackend *blk); | |
672 | void blk_dev_eject_request(BlockBackend *blk, bool force); | |
673 | bool blk_dev_is_tray_open(BlockBackend *blk); | |
674 | bool blk_dev_is_medium_locked(BlockBackend *blk); | |
675 | void blk_dev_resize_cb(BlockBackend *blk); | |
676 | ||
e0c47b6c | 677 | void bdrv_set_dirty(BlockDriverState *bs, int64_t cur_sector, int nr_sectors); |
439db28c | 678 | bool bdrv_requests_pending(BlockDriverState *bs); |
e0c47b6c | 679 | |
ea2384d3 | 680 | #endif /* BLOCK_INT_H */ |