block_int.h 45.2 KB
Newer Older
B
bellard 已提交
1 2
/*
 * QEMU System Emulator block driver
3
 *
B
bellard 已提交
4
 * Copyright (c) 2003 Fabrice Bellard
5
 *
B
bellard 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
#ifndef BLOCK_INT_H
#define BLOCK_INT_H

27
#include "block/accounting.h"
28
#include "block/block.h"
29
#include "block/aio-wait.h"
30
#include "qemu/queue.h"
31
#include "qemu/coroutine.h"
32
#include "qemu/stats64.h"
33
#include "qemu/timer.h"
34
#include "qemu/hbitmap.h"
35
#include "block/snapshot.h"
36
#include "qemu/main-loop.h"
37
#include "qemu/throttle.h"
P
pbrook 已提交
38

39
#define BLOCK_FLAG_LAZY_REFCOUNTS   8
40

41 42
#define BLOCK_OPT_SIZE              "size"
#define BLOCK_OPT_ENCRYPT           "encryption"
43
#define BLOCK_OPT_ENCRYPT_FORMAT    "encrypt.format"
44
#define BLOCK_OPT_COMPAT6           "compat6"
45
#define BLOCK_OPT_HWVERSION         "hwversion"
46 47 48 49 50 51 52 53
#define BLOCK_OPT_BACKING_FILE      "backing_file"
#define BLOCK_OPT_BACKING_FMT       "backing_fmt"
#define BLOCK_OPT_CLUSTER_SIZE      "cluster_size"
#define BLOCK_OPT_TABLE_SIZE        "table_size"
#define BLOCK_OPT_PREALLOC          "preallocation"
#define BLOCK_OPT_SUBFMT            "subformat"
#define BLOCK_OPT_COMPAT_LEVEL      "compat"
#define BLOCK_OPT_LAZY_REFCOUNTS    "lazy_refcounts"
54
#define BLOCK_OPT_ADAPTER_TYPE      "adapter_type"
55
#define BLOCK_OPT_REDUNDANCY        "redundancy"
56
#define BLOCK_OPT_NOCOW             "nocow"
57
#define BLOCK_OPT_OBJECT_SIZE       "object_size"
58
#define BLOCK_OPT_REFCOUNT_BITS     "refcount_bits"
59

60 61
#define BLOCK_PROBE_BUF_SIZE        512

62 63 64 65 66 67
enum BdrvTrackedRequestType {
    BDRV_TRACKED_READ,
    BDRV_TRACKED_WRITE,
    BDRV_TRACKED_DISCARD,
};

68 69
typedef struct BdrvTrackedRequest {
    BlockDriverState *bs;
70 71
    int64_t offset;
    unsigned int bytes;
72
    enum BdrvTrackedRequestType type;
73

74
    bool serialising;
75 76 77
    int64_t overlap_offset;
    unsigned int overlap_bytes;

78 79 80
    QLIST_ENTRY(BdrvTrackedRequest) list;
    Coroutine *co; /* owner, used for deadlock detection */
    CoQueue wait_queue; /* coroutines blocked on this request */
81 82

    struct BdrvTrackedRequest *waiting_for;
83 84
} BdrvTrackedRequest;

B
bellard 已提交
85 86 87
struct BlockDriver {
    const char *format_name;
    int instance_size;
88

89 90 91 92 93
    /* set to true if the BlockDriver is a block filter. Block filters pass
     * certain callbacks that refer to data (see block.c) to their bs->file if
     * the driver doesn't implement them. Drivers that do not wish to forward
     * must implement them and return -ENOTSUP.
     */
94 95 96
    bool is_filter;
    /* for snapshots block filter like Quorum can implement the
     * following recursive callback.
97 98 99
     * It's purpose is to recurse on the filter children while calling
     * bdrv_recurse_is_first_non_filter on them.
     * For a sample implementation look in the future Quorum block filter.
100
     */
101 102
    bool (*bdrv_recurse_is_first_non_filter)(BlockDriverState *bs,
                                             BlockDriverState *candidate);
103

B
bellard 已提交
104
    int (*bdrv_probe)(const uint8_t *buf, int buf_size, const char *filename);
105
    int (*bdrv_probe_device)(const char *filename);
106 107 108

    /* Any driver implementing this callback is expected to be able to handle
     * NULL file names in its .bdrv_open() implementation */
109
    void (*bdrv_parse_filename)(const char *filename, QDict *options, Error **errp);
110 111 112 113 114 115
    /* Drivers not implementing bdrv_parse_filename nor bdrv_open should have
     * this field set to true, except ones that are defined only by their
     * child's bs.
     * An example of the last type will be the quorum block driver.
     */
    bool bdrv_needs_filename;
116

117 118 119
    /* Set if a driver can support backing files */
    bool supports_backing;

120 121 122 123 124
    /* For handling image reopen for split or non-split files */
    int (*bdrv_reopen_prepare)(BDRVReopenState *reopen_state,
                               BlockReopenQueue *queue, Error **errp);
    void (*bdrv_reopen_commit)(BDRVReopenState *reopen_state);
    void (*bdrv_reopen_abort)(BDRVReopenState *reopen_state);
125
    void (*bdrv_join_options)(QDict *options, QDict *old_options);
126

M
Max Reitz 已提交
127 128
    int (*bdrv_open)(BlockDriverState *bs, QDict *options, int flags,
                     Error **errp);
129 130

    /* Protocol drivers should implement this instead of bdrv_open */
M
Max Reitz 已提交
131 132
    int (*bdrv_file_open)(BlockDriverState *bs, QDict *options, int flags,
                          Error **errp);
B
bellard 已提交
133
    void (*bdrv_close)(BlockDriverState *bs);
134
    int coroutine_fn (*bdrv_co_create)(BlockdevCreateOptions *opts,
135
                                       Error **errp);
136 137 138
    int coroutine_fn (*bdrv_co_create_opts)(const char *filename,
                                            QemuOpts *opts,
                                            Error **errp);
139
    int (*bdrv_make_empty)(BlockDriverState *bs);
M
Max Reitz 已提交
140

141
    void (*bdrv_refresh_filename)(BlockDriverState *bs, QDict *options);
M
Max Reitz 已提交
142

B
bellard 已提交
143
    /* aio */
144
    BlockAIOCB *(*bdrv_aio_readv)(BlockDriverState *bs,
145
        int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
146
        BlockCompletionFunc *cb, void *opaque);
147
    BlockAIOCB *(*bdrv_aio_writev)(BlockDriverState *bs,
148
        int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
149
        BlockCompletionFunc *cb, void *opaque);
150
    BlockAIOCB *(*bdrv_aio_flush)(BlockDriverState *bs,
151
        BlockCompletionFunc *cb, void *opaque);
152
    BlockAIOCB *(*bdrv_aio_pdiscard)(BlockDriverState *bs,
153
        int64_t offset, int bytes,
154
        BlockCompletionFunc *cb, void *opaque);
B
bellard 已提交
155

K
Kevin Wolf 已提交
156 157
    int coroutine_fn (*bdrv_co_readv)(BlockDriverState *bs,
        int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173

    /**
     * @offset: position in bytes to read at
     * @bytes: number of bytes to read
     * @qiov: the buffers to fill with read data
     * @flags: currently unused, always 0
     *
     * @offset and @bytes will be a multiple of 'request_alignment',
     * but the length of individual @qiov elements does not have to
     * be a multiple.
     *
     * @bytes will always equal the total size of @qiov, and will be
     * no larger than 'max_transfer'.
     *
     * The buffer in @qiov may point directly to guest memory.
     */
174 175
    int coroutine_fn (*bdrv_co_preadv)(BlockDriverState *bs,
        uint64_t offset, uint64_t bytes, QEMUIOVector *qiov, int flags);
K
Kevin Wolf 已提交
176 177
    int coroutine_fn (*bdrv_co_writev)(BlockDriverState *bs,
        int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
178 179
    int coroutine_fn (*bdrv_co_writev_flags)(BlockDriverState *bs,
        int64_t sector_num, int nb_sectors, QEMUIOVector *qiov, int flags);
180 181 182 183 184 185 186 187 188 189 190 191 192 193 194
    /**
     * @offset: position in bytes to write at
     * @bytes: number of bytes to write
     * @qiov: the buffers containing data to write
     * @flags: zero or more bits allowed by 'supported_write_flags'
     *
     * @offset and @bytes will be a multiple of 'request_alignment',
     * but the length of individual @qiov elements does not have to
     * be a multiple.
     *
     * @bytes will always equal the total size of @qiov, and will be
     * no larger than 'max_transfer'.
     *
     * The buffer in @qiov may point directly to guest memory.
     */
195 196
    int coroutine_fn (*bdrv_co_pwritev)(BlockDriverState *bs,
        uint64_t offset, uint64_t bytes, QEMUIOVector *qiov, int flags);
197

198 199 200
    /*
     * Efficiently zero a region of the disk image.  Typically an image format
     * would use a compact metadata representation to implement this.  This
201 202
     * function pointer may be NULL or return -ENOSUP and .bdrv_co_writev()
     * will be called instead.
203
     */
E
Eric Blake 已提交
204
    int coroutine_fn (*bdrv_co_pwrite_zeroes)(BlockDriverState *bs,
205
        int64_t offset, int bytes, BdrvRequestFlags flags);
206
    int coroutine_fn (*bdrv_co_pdiscard)(BlockDriverState *bs,
207
        int64_t offset, int bytes);
208 209

    /*
210 211
     * Building block for bdrv_block_status[_above] and
     * bdrv_is_allocated[_above].  The driver should answer only
212 213 214 215 216 217 218 219 220 221 222 223
     * according to the current layer, and should only need to set
     * BDRV_BLOCK_DATA, BDRV_BLOCK_ZERO, BDRV_BLOCK_OFFSET_VALID,
     * and/or BDRV_BLOCK_RAW; if the current layer defers to a backing
     * layer, the result should be 0 (and not BDRV_BLOCK_ZERO).  See
     * block.h for the overall meaning of the bits.  As a hint, the
     * flag want_zero is true if the caller cares more about precise
     * mappings (favor accurate _OFFSET_VALID/_ZERO) or false for
     * overall allocation (favor larger *pnum, perhaps by reporting
     * _DATA instead of _ZERO).  The block layer guarantees input
     * clamped to bdrv_getlength() and aligned to request_alignment,
     * as well as non-NULL pnum, map, and file; in turn, the driver
     * must return an error or set pnum to an aligned non-zero value.
224
     */
225 226 227
    int coroutine_fn (*bdrv_co_block_status)(BlockDriverState *bs,
        bool want_zero, int64_t offset, int64_t bytes, int64_t *pnum,
        int64_t *map, BlockDriverState **file);
K
Kevin Wolf 已提交
228

229 230 231
    /*
     * Invalidate any cached meta-data.
     */
232 233
    void coroutine_fn (*bdrv_co_invalidate_cache)(BlockDriverState *bs,
                                                  Error **errp);
234
    int (*bdrv_inactivate)(BlockDriverState *bs);
235

P
Pavel Dovgalyuk 已提交
236 237 238 239 240 241 242
    /*
     * Flushes all data for all layers by calling bdrv_co_flush for underlying
     * layers, if needed. This function is needed for deterministic
     * synchronization of the flush finishing callback.
     */
    int coroutine_fn (*bdrv_co_flush)(BlockDriverState *bs);

243 244
    /*
     * Flushes all data that was already written to the OS all the way down to
245
     * the disk (for example file-posix.c calls fsync()).
246 247 248
     */
    int coroutine_fn (*bdrv_co_flush_to_disk)(BlockDriverState *bs);

K
Kevin Wolf 已提交
249 250 251 252 253 254 255
    /*
     * Flushes all internal caches to the OS. The data may still sit in a
     * writeback cache of the host OS, but it will survive a crash of the qemu
     * process.
     */
    int coroutine_fn (*bdrv_co_flush_to_os)(BlockDriverState *bs);

256 257 258 259 260 261
    /*
     * Drivers setting this field must be able to work with just a plain
     * filename with '<protocol_name>:' as a prefix, and no other options.
     * Options may be extracted from the filename by implementing
     * bdrv_parse_filename.
     */
B
bellard 已提交
262
    const char *protocol_name;
263 264
    int (*bdrv_truncate)(BlockDriverState *bs, int64_t offset,
                         PreallocMode prealloc, Error **errp);
265

B
bellard 已提交
266
    int64_t (*bdrv_getlength)(BlockDriverState *bs);
267
    bool has_variable_length;
268
    int64_t (*bdrv_get_allocated_file_size)(BlockDriverState *bs);
S
Stefan Hajnoczi 已提交
269 270
    BlockMeasureInfo *(*bdrv_measure)(QemuOpts *opts, BlockDriverState *in_bs,
                                      Error **errp);
271

272 273 274
    int coroutine_fn (*bdrv_co_pwritev_compressed)(BlockDriverState *bs,
        uint64_t offset, uint64_t bytes, QEMUIOVector *qiov);

275
    int (*bdrv_snapshot_create)(BlockDriverState *bs,
B
bellard 已提交
276
                                QEMUSnapshotInfo *sn_info);
277
    int (*bdrv_snapshot_goto)(BlockDriverState *bs,
B
bellard 已提交
278
                              const char *snapshot_id);
279 280 281 282
    int (*bdrv_snapshot_delete)(BlockDriverState *bs,
                                const char *snapshot_id,
                                const char *name,
                                Error **errp);
283
    int (*bdrv_snapshot_list)(BlockDriverState *bs,
B
bellard 已提交
284
                              QEMUSnapshotInfo **psn_info);
E
edison 已提交
285
    int (*bdrv_snapshot_load_tmp)(BlockDriverState *bs,
286 287 288
                                  const char *snapshot_id,
                                  const char *name,
                                  Error **errp);
B
bellard 已提交
289
    int (*bdrv_get_info)(BlockDriverState *bs, BlockDriverInfo *bdi);
M
Max Reitz 已提交
290
    ImageInfoSpecific *(*bdrv_get_specific_info)(BlockDriverState *bs);
B
bellard 已提交
291

292 293 294 295 296 297
    int coroutine_fn (*bdrv_save_vmstate)(BlockDriverState *bs,
                                          QEMUIOVector *qiov,
                                          int64_t pos);
    int coroutine_fn (*bdrv_load_vmstate)(BlockDriverState *bs,
                                          QEMUIOVector *qiov,
                                          int64_t pos);
298

K
Kevin Wolf 已提交
299 300 301
    int (*bdrv_change_backing_file)(BlockDriverState *bs,
        const char *backing_file, const char *backing_fmt);

B
bellard 已提交
302
    /* removable device specific */
303
    bool (*bdrv_is_inserted)(BlockDriverState *bs);
304
    void (*bdrv_eject)(BlockDriverState *bs, bool eject_flag);
305
    void (*bdrv_lock_medium)(BlockDriverState *bs, bool locked);
306

307
    /* to control generic scsi devices */
308
    BlockAIOCB *(*bdrv_aio_ioctl)(BlockDriverState *bs,
309
        unsigned long int req, void *buf,
310
        BlockCompletionFunc *cb, void *opaque);
311 312
    int coroutine_fn (*bdrv_co_ioctl)(BlockDriverState *bs,
                                      unsigned long int req, void *buf);
313

314
    /* List of options for creating images, terminated by name == NULL */
315
    QemuOptsList *create_opts;
316

317 318 319 320
    /*
     * Returns 0 for completed check, -errno for internal errors.
     * The check results are stored in result.
     */
321 322 323
    int coroutine_fn (*bdrv_co_check)(BlockDriverState *bs,
                                      BdrvCheckResult *result,
                                      BdrvCheckMode fix);
A
aliguori 已提交
324

325
    int (*bdrv_amend_options)(BlockDriverState *bs, QemuOpts *opts,
326 327
                              BlockDriverAmendStatusCB *status_cb,
                              void *cb_opaque);
M
Max Reitz 已提交
328

329
    void (*bdrv_debug_event)(BlockDriverState *bs, BlkdebugEvent event);
K
Kevin Wolf 已提交
330

K
Kevin Wolf 已提交
331 332 333
    /* TODO Better pass a option string/QDict/QemuOpts to add any rule? */
    int (*bdrv_debug_breakpoint)(BlockDriverState *bs, const char *event,
        const char *tag);
F
Fam Zheng 已提交
334 335
    int (*bdrv_debug_remove_breakpoint)(BlockDriverState *bs,
        const char *tag);
K
Kevin Wolf 已提交
336 337 338
    int (*bdrv_debug_resume)(BlockDriverState *bs, const char *tag);
    bool (*bdrv_debug_is_suspended)(BlockDriverState *bs, const char *tag);

339
    void (*bdrv_refresh_limits)(BlockDriverState *bs, Error **errp);
340

K
Kevin Wolf 已提交
341 342 343 344 345
    /*
     * Returns 1 if newly created images are guaranteed to contain only
     * zeros, 0 otherwise.
     */
    int (*bdrv_has_zero_init)(BlockDriverState *bs);
346

347 348 349 350 351 352 353 354 355 356 357 358 359
    /* Remove fd handlers, timers, and other event loop callbacks so the event
     * loop is no longer in use.  Called with no in-flight requests and in
     * depth-first traversal order with parents before child nodes.
     */
    void (*bdrv_detach_aio_context)(BlockDriverState *bs);

    /* Add fd handlers, timers, and other event loop callbacks so I/O requests
     * can be processed again.  Called with no in-flight requests and in
     * depth-first traversal order with child nodes before parent nodes.
     */
    void (*bdrv_attach_aio_context)(BlockDriverState *bs,
                                    AioContext *new_context);

360 361 362 363
    /* io queue for linux-aio */
    void (*bdrv_io_plug)(BlockDriverState *bs);
    void (*bdrv_io_unplug)(BlockDriverState *bs);

364 365 366 367 368 369 370 371 372 373 374 375 376 377 378
    /**
     * Try to get @bs's logical and physical block size.
     * On success, store them in @bsz and return zero.
     * On failure, return negative errno.
     */
    int (*bdrv_probe_blocksizes)(BlockDriverState *bs, BlockSizes *bsz);
    /**
     * Try to get @bs's geometry (cyls, heads, sectors)
     * On success, store them in @geo and return 0.
     * On failure return -errno.
     * Only drivers that want to override guest geometry implement this
     * callback; see hd_geometry_guess().
     */
    int (*bdrv_probe_geometry)(BlockDriverState *bs, HDGeometry *geo);

379
    /**
380
     * bdrv_co_drain_begin is called if implemented in the beginning of a
381 382 383 384 385 386 387
     * drain operation to drain and stop any internal sources of requests in
     * the driver.
     * bdrv_co_drain_end is called if implemented at the end of the drain.
     *
     * They should be used by the driver to e.g. manage scheduled I/O
     * requests, or toggle an internal state. After the end of the drain new
     * requests will continue normally.
388
     */
389
    void coroutine_fn (*bdrv_co_drain_begin)(BlockDriverState *bs);
390
    void coroutine_fn (*bdrv_co_drain_end)(BlockDriverState *bs);
391

392 393 394 395 396
    void (*bdrv_add_child)(BlockDriverState *parent, BlockDriverState *child,
                           Error **errp);
    void (*bdrv_del_child)(BlockDriverState *parent, BdrvChild *child,
                           Error **errp);

397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443
    /**
     * Informs the block driver that a permission change is intended. The
     * driver checks whether the change is permissible and may take other
     * preparations for the change (e.g. get file system locks). This operation
     * is always followed either by a call to either .bdrv_set_perm or
     * .bdrv_abort_perm_update.
     *
     * Checks whether the requested set of cumulative permissions in @perm
     * can be granted for accessing @bs and whether no other users are using
     * permissions other than those given in @shared (both arguments take
     * BLK_PERM_* bitmasks).
     *
     * If both conditions are met, 0 is returned. Otherwise, -errno is returned
     * and errp is set to an error describing the conflict.
     */
    int (*bdrv_check_perm)(BlockDriverState *bs, uint64_t perm,
                           uint64_t shared, Error **errp);

    /**
     * Called to inform the driver that the set of cumulative set of used
     * permissions for @bs has changed to @perm, and the set of sharable
     * permission to @shared. The driver can use this to propagate changes to
     * its children (i.e. request permissions only if a parent actually needs
     * them).
     *
     * This function is only invoked after bdrv_check_perm(), so block drivers
     * may rely on preparations made in their .bdrv_check_perm implementation.
     */
    void (*bdrv_set_perm)(BlockDriverState *bs, uint64_t perm, uint64_t shared);

    /*
     * Called to inform the driver that after a previous bdrv_check_perm()
     * call, the permission update is not performed and any preparations made
     * for it (e.g. taken file locks) need to be undone.
     *
     * This function can be called even for nodes that never saw a
     * bdrv_check_perm() call. It is a no-op then.
     */
    void (*bdrv_abort_perm_update)(BlockDriverState *bs);

    /**
     * Returns in @nperm and @nshared the permissions that the driver for @bs
     * needs on its child @c, based on the cumulative permissions requested by
     * the parents in @parent_perm and @parent_shared.
     *
     * If @c is NULL, return the permissions for attaching a new child for the
     * given @role.
444 445 446 447
     *
     * If @reopen_queue is non-NULL, don't return the currently needed
     * permissions, but those that will be needed after applying the
     * @reopen_queue.
448 449 450
     */
     void (*bdrv_child_perm)(BlockDriverState *bs, BdrvChild *c,
                             const BdrvChildRole *role,
451
                             BlockReopenQueue *reopen_queue,
452 453 454
                             uint64_t parent_perm, uint64_t parent_shared,
                             uint64_t *nperm, uint64_t *nshared);

455 456 457 458 459 460
    /**
     * Bitmaps should be marked as 'IN_USE' in the image on reopening image
     * as rw. This handler should realize it. It also should unset readonly
     * field of BlockDirtyBitmap's in case of success.
     */
    int (*bdrv_reopen_bitmaps_rw)(BlockDriverState *bs, Error **errp);
461 462 463 464
    bool (*bdrv_can_store_new_dirty_bitmap)(BlockDriverState *bs,
                                            const char *name,
                                            uint32_t granularity,
                                            Error **errp);
465 466 467
    void (*bdrv_remove_persistent_dirty_bitmap)(BlockDriverState *bs,
                                                const char *name,
                                                Error **errp);
468

F
Fam Zheng 已提交
469 470 471 472 473 474 475 476 477
    /**
     * Register/unregister a buffer for I/O. For example, when the driver is
     * interested to know the memory areas that will later be used in iovs, so
     * that it can do IOMMU mapping with VFIO etc., in order to get better
     * performance. In the case of VFIO drivers, this callback is used to do
     * DMA mapping for hot buffers.
     */
    void (*bdrv_register_buf)(BlockDriverState *bs, void *host, size_t size);
    void (*bdrv_unregister_buf)(BlockDriverState *bs, void *host);
478
    QLIST_ENTRY(BlockDriver) list;
B
bellard 已提交
479 480
};

481
typedef struct BlockLimits {
482 483 484 485 486 487
    /* Alignment requirement, in bytes, for offset/length of I/O
     * requests. Must be a power of 2 less than INT_MAX; defaults to
     * 1 for drivers with modern byte interfaces, and to 512
     * otherwise. */
    uint32_t request_alignment;

488 489
    /* Maximum number of bytes that can be discarded at once (since it
     * is signed, it must be < 2G, if set). Must be multiple of
490 491 492 493
     * pdiscard_alignment, but need not be power of 2. May be 0 if no
     * inherent 32-bit limit */
    int32_t max_pdiscard;

494 495 496 497
    /* Optimal alignment for discard requests in bytes. A power of 2
     * is best but not mandatory.  Must be a multiple of
     * bl.request_alignment, and must be less than max_pdiscard if
     * that is set. May be 0 if bl.request_alignment is good enough */
498
    uint32_t pdiscard_alignment;
499

500 501
    /* Maximum number of bytes that can zeroized at once (since it is
     * signed, it must be < 2G, if set). Must be multiple of
502
     * pwrite_zeroes_alignment. May be 0 if no inherent 32-bit limit */
503
    int32_t max_pwrite_zeroes;
504

505 506 507 508 509
    /* Optimal alignment for write zeroes requests in bytes. A power
     * of 2 is best but not mandatory.  Must be a multiple of
     * bl.request_alignment, and must be less than max_pwrite_zeroes
     * if that is set. May be 0 if bl.request_alignment is good
     * enough */
510
    uint32_t pwrite_zeroes_alignment;
511

512 513 514
    /* Optimal transfer length in bytes.  A power of 2 is best but not
     * mandatory.  Must be a multiple of bl.request_alignment, or 0 if
     * no preferred size */
515 516
    uint32_t opt_transfer;

517 518 519 520
    /* Maximal transfer length in bytes.  Need not be power of 2, but
     * must be multiple of opt_transfer and bl.request_alignment, or 0
     * for no 32-bit limit.  For now, anything larger than INT_MAX is
     * clamped down. */
521
    uint32_t max_transfer;
522

523
    /* memory alignment, in bytes so that no bounce buffer is needed */
524 525
    size_t min_mem_alignment;

526
    /* memory alignment, in bytes, for bounce buffer */
527
    size_t opt_mem_alignment;
528 529 530

    /* maximum number of iovec elements */
    int max_iov;
531 532
} BlockLimits;

533 534
typedef struct BdrvOpBlocker BdrvOpBlocker;

M
Max Reitz 已提交
535 536 537 538 539
typedef struct BdrvAioNotifier {
    void (*attached_aio_context)(AioContext *new_context, void *opaque);
    void (*detach_aio_context)(void *opaque);

    void *opaque;
540
    bool deleted;
M
Max Reitz 已提交
541 542 543 544

    QLIST_ENTRY(BdrvAioNotifier) list;
} BdrvAioNotifier;

545
struct BdrvChildRole {
546 547
    /* If true, bdrv_replace_node() doesn't change the node this BdrvChild
     * points to. */
548 549
    bool stay_at_node;

550 551
    void (*inherit_options)(int *child_flags, QDict *child_options,
                            int parent_flags, QDict *parent_options);
552

553 554 555
    void (*change_media)(BdrvChild *child, bool load);
    void (*resize)(BdrvChild *child);

556 557 558
    /* Returns a name that is supposedly more useful for human users than the
     * node name for identifying the node in question (in particular, a BB
     * name), or NULL if the parent can't provide a better name. */
559
    const char *(*get_name)(BdrvChild *child);
560

561 562 563 564
    /* Returns a malloced string that describes the parent of the child for a
     * human reader. This could be a node-name, BlockBackend name, qdev ID or
     * QOM path of the device owning the BlockBackend, job type and ID etc. The
     * caller is responsible for freeing the memory. */
565
    char *(*get_parent_desc)(BdrvChild *child);
566

567 568 569 570 571 572 573 574 575 576
    /*
     * If this pair of functions is implemented, the parent doesn't issue new
     * requests after returning from .drained_begin() until .drained_end() is
     * called.
     *
     * Note that this can be nested. If drained_begin() was called twice, new
     * I/O is allowed only after drained_end() was called twice, too.
     */
    void (*drained_begin)(BdrvChild *child);
    void (*drained_end)(BdrvChild *child);
577

578 579 580
    /* Notifies the parent that the child has been activated/inactivated (e.g.
     * when migration is completing) and it can start/stop requesting
     * permissions and doing I/O on it. */
581
    void (*activate)(BdrvChild *child, Error **errp);
582
    int (*inactivate)(BdrvChild *child);
583

584 585
    void (*attach)(BdrvChild *child);
    void (*detach)(BdrvChild *child);
586 587 588 589 590 591

    /* Notifies the parent that the filename of its child has changed (e.g.
     * because the direct child was removed from the backing chain), so that it
     * can update its reference. */
    int (*update_filename)(BdrvChild *child, BlockDriverState *new_base,
                           const char *filename, Error **errp);
592 593 594 595
};

extern const BdrvChildRole child_file;
extern const BdrvChildRole child_format;
K
Kevin Wolf 已提交
596
extern const BdrvChildRole child_backing;
597

K
Kevin Wolf 已提交
598
struct BdrvChild {
599
    BlockDriverState *bs;
600
    char *name;
601
    const BdrvChildRole *role;
K
Kevin Wolf 已提交
602
    void *opaque;
603 604 605 606 607 608 609 610 611 612 613 614

    /**
     * Granted permissions for operating on this BdrvChild (BLK_PERM_* bitmask)
     */
    uint64_t perm;

    /**
     * Permissions that can still be granted to other users of @bs while this
     * BdrvChild is still attached to it. (BLK_PERM_* bitmask)
     */
    uint64_t shared_perm;

615
    QLIST_ENTRY(BdrvChild) next;
K
Kevin Wolf 已提交
616
    QLIST_ENTRY(BdrvChild) next_parent;
K
Kevin Wolf 已提交
617
};
618

619 620 621 622 623 624
/*
 * Note: the function bdrv_append() copies and swaps contents of
 * BlockDriverStates, so if you add new fields to this struct, please
 * inspect bdrv_append() to determine if the new fields need to be
 * copied as well.
 */
B
bellard 已提交
625
struct BlockDriverState {
626 627 628
    /* Protected by big QEMU lock or read-only after opening.  No special
     * locking needed during I/O...
     */
629
    int open_flags; /* flags used to open the file, re-used for re-open */
630 631 632 633
    bool read_only; /* if true, the media is read only */
    bool encrypted; /* if true, the media is encrypted */
    bool sg;        /* if true, the device is a /dev/sg* */
    bool probed;    /* if true, format was probed rather than specified */
634
    bool force_share; /* if true, always allow all shared permissions */
635
    bool implicit;  /* if true, this filter node was automatically inserted */
636

B
bellard 已提交
637
    BlockDriver *drv; /* NULL means no media */
B
bellard 已提交
638 639
    void *opaque;

640
    AioContext *aio_context; /* event loop used for fd handlers, timers, etc */
M
Max Reitz 已提交
641 642 643 644
    /* long-running tasks intended to always use the same AioContext as this
     * BDS may register themselves in this list to be notified of changes
     * regarding this BDS's context */
    QLIST_HEAD(, BdrvAioNotifier) aio_notifiers;
645
    bool walking_aio_notifiers; /* to make removal during iteration safe */
646

647 648 649
    char filename[PATH_MAX];
    char backing_file[PATH_MAX]; /* if non zero, the image is a diff of
                                    this file image */
650
    char backing_format[16]; /* if non-zero and backing_file exists */
B
bellard 已提交
651

M
Max Reitz 已提交
652
    QDict *full_open_options;
653
    char exact_filename[PATH_MAX];
M
Max Reitz 已提交
654

655
    BdrvChild *backing;
K
Kevin Wolf 已提交
656
    BdrvChild *file;
657

658 659 660
    /* I/O Limits */
    BlockLimits bl;

661 662
    /* Flags honored during pwrite (so far: BDRV_REQ_FUA) */
    unsigned int supported_write_flags;
E
Eric Blake 已提交
663
    /* Flags honored during pwrite_zeroes (so far: BDRV_REQ_FUA,
664 665
     * BDRV_REQ_MAY_UNMAP) */
    unsigned int supported_zero_flags;
666

667 668 669 670
    /* the following member gives a name to every node on the bs graph. */
    char node_name[32];
    /* element of the list of named nodes building the graph */
    QTAILQ_ENTRY(BlockDriverState) node_list;
671 672
    /* element of the list of all BlockDriverStates (all_bdrv_states) */
    QTAILQ_ENTRY(BlockDriverState) bs_list;
673 674
    /* element of the list of monitor-owned BDS */
    QTAILQ_ENTRY(BlockDriverState) monitor_list;
675
    int refcnt;
S
Stefan Hajnoczi 已提交
676

677 678 679
    /* operation blockers */
    QLIST_HEAD(, BdrvOpBlocker) op_blockers[BLOCK_OP_TYPE_MAX];

680 681
    /* long-running background operation */
    BlockJob *job;
682

683 684 685 686
    /* The node that this node inherited default options from (and a reopen on
     * which can affect this node by changing these defaults). This is always a
     * parent node of this node. */
    BlockDriverState *inherits_from;
687
    QLIST_HEAD(, BdrvChild) children;
K
Kevin Wolf 已提交
688
    QLIST_HEAD(, BdrvChild) parents;
689

690
    QDict *options;
K
Kevin Wolf 已提交
691
    QDict *explicit_options;
692
    BlockdevDetectZeroesOptions detect_zeroes;
693 694 695

    /* The error object in use for blocking operations on backing_hd */
    Error *backing_blocker;
696

697 698 699
    /* Protected by AioContext lock */

    /* If we are reading a disk image, give its size in sectors.
700 701
     * Generally read-only; it is written to by load_snapshot and
     * save_snaphost, but the block layer is quiescent during those.
702 703 704 705 706 707
     */
    int64_t total_sectors;

    /* Callback before write request is processed */
    NotifierWithReturnList before_write_notifiers;

708 709 710
    /* threshold limit for writes, in bytes. "High water mark". */
    uint64_t write_threshold_offset;
    NotifierWithReturn write_threshold_notifier;
711

712 713
    /* Writing to the list requires the BQL _and_ the dirty_bitmap_mutex.
     * Reading from the list can be done with either the BQL or the
714 715
     * dirty_bitmap_mutex.  Modifying a bitmap only requires
     * dirty_bitmap_mutex.  */
716
    QemuMutex dirty_bitmap_mutex;
717 718
    QLIST_HEAD(, BdrvDirtyBitmap) dirty_bitmaps;

719 720 721
    /* Offset after the highest byte written to */
    Stat64 wr_highest_offset;

722 723 724 725 726 727
    /* If true, copy read backing sectors into image.  Can be >1 if more
     * than one client has requested copy-on-read.  Accessed with atomic
     * ops.
     */
    int copy_on_read;

728 729 730 731 732 733
    /* number of in-flight requests; overall and serialising.
     * Accessed with atomic ops.
     */
    unsigned int in_flight;
    unsigned int serialising_in_flight;

734 735
    /* Kicked to signal main loop when a request completes. */
    AioWait wait;
736

737 738 739 740 741
    /* counter for nested bdrv_io_plug.
     * Accessed with atomic ops.
    */
    unsigned io_plugged;

742 743 744
    /* do we need to tell the quest if we have a volatile write cache? */
    int enable_write_cache;

745
    /* Accessed with atomic ops.  */
746
    int quiesce_counter;
747 748
    int recursive_quiesce_counter;

749
    unsigned int write_gen;               /* Current data generation */
750 751 752 753 754 755 756 757 758

    /* Protected by reqs_lock.  */
    CoMutex reqs_lock;
    QLIST_HEAD(, BdrvTrackedRequest) tracked_requests;
    CoQueue flush_queue;                  /* Serializing flush queue */
    bool active_flush_req;                /* Flush request in flight? */

    /* Only read/written by whoever has set active_flush_req to true.  */
    unsigned int flushed_gen;             /* Flushed write generation */
B
bellard 已提交
759 760
};

M
Max Reitz 已提交
761 762 763 764 765 766
struct BlockBackendRootState {
    int open_flags;
    bool read_only;
    BlockdevDetectZeroesOptions detect_zeroes;
};

M
Max Reitz 已提交
767 768 769 770 771 772 773 774 775 776 777 778 779 780
typedef enum BlockMirrorBackingMode {
    /* Reuse the existing backing chain from the source for the target.
     * - sync=full: Set backing BDS to NULL.
     * - sync=top:  Use source's backing BDS.
     * - sync=none: Use source as the backing BDS. */
    MIRROR_SOURCE_BACKING_CHAIN,

    /* Open the target's backing chain completely anew */
    MIRROR_OPEN_BACKING_CHAIN,

    /* Do not change the target's backing BDS after job completion */
    MIRROR_LEAVE_BACKING_CHAIN,
} BlockMirrorBackingMode;

781 782 783 784 785
static inline BlockDriverState *backing_bs(BlockDriverState *bs)
{
    return bs->backing ? bs->backing->bs : NULL;
}

786 787 788 789 790 791 792

/* Essential block drivers which must always be statically linked into qemu, and
 * which therefore can be accessed without using bdrv_find_format() */
extern BlockDriver bdrv_file;
extern BlockDriver bdrv_raw;
extern BlockDriver bdrv_qcow2;

793
int coroutine_fn bdrv_co_preadv(BdrvChild *child,
794 795
    int64_t offset, unsigned int bytes, QEMUIOVector *qiov,
    BdrvRequestFlags flags);
796
int coroutine_fn bdrv_co_pwritev(BdrvChild *child,
797 798
    int64_t offset, unsigned int bytes, QEMUIOVector *qiov,
    BdrvRequestFlags flags);
799

800 801 802
void bdrv_apply_subtree_drain(BdrvChild *child, BlockDriverState *new_parent);
void bdrv_unapply_subtree_drain(BdrvChild *child, BlockDriverState *old_parent);

803
int get_tmp_filename(char *filename, int size);
804 805
BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
                            const char *filename);
806

807 808 809
void bdrv_parse_filename_strip_prefix(const char *filename, const char *prefix,
                                      QDict *options);

810

811 812 813 814 815 816 817 818 819
/**
 * bdrv_add_before_write_notifier:
 *
 * Register a callback that is invoked before write requests are processed but
 * after any throttling or waiting for overlapping requests.
 */
void bdrv_add_before_write_notifier(BlockDriverState *bs,
                                    NotifierWithReturn *notifier);

820 821 822 823 824
/**
 * bdrv_detach_aio_context:
 *
 * May be called from .bdrv_detach_aio_context() to detach children from the
 * current #AioContext.  This is only needed by block drivers that manage their
825
 * own children.  Both ->file and ->backing are automatically handled and
826 827 828 829 830 831 832 833 834
 * block drivers should not call this function on them explicitly.
 */
void bdrv_detach_aio_context(BlockDriverState *bs);

/**
 * bdrv_attach_aio_context:
 *
 * May be called from .bdrv_attach_aio_context() to attach children to the new
 * #AioContext.  This is only needed by block drivers that manage their own
835
 * children.  Both ->file and ->backing are automatically handled and block
836 837 838 839 840
 * drivers should not call this function on them explicitly.
 */
void bdrv_attach_aio_context(BlockDriverState *bs,
                             AioContext *new_context);

M
Max Reitz 已提交
841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868
/**
 * bdrv_add_aio_context_notifier:
 *
 * If a long-running job intends to be always run in the same AioContext as a
 * certain BDS, it may use this function to be notified of changes regarding the
 * association of the BDS to an AioContext.
 *
 * attached_aio_context() is called after the target BDS has been attached to a
 * new AioContext; detach_aio_context() is called before the target BDS is being
 * detached from its old AioContext.
 */
void bdrv_add_aio_context_notifier(BlockDriverState *bs,
        void (*attached_aio_context)(AioContext *new_context, void *opaque),
        void (*detach_aio_context)(void *opaque), void *opaque);

/**
 * bdrv_remove_aio_context_notifier:
 *
 * Unsubscribe of change notifications regarding the BDS's AioContext. The
 * parameters given here have to be the same as those given to
 * bdrv_add_aio_context_notifier().
 */
void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
                                      void (*aio_context_attached)(AioContext *,
                                                                   void *),
                                      void (*aio_context_detached)(void *),
                                      void *opaque);

869 870 871 872 873 874 875 876 877 878 879 880 881 882 883
/**
 * bdrv_wakeup:
 * @bs: The BlockDriverState for which an I/O operation has been completed.
 *
 * Wake up the main thread if it is waiting on BDRV_POLL_WHILE.  During
 * synchronous I/O on a BlockDriverState that is attached to another
 * I/O thread, the main thread lets the I/O thread's event loop run,
 * waiting for the I/O operation to complete.  A bdrv_wakeup will wake
 * up the main thread if necessary.
 *
 * Manual calls to bdrv_wakeup are rarely necessary, because
 * bdrv_dec_in_flight already calls it.
 */
void bdrv_wakeup(BlockDriverState *bs);

884 885 886 887
#ifdef _WIN32
int is_windows_drive(const char *filename);
#endif

P
Paolo Bonzini 已提交
888 889
/**
 * stream_start:
890 891
 * @job_id: The id of the newly-created job, or %NULL to use the
 * device name of @bs.
P
Paolo Bonzini 已提交
892 893 894
 * @bs: Block device to operate on.
 * @base: Block device that will become the new base, or %NULL to
 * flatten the whole backing file chain onto @bs.
895 896
 * @backing_file_str: The file name that will be written to @bs as the
 * the new backing file if the job completes. Ignored if @base is %NULL.
897
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
P
Paolo Bonzini 已提交
898
 * @on_error: The action to take upon error.
899
 * @errp: Error object.
P
Paolo Bonzini 已提交
900 901 902 903 904
 *
 * Start a streaming operation on @bs.  Clusters that are unallocated
 * in @bs, but allocated in any image between @base and @bs (both
 * exclusive) will be written to @bs.  At the end of a successful
 * streaming job, the backing file of @bs will be changed to
905 906
 * @backing_file_str in the written image and to @base in the live
 * BlockDriverState.
P
Paolo Bonzini 已提交
907
 */
908 909
void stream_start(const char *job_id, BlockDriverState *bs,
                  BlockDriverState *base, const char *backing_file_str,
910
                  int64_t speed, BlockdevOnError on_error, Error **errp);
911

912 913
/**
 * commit_start:
914 915
 * @job_id: The id of the newly-created job, or %NULL to use the
 * device name of @bs.
F
Fam Zheng 已提交
916 917 918
 * @bs: Active block device.
 * @top: Top block device to be committed.
 * @base: Block device that will be written into, and become the new top.
919 920
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
 * @on_error: The action to take upon error.
921
 * @backing_file_str: String to use as the backing file in @top's overlay
922 923 924
 * @filter_node_name: The node name that should be assigned to the filter
 * driver that the commit job inserts into the graph above @top. NULL means
 * that a node name should be autogenerated.
925 926 927
 * @errp: Error object.
 *
 */
928 929
void commit_start(const char *job_id, BlockDriverState *bs,
                  BlockDriverState *base, BlockDriverState *top, int64_t speed,
930
                  BlockdevOnError on_error, const char *backing_file_str,
931
                  const char *filter_node_name, Error **errp);
F
Fam Zheng 已提交
932 933
/**
 * commit_active_start:
934 935
 * @job_id: The id of the newly-created job, or %NULL to use the
 * device name of @bs.
F
Fam Zheng 已提交
936 937
 * @bs: Active block device to be committed.
 * @base: Block device that will be written into, and become the new top.
938 939
 * @creation_flags: Flags that control the behavior of the Job lifetime.
 *                  See @BlockJobCreateFlags
F
Fam Zheng 已提交
940 941
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
 * @on_error: The action to take upon error.
942 943 944
 * @filter_node_name: The node name that should be assigned to the filter
 * driver that the commit job inserts into the graph above @bs. NULL means that
 * a node name should be autogenerated.
F
Fam Zheng 已提交
945 946
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
947
 * @auto_complete: Auto complete the job.
948
 * @errp: Error object.
F
Fam Zheng 已提交
949 950
 *
 */
951
void commit_active_start(const char *job_id, BlockDriverState *bs,
952 953
                         BlockDriverState *base, int creation_flags,
                         int64_t speed, BlockdevOnError on_error,
954
                         const char *filter_node_name,
955 956
                         BlockCompletionFunc *cb, void *opaque,
                         bool auto_complete, Error **errp);
P
Paolo Bonzini 已提交
957 958
/*
 * mirror_start:
959 960
 * @job_id: The id of the newly-created job, or %NULL to use the
 * device name of @bs.
P
Paolo Bonzini 已提交
961 962
 * @bs: Block device to operate on.
 * @target: Block device to write to.
963 964
 * @replaces: Block graph node name to replace once the mirror is done. Can
 *            only be used when full mirroring is selected.
P
Paolo Bonzini 已提交
965
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
966
 * @granularity: The chosen granularity for the dirty bitmap.
967
 * @buf_size: The amount of data that can be in flight at one time.
P
Paolo Bonzini 已提交
968
 * @mode: Whether to collapse all images in the chain to the target.
M
Max Reitz 已提交
969
 * @backing_mode: How to establish the target's backing chain after completion.
970 971
 * @on_source_error: The action to take upon error reading from the source.
 * @on_target_error: The action to take upon error writing to the target.
972
 * @unmap: Whether to unmap target where source sectors only contain zeroes.
973 974 975
 * @filter_node_name: The node name that should be assigned to the filter
 * driver that the mirror job inserts into the graph above @bs. NULL means that
 * a node name should be autogenerated.
P
Paolo Bonzini 已提交
976 977 978
 * @errp: Error object.
 *
 * Start a mirroring operation on @bs.  Clusters that are allocated
979
 * in @bs will be written to @target until the job is cancelled or
P
Paolo Bonzini 已提交
980 981 982
 * manually completed.  At the end of a successful mirroring job,
 * @bs will be switched to read from @target.
 */
983 984
void mirror_start(const char *job_id, BlockDriverState *bs,
                  BlockDriverState *target, const char *replaces,
985
                  int64_t speed, uint32_t granularity, int64_t buf_size,
M
Max Reitz 已提交
986 987
                  MirrorSyncMode mode, BlockMirrorBackingMode backing_mode,
                  BlockdevOnError on_source_error,
988
                  BlockdevOnError on_target_error,
989
                  bool unmap, const char *filter_node_name, Error **errp);
P
Paolo Bonzini 已提交
990

991
/*
992
 * backup_job_create:
993 994
 * @job_id: The id of the newly-created job, or %NULL to use the
 * device name of @bs.
995 996 997
 * @bs: Block device to operate on.
 * @target: Block device to write to.
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
998
 * @sync_mode: What parts of the disk image should be copied to the destination.
999
 * @sync_bitmap: The dirty bitmap if sync_mode is MIRROR_SYNC_MODE_INCREMENTAL.
1000 1001
 * @on_source_error: The action to take upon error reading from the source.
 * @on_target_error: The action to take upon error writing to the target.
1002 1003
 * @creation_flags: Flags that control the behavior of the Job lifetime.
 *                  See @BlockJobCreateFlags
1004 1005
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
1006
 * @txn: Transaction that this job is part of (may be NULL).
1007
 *
1008
 * Create a backup operation on @bs.  Clusters in @bs are written to @target
1009 1010
 * until the job is cancelled or manually completed.
 */
1011 1012 1013 1014 1015 1016 1017 1018 1019 1020
BlockJob *backup_job_create(const char *job_id, BlockDriverState *bs,
                            BlockDriverState *target, int64_t speed,
                            MirrorSyncMode sync_mode,
                            BdrvDirtyBitmap *sync_bitmap,
                            bool compress,
                            BlockdevOnError on_source_error,
                            BlockdevOnError on_target_error,
                            int creation_flags,
                            BlockCompletionFunc *cb, void *opaque,
                            BlockJobTxn *txn, Error **errp);
1021

1022 1023
void hmp_drive_add_node(Monitor *mon, const char *optstr);

1024 1025
BdrvChild *bdrv_root_attach_child(BlockDriverState *child_bs,
                                  const char *child_name,
1026
                                  const BdrvChildRole *child_role,
1027 1028
                                  uint64_t perm, uint64_t shared_perm,
                                  void *opaque, Error **errp);
1029 1030
void bdrv_root_unref_child(BdrvChild *child);

1031 1032 1033
int bdrv_child_try_set_perm(BdrvChild *c, uint64_t perm, uint64_t shared,
                            Error **errp);

1034 1035 1036 1037 1038
/* Default implementation for BlockDriver.bdrv_child_perm() that can be used by
 * block filters: Forward CONSISTENT_READ, WRITE, WRITE_UNCHANGED and RESIZE to
 * all children */
void bdrv_filter_default_perms(BlockDriverState *bs, BdrvChild *c,
                               const BdrvChildRole *role,
1039
                               BlockReopenQueue *reopen_queue,
1040 1041 1042
                               uint64_t perm, uint64_t shared,
                               uint64_t *nperm, uint64_t *nshared);

1043 1044 1045 1046 1047 1048
/* Default implementation for BlockDriver.bdrv_child_perm() that can be used by
 * (non-raw) image formats: Like above for bs->backing, but for bs->file it
 * requires WRITE | RESIZE for read-write images, always requires
 * CONSISTENT_READ and doesn't share WRITE. */
void bdrv_format_default_perms(BlockDriverState *bs, BdrvChild *c,
                               const BdrvChildRole *role,
1049
                               BlockReopenQueue *reopen_queue,
1050 1051
                               uint64_t perm, uint64_t shared,
                               uint64_t *nperm, uint64_t *nshared);
1052

1053
/*
1054
 * Default implementation for drivers to pass bdrv_co_block_status() to
1055 1056
 * their file.
 */
1057 1058 1059 1060 1061 1062 1063
int coroutine_fn bdrv_co_block_status_from_file(BlockDriverState *bs,
                                                bool want_zero,
                                                int64_t offset,
                                                int64_t bytes,
                                                int64_t *pnum,
                                                int64_t *map,
                                                BlockDriverState **file);
1064
/*
1065
 * Default implementation for drivers to pass bdrv_co_block_status() to
1066 1067
 * their backing file.
 */
1068 1069 1070 1071 1072 1073 1074
int coroutine_fn bdrv_co_block_status_from_backing(BlockDriverState *bs,
                                                   bool want_zero,
                                                   int64_t offset,
                                                   int64_t bytes,
                                                   int64_t *pnum,
                                                   int64_t *map,
                                                   BlockDriverState **file);
K
Kevin Wolf 已提交
1075
const char *bdrv_get_parent_name(const BlockDriverState *bs);
1076
void blk_dev_change_media_cb(BlockBackend *blk, bool load, Error **errp);
1077
bool blk_dev_has_removable_media(BlockBackend *blk);
M
Max Reitz 已提交
1078
bool blk_dev_has_tray(BlockBackend *blk);
1079 1080 1081 1082
void blk_dev_eject_request(BlockBackend *blk, bool force);
bool blk_dev_is_tray_open(BlockBackend *blk);
bool blk_dev_is_medium_locked(BlockBackend *blk);

1083
void bdrv_set_dirty(BlockDriverState *bs, int64_t offset, int64_t bytes);
1084

F
Fam Zheng 已提交
1085 1086 1087
void bdrv_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap, HBitmap **out);
void bdrv_undo_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap, HBitmap *in);

1088 1089 1090
void bdrv_inc_in_flight(BlockDriverState *bs);
void bdrv_dec_in_flight(BlockDriverState *bs);

1091 1092
void blockdev_close_all_bdrv_states(void);

B
bellard 已提交
1093
#endif /* BLOCK_INT_H */