block_int.h 25.9 KB
Newer Older
B
bellard 已提交
1 2
/*
 * QEMU System Emulator block driver
3
 *
B
bellard 已提交
4
 * Copyright (c) 2003 Fabrice Bellard
5
 *
B
bellard 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
#ifndef BLOCK_INT_H
#define BLOCK_INT_H

27
#include "block/accounting.h"
28
#include "block/block.h"
29 30
#include "qemu/option.h"
#include "qemu/queue.h"
31
#include "block/coroutine.h"
32
#include "qemu/timer.h"
L
Luiz Capitulino 已提交
33
#include "qapi-types.h"
34
#include "qemu/hbitmap.h"
35
#include "block/snapshot.h"
36
#include "qemu/main-loop.h"
37
#include "qemu/throttle.h"
P
pbrook 已提交
38

39 40 41
#define BLOCK_FLAG_ENCRYPT          1
#define BLOCK_FLAG_COMPAT6          4
#define BLOCK_FLAG_LAZY_REFCOUNTS   8
42

43 44 45 46 47 48 49 50 51 52 53
#define BLOCK_OPT_SIZE              "size"
#define BLOCK_OPT_ENCRYPT           "encryption"
#define BLOCK_OPT_COMPAT6           "compat6"
#define BLOCK_OPT_BACKING_FILE      "backing_file"
#define BLOCK_OPT_BACKING_FMT       "backing_fmt"
#define BLOCK_OPT_CLUSTER_SIZE      "cluster_size"
#define BLOCK_OPT_TABLE_SIZE        "table_size"
#define BLOCK_OPT_PREALLOC          "preallocation"
#define BLOCK_OPT_SUBFMT            "subformat"
#define BLOCK_OPT_COMPAT_LEVEL      "compat"
#define BLOCK_OPT_LAZY_REFCOUNTS    "lazy_refcounts"
54
#define BLOCK_OPT_ADAPTER_TYPE      "adapter_type"
55
#define BLOCK_OPT_REDUNDANCY        "redundancy"
56
#define BLOCK_OPT_NOCOW             "nocow"
57
#define BLOCK_OPT_OBJECT_SIZE       "object_size"
58
#define BLOCK_OPT_REFCOUNT_BITS     "refcount_bits"
59

60 61
#define BLOCK_PROBE_BUF_SIZE        512

62 63
typedef struct BdrvTrackedRequest {
    BlockDriverState *bs;
64 65
    int64_t offset;
    unsigned int bytes;
66
    bool is_write;
67

68
    bool serialising;
69 70 71
    int64_t overlap_offset;
    unsigned int overlap_bytes;

72 73 74
    QLIST_ENTRY(BdrvTrackedRequest) list;
    Coroutine *co; /* owner, used for deadlock detection */
    CoQueue wait_queue; /* coroutines blocked on this request */
75 76

    struct BdrvTrackedRequest *waiting_for;
77 78
} BdrvTrackedRequest;

B
bellard 已提交
79 80 81
struct BlockDriver {
    const char *format_name;
    int instance_size;
82

83 84 85 86
    /* set to true if the BlockDriver is a block filter */
    bool is_filter;
    /* for snapshots block filter like Quorum can implement the
     * following recursive callback.
87 88 89
     * It's purpose is to recurse on the filter children while calling
     * bdrv_recurse_is_first_non_filter on them.
     * For a sample implementation look in the future Quorum block filter.
90
     */
91 92
    bool (*bdrv_recurse_is_first_non_filter)(BlockDriverState *bs,
                                             BlockDriverState *candidate);
93

B
bellard 已提交
94
    int (*bdrv_probe)(const uint8_t *buf, int buf_size, const char *filename);
95
    int (*bdrv_probe_device)(const char *filename);
96 97 98

    /* Any driver implementing this callback is expected to be able to handle
     * NULL file names in its .bdrv_open() implementation */
99
    void (*bdrv_parse_filename)(const char *filename, QDict *options, Error **errp);
100 101 102 103 104 105
    /* Drivers not implementing bdrv_parse_filename nor bdrv_open should have
     * this field set to true, except ones that are defined only by their
     * child's bs.
     * An example of the last type will be the quorum block driver.
     */
    bool bdrv_needs_filename;
106

107 108 109
    /* Set if a driver can support backing files */
    bool supports_backing;

110 111 112 113 114 115
    /* For handling image reopen for split or non-split files */
    int (*bdrv_reopen_prepare)(BDRVReopenState *reopen_state,
                               BlockReopenQueue *queue, Error **errp);
    void (*bdrv_reopen_commit)(BDRVReopenState *reopen_state);
    void (*bdrv_reopen_abort)(BDRVReopenState *reopen_state);

M
Max Reitz 已提交
116 117 118 119
    int (*bdrv_open)(BlockDriverState *bs, QDict *options, int flags,
                     Error **errp);
    int (*bdrv_file_open)(BlockDriverState *bs, QDict *options, int flags,
                          Error **errp);
120
    int (*bdrv_read)(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
121
                     uint8_t *buf, int nb_sectors);
122
    int (*bdrv_write)(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
123
                      const uint8_t *buf, int nb_sectors);
B
bellard 已提交
124
    void (*bdrv_close)(BlockDriverState *bs);
P
Paolo Bonzini 已提交
125
    void (*bdrv_rebind)(BlockDriverState *bs);
C
Chunyan Liu 已提交
126
    int (*bdrv_create)(const char *filename, QemuOpts *opts, Error **errp);
B
bellard 已提交
127
    int (*bdrv_set_key)(BlockDriverState *bs, const char *key);
128
    int (*bdrv_make_empty)(BlockDriverState *bs);
M
Max Reitz 已提交
129 130 131

    void (*bdrv_refresh_filename)(BlockDriverState *bs);

B
bellard 已提交
132
    /* aio */
133
    BlockAIOCB *(*bdrv_aio_readv)(BlockDriverState *bs,
134
        int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
135
        BlockCompletionFunc *cb, void *opaque);
136
    BlockAIOCB *(*bdrv_aio_writev)(BlockDriverState *bs,
137
        int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
138
        BlockCompletionFunc *cb, void *opaque);
139
    BlockAIOCB *(*bdrv_aio_flush)(BlockDriverState *bs,
140
        BlockCompletionFunc *cb, void *opaque);
141
    BlockAIOCB *(*bdrv_aio_discard)(BlockDriverState *bs,
142
        int64_t sector_num, int nb_sectors,
143
        BlockCompletionFunc *cb, void *opaque);
B
bellard 已提交
144

K
Kevin Wolf 已提交
145 146 147 148
    int coroutine_fn (*bdrv_co_readv)(BlockDriverState *bs,
        int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
    int coroutine_fn (*bdrv_co_writev)(BlockDriverState *bs,
        int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
149 150 151 152 153 154 155
    /*
     * Efficiently zero a region of the disk image.  Typically an image format
     * would use a compact metadata representation to implement this.  This
     * function pointer may be NULL and .bdrv_co_writev() will be called
     * instead.
     */
    int coroutine_fn (*bdrv_co_write_zeroes)(BlockDriverState *bs,
156
        int64_t sector_num, int nb_sectors, BdrvRequestFlags flags);
157 158
    int coroutine_fn (*bdrv_co_discard)(BlockDriverState *bs,
        int64_t sector_num, int nb_sectors);
159
    int64_t coroutine_fn (*bdrv_co_get_block_status)(BlockDriverState *bs,
160
        int64_t sector_num, int nb_sectors, int *pnum);
K
Kevin Wolf 已提交
161

162 163 164
    /*
     * Invalidate any cached meta-data.
     */
165
    void (*bdrv_invalidate_cache)(BlockDriverState *bs, Error **errp);
166

167 168 169 170 171 172
    /*
     * Flushes all data that was already written to the OS all the way down to
     * the disk (for example raw-posix calls fsync()).
     */
    int coroutine_fn (*bdrv_co_flush_to_disk)(BlockDriverState *bs);

K
Kevin Wolf 已提交
173 174 175 176 177 178 179
    /*
     * Flushes all internal caches to the OS. The data may still sit in a
     * writeback cache of the host OS, but it will survive a crash of the qemu
     * process.
     */
    int coroutine_fn (*bdrv_co_flush_to_os)(BlockDriverState *bs);

B
bellard 已提交
180 181
    const char *protocol_name;
    int (*bdrv_truncate)(BlockDriverState *bs, int64_t offset);
182

B
bellard 已提交
183
    int64_t (*bdrv_getlength)(BlockDriverState *bs);
184
    bool has_variable_length;
185
    int64_t (*bdrv_get_allocated_file_size)(BlockDriverState *bs);
186

187
    int (*bdrv_write_compressed)(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
188 189
                                 const uint8_t *buf, int nb_sectors);

190
    int (*bdrv_snapshot_create)(BlockDriverState *bs,
B
bellard 已提交
191
                                QEMUSnapshotInfo *sn_info);
192
    int (*bdrv_snapshot_goto)(BlockDriverState *bs,
B
bellard 已提交
193
                              const char *snapshot_id);
194 195 196 197
    int (*bdrv_snapshot_delete)(BlockDriverState *bs,
                                const char *snapshot_id,
                                const char *name,
                                Error **errp);
198
    int (*bdrv_snapshot_list)(BlockDriverState *bs,
B
bellard 已提交
199
                              QEMUSnapshotInfo **psn_info);
E
edison 已提交
200
    int (*bdrv_snapshot_load_tmp)(BlockDriverState *bs,
201 202 203
                                  const char *snapshot_id,
                                  const char *name,
                                  Error **errp);
B
bellard 已提交
204
    int (*bdrv_get_info)(BlockDriverState *bs, BlockDriverInfo *bdi);
M
Max Reitz 已提交
205
    ImageInfoSpecific *(*bdrv_get_specific_info)(BlockDriverState *bs);
B
bellard 已提交
206

207 208
    int (*bdrv_save_vmstate)(BlockDriverState *bs, QEMUIOVector *qiov,
                             int64_t pos);
209 210
    int (*bdrv_load_vmstate)(BlockDriverState *bs, uint8_t *buf,
                             int64_t pos, int size);
211

K
Kevin Wolf 已提交
212 213 214
    int (*bdrv_change_backing_file)(BlockDriverState *bs,
        const char *backing_file, const char *backing_fmt);

B
bellard 已提交
215 216 217
    /* removable device specific */
    int (*bdrv_is_inserted)(BlockDriverState *bs);
    int (*bdrv_media_changed)(BlockDriverState *bs);
218
    void (*bdrv_eject)(BlockDriverState *bs, bool eject_flag);
219
    void (*bdrv_lock_medium)(BlockDriverState *bs, bool locked);
220

221 222
    /* to control generic scsi devices */
    int (*bdrv_ioctl)(BlockDriverState *bs, unsigned long int req, void *buf);
223
    BlockAIOCB *(*bdrv_aio_ioctl)(BlockDriverState *bs,
224
        unsigned long int req, void *buf,
225
        BlockCompletionFunc *cb, void *opaque);
226

227
    /* List of options for creating images, terminated by name == NULL */
228
    QemuOptsList *create_opts;
229

230 231 232 233
    /*
     * Returns 0 for completed check, -errno for internal errors.
     * The check results are stored in result.
     */
234 235
    int (*bdrv_check)(BlockDriverState* bs, BdrvCheckResult *result,
        BdrvCheckMode fix);
A
aliguori 已提交
236

237 238
    int (*bdrv_amend_options)(BlockDriverState *bs, QemuOpts *opts,
                              BlockDriverAmendStatusCB *status_cb);
M
Max Reitz 已提交
239

K
Kevin Wolf 已提交
240 241
    void (*bdrv_debug_event)(BlockDriverState *bs, BlkDebugEvent event);

K
Kevin Wolf 已提交
242 243 244
    /* TODO Better pass a option string/QDict/QemuOpts to add any rule? */
    int (*bdrv_debug_breakpoint)(BlockDriverState *bs, const char *event,
        const char *tag);
F
Fam Zheng 已提交
245 246
    int (*bdrv_debug_remove_breakpoint)(BlockDriverState *bs,
        const char *tag);
K
Kevin Wolf 已提交
247 248 249
    int (*bdrv_debug_resume)(BlockDriverState *bs, const char *tag);
    bool (*bdrv_debug_is_suspended)(BlockDriverState *bs, const char *tag);

250
    void (*bdrv_refresh_limits)(BlockDriverState *bs, Error **errp);
251

K
Kevin Wolf 已提交
252 253 254 255 256
    /*
     * Returns 1 if newly created images are guaranteed to contain only
     * zeros, 0 otherwise.
     */
    int (*bdrv_has_zero_init)(BlockDriverState *bs);
257

258 259 260 261 262 263 264 265 266 267 268 269 270
    /* Remove fd handlers, timers, and other event loop callbacks so the event
     * loop is no longer in use.  Called with no in-flight requests and in
     * depth-first traversal order with parents before child nodes.
     */
    void (*bdrv_detach_aio_context)(BlockDriverState *bs);

    /* Add fd handlers, timers, and other event loop callbacks so I/O requests
     * can be processed again.  Called with no in-flight requests and in
     * depth-first traversal order with child nodes before parent nodes.
     */
    void (*bdrv_attach_aio_context)(BlockDriverState *bs,
                                    AioContext *new_context);

271 272 273 274 275
    /* io queue for linux-aio */
    void (*bdrv_io_plug)(BlockDriverState *bs);
    void (*bdrv_io_unplug)(BlockDriverState *bs);
    void (*bdrv_flush_io_queue)(BlockDriverState *bs);

276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
    /**
     * Try to get @bs's logical and physical block size.
     * On success, store them in @bsz and return zero.
     * On failure, return negative errno.
     */
    int (*bdrv_probe_blocksizes)(BlockDriverState *bs, BlockSizes *bsz);
    /**
     * Try to get @bs's geometry (cyls, heads, sectors)
     * On success, store them in @geo and return 0.
     * On failure return -errno.
     * Only drivers that want to override guest geometry implement this
     * callback; see hd_geometry_guess().
     */
    int (*bdrv_probe_geometry)(BlockDriverState *bs, HDGeometry *geo);

291
    QLIST_ENTRY(BlockDriver) list;
B
bellard 已提交
292 293
};

294 295 296 297 298 299 300 301 302 303 304 305
typedef struct BlockLimits {
    /* maximum number of sectors that can be discarded at once */
    int max_discard;

    /* optimal alignment for discard requests in sectors */
    int64_t discard_alignment;

    /* maximum number of sectors that can zeroized at once */
    int max_write_zeroes;

    /* optimal alignment for write zeroes requests in sectors */
    int64_t write_zeroes_alignment;
306 307 308

    /* optimal transfer length in sectors */
    int opt_transfer_length;
309

310 311 312
    /* maximal transfer length in sectors */
    int max_transfer_length;

313
    /* memory alignment so that no bounce buffer is needed */
314 315 316
    size_t min_mem_alignment;

    /* memory alignment for bounce buffer */
317
    size_t opt_mem_alignment;
318 319
} BlockLimits;

320 321
typedef struct BdrvOpBlocker BdrvOpBlocker;

M
Max Reitz 已提交
322 323 324 325 326 327 328 329 330
typedef struct BdrvAioNotifier {
    void (*attached_aio_context)(AioContext *new_context, void *opaque);
    void (*detach_aio_context)(void *opaque);

    void *opaque;

    QLIST_ENTRY(BdrvAioNotifier) list;
} BdrvAioNotifier;

331 332 333 334 335 336 337
struct BdrvChildRole {
    int (*inherit_flags)(int parent_flags);
};

extern const BdrvChildRole child_file;
extern const BdrvChildRole child_format;

K
Kevin Wolf 已提交
338
struct BdrvChild {
339 340 341
    BlockDriverState *bs;
    const BdrvChildRole *role;
    QLIST_ENTRY(BdrvChild) next;
K
Kevin Wolf 已提交
342
};
343

344 345 346 347 348 349
/*
 * Note: the function bdrv_append() copies and swaps contents of
 * BlockDriverStates, so if you add new fields to this struct, please
 * inspect bdrv_append() to determine if the new fields need to be
 * copied as well.
 */
B
bellard 已提交
350
struct BlockDriverState {
351 352
    int64_t total_sectors; /* if we are reading a disk image, give its
                              size in sectors */
B
bellard 已提交
353
    int read_only; /* if true, the media is read only */
354
    int open_flags; /* flags used to open the file, re-used for re-open */
B
bellard 已提交
355
    int encrypted; /* if true, the media is encrypted */
356
    int valid_key; /* if true, a valid encryption key has been set */
357
    int sg;        /* if true, the device is a /dev/sg* */
358 359
    int copy_on_read; /* if true, copy read backing sectors into image
                         note this is a reference count */
360
    bool probed;
B
bellard 已提交
361

B
bellard 已提交
362
    BlockDriver *drv; /* NULL means no media */
B
bellard 已提交
363 364
    void *opaque;

365 366
    BlockBackend *blk;          /* owning backend, if any */

367
    AioContext *aio_context; /* event loop used for fd handlers, timers, etc */
M
Max Reitz 已提交
368 369 370 371
    /* long-running tasks intended to always use the same AioContext as this
     * BDS may register themselves in this list to be notified of changes
     * regarding this BDS's context */
    QLIST_HEAD(, BdrvAioNotifier) aio_notifiers;
372

373 374 375
    char filename[PATH_MAX];
    char backing_file[PATH_MAX]; /* if non zero, the image is a diff of
                                    this file image */
376
    char backing_format[16]; /* if non-zero and backing_file exists */
B
bellard 已提交
377

M
Max Reitz 已提交
378
    QDict *full_open_options;
379
    char exact_filename[PATH_MAX];
M
Max Reitz 已提交
380

381
    BdrvChild *backing;
K
Kevin Wolf 已提交
382
    BdrvChild *file;
383

P
Paolo Bonzini 已提交
384 385
    NotifierList close_notifiers;

386 387 388
    /* Callback before write request is processed */
    NotifierWithReturnList before_write_notifiers;

389 390
    /* number of in-flight serialising requests */
    unsigned int serialising_in_flight;
391

392 393
    /* I/O throttling */
    CoQueue      throttled_reqs[2];
394
    bool         io_limits_enabled;
395 396 397 398 399
    /* The following fields are protected by the ThrottleGroup lock.
     * See the ThrottleGroup documentation for details. */
    ThrottleState *throttle_state;
    ThrottleTimers throttle_timers;
    unsigned       pending_reqs[2];
400
    QLIST_ENTRY(BlockDriverState) round_robin;
401

402
    /* I/O stats (display with "info blockstats"). */
403
    BlockAcctStats stats;
404

405 406 407
    /* I/O Limits */
    BlockLimits bl;

A
Asias He 已提交
408 409 410
    /* Whether produces zeros when read beyond eof */
    bool zero_beyond_eof;

411 412 413
    /* Alignment requirement for offset/length of I/O requests */
    unsigned int request_alignment;

414 415
    /* the block size for which the guest device expects atomicity */
    int guest_block_size;
416

417 418 419
    /* do we need to tell the quest if we have a volatile write cache? */
    int enable_write_cache;

B
bellard 已提交
420 421
    /* NOTE: the following infos are only hints for real hardware
       drivers. They are not used by the block driver */
422
    BlockdevOnError on_read_error, on_write_error;
423
    bool iostatus_enabled;
L
Luiz Capitulino 已提交
424
    BlockDeviceIoStatus iostatus;
425 426 427 428 429 430 431

    /* the following member gives a name to every node on the bs graph. */
    char node_name[32];
    /* element of the list of named nodes building the graph */
    QTAILQ_ENTRY(BlockDriverState) node_list;
    /* element of the list of "drives" the guest sees */
    QTAILQ_ENTRY(BlockDriverState) device_list;
F
Fam Zheng 已提交
432
    QLIST_HEAD(, BdrvDirtyBitmap) dirty_bitmaps;
433
    int refcnt;
S
Stefan Hajnoczi 已提交
434 435

    QLIST_HEAD(, BdrvTrackedRequest) tracked_requests;
436

437 438 439
    /* operation blockers */
    QLIST_HEAD(, BdrvOpBlocker) op_blockers[BLOCK_OP_TYPE_MAX];

440 441
    /* long-running background operation */
    BlockJob *job;
442

443 444 445 446
    /* The node that this node inherited default options from (and a reopen on
     * which can affect this node by changing these defaults). This is always a
     * parent node of this node. */
    BlockDriverState *inherits_from;
447 448
    QLIST_HEAD(, BdrvChild) children;

449
    QDict *options;
450
    BlockdevDetectZeroesOptions detect_zeroes;
451 452 453

    /* The error object in use for blocking operations on backing_hd */
    Error *backing_blocker;
454 455 456 457

    /* threshold limit for writes, in bytes. "High water mark". */
    uint64_t write_threshold_offset;
    NotifierWithReturn write_threshold_notifier;
B
bellard 已提交
458 459
};

460 461 462 463 464
static inline BlockDriverState *backing_bs(BlockDriverState *bs)
{
    return bs->backing ? bs->backing->bs : NULL;
}

465 466 467 468 469 470 471

/* Essential block drivers which must always be statically linked into qemu, and
 * which therefore can be accessed without using bdrv_find_format() */
extern BlockDriver bdrv_file;
extern BlockDriver bdrv_raw;
extern BlockDriver bdrv_qcow2;

472 473 474 475 476 477 478 479
/**
 * bdrv_setup_io_funcs:
 *
 * Prepare a #BlockDriver for I/O request processing by populating
 * unimplemented coroutine and AIO interfaces with generic wrapper functions
 * that fall back to implemented interfaces.
 */
void bdrv_setup_io_funcs(BlockDriver *bdrv);
480

481
int get_tmp_filename(char *filename, int size);
482 483
BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
                            const char *filename);
484

485
void bdrv_set_io_limits(BlockDriverState *bs,
486 487
                        ThrottleConfig *cfg);

488

489 490 491 492 493 494 495 496 497
/**
 * bdrv_add_before_write_notifier:
 *
 * Register a callback that is invoked before write requests are processed but
 * after any throttling or waiting for overlapping requests.
 */
void bdrv_add_before_write_notifier(BlockDriverState *bs,
                                    NotifierWithReturn *notifier);

498 499 500 501 502
/**
 * bdrv_detach_aio_context:
 *
 * May be called from .bdrv_detach_aio_context() to detach children from the
 * current #AioContext.  This is only needed by block drivers that manage their
503
 * own children.  Both ->file and ->backing are automatically handled and
504 505 506 507 508 509 510 511 512
 * block drivers should not call this function on them explicitly.
 */
void bdrv_detach_aio_context(BlockDriverState *bs);

/**
 * bdrv_attach_aio_context:
 *
 * May be called from .bdrv_attach_aio_context() to attach children to the new
 * #AioContext.  This is only needed by block drivers that manage their own
513
 * children.  Both ->file and ->backing are automatically handled and block
514 515 516 517 518
 * drivers should not call this function on them explicitly.
 */
void bdrv_attach_aio_context(BlockDriverState *bs,
                             AioContext *new_context);

M
Max Reitz 已提交
519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546
/**
 * bdrv_add_aio_context_notifier:
 *
 * If a long-running job intends to be always run in the same AioContext as a
 * certain BDS, it may use this function to be notified of changes regarding the
 * association of the BDS to an AioContext.
 *
 * attached_aio_context() is called after the target BDS has been attached to a
 * new AioContext; detach_aio_context() is called before the target BDS is being
 * detached from its old AioContext.
 */
void bdrv_add_aio_context_notifier(BlockDriverState *bs,
        void (*attached_aio_context)(AioContext *new_context, void *opaque),
        void (*detach_aio_context)(void *opaque), void *opaque);

/**
 * bdrv_remove_aio_context_notifier:
 *
 * Unsubscribe of change notifications regarding the BDS's AioContext. The
 * parameters given here have to be the same as those given to
 * bdrv_add_aio_context_notifier().
 */
void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
                                      void (*aio_context_attached)(AioContext *,
                                                                   void *),
                                      void (*aio_context_detached)(void *),
                                      void *opaque);

547 548 549 550
#ifdef _WIN32
int is_windows_drive(const char *filename);
#endif

P
Paolo Bonzini 已提交
551 552 553 554 555 556 557
/**
 * stream_start:
 * @bs: Block device to operate on.
 * @base: Block device that will become the new base, or %NULL to
 * flatten the whole backing file chain onto @bs.
 * @base_id: The file name that will be written to @bs as the new
 * backing file if the job completes.  Ignored if @base is %NULL.
558
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
P
Paolo Bonzini 已提交
559
 * @on_error: The action to take upon error.
P
Paolo Bonzini 已提交
560 561
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
562
 * @errp: Error object.
P
Paolo Bonzini 已提交
563 564 565 566 567 568 569
 *
 * Start a streaming operation on @bs.  Clusters that are unallocated
 * in @bs, but allocated in any image between @base and @bs (both
 * exclusive) will be written to @bs.  At the end of a successful
 * streaming job, the backing file of @bs will be changed to
 * @base_id in the written image and to @base in the live BlockDriverState.
 */
570
void stream_start(BlockDriverState *bs, BlockDriverState *base,
P
Paolo Bonzini 已提交
571
                  const char *base_id, int64_t speed, BlockdevOnError on_error,
572
                  BlockCompletionFunc *cb,
573
                  void *opaque, Error **errp);
574

575 576
/**
 * commit_start:
F
Fam Zheng 已提交
577 578 579
 * @bs: Active block device.
 * @top: Top block device to be committed.
 * @base: Block device that will be written into, and become the new top.
580 581 582 583
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
 * @on_error: The action to take upon error.
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
584
 * @backing_file_str: String to use as the backing file in @top's overlay
585 586 587 588 589
 * @errp: Error object.
 *
 */
void commit_start(BlockDriverState *bs, BlockDriverState *base,
                 BlockDriverState *top, int64_t speed,
590
                 BlockdevOnError on_error, BlockCompletionFunc *cb,
591
                 void *opaque, const char *backing_file_str, Error **errp);
F
Fam Zheng 已提交
592 593 594 595 596 597 598 599 600 601 602 603 604 605
/**
 * commit_active_start:
 * @bs: Active block device to be committed.
 * @base: Block device that will be written into, and become the new top.
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
 * @on_error: The action to take upon error.
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
 * @errp: Error object.
 *
 */
void commit_active_start(BlockDriverState *bs, BlockDriverState *base,
                         int64_t speed,
                         BlockdevOnError on_error,
606
                         BlockCompletionFunc *cb,
F
Fam Zheng 已提交
607
                         void *opaque, Error **errp);
P
Paolo Bonzini 已提交
608 609 610 611
/*
 * mirror_start:
 * @bs: Block device to operate on.
 * @target: Block device to write to.
612 613
 * @replaces: Block graph node name to replace once the mirror is done. Can
 *            only be used when full mirroring is selected.
P
Paolo Bonzini 已提交
614
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
615
 * @granularity: The chosen granularity for the dirty bitmap.
616
 * @buf_size: The amount of data that can be in flight at one time.
P
Paolo Bonzini 已提交
617
 * @mode: Whether to collapse all images in the chain to the target.
618 619
 * @on_source_error: The action to take upon error reading from the source.
 * @on_target_error: The action to take upon error writing to the target.
620
 * @unmap: Whether to unmap target where source sectors only contain zeroes.
P
Paolo Bonzini 已提交
621 622 623 624 625 626 627 628 629 630
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
 * @errp: Error object.
 *
 * Start a mirroring operation on @bs.  Clusters that are allocated
 * in @bs will be written to @bs until the job is cancelled or
 * manually completed.  At the end of a successful mirroring job,
 * @bs will be switched to read from @target.
 */
void mirror_start(BlockDriverState *bs, BlockDriverState *target,
631
                  const char *replaces,
632
                  int64_t speed, uint32_t granularity, int64_t buf_size,
633
                  MirrorSyncMode mode, BlockdevOnError on_source_error,
634
                  BlockdevOnError on_target_error,
635
                  bool unmap,
636
                  BlockCompletionFunc *cb,
P
Paolo Bonzini 已提交
637 638
                  void *opaque, Error **errp);

639 640 641 642 643
/*
 * backup_start:
 * @bs: Block device to operate on.
 * @target: Block device to write to.
 * @speed: The maximum speed, in bytes per second, or 0 for unlimited.
644
 * @sync_mode: What parts of the disk image should be copied to the destination.
645
 * @sync_bitmap: The dirty bitmap if sync_mode is MIRROR_SYNC_MODE_INCREMENTAL.
646 647 648 649 650 651 652 653 654
 * @on_source_error: The action to take upon error reading from the source.
 * @on_target_error: The action to take upon error writing to the target.
 * @cb: Completion function for the job.
 * @opaque: Opaque pointer value passed to @cb.
 *
 * Start a backup operation on @bs.  Clusters in @bs are written to @target
 * until the job is cancelled or manually completed.
 */
void backup_start(BlockDriverState *bs, BlockDriverState *target,
655
                  int64_t speed, MirrorSyncMode sync_mode,
656
                  BdrvDirtyBitmap *sync_bitmap,
657
                  BlockdevOnError on_source_error,
658
                  BlockdevOnError on_target_error,
659
                  BlockCompletionFunc *cb, void *opaque,
660 661
                  Error **errp);

662 663 664 665 666 667 668
void blk_dev_change_media_cb(BlockBackend *blk, bool load);
bool blk_dev_has_removable_media(BlockBackend *blk);
void blk_dev_eject_request(BlockBackend *blk, bool force);
bool blk_dev_is_tray_open(BlockBackend *blk);
bool blk_dev_is_medium_locked(BlockBackend *blk);
void blk_dev_resize_cb(BlockBackend *blk);

669 670
void bdrv_set_dirty(BlockDriverState *bs, int64_t cur_sector, int nr_sectors);

B
bellard 已提交
671
#endif /* BLOCK_INT_H */