block.c 39.6 KB
Newer Older
B
bellard 已提交
1 2
/*
 * QEMU System Emulator block driver
3
 *
B
bellard 已提交
4
 * Copyright (c) 2003 Fabrice Bellard
5
 *
B
bellard 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
P
pbrook 已提交
24
#include "qemu-common.h"
P
pbrook 已提交
25
#include "console.h"
B
bellard 已提交
26
#include "block_int.h"
B
bellard 已提交
27

B
bellard 已提交
28 29 30 31 32 33 34 35
#ifdef _BSD
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/ioctl.h>
#include <sys/queue.h>
#include <sys/disk.h>
#endif

B
bellard 已提交
36 37 38
#define SECTOR_BITS 9
#define SECTOR_SIZE (1 << SECTOR_BITS)

B
bellard 已提交
39 40 41 42 43 44
typedef struct BlockDriverAIOCBSync {
    BlockDriverAIOCB common;
    QEMUBH *bh;
    int ret;
} BlockDriverAIOCBSync;

45 46 47 48 49 50
static BlockDriverAIOCB *bdrv_aio_read_em(BlockDriverState *bs,
        int64_t sector_num, uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque);
static BlockDriverAIOCB *bdrv_aio_write_em(BlockDriverState *bs,
        int64_t sector_num, const uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque);
B
bellard 已提交
51
static void bdrv_aio_cancel_em(BlockDriverAIOCB *acb);
52
static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
53 54 55
                        uint8_t *buf, int nb_sectors);
static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
                         const uint8_t *buf, int nb_sectors);
B
bellard 已提交
56

57 58
BlockDriverState *bdrv_first;

B
bellard 已提交
59 60
static BlockDriver *first_drv;

B
bellard 已提交
61
int path_is_absolute(const char *path)
62
{
B
bellard 已提交
63
    const char *p;
B
bellard 已提交
64 65 66 67 68
#ifdef _WIN32
    /* specific case for names like: "\\.\d:" */
    if (*path == '/' || *path == '\\')
        return 1;
#endif
B
bellard 已提交
69 70 71 72 73
    p = strchr(path, ':');
    if (p)
        p++;
    else
        p = path;
74 75 76 77 78
#ifdef _WIN32
    return (*p == '/' || *p == '\\');
#else
    return (*p == '/');
#endif
79 80
}

B
bellard 已提交
81 82 83 84 85 86
/* if filename is absolute, just copy it to dest. Otherwise, build a
   path to it by considering it is relative to base_path. URL are
   supported. */
void path_combine(char *dest, int dest_size,
                  const char *base_path,
                  const char *filename)
87
{
B
bellard 已提交
88 89 90 91 92 93 94 95 96 97 98 99 100
    const char *p, *p1;
    int len;

    if (dest_size <= 0)
        return;
    if (path_is_absolute(filename)) {
        pstrcpy(dest, dest_size, filename);
    } else {
        p = strchr(base_path, ':');
        if (p)
            p++;
        else
            p = base_path;
101 102 103 104 105 106 107 108 109
        p1 = strrchr(base_path, '/');
#ifdef _WIN32
        {
            const char *p2;
            p2 = strrchr(base_path, '\\');
            if (!p1 || p2 > p1)
                p1 = p2;
        }
#endif
B
bellard 已提交
110 111 112 113 114 115 116 117 118 119 120 121
        if (p1)
            p1++;
        else
            p1 = base_path;
        if (p1 > p)
            p = p1;
        len = p - base_path;
        if (len > dest_size - 1)
            len = dest_size - 1;
        memcpy(dest, base_path, len);
        dest[len] = '\0';
        pstrcat(dest, dest_size, filename);
122 123 124 125
    }
}


126
static void bdrv_register(BlockDriver *bdrv)
B
bellard 已提交
127
{
128
    if (!bdrv->bdrv_aio_read) {
B
bellard 已提交
129 130 131 132
        /* add AIO emulation layer */
        bdrv->bdrv_aio_read = bdrv_aio_read_em;
        bdrv->bdrv_aio_write = bdrv_aio_write_em;
        bdrv->bdrv_aio_cancel = bdrv_aio_cancel_em;
B
bellard 已提交
133
        bdrv->aiocb_size = sizeof(BlockDriverAIOCBSync);
B
bellard 已提交
134 135 136 137 138
    } else if (!bdrv->bdrv_read && !bdrv->bdrv_pread) {
        /* add synchronous IO emulation layer */
        bdrv->bdrv_read = bdrv_read_em;
        bdrv->bdrv_write = bdrv_write_em;
    }
B
bellard 已提交
139 140 141
    bdrv->next = first_drv;
    first_drv = bdrv;
}
B
bellard 已提交
142 143 144 145 146 147 148 149 150 151

/* create a new block device (by default it is empty) */
BlockDriverState *bdrv_new(const char *device_name)
{
    BlockDriverState **pbs, *bs;

    bs = qemu_mallocz(sizeof(BlockDriverState));
    if(!bs)
        return NULL;
    pstrcpy(bs->device_name, sizeof(bs->device_name), device_name);
B
bellard 已提交
152 153 154 155 156 157 158
    if (device_name[0] != '\0') {
        /* insert at the end */
        pbs = &bdrv_first;
        while (*pbs != NULL)
            pbs = &(*pbs)->next;
        *pbs = bs;
    }
B
bellard 已提交
159 160 161
    return bs;
}

B
bellard 已提交
162 163 164 165 166 167 168 169 170 171
BlockDriver *bdrv_find_format(const char *format_name)
{
    BlockDriver *drv1;
    for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
        if (!strcmp(drv1->format_name, format_name))
            return drv1;
    }
    return NULL;
}

172
int bdrv_create(BlockDriver *drv,
B
bellard 已提交
173 174 175 176 177 178 179 180
                const char *filename, int64_t size_in_sectors,
                const char *backing_file, int flags)
{
    if (!drv->bdrv_create)
        return -ENOTSUP;
    return drv->bdrv_create(filename, size_in_sectors, backing_file, flags);
}

B
bellard 已提交
181
#ifdef _WIN32
182
void get_tmp_filename(char *filename, int size)
B
bellard 已提交
183
{
184
    char temp_dir[MAX_PATH];
185

186 187
    GetTempPath(MAX_PATH, temp_dir);
    GetTempFileName(temp_dir, "qem", 0, filename);
B
bellard 已提交
188 189
}
#else
190
void get_tmp_filename(char *filename, int size)
B
bellard 已提交
191
{
B
bellard 已提交
192
    int fd;
193
    const char *tmpdir;
B
bellard 已提交
194
    /* XXX: race condition possible */
A
aurel32 已提交
195 196 197 198
    tmpdir = getenv("TMPDIR");
    if (!tmpdir)
        tmpdir = "/tmp";
    snprintf(filename, size, "%s/vl.XXXXXX", tmpdir);
B
bellard 已提交
199 200 201
    fd = mkstemp(filename);
    close(fd);
}
B
bellard 已提交
202
#endif
B
bellard 已提交
203

B
bellard 已提交
204
#ifdef _WIN32
B
bellard 已提交
205 206 207 208 209 210
static int is_windows_drive_prefix(const char *filename)
{
    return (((filename[0] >= 'a' && filename[0] <= 'z') ||
             (filename[0] >= 'A' && filename[0] <= 'Z')) &&
            filename[1] == ':');
}
211

B
bellard 已提交
212 213
static int is_windows_drive(const char *filename)
{
214
    if (is_windows_drive_prefix(filename) &&
B
bellard 已提交
215
        filename[2] == '\0')
B
bellard 已提交
216 217 218 219 220 221 222 223
        return 1;
    if (strstart(filename, "\\\\.\\", NULL) ||
        strstart(filename, "//./", NULL))
        return 1;
    return 0;
}
#endif

B
bellard 已提交
224 225 226 227 228 229
static BlockDriver *find_protocol(const char *filename)
{
    BlockDriver *drv1;
    char protocol[128];
    int len;
    const char *p;
B
bellard 已提交
230 231

#ifdef _WIN32
B
bellard 已提交
232 233
    if (is_windows_drive(filename) ||
        is_windows_drive_prefix(filename))
B
bellard 已提交
234 235
        return &bdrv_raw;
#endif
B
bellard 已提交
236 237 238 239 240 241 242 243 244
    p = strchr(filename, ':');
    if (!p)
        return &bdrv_raw;
    len = p - filename;
    if (len > sizeof(protocol) - 1)
        len = sizeof(protocol) - 1;
    memcpy(protocol, filename, len);
    protocol[len] = '\0';
    for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
245
        if (drv1->protocol_name &&
B
bellard 已提交
246 247 248 249 250 251
            !strcmp(drv1->protocol_name, protocol))
            return drv1;
    }
    return NULL;
}

B
bellard 已提交
252 253
/* XXX: force raw format if block or character device ? It would
   simplify the BSD case */
B
bellard 已提交
254 255
static BlockDriver *find_image_format(const char *filename)
{
B
bellard 已提交
256
    int ret, score, score_max;
B
bellard 已提交
257
    BlockDriver *drv1, *drv;
B
bellard 已提交
258 259
    uint8_t buf[2048];
    BlockDriverState *bs;
260

B
bellard 已提交
261 262 263 264 265 266 267 268 269 270
    /* detect host devices. By convention, /dev/cdrom[N] is always
       recognized as a host CDROM */
    if (strstart(filename, "/dev/cdrom", NULL))
        return &bdrv_host_device;
#ifdef _WIN32
    if (is_windows_drive(filename))
        return &bdrv_host_device;
#else
    {
        struct stat st;
271
        if (stat(filename, &st) >= 0 &&
B
bellard 已提交
272 273 274 275 276
            (S_ISCHR(st.st_mode) || S_ISBLK(st.st_mode))) {
            return &bdrv_host_device;
        }
    }
#endif
277

B
bellard 已提交
278
    drv = find_protocol(filename);
B
bellard 已提交
279
    /* no need to test disk image formats for vvfat */
B
bellard 已提交
280 281
    if (drv == &bdrv_vvfat)
        return drv;
B
bellard 已提交
282

B
bellard 已提交
283 284 285 286 287 288 289 290 291
    ret = bdrv_file_open(&bs, filename, BDRV_O_RDONLY);
    if (ret < 0)
        return NULL;
    ret = bdrv_pread(bs, 0, buf, sizeof(buf));
    bdrv_delete(bs);
    if (ret < 0) {
        return NULL;
    }

B
bellard 已提交
292 293
    score_max = 0;
    for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
B
bellard 已提交
294 295 296 297 298 299
        if (drv1->bdrv_probe) {
            score = drv1->bdrv_probe(buf, ret, filename);
            if (score > score_max) {
                score_max = score;
                drv = drv1;
            }
B
bellard 已提交
300
        }
B
bellard 已提交
301
    }
B
bellard 已提交
302 303 304
    return drv;
}

B
bellard 已提交
305
int bdrv_file_open(BlockDriverState **pbs, const char *filename, int flags)
B
bellard 已提交
306
{
B
bellard 已提交
307 308 309 310 311 312 313 314 315 316
    BlockDriverState *bs;
    int ret;

    bs = bdrv_new("");
    if (!bs)
        return -ENOMEM;
    ret = bdrv_open2(bs, filename, flags | BDRV_O_FILE, NULL);
    if (ret < 0) {
        bdrv_delete(bs);
        return ret;
317
    }
B
bellard 已提交
318 319 320 321 322 323 324
    *pbs = bs;
    return 0;
}

int bdrv_open(BlockDriverState *bs, const char *filename, int flags)
{
    return bdrv_open2(bs, filename, flags, NULL);
B
bellard 已提交
325 326
}

B
bellard 已提交
327
int bdrv_open2(BlockDriverState *bs, const char *filename, int flags,
B
bellard 已提交
328 329
               BlockDriver *drv)
{
B
bellard 已提交
330
    int ret, open_flags;
331 332
    char tmp_filename[PATH_MAX];
    char backing_filename[PATH_MAX];
333

B
bellard 已提交
334 335 336
    bs->read_only = 0;
    bs->is_temporary = 0;
    bs->encrypted = 0;
B
bellard 已提交
337

B
bellard 已提交
338
    if (flags & BDRV_O_SNAPSHOT) {
B
bellard 已提交
339 340
        BlockDriverState *bs1;
        int64_t total_size;
A
aliguori 已提交
341
        int is_protocol = 0;
342

B
bellard 已提交
343 344
        /* if snapshot, we create a temporary backing file and open it
           instead of opening 'filename' directly */
345

B
bellard 已提交
346 347 348
        /* if there is a backing file, use it */
        bs1 = bdrv_new("");
        if (!bs1) {
B
bellard 已提交
349
            return -ENOMEM;
B
bellard 已提交
350 351 352 353 354
        }
        if (bdrv_open(bs1, filename, 0) < 0) {
            bdrv_delete(bs1);
            return -1;
        }
B
bellard 已提交
355
        total_size = bdrv_getlength(bs1) >> SECTOR_BITS;
A
aliguori 已提交
356 357 358 359

        if (bs1->drv && bs1->drv->protocol_name)
            is_protocol = 1;

B
bellard 已提交
360
        bdrv_delete(bs1);
361

B
bellard 已提交
362
        get_tmp_filename(tmp_filename, sizeof(tmp_filename));
A
aliguori 已提交
363 364 365 366 367 368 369 370

        /* Real path is meaningless for protocols */
        if (is_protocol)
            snprintf(backing_filename, sizeof(backing_filename),
                     "%s", filename);
        else
            realpath(filename, backing_filename);

371
        if (bdrv_create(&bdrv_qcow2, tmp_filename,
372
                        total_size, backing_filename, 0) < 0) {
B
bellard 已提交
373 374 375 376 377
            return -1;
        }
        filename = tmp_filename;
        bs->is_temporary = 1;
    }
B
bellard 已提交
378

B
bellard 已提交
379
    pstrcpy(bs->filename, sizeof(bs->filename), filename);
B
bellard 已提交
380 381
    if (flags & BDRV_O_FILE) {
        drv = find_protocol(filename);
B
bellard 已提交
382
        if (!drv)
B
bellard 已提交
383 384 385 386 387 388 389
            return -ENOENT;
    } else {
        if (!drv) {
            drv = find_image_format(filename);
            if (!drv)
                return -1;
        }
B
bellard 已提交
390 391 392 393 394
    }
    bs->drv = drv;
    bs->opaque = qemu_mallocz(drv->instance_size);
    if (bs->opaque == NULL && drv->instance_size > 0)
        return -1;
B
bellard 已提交
395 396 397
    /* Note: for compatibility, we open disk image files as RDWR, and
       RDONLY as fallback */
    if (!(flags & BDRV_O_FILE))
398
        open_flags = BDRV_O_RDWR | (flags & BDRV_O_CACHE_MASK);
B
bellard 已提交
399 400 401
    else
        open_flags = flags & ~(BDRV_O_FILE | BDRV_O_SNAPSHOT);
    ret = drv->bdrv_open(bs, filename, open_flags);
402
    if ((ret == -EACCES || ret == -EPERM) && !(flags & BDRV_O_FILE)) {
403
        ret = drv->bdrv_open(bs, filename, open_flags & ~BDRV_O_RDWR);
B
bellard 已提交
404 405
        bs->read_only = 1;
    }
B
bellard 已提交
406 407
    if (ret < 0) {
        qemu_free(bs->opaque);
B
bellard 已提交
408 409
        bs->opaque = NULL;
        bs->drv = NULL;
B
bellard 已提交
410
        return ret;
411
    }
412 413 414
    if (drv->bdrv_getlength) {
        bs->total_sectors = bdrv_getlength(bs) >> SECTOR_BITS;
    }
B
bellard 已提交
415
#ifndef _WIN32
B
bellard 已提交
416 417 418 419
    if (bs->is_temporary) {
        unlink(filename);
    }
#endif
B
bellard 已提交
420
    if (bs->backing_file[0] != '\0') {
B
bellard 已提交
421 422 423 424 425
        /* if there is a backing file, use it */
        bs->backing_hd = bdrv_new("");
        if (!bs->backing_hd) {
        fail:
            bdrv_close(bs);
B
bellard 已提交
426
            return -ENOMEM;
427
        }
B
bellard 已提交
428 429
        path_combine(backing_filename, sizeof(backing_filename),
                     filename, bs->backing_file);
430
        if (bdrv_open(bs->backing_hd, backing_filename, open_flags) < 0)
431 432 433
            goto fail;
    }

B
bellard 已提交
434
    /* call the change callback */
B
bellard 已提交
435
    bs->media_changed = 1;
B
bellard 已提交
436 437 438 439
    if (bs->change_cb)
        bs->change_cb(bs->change_opaque);

    return 0;
B
bellard 已提交
440 441 442 443
}

void bdrv_close(BlockDriverState *bs)
{
B
bellard 已提交
444
    if (bs->drv) {
B
bellard 已提交
445 446 447 448 449 450 451 452
        if (bs->backing_hd)
            bdrv_delete(bs->backing_hd);
        bs->drv->bdrv_close(bs);
        qemu_free(bs->opaque);
#ifdef _WIN32
        if (bs->is_temporary) {
            unlink(bs->filename);
        }
B
bellard 已提交
453
#endif
B
bellard 已提交
454 455
        bs->opaque = NULL;
        bs->drv = NULL;
B
bellard 已提交
456 457

        /* call the change callback */
B
bellard 已提交
458
        bs->media_changed = 1;
B
bellard 已提交
459 460 461 462 463 464 465
        if (bs->change_cb)
            bs->change_cb(bs->change_opaque);
    }
}

void bdrv_delete(BlockDriverState *bs)
{
466 467 468 469 470 471 472 473
    BlockDriverState **pbs;

    pbs = &bdrv_first;
    while (*pbs != bs && *pbs != NULL)
        pbs = &(*pbs)->next;
    if (*pbs == bs)
        *pbs = bs->next;

B
bellard 已提交
474 475
    bdrv_close(bs);
    qemu_free(bs);
B
bellard 已提交
476 477
}

478 479 480
/* commit COW file into the raw image */
int bdrv_commit(BlockDriverState *bs)
{
B
bellard 已提交
481
    BlockDriver *drv = bs->drv;
B
bellard 已提交
482
    int64_t i, total_sectors;
B
bellard 已提交
483 484
    int n, j;
    unsigned char sector[512];
485

B
bellard 已提交
486 487
    if (!drv)
        return -ENOMEDIUM;
488 489

    if (bs->read_only) {
B
bellard 已提交
490
	return -EACCES;
491 492
    }

B
bellard 已提交
493 494 495
    if (!bs->backing_hd) {
	return -ENOTSUP;
    }
496

B
bellard 已提交
497 498
    total_sectors = bdrv_getlength(bs) >> SECTOR_BITS;
    for (i = 0; i < total_sectors;) {
B
bellard 已提交
499
        if (drv->bdrv_is_allocated(bs, i, 65536, &n)) {
B
bellard 已提交
500 501 502 503 504 505 506 507 508
            for(j = 0; j < n; j++) {
                if (bdrv_read(bs, i, sector, 1) != 0) {
                    return -EIO;
                }

                if (bdrv_write(bs->backing_hd, i, sector, 1) != 0) {
                    return -EIO;
                }
                i++;
509
	    }
B
bellard 已提交
510 511 512
	} else {
            i += n;
        }
513
    }
514

B
bellard 已提交
515 516
    if (drv->bdrv_make_empty)
	return drv->bdrv_make_empty(bs);
517

518 519 520
    return 0;
}

B
bellard 已提交
521
/* return < 0 if error. See bdrv_write() for the return codes */
522
int bdrv_read(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
523 524
              uint8_t *buf, int nb_sectors)
{
B
bellard 已提交
525 526
    BlockDriver *drv = bs->drv;

B
bellard 已提交
527 528
    if (!drv)
        return -ENOMEDIUM;
B
bellard 已提交
529

B
bellard 已提交
530 531 532 533 534 535 536
    if (drv->bdrv_pread) {
        int ret, len;
        len = nb_sectors * 512;
        ret = drv->bdrv_pread(bs, sector_num * 512, buf, len);
        if (ret < 0)
            return ret;
        else if (ret != len)
B
bellard 已提交
537
            return -EINVAL;
538 539 540
        else {
	    bs->rd_bytes += (unsigned) len;
	    bs->rd_ops ++;
B
bellard 已提交
541
            return 0;
542
	}
B
bellard 已提交
543 544
    } else {
        return drv->bdrv_read(bs, sector_num, buf, nb_sectors);
545
    }
B
bellard 已提交
546 547
}

548
/* Return < 0 if error. Important errors are:
B
bellard 已提交
549 550 551 552 553
  -EIO         generic I/O error (may happen for all errors)
  -ENOMEDIUM   No media inserted.
  -EINVAL      Invalid sector number or nb_sectors
  -EACCES      Trying to write a read-only device
*/
554
int bdrv_write(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
555 556
               const uint8_t *buf, int nb_sectors)
{
B
bellard 已提交
557
    BlockDriver *drv = bs->drv;
B
bellard 已提交
558 559
    if (!bs->drv)
        return -ENOMEDIUM;
B
bellard 已提交
560
    if (bs->read_only)
B
bellard 已提交
561
        return -EACCES;
B
bellard 已提交
562 563 564 565 566 567 568 569
    if (drv->bdrv_pwrite) {
        int ret, len;
        len = nb_sectors * 512;
        ret = drv->bdrv_pwrite(bs, sector_num * 512, buf, len);
        if (ret < 0)
            return ret;
        else if (ret != len)
            return -EIO;
570 571 572
        else {
	    bs->wr_bytes += (unsigned) len;
	    bs->wr_ops ++;
B
bellard 已提交
573
            return 0;
574
	}
B
bellard 已提交
575 576 577 578 579
    } else {
        return drv->bdrv_write(bs, sector_num, buf, nb_sectors);
    }
}

580
static int bdrv_pread_em(BlockDriverState *bs, int64_t offset,
B
bellard 已提交
581
                         uint8_t *buf, int count1)
B
bellard 已提交
582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623
{
    uint8_t tmp_buf[SECTOR_SIZE];
    int len, nb_sectors, count;
    int64_t sector_num;

    count = count1;
    /* first read to align to sector start */
    len = (SECTOR_SIZE - offset) & (SECTOR_SIZE - 1);
    if (len > count)
        len = count;
    sector_num = offset >> SECTOR_BITS;
    if (len > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(buf, tmp_buf + (offset & (SECTOR_SIZE - 1)), len);
        count -= len;
        if (count == 0)
            return count1;
        sector_num++;
        buf += len;
    }

    /* read the sectors "in place" */
    nb_sectors = count >> SECTOR_BITS;
    if (nb_sectors > 0) {
        if (bdrv_read(bs, sector_num, buf, nb_sectors) < 0)
            return -EIO;
        sector_num += nb_sectors;
        len = nb_sectors << SECTOR_BITS;
        buf += len;
        count -= len;
    }

    /* add data from the last sector */
    if (count > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(buf, tmp_buf, count);
    }
    return count1;
}

624
static int bdrv_pwrite_em(BlockDriverState *bs, int64_t offset,
B
bellard 已提交
625
                          const uint8_t *buf, int count1)
B
bellard 已提交
626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672
{
    uint8_t tmp_buf[SECTOR_SIZE];
    int len, nb_sectors, count;
    int64_t sector_num;

    count = count1;
    /* first write to align to sector start */
    len = (SECTOR_SIZE - offset) & (SECTOR_SIZE - 1);
    if (len > count)
        len = count;
    sector_num = offset >> SECTOR_BITS;
    if (len > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(tmp_buf + (offset & (SECTOR_SIZE - 1)), buf, len);
        if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        count -= len;
        if (count == 0)
            return count1;
        sector_num++;
        buf += len;
    }

    /* write the sectors "in place" */
    nb_sectors = count >> SECTOR_BITS;
    if (nb_sectors > 0) {
        if (bdrv_write(bs, sector_num, buf, nb_sectors) < 0)
            return -EIO;
        sector_num += nb_sectors;
        len = nb_sectors << SECTOR_BITS;
        buf += len;
        count -= len;
    }

    /* add data from the last sector */
    if (count > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(tmp_buf, buf, count);
        if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
    }
    return count1;
}

/**
673
 * Read with byte offsets (needed only for file protocols)
B
bellard 已提交
674
 */
675
int bdrv_pread(BlockDriverState *bs, int64_t offset,
B
bellard 已提交
676 677 678 679 680
               void *buf1, int count1)
{
    BlockDriver *drv = bs->drv;

    if (!drv)
B
bellard 已提交
681
        return -ENOMEDIUM;
B
bellard 已提交
682
    if (!drv->bdrv_pread)
B
bellard 已提交
683
        return bdrv_pread_em(bs, offset, buf1, count1);
B
bellard 已提交
684 685 686
    return drv->bdrv_pread(bs, offset, buf1, count1);
}

687 688
/**
 * Write with byte offsets (needed only for file protocols)
B
bellard 已提交
689
 */
690
int bdrv_pwrite(BlockDriverState *bs, int64_t offset,
B
bellard 已提交
691 692 693 694 695
                const void *buf1, int count1)
{
    BlockDriver *drv = bs->drv;

    if (!drv)
B
bellard 已提交
696
        return -ENOMEDIUM;
B
bellard 已提交
697
    if (!drv->bdrv_pwrite)
B
bellard 已提交
698
        return bdrv_pwrite_em(bs, offset, buf1, count1);
B
bellard 已提交
699 700 701 702 703 704 705 706 707 708
    return drv->bdrv_pwrite(bs, offset, buf1, count1);
}

/**
 * Truncate file to 'offset' bytes (needed only for file protocols)
 */
int bdrv_truncate(BlockDriverState *bs, int64_t offset)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
709
        return -ENOMEDIUM;
B
bellard 已提交
710 711 712 713 714 715 716 717 718 719 720 721
    if (!drv->bdrv_truncate)
        return -ENOTSUP;
    return drv->bdrv_truncate(bs, offset);
}

/**
 * Length of a file in bytes. Return < 0 if error or unknown.
 */
int64_t bdrv_getlength(BlockDriverState *bs)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
722
        return -ENOMEDIUM;
B
bellard 已提交
723 724 725 726 727
    if (!drv->bdrv_getlength) {
        /* legacy mode */
        return bs->total_sectors * SECTOR_SIZE;
    }
    return drv->bdrv_getlength(bs);
B
bellard 已提交
728 729
}

B
bellard 已提交
730
/* return 0 as number of sectors if no device present or error */
731
void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
B
bellard 已提交
732
{
B
bellard 已提交
733 734 735 736 737 738 739
    int64_t length;
    length = bdrv_getlength(bs);
    if (length < 0)
        length = 0;
    else
        length = length >> SECTOR_BITS;
    *nb_sectors_ptr = length;
B
bellard 已提交
740
}
B
bellard 已提交
741

742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857
struct partition {
        uint8_t boot_ind;           /* 0x80 - active */
        uint8_t head;               /* starting head */
        uint8_t sector;             /* starting sector */
        uint8_t cyl;                /* starting cylinder */
        uint8_t sys_ind;            /* What partition type */
        uint8_t end_head;           /* end head */
        uint8_t end_sector;         /* end sector */
        uint8_t end_cyl;            /* end cylinder */
        uint32_t start_sect;        /* starting sector counting from 0 */
        uint32_t nr_sects;          /* nr of sectors in partition */
} __attribute__((packed));

/* try to guess the disk logical geometry from the MSDOS partition table. Return 0 if OK, -1 if could not guess */
static int guess_disk_lchs(BlockDriverState *bs,
                           int *pcylinders, int *pheads, int *psectors)
{
    uint8_t buf[512];
    int ret, i, heads, sectors, cylinders;
    struct partition *p;
    uint32_t nr_sects;
    int64_t nb_sectors;

    bdrv_get_geometry(bs, &nb_sectors);

    ret = bdrv_read(bs, 0, buf, 1);
    if (ret < 0)
        return -1;
    /* test msdos magic */
    if (buf[510] != 0x55 || buf[511] != 0xaa)
        return -1;
    for(i = 0; i < 4; i++) {
        p = ((struct partition *)(buf + 0x1be)) + i;
        nr_sects = le32_to_cpu(p->nr_sects);
        if (nr_sects && p->end_head) {
            /* We make the assumption that the partition terminates on
               a cylinder boundary */
            heads = p->end_head + 1;
            sectors = p->end_sector & 63;
            if (sectors == 0)
                continue;
            cylinders = nb_sectors / (heads * sectors);
            if (cylinders < 1 || cylinders > 16383)
                continue;
            *pheads = heads;
            *psectors = sectors;
            *pcylinders = cylinders;
#if 0
            printf("guessed geometry: LCHS=%d %d %d\n",
                   cylinders, heads, sectors);
#endif
            return 0;
        }
    }
    return -1;
}

void bdrv_guess_geometry(BlockDriverState *bs, int *pcyls, int *pheads, int *psecs)
{
    int translation, lba_detected = 0;
    int cylinders, heads, secs;
    int64_t nb_sectors;

    /* if a geometry hint is available, use it */
    bdrv_get_geometry(bs, &nb_sectors);
    bdrv_get_geometry_hint(bs, &cylinders, &heads, &secs);
    translation = bdrv_get_translation_hint(bs);
    if (cylinders != 0) {
        *pcyls = cylinders;
        *pheads = heads;
        *psecs = secs;
    } else {
        if (guess_disk_lchs(bs, &cylinders, &heads, &secs) == 0) {
            if (heads > 16) {
                /* if heads > 16, it means that a BIOS LBA
                   translation was active, so the default
                   hardware geometry is OK */
                lba_detected = 1;
                goto default_geometry;
            } else {
                *pcyls = cylinders;
                *pheads = heads;
                *psecs = secs;
                /* disable any translation to be in sync with
                   the logical geometry */
                if (translation == BIOS_ATA_TRANSLATION_AUTO) {
                    bdrv_set_translation_hint(bs,
                                              BIOS_ATA_TRANSLATION_NONE);
                }
            }
        } else {
        default_geometry:
            /* if no geometry, use a standard physical disk geometry */
            cylinders = nb_sectors / (16 * 63);

            if (cylinders > 16383)
                cylinders = 16383;
            else if (cylinders < 2)
                cylinders = 2;
            *pcyls = cylinders;
            *pheads = 16;
            *psecs = 63;
            if ((lba_detected == 1) && (translation == BIOS_ATA_TRANSLATION_AUTO)) {
                if ((*pcyls * *pheads) <= 131072) {
                    bdrv_set_translation_hint(bs,
                                              BIOS_ATA_TRANSLATION_LARGE);
                } else {
                    bdrv_set_translation_hint(bs,
                                              BIOS_ATA_TRANSLATION_LBA);
                }
            }
        }
        bdrv_set_geometry_hint(bs, *pcyls, *pheads, *psecs);
    }
}

858
void bdrv_set_geometry_hint(BlockDriverState *bs,
B
bellard 已提交
859 860 861 862 863 864 865 866 867 868 869 870 871 872
                            int cyls, int heads, int secs)
{
    bs->cyls = cyls;
    bs->heads = heads;
    bs->secs = secs;
}

void bdrv_set_type_hint(BlockDriverState *bs, int type)
{
    bs->type = type;
    bs->removable = ((type == BDRV_TYPE_CDROM ||
                      type == BDRV_TYPE_FLOPPY));
}

B
bellard 已提交
873 874 875 876 877
void bdrv_set_translation_hint(BlockDriverState *bs, int translation)
{
    bs->translation = translation;
}

878
void bdrv_get_geometry_hint(BlockDriverState *bs,
B
bellard 已提交
879 880 881 882 883 884 885 886 887 888 889 890
                            int *pcyls, int *pheads, int *psecs)
{
    *pcyls = bs->cyls;
    *pheads = bs->heads;
    *psecs = bs->secs;
}

int bdrv_get_type_hint(BlockDriverState *bs)
{
    return bs->type;
}

B
bellard 已提交
891 892 893 894 895
int bdrv_get_translation_hint(BlockDriverState *bs)
{
    return bs->translation;
}

B
bellard 已提交
896 897 898 899 900 901 902 903 904 905
int bdrv_is_removable(BlockDriverState *bs)
{
    return bs->removable;
}

int bdrv_is_read_only(BlockDriverState *bs)
{
    return bs->read_only;
}

906 907 908 909 910
int bdrv_is_sg(BlockDriverState *bs)
{
    return bs->sg;
}

B
bellard 已提交
911
/* XXX: no longer used */
912
void bdrv_set_change_cb(BlockDriverState *bs,
B
bellard 已提交
913 914 915 916 917 918
                        void (*change_cb)(void *opaque), void *opaque)
{
    bs->change_cb = change_cb;
    bs->change_opaque = opaque;
}

B
bellard 已提交
919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942
int bdrv_is_encrypted(BlockDriverState *bs)
{
    if (bs->backing_hd && bs->backing_hd->encrypted)
        return 1;
    return bs->encrypted;
}

int bdrv_set_key(BlockDriverState *bs, const char *key)
{
    int ret;
    if (bs->backing_hd && bs->backing_hd->encrypted) {
        ret = bdrv_set_key(bs->backing_hd, key);
        if (ret < 0)
            return ret;
        if (!bs->encrypted)
            return 0;
    }
    if (!bs->encrypted || !bs->drv || !bs->drv->bdrv_set_key)
        return -1;
    return bs->drv->bdrv_set_key(bs, key);
}

void bdrv_get_format(BlockDriverState *bs, char *buf, int buf_size)
{
B
bellard 已提交
943
    if (!bs->drv) {
B
bellard 已提交
944 945 946 947 948 949
        buf[0] = '\0';
    } else {
        pstrcpy(buf, buf_size, bs->drv->format_name);
    }
}

950
void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
B
bellard 已提交
951 952 953 954 955 956 957 958 959
                         void *opaque)
{
    BlockDriver *drv;

    for (drv = first_drv; drv != NULL; drv = drv->next) {
        it(opaque, drv->format_name);
    }
}

B
bellard 已提交
960 961 962 963 964 965 966 967 968 969 970
BlockDriverState *bdrv_find(const char *name)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
        if (!strcmp(name, bs->device_name))
            return bs;
    }
    return NULL;
}

B
bellard 已提交
971 972 973 974 975 976 977 978 979
void bdrv_iterate(void (*it)(void *opaque, const char *name), void *opaque)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
        it(opaque, bs->device_name);
    }
}

B
bellard 已提交
980 981 982 983 984
const char *bdrv_get_device_name(BlockDriverState *bs)
{
    return bs->device_name;
}

P
pbrook 已提交
985 986 987 988 989 990 991 992
void bdrv_flush(BlockDriverState *bs)
{
    if (bs->drv->bdrv_flush)
        bs->drv->bdrv_flush(bs);
    if (bs->backing_hd)
        bdrv_flush(bs->backing_hd);
}

A
aliguori 已提交
993 994 995 996 997 998 999 1000 1001 1002
void bdrv_flush_all(void)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next)
        if (bs->drv && !bdrv_is_read_only(bs) && 
            (!bdrv_is_removable(bs) || bdrv_is_inserted(bs)))
            bdrv_flush(bs);
}

1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029
/*
 * Returns true iff the specified sector is present in the disk image. Drivers
 * not implementing the functionality are assumed to not support backing files,
 * hence all their sectors are reported as allocated.
 *
 * 'pnum' is set to the number of sectors (including and immediately following
 * the specified sector) that are known to be in the same
 * allocated/unallocated state.
 *
 * 'nb_sectors' is the max value 'pnum' should be set to.
 */
int bdrv_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors,
	int *pnum)
{
    int64_t n;
    if (!bs->drv->bdrv_is_allocated) {
        if (sector_num >= bs->total_sectors) {
            *pnum = 0;
            return 0;
        }
        n = bs->total_sectors - sector_num;
        *pnum = (n < nb_sectors) ? (n) : (nb_sectors);
        return 1;
    }
    return bs->drv->bdrv_is_allocated(bs, sector_num, nb_sectors, pnum);
}

B
bellard 已提交
1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051
void bdrv_info(void)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
        term_printf("%s:", bs->device_name);
        term_printf(" type=");
        switch(bs->type) {
        case BDRV_TYPE_HD:
            term_printf("hd");
            break;
        case BDRV_TYPE_CDROM:
            term_printf("cdrom");
            break;
        case BDRV_TYPE_FLOPPY:
            term_printf("floppy");
            break;
        }
        term_printf(" removable=%d", bs->removable);
        if (bs->removable) {
            term_printf(" locked=%d", bs->locked);
        }
B
bellard 已提交
1052
        if (bs->drv) {
1053 1054 1055 1056 1057 1058
            term_printf(" file=");
	    term_print_filename(bs->filename);
            if (bs->backing_file[0] != '\0') {
                term_printf(" backing_file=");
		term_print_filename(bs->backing_file);
	    }
B
bellard 已提交
1059
            term_printf(" ro=%d", bs->read_only);
B
bellard 已提交
1060 1061 1062
            term_printf(" drv=%s", bs->drv->format_name);
            if (bs->encrypted)
                term_printf(" encrypted");
B
bellard 已提交
1063 1064 1065 1066 1067 1068
        } else {
            term_printf(" [not inserted]");
        }
        term_printf("\n");
    }
}
1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086

/* The "info blockstats" command. */
void bdrv_info_stats (void)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
	term_printf ("%s:"
		     " rd_bytes=%" PRIu64
		     " wr_bytes=%" PRIu64
		     " rd_operations=%" PRIu64
		     " wr_operations=%" PRIu64
		     "\n",
		     bs->device_name,
		     bs->rd_bytes, bs->wr_bytes,
		     bs->rd_ops, bs->wr_ops);
    }
}
B
bellard 已提交
1087

1088
void bdrv_get_backing_filename(BlockDriverState *bs,
B
bellard 已提交
1089 1090 1091 1092 1093 1094 1095 1096 1097
                               char *filename, int filename_size)
{
    if (!bs->backing_hd) {
        pstrcpy(filename, filename_size, "");
    } else {
        pstrcpy(filename, filename_size, bs->backing_file);
    }
}

1098
int bdrv_write_compressed(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
1099 1100 1101 1102
                          const uint8_t *buf, int nb_sectors)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
1103
        return -ENOMEDIUM;
B
bellard 已提交
1104 1105 1106 1107
    if (!drv->bdrv_write_compressed)
        return -ENOTSUP;
    return drv->bdrv_write_compressed(bs, sector_num, buf, nb_sectors);
}
1108

B
bellard 已提交
1109 1110 1111 1112
int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
1113
        return -ENOMEDIUM;
B
bellard 已提交
1114 1115 1116 1117 1118 1119 1120 1121 1122
    if (!drv->bdrv_get_info)
        return -ENOTSUP;
    memset(bdi, 0, sizeof(*bdi));
    return drv->bdrv_get_info(bs, bdi);
}

/**************************************************************/
/* handling of snapshots */

1123
int bdrv_snapshot_create(BlockDriverState *bs,
B
bellard 已提交
1124 1125 1126 1127
                         QEMUSnapshotInfo *sn_info)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
1128
        return -ENOMEDIUM;
B
bellard 已提交
1129 1130 1131 1132 1133
    if (!drv->bdrv_snapshot_create)
        return -ENOTSUP;
    return drv->bdrv_snapshot_create(bs, sn_info);
}

1134
int bdrv_snapshot_goto(BlockDriverState *bs,
B
bellard 已提交
1135 1136 1137 1138
                       const char *snapshot_id)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
1139
        return -ENOMEDIUM;
B
bellard 已提交
1140 1141 1142 1143 1144 1145 1146 1147 1148
    if (!drv->bdrv_snapshot_goto)
        return -ENOTSUP;
    return drv->bdrv_snapshot_goto(bs, snapshot_id);
}

int bdrv_snapshot_delete(BlockDriverState *bs, const char *snapshot_id)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
1149
        return -ENOMEDIUM;
B
bellard 已提交
1150 1151 1152 1153 1154
    if (!drv->bdrv_snapshot_delete)
        return -ENOTSUP;
    return drv->bdrv_snapshot_delete(bs, snapshot_id);
}

1155
int bdrv_snapshot_list(BlockDriverState *bs,
B
bellard 已提交
1156 1157 1158 1159
                       QEMUSnapshotInfo **psn_info)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
B
bellard 已提交
1160
        return -ENOMEDIUM;
B
bellard 已提交
1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179
    if (!drv->bdrv_snapshot_list)
        return -ENOTSUP;
    return drv->bdrv_snapshot_list(bs, psn_info);
}

#define NB_SUFFIXES 4

char *get_human_readable_size(char *buf, int buf_size, int64_t size)
{
    static const char suffixes[NB_SUFFIXES] = "KMGT";
    int64_t base;
    int i;

    if (size <= 999) {
        snprintf(buf, buf_size, "%" PRId64, size);
    } else {
        base = 1024;
        for(i = 0; i < NB_SUFFIXES; i++) {
            if (size < (10 * base)) {
1180
                snprintf(buf, buf_size, "%0.1f%c",
B
bellard 已提交
1181 1182 1183 1184
                         (double)size / base,
                         suffixes[i]);
                break;
            } else if (size < (1000 * base) || i == (NB_SUFFIXES - 1)) {
1185
                snprintf(buf, buf_size, "%" PRId64 "%c",
B
bellard 已提交
1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198
                         ((size + (base >> 1)) / base),
                         suffixes[i]);
                break;
            }
            base = base * 1024;
        }
    }
    return buf;
}

char *bdrv_snapshot_dump(char *buf, int buf_size, QEMUSnapshotInfo *sn)
{
    char buf1[128], date_buf[128], clock_buf[128];
1199 1200 1201
#ifdef _WIN32
    struct tm *ptm;
#else
B
bellard 已提交
1202
    struct tm tm;
1203
#endif
B
bellard 已提交
1204 1205 1206 1207
    time_t ti;
    int64_t secs;

    if (!sn) {
1208 1209
        snprintf(buf, buf_size,
                 "%-10s%-20s%7s%20s%15s",
B
bellard 已提交
1210 1211 1212
                 "ID", "TAG", "VM SIZE", "DATE", "VM CLOCK");
    } else {
        ti = sn->date_sec;
1213 1214 1215 1216 1217
#ifdef _WIN32
        ptm = localtime(&ti);
        strftime(date_buf, sizeof(date_buf),
                 "%Y-%m-%d %H:%M:%S", ptm);
#else
B
bellard 已提交
1218 1219 1220
        localtime_r(&ti, &tm);
        strftime(date_buf, sizeof(date_buf),
                 "%Y-%m-%d %H:%M:%S", &tm);
1221
#endif
B
bellard 已提交
1222 1223 1224 1225 1226
        secs = sn->vm_clock_nsec / 1000000000;
        snprintf(clock_buf, sizeof(clock_buf),
                 "%02d:%02d:%02d.%03d",
                 (int)(secs / 3600),
                 (int)((secs / 60) % 60),
1227
                 (int)(secs % 60),
B
bellard 已提交
1228 1229
                 (int)((sn->vm_clock_nsec / 1000000) % 1000));
        snprintf(buf, buf_size,
1230
                 "%-10s%-20s%7s%20s%15s",
B
bellard 已提交
1231 1232 1233 1234 1235 1236 1237 1238
                 sn->id_str, sn->name,
                 get_human_readable_size(buf1, sizeof(buf1), sn->vm_state_size),
                 date_buf,
                 clock_buf);
    }
    return buf;
}

B
bellard 已提交
1239

B
bellard 已提交
1240
/**************************************************************/
B
bellard 已提交
1241
/* async I/Os */
B
bellard 已提交
1242

1243 1244 1245
BlockDriverAIOCB *bdrv_aio_read(BlockDriverState *bs, int64_t sector_num,
                                uint8_t *buf, int nb_sectors,
                                BlockDriverCompletionFunc *cb, void *opaque)
B
bellard 已提交
1246 1247
{
    BlockDriver *drv = bs->drv;
1248
    BlockDriverAIOCB *ret;
B
bellard 已提交
1249

B
bellard 已提交
1250
    if (!drv)
1251
        return NULL;
1252

1253 1254 1255 1256 1257 1258 1259 1260 1261
    ret = drv->bdrv_aio_read(bs, sector_num, buf, nb_sectors, cb, opaque);

    if (ret) {
	/* Update stats even though technically transfer has not happened. */
	bs->rd_bytes += (unsigned) nb_sectors * SECTOR_SIZE;
	bs->rd_ops ++;
    }

    return ret;
B
bellard 已提交
1262 1263
}

1264 1265 1266
BlockDriverAIOCB *bdrv_aio_write(BlockDriverState *bs, int64_t sector_num,
                                 const uint8_t *buf, int nb_sectors,
                                 BlockDriverCompletionFunc *cb, void *opaque)
B
bellard 已提交
1267
{
B
bellard 已提交
1268
    BlockDriver *drv = bs->drv;
1269
    BlockDriverAIOCB *ret;
B
bellard 已提交
1270

B
bellard 已提交
1271
    if (!drv)
1272
        return NULL;
B
bellard 已提交
1273
    if (bs->read_only)
1274
        return NULL;
B
bellard 已提交
1275

1276 1277 1278 1279 1280 1281 1282 1283 1284
    ret = drv->bdrv_aio_write(bs, sector_num, buf, nb_sectors, cb, opaque);

    if (ret) {
	/* Update stats even though technically transfer has not happened. */
	bs->wr_bytes += (unsigned) nb_sectors * SECTOR_SIZE;
	bs->wr_ops ++;
    }

    return ret;
B
bellard 已提交
1285 1286 1287 1288
}

void bdrv_aio_cancel(BlockDriverAIOCB *acb)
{
1289
    BlockDriver *drv = acb->bs->drv;
B
bellard 已提交
1290

1291
    drv->bdrv_aio_cancel(acb);
B
bellard 已提交
1292 1293
}

1294

B
bellard 已提交
1295 1296 1297
/**************************************************************/
/* async block device emulation */

1298
static void bdrv_aio_bh_cb(void *opaque)
B
bellard 已提交
1299
{
1300 1301 1302
    BlockDriverAIOCBSync *acb = opaque;
    acb->common.cb(acb->common.opaque, acb->ret);
    qemu_aio_release(acb);
B
bellard 已提交
1303
}
1304

1305 1306 1307
static BlockDriverAIOCB *bdrv_aio_read_em(BlockDriverState *bs,
        int64_t sector_num, uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque)
B
bellard 已提交
1308
{
1309
    BlockDriverAIOCBSync *acb;
B
bellard 已提交
1310
    int ret;
1311 1312 1313 1314 1315 1316 1317 1318

    acb = qemu_aio_get(bs, cb, opaque);
    if (!acb->bh)
        acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
    ret = bdrv_read(bs, sector_num, buf, nb_sectors);
    acb->ret = ret;
    qemu_bh_schedule(acb->bh);
    return &acb->common;
1319 1320
}

1321 1322 1323
static BlockDriverAIOCB *bdrv_aio_write_em(BlockDriverState *bs,
        int64_t sector_num, const uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque)
1324
{
1325
    BlockDriverAIOCBSync *acb;
B
bellard 已提交
1326 1327
    int ret;

1328 1329 1330 1331 1332 1333 1334
    acb = qemu_aio_get(bs, cb, opaque);
    if (!acb->bh)
        acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
    ret = bdrv_write(bs, sector_num, buf, nb_sectors);
    acb->ret = ret;
    qemu_bh_schedule(acb->bh);
    return &acb->common;
1335 1336
}

1337
static void bdrv_aio_cancel_em(BlockDriverAIOCB *blockacb)
B
bellard 已提交
1338
{
1339 1340 1341
    BlockDriverAIOCBSync *acb = (BlockDriverAIOCBSync *)blockacb;
    qemu_bh_cancel(acb->bh);
    qemu_aio_release(acb);
B
bellard 已提交
1342
}
B
bellard 已提交
1343

B
bellard 已提交
1344 1345
/**************************************************************/
/* sync block device emulation */
B
bellard 已提交
1346

B
bellard 已提交
1347 1348 1349
static void bdrv_rw_em_cb(void *opaque, int ret)
{
    *(int *)opaque = ret;
B
bellard 已提交
1350 1351
}

B
bellard 已提交
1352 1353
#define NOT_DONE 0x7fffffff

1354
static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
1355
                        uint8_t *buf, int nb_sectors)
P
pbrook 已提交
1356
{
1357 1358
    int async_ret;
    BlockDriverAIOCB *acb;
B
bellard 已提交
1359 1360

    async_ret = NOT_DONE;
1361
    acb = bdrv_aio_read(bs, sector_num, buf, nb_sectors,
B
bellard 已提交
1362
                        bdrv_rw_em_cb, &async_ret);
1363
    if (acb == NULL)
1364
        return -1;
1365

B
bellard 已提交
1366 1367 1368
    while (async_ret == NOT_DONE) {
        qemu_aio_wait();
    }
1369

B
bellard 已提交
1370
    return async_ret;
P
pbrook 已提交
1371 1372
}

B
bellard 已提交
1373 1374 1375
static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
                         const uint8_t *buf, int nb_sectors)
{
1376 1377
    int async_ret;
    BlockDriverAIOCB *acb;
B
bellard 已提交
1378 1379

    async_ret = NOT_DONE;
1380
    acb = bdrv_aio_write(bs, sector_num, buf, nb_sectors,
B
bellard 已提交
1381
                         bdrv_rw_em_cb, &async_ret);
1382
    if (acb == NULL)
1383
        return -1;
B
bellard 已提交
1384 1385 1386 1387 1388
    while (async_ret == NOT_DONE) {
        qemu_aio_wait();
    }
    return async_ret;
}
B
bellard 已提交
1389 1390 1391 1392

void bdrv_init(void)
{
    bdrv_register(&bdrv_raw);
B
bellard 已提交
1393
    bdrv_register(&bdrv_host_device);
B
bellard 已提交
1394 1395 1396 1397 1398
#ifndef _WIN32
    bdrv_register(&bdrv_cow);
#endif
    bdrv_register(&bdrv_qcow);
    bdrv_register(&bdrv_vmdk);
B
bellard 已提交
1399
    bdrv_register(&bdrv_cloop);
1400
    bdrv_register(&bdrv_dmg);
1401
    bdrv_register(&bdrv_bochs);
1402
    bdrv_register(&bdrv_vpc);
B
bellard 已提交
1403
    bdrv_register(&bdrv_vvfat);
B
bellard 已提交
1404
    bdrv_register(&bdrv_qcow2);
1405
    bdrv_register(&bdrv_parallels);
1406
    bdrv_register(&bdrv_nbd);
B
bellard 已提交
1407
}
1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436

void *qemu_aio_get(BlockDriverState *bs, BlockDriverCompletionFunc *cb,
                   void *opaque)
{
    BlockDriver *drv;
    BlockDriverAIOCB *acb;

    drv = bs->drv;
    if (drv->free_aiocb) {
        acb = drv->free_aiocb;
        drv->free_aiocb = acb->next;
    } else {
        acb = qemu_mallocz(drv->aiocb_size);
        if (!acb)
            return NULL;
    }
    acb->bs = bs;
    acb->cb = cb;
    acb->opaque = opaque;
    return acb;
}

void qemu_aio_release(void *p)
{
    BlockDriverAIOCB *acb = p;
    BlockDriver *drv = acb->bs->drv;
    acb->next = drv->free_aiocb;
    drv->free_aiocb = acb;
}
B
bellard 已提交
1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457

/**************************************************************/
/* removable device support */

/**
 * Return TRUE if the media is present
 */
int bdrv_is_inserted(BlockDriverState *bs)
{
    BlockDriver *drv = bs->drv;
    int ret;
    if (!drv)
        return 0;
    if (!drv->bdrv_is_inserted)
        return 1;
    ret = drv->bdrv_is_inserted(bs);
    return ret;
}

/**
 * Return TRUE if the media changed since the last call to this
1458
 * function. It is currently only used for floppy disks
B
bellard 已提交
1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511
 */
int bdrv_media_changed(BlockDriverState *bs)
{
    BlockDriver *drv = bs->drv;
    int ret;

    if (!drv || !drv->bdrv_media_changed)
        ret = -ENOTSUP;
    else
        ret = drv->bdrv_media_changed(bs);
    if (ret == -ENOTSUP)
        ret = bs->media_changed;
    bs->media_changed = 0;
    return ret;
}

/**
 * If eject_flag is TRUE, eject the media. Otherwise, close the tray
 */
void bdrv_eject(BlockDriverState *bs, int eject_flag)
{
    BlockDriver *drv = bs->drv;
    int ret;

    if (!drv || !drv->bdrv_eject) {
        ret = -ENOTSUP;
    } else {
        ret = drv->bdrv_eject(bs, eject_flag);
    }
    if (ret == -ENOTSUP) {
        if (eject_flag)
            bdrv_close(bs);
    }
}

int bdrv_is_locked(BlockDriverState *bs)
{
    return bs->locked;
}

/**
 * Lock or unlock the media (if it is locked, the user won't be able
 * to eject it manually).
 */
void bdrv_set_locked(BlockDriverState *bs, int locked)
{
    BlockDriver *drv = bs->drv;

    bs->locked = locked;
    if (drv && drv->bdrv_set_locked) {
        drv->bdrv_set_locked(bs, locked);
    }
}
1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522

/* needed for generic scsi interface */

int bdrv_ioctl(BlockDriverState *bs, unsigned long int req, void *buf)
{
    BlockDriver *drv = bs->drv;

    if (drv && drv->bdrv_ioctl)
        return drv->bdrv_ioctl(bs, req, buf);
    return -ENOTSUP;
}