cow.c 8.8 KB
Newer Older
B
bellard 已提交
1 2
/*
 * Block driver for the COW format
3
 *
B
bellard 已提交
4
 * Copyright (c) 2004 Fabrice Bellard
5
 *
B
bellard 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
#ifndef _WIN32
P
pbrook 已提交
25
#include "qemu-common.h"
B
bellard 已提交
26
#include "block_int.h"
27
#include "module.h"
B
bellard 已提交
28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
#include <sys/mman.h>

/**************************************************************/
/* COW block driver using file system holes */

/* user mode linux compatible COW file */
#define COW_MAGIC 0x4f4f4f4d  /* MOOO */
#define COW_VERSION 2

struct cow_header_v2 {
    uint32_t magic;
    uint32_t version;
    char backing_file[1024];
    int32_t mtime;
    uint64_t size;
    uint32_t sectorsize;
};

typedef struct BDRVCowState {
    int fd;
    uint8_t *cow_bitmap; /* if non NULL, COW mappings are used first */
    uint8_t *cow_bitmap_addr; /* mmap address of cow_bitmap */
    int cow_bitmap_size;
    int64_t cow_sectors_offset;
} BDRVCowState;

static int cow_probe(const uint8_t *buf, int buf_size, const char *filename)
{
    const struct cow_header_v2 *cow_header = (const void *)buf;

B
bellard 已提交
58 59
    if (buf_size >= sizeof(struct cow_header_v2) &&
        be32_to_cpu(cow_header->magic) == COW_MAGIC &&
60
        be32_to_cpu(cow_header->version) == COW_VERSION)
B
bellard 已提交
61 62 63 64 65
        return 100;
    else
        return 0;
}

B
bellard 已提交
66
static int cow_open(BlockDriverState *bs, const char *filename, int flags)
B
bellard 已提交
67 68 69 70 71 72 73 74 75 76 77 78 79 80
{
    BDRVCowState *s = bs->opaque;
    int fd;
    struct cow_header_v2 cow_header;
    int64_t size;

    fd = open(filename, O_RDWR | O_BINARY | O_LARGEFILE);
    if (fd < 0) {
        fd = open(filename, O_RDONLY | O_BINARY | O_LARGEFILE);
        if (fd < 0)
            return -1;
    }
    s->fd = fd;
    /* see if it is a cow image */
C
Christoph Hellwig 已提交
81
    if (pread(fd, &cow_header, sizeof(cow_header), 0) != sizeof(cow_header)) {
B
bellard 已提交
82 83 84 85 86 87 88
        goto fail;
    }

    if (be32_to_cpu(cow_header.magic) != COW_MAGIC ||
        be32_to_cpu(cow_header.version) != COW_VERSION) {
        goto fail;
    }
89

B
bellard 已提交
90 91 92 93
    /* cow image found */
    size = be64_to_cpu(cow_header.size);
    bs->total_sectors = size / 512;

94
    pstrcpy(bs->backing_file, sizeof(bs->backing_file),
B
bellard 已提交
95
            cow_header.backing_file);
96

B
bellard 已提交
97 98
    /* mmap the bitmap */
    s->cow_bitmap_size = ((bs->total_sectors + 7) >> 3) + sizeof(cow_header);
99 100 101 102
    s->cow_bitmap_addr = (void *)mmap(get_mmap_addr(s->cow_bitmap_size),
                                      s->cow_bitmap_size,
                                      PROT_READ | PROT_WRITE,
                                      MAP_SHARED, s->fd, 0);
B
bellard 已提交
103 104 105 106 107 108 109 110 111 112
    if (s->cow_bitmap_addr == MAP_FAILED)
        goto fail;
    s->cow_bitmap = s->cow_bitmap_addr + sizeof(cow_header);
    s->cow_sectors_offset = (s->cow_bitmap_size + 511) & ~511;
    return 0;
 fail:
    close(fd);
    return -1;
}

113
static inline void cow_set_bit(uint8_t *bitmap, int64_t bitnum)
B
bellard 已提交
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146
{
    bitmap[bitnum / 8] |= (1 << (bitnum%8));
}

static inline int is_bit_set(const uint8_t *bitmap, int64_t bitnum)
{
    return !!(bitmap[bitnum / 8] & (1 << (bitnum%8)));
}


/* Return true if first block has been changed (ie. current version is
 * in COW file).  Set the number of continuous blocks for which that
 * is true. */
static inline int is_changed(uint8_t *bitmap,
                             int64_t sector_num, int nb_sectors,
                             int *num_same)
{
    int changed;

    if (!bitmap || nb_sectors == 0) {
	*num_same = nb_sectors;
	return 0;
    }

    changed = is_bit_set(bitmap, sector_num);
    for (*num_same = 1; *num_same < nb_sectors; (*num_same)++) {
	if (is_bit_set(bitmap, sector_num + *num_same) != changed)
	    break;
    }

    return changed;
}

147
static int cow_is_allocated(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
148 149 150 151 152 153
                            int nb_sectors, int *pnum)
{
    BDRVCowState *s = bs->opaque;
    return is_changed(s->cow_bitmap, sector_num, nb_sectors, pnum);
}

154
static int cow_read(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
155 156 157 158
                    uint8_t *buf, int nb_sectors)
{
    BDRVCowState *s = bs->opaque;
    int ret, n;
159

B
bellard 已提交
160 161
    while (nb_sectors > 0) {
        if (is_changed(s->cow_bitmap, sector_num, nb_sectors, &n)) {
C
Christoph Hellwig 已提交
162 163
            ret = pread(s->fd, buf, n * 512,
                        s->cow_sectors_offset + sector_num * 512);
164
            if (ret != n * 512)
B
bellard 已提交
165 166
                return -1;
        } else {
B
bellard 已提交
167 168 169 170 171 172
            if (bs->backing_hd) {
                /* read from the base image */
                ret = bdrv_read(bs->backing_hd, sector_num, buf, n);
                if (ret < 0)
                    return -1;
            } else {
B
bellard 已提交
173 174
            memset(buf, 0, n * 512);
        }
B
bellard 已提交
175
        }
B
bellard 已提交
176 177 178 179 180 181 182
        nb_sectors -= n;
        sector_num += n;
        buf += n * 512;
    }
    return 0;
}

183
static int cow_write(BlockDriverState *bs, int64_t sector_num,
B
bellard 已提交
184 185 186 187
                     const uint8_t *buf, int nb_sectors)
{
    BDRVCowState *s = bs->opaque;
    int ret, i;
188

C
Christoph Hellwig 已提交
189 190
    ret = pwrite(s->fd, buf, nb_sectors * 512,
                 s->cow_sectors_offset + sector_num * 512);
191
    if (ret != nb_sectors * 512)
B
bellard 已提交
192 193
        return -1;
    for (i = 0; i < nb_sectors; i++)
194
        cow_set_bit(s->cow_bitmap, sector_num + i);
B
bellard 已提交
195 196 197
    return 0;
}

B
bellard 已提交
198
static void cow_close(BlockDriverState *bs)
B
bellard 已提交
199 200
{
    BDRVCowState *s = bs->opaque;
201
    munmap((void *)s->cow_bitmap_addr, s->cow_bitmap_size);
B
bellard 已提交
202 203 204
    close(s->fd);
}

205
static int cow_create(const char *filename, QEMUOptionParameter *options)
B
bellard 已提交
206 207 208 209
{
    int fd, cow_fd;
    struct cow_header_v2 cow_header;
    struct stat st;
210 211
    int64_t image_sectors = 0;
    const char *image_filename = NULL;
212
    int ret;
213 214 215 216 217 218 219 220 221 222

    /* Read out options */
    while (options && options->name) {
        if (!strcmp(options->name, BLOCK_OPT_SIZE)) {
            image_sectors = options->value.n / 512;
        } else if (!strcmp(options->name, BLOCK_OPT_BACKING_FILE)) {
            image_filename = options->value.s;
        }
        options++;
    }
B
bellard 已提交
223

224
    cow_fd = open(filename, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY,
B
bellard 已提交
225 226
              0644);
    if (cow_fd < 0)
J
Juan Quintela 已提交
227
        return -errno;
B
bellard 已提交
228 229 230 231
    memset(&cow_header, 0, sizeof(cow_header));
    cow_header.magic = cpu_to_be32(COW_MAGIC);
    cow_header.version = cpu_to_be32(COW_VERSION);
    if (image_filename) {
B
bellard 已提交
232 233 234
        /* Note: if no file, we put a dummy mtime */
        cow_header.mtime = cpu_to_be32(0);

B
bellard 已提交
235 236 237
        fd = open(image_filename, O_RDONLY | O_BINARY);
        if (fd < 0) {
            close(cow_fd);
B
bellard 已提交
238
            goto mtime_fail;
B
bellard 已提交
239 240 241
        }
        if (fstat(fd, &st) != 0) {
            close(fd);
B
bellard 已提交
242
            goto mtime_fail;
B
bellard 已提交
243 244 245
        }
        close(fd);
        cow_header.mtime = cpu_to_be32(st.st_mtime);
B
bellard 已提交
246 247 248
    mtime_fail:
        pstrcpy(cow_header.backing_file, sizeof(cow_header.backing_file),
                image_filename);
B
bellard 已提交
249 250 251
    }
    cow_header.sectorsize = cpu_to_be32(512);
    cow_header.size = cpu_to_be64(image_sectors * 512);
252 253
    ret = qemu_write_full(cow_fd, &cow_header, sizeof(cow_header));
    if (ret != sizeof(cow_header)) {
J
Juan Quintela 已提交
254
        ret = -errno;
255 256 257
        goto exit;
    }

B
bellard 已提交
258
    /* resize to include at least all the bitmap */
259 260 261 262 263 264 265
    ret = ftruncate(cow_fd, sizeof(cow_header) + ((image_sectors + 7) >> 3));
    if (ret) {
        ret = -errno;
        goto exit;
    }

exit:
B
bellard 已提交
266
    close(cow_fd);
267
    return ret;
B
bellard 已提交
268 269
}

P
pbrook 已提交
270 271 272
static void cow_flush(BlockDriverState *bs)
{
    BDRVCowState *s = bs->opaque;
273
    qemu_fdatasync(s->fd);
P
pbrook 已提交
274 275
}

276
static QEMUOptionParameter cow_create_options[] = {
277 278 279 280 281 282 283 284 285 286
    {
        .name = BLOCK_OPT_SIZE,
        .type = OPT_SIZE,
        .help = "Virtual disk size"
    },
    {
        .name = BLOCK_OPT_BACKING_FILE,
        .type = OPT_STRING,
        .help = "File name of a base image"
    },
287 288 289
    { NULL }
};

290
static BlockDriver bdrv_cow = {
291 292 293
    .format_name	= "cow",
    .instance_size	= sizeof(BDRVCowState),
    .bdrv_probe		= cow_probe,
294
    .bdrv_file_open	= cow_open,
295 296 297 298 299 300
    .bdrv_read		= cow_read,
    .bdrv_write		= cow_write,
    .bdrv_close		= cow_close,
    .bdrv_create	= cow_create,
    .bdrv_flush		= cow_flush,
    .bdrv_is_allocated	= cow_is_allocated,
301 302

    .create_options = cow_create_options,
B
bellard 已提交
303
};
304 305 306 307 308 309 310

static void bdrv_cow_init(void)
{
    bdrv_register(&bdrv_cow);
}

block_init(bdrv_cow_init);
B
bellard 已提交
311
#endif