savevm.c 62.0 KB
Newer Older
A
aliguori 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
/*
 * QEMU System Emulator
 *
 * Copyright (c) 2003-2008 Fabrice Bellard
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */

B
blueswir1 已提交
25
#include "config-host.h"
26 27
#include "qemu-common.h"
#include "hw/hw.h"
28
#include "hw/qdev.h"
P
Paolo Bonzini 已提交
29
#include "net/net.h"
30
#include "monitor/monitor.h"
31
#include "sysemu/sysemu.h"
32
#include "qemu/timer.h"
33
#include "audio/audio.h"
34
#include "migration/migration.h"
35 36
#include "qemu/sockets.h"
#include "qemu/queue.h"
37
#include "sysemu/cpus.h"
38
#include "exec/memory.h"
39
#include "qmp-commands.h"
40
#include "trace.h"
41
#include "qemu/bitops.h"
42
#include "qemu/iov.h"
43

A
aliguori 已提交
44 45
#define SELF_ANNOUNCE_ROUNDS 5

N
Nolan 已提交
46
#ifndef ETH_P_RARP
S
Stefan Berger 已提交
47
#define ETH_P_RARP 0x8035
N
Nolan 已提交
48 49 50 51 52 53
#endif
#define ARP_HTYPE_ETH 0x0001
#define ARP_PTYPE_IP 0x0800
#define ARP_OP_REQUEST_REV 0x3

static int announce_self_create(uint8_t *buf,
A
aliguori 已提交
54 55
				uint8_t *mac_addr)
{
N
Nolan 已提交
56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75
    /* Ethernet header. */
    memset(buf, 0xff, 6);         /* destination MAC addr */
    memcpy(buf + 6, mac_addr, 6); /* source MAC addr */
    *(uint16_t *)(buf + 12) = htons(ETH_P_RARP); /* ethertype */

    /* RARP header. */
    *(uint16_t *)(buf + 14) = htons(ARP_HTYPE_ETH); /* hardware addr space */
    *(uint16_t *)(buf + 16) = htons(ARP_PTYPE_IP); /* protocol addr space */
    *(buf + 18) = 6; /* hardware addr length (ethernet) */
    *(buf + 19) = 4; /* protocol addr length (IPv4) */
    *(uint16_t *)(buf + 20) = htons(ARP_OP_REQUEST_REV); /* opcode */
    memcpy(buf + 22, mac_addr, 6); /* source hw addr */
    memset(buf + 28, 0x00, 4);     /* source protocol addr */
    memcpy(buf + 32, mac_addr, 6); /* target hw addr */
    memset(buf + 38, 0x00, 4);     /* target protocol addr */

    /* Padding to get up to 60 bytes (ethernet min packet size, minus FCS). */
    memset(buf + 42, 0x00, 18);

    return 60; /* len (FCS will be added by hardware) */
A
aliguori 已提交
76 77
}

M
Mark McLoughlin 已提交
78
static void qemu_announce_self_iter(NICState *nic, void *opaque)
A
aliguori 已提交
79
{
N
Nolan 已提交
80
    uint8_t buf[60];
M
Mark McLoughlin 已提交
81 82 83 84
    int len;

    len = announce_self_create(buf, nic->conf->macaddr.a);

J
Jason Wang 已提交
85
    qemu_send_packet_raw(qemu_get_queue(nic), buf, len);
M
Mark McLoughlin 已提交
86 87 88 89 90
}


static void qemu_announce_self_once(void *opaque)
{
91 92
    static int count = SELF_ANNOUNCE_ROUNDS;
    QEMUTimer *timer = *(QEMUTimer **)opaque;
A
aliguori 已提交
93

M
Mark McLoughlin 已提交
94 95
    qemu_foreach_nic(qemu_announce_self_iter, NULL);

N
Nolan 已提交
96 97
    if (--count) {
        /* delay 50ms, 150ms, 250ms, ... */
98
        qemu_mod_timer(timer, qemu_get_clock_ms(rt_clock) +
N
Nolan 已提交
99
                       50 + (SELF_ANNOUNCE_ROUNDS - count - 1) * 100);
100 101 102 103 104 105 106 107 108
    } else {
	    qemu_del_timer(timer);
	    qemu_free_timer(timer);
    }
}

void qemu_announce_self(void)
{
	static QEMUTimer *timer;
109
	timer = qemu_new_timer_ms(rt_clock, qemu_announce_self_once, &timer);
110
	qemu_announce_self_once(&timer);
A
aliguori 已提交
111 112 113 114 115 116
}

/***********************************************************/
/* savevm/loadvm support */

#define IO_BUF_SIZE 32768
117
#define MAX_IOV_SIZE MIN(IOV_MAX, 64)
A
aliguori 已提交
118 119

struct QEMUFile {
120
    const QEMUFileOps *ops;
A
aliguori 已提交
121 122 123
    void *opaque;
    int is_write;

124 125 126
    int64_t bytes_xfer;
    int64_t xfer_limit;

127 128
    int64_t pos; /* start of buffer when writing, end of buffer
                    when reading */
A
aliguori 已提交
129 130 131 132
    int buf_index;
    int buf_size; /* 0 when writing */
    uint8_t buf[IO_BUF_SIZE];

133 134 135
    struct iovec iov[MAX_IOV_SIZE];
    unsigned int iovcnt;

136
    int last_error;
A
aliguori 已提交
137 138
};

P
Paolo Bonzini 已提交
139
typedef struct QEMUFileStdio
A
aliguori 已提交
140
{
P
Paolo Bonzini 已提交
141
    FILE *stdio_file;
A
aliguori 已提交
142
    QEMUFile *file;
P
Paolo Bonzini 已提交
143
} QEMUFileStdio;
A
aliguori 已提交
144 145 146 147 148 149 150

typedef struct QEMUFileSocket
{
    int fd;
    QEMUFile *file;
} QEMUFileSocket;

151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178
typedef struct {
    Coroutine *co;
    int fd;
} FDYieldUntilData;

static void fd_coroutine_enter(void *opaque)
{
    FDYieldUntilData *data = opaque;
    qemu_set_fd_handler(data->fd, NULL, NULL, NULL);
    qemu_coroutine_enter(data->co, NULL);
}

/**
 * Yield until a file descriptor becomes readable
 *
 * Note that this function clobbers the handlers for the file descriptor.
 */
static void coroutine_fn yield_until_fd_readable(int fd)
{
    FDYieldUntilData data;

    assert(qemu_in_coroutine());
    data.co = qemu_coroutine_self();
    data.fd = fd;
    qemu_set_fd_handler(fd, fd_coroutine_enter, NULL, &data);
    qemu_coroutine_yield();
}

179 180 181 182 183 184 185 186 187 188 189 190 191
static ssize_t socket_writev_buffer(void *opaque, struct iovec *iov, int iovcnt)
{
    QEMUFileSocket *s = opaque;
    ssize_t len;
    ssize_t size = iov_size(iov, iovcnt);

    len = iov_send(s->fd, iov, iovcnt, 0, size);
    if (len < size) {
        len = -socket_error();
    }
    return len;
}

P
Paolo Bonzini 已提交
192 193 194 195 196 197 198
static int socket_get_fd(void *opaque)
{
    QEMUFileSocket *s = opaque;

    return s->fd;
}

A
aliguori 已提交
199 200 201 202 203
static int socket_get_buffer(void *opaque, uint8_t *buf, int64_t pos, int size)
{
    QEMUFileSocket *s = opaque;
    ssize_t len;

204
    for (;;) {
B
Blue Swirl 已提交
205
        len = qemu_recv(s->fd, buf, size, 0);
206 207 208 209
        if (len != -1) {
            break;
        }
        if (socket_error() == EAGAIN) {
210
            yield_until_fd_readable(s->fd);
211 212 213 214
        } else if (socket_error() != EINTR) {
            break;
        }
    }
A
aliguori 已提交
215

216
    if (len == -1) {
A
aliguori 已提交
217
        len = -socket_error();
218
    }
A
aliguori 已提交
219 220 221
    return len;
}

222 223 224 225 226 227 228 229 230 231 232 233
static int socket_put_buffer(void *opaque, const uint8_t *buf, int64_t pos, int size)
{
    QEMUFileSocket *s = opaque;
    ssize_t len;

    len = qemu_send_full(s->fd, buf, size, 0);
    if (len < size) {
        len = -socket_error();
    }
    return len;
}

A
aliguori 已提交
234 235 236
static int socket_close(void *opaque)
{
    QEMUFileSocket *s = opaque;
237
    closesocket(s->fd);
238
    g_free(s);
A
aliguori 已提交
239 240 241
    return 0;
}

P
Paolo Bonzini 已提交
242 243 244 245 246 247 248
static int stdio_get_fd(void *opaque)
{
    QEMUFileStdio *s = opaque;

    return fileno(s->stdio_file);
}

P
Paolo Bonzini 已提交
249
static int stdio_put_buffer(void *opaque, const uint8_t *buf, int64_t pos, int size)
A
aliguori 已提交
250
{
P
Paolo Bonzini 已提交
251 252
    QEMUFileStdio *s = opaque;
    return fwrite(buf, 1, size, s->stdio_file);
A
aliguori 已提交
253 254
}

P
Paolo Bonzini 已提交
255
static int stdio_get_buffer(void *opaque, uint8_t *buf, int64_t pos, int size)
A
aliguori 已提交
256
{
P
Paolo Bonzini 已提交
257 258
    QEMUFileStdio *s = opaque;
    FILE *fp = s->stdio_file;
259 260
    int bytes;

261
    for (;;) {
262 263
        clearerr(fp);
        bytes = fread(buf, 1, size, fp);
264 265 266 267
        if (bytes != 0 || !ferror(fp)) {
            break;
        }
        if (errno == EAGAIN) {
268
            yield_until_fd_readable(fileno(fp));
269 270 271 272
        } else if (errno != EINTR) {
            break;
        }
    }
273
    return bytes;
A
aliguori 已提交
274 275
}

P
Paolo Bonzini 已提交
276 277 278
static int stdio_pclose(void *opaque)
{
    QEMUFileStdio *s = opaque;
279 280
    int ret;
    ret = pclose(s->stdio_file);
281 282
    if (ret == -1) {
        ret = -errno;
283 284 285
    } else if (!WIFEXITED(ret) || WEXITSTATUS(ret) != 0) {
        /* close succeeded, but non-zero exit code: */
        ret = -EIO; /* fake errno value */
286
    }
287
    g_free(s);
288
    return ret;
P
Paolo Bonzini 已提交
289 290 291
}

static int stdio_fclose(void *opaque)
A
aliguori 已提交
292
{
P
Paolo Bonzini 已提交
293
    QEMUFileStdio *s = opaque;
294
    int ret = 0;
295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312

    if (s->file->ops->put_buffer) {
        int fd = fileno(s->stdio_file);
        struct stat st;

        ret = fstat(fd, &st);
        if (ret == 0 && S_ISREG(st.st_mode)) {
            /*
             * If the file handle is a regular file make sure the
             * data is flushed to disk before signaling success.
             */
            ret = fsync(fd);
            if (ret != 0) {
                ret = -errno;
                return ret;
            }
        }
    }
313 314 315
    if (fclose(s->stdio_file) == EOF) {
        ret = -errno;
    }
316
    g_free(s);
317
    return ret;
A
aliguori 已提交
318 319
}

320
static const QEMUFileOps stdio_pipe_read_ops = {
P
Paolo Bonzini 已提交
321
    .get_fd =     stdio_get_fd,
322 323 324 325 326
    .get_buffer = stdio_get_buffer,
    .close =      stdio_pclose
};

static const QEMUFileOps stdio_pipe_write_ops = {
P
Paolo Bonzini 已提交
327
    .get_fd =     stdio_get_fd,
328 329 330 331
    .put_buffer = stdio_put_buffer,
    .close =      stdio_pclose
};

332
QEMUFile *qemu_popen_cmd(const char *command, const char *mode)
A
aliguori 已提交
333
{
334
    FILE *stdio_file;
P
Paolo Bonzini 已提交
335
    QEMUFileStdio *s;
A
aliguori 已提交
336

337 338 339 340 341 342
    stdio_file = popen(command, mode);
    if (stdio_file == NULL) {
        return NULL;
    }

    if (mode == NULL || (mode[0] != 'r' && mode[0] != 'w') || mode[1] != 0) {
A
aliguori 已提交
343 344 345 346
        fprintf(stderr, "qemu_popen: Argument validity check failed\n");
        return NULL;
    }

347
    s = g_malloc0(sizeof(QEMUFileStdio));
A
aliguori 已提交
348

P
Paolo Bonzini 已提交
349
    s->stdio_file = stdio_file;
A
aliguori 已提交
350 351

    if(mode[0] == 'r') {
352
        s->file = qemu_fopen_ops(s, &stdio_pipe_read_ops);
A
aliguori 已提交
353
    } else {
354
        s->file = qemu_fopen_ops(s, &stdio_pipe_write_ops);
A
aliguori 已提交
355 356 357 358
    }
    return s->file;
}

359
static const QEMUFileOps stdio_file_read_ops = {
P
Paolo Bonzini 已提交
360
    .get_fd =     stdio_get_fd,
361 362 363 364 365
    .get_buffer = stdio_get_buffer,
    .close =      stdio_fclose
};

static const QEMUFileOps stdio_file_write_ops = {
P
Paolo Bonzini 已提交
366
    .get_fd =     stdio_get_fd,
367 368 369 370
    .put_buffer = stdio_put_buffer,
    .close =      stdio_fclose
};

P
Paolo Bonzini 已提交
371 372 373 374 375 376 377 378 379 380 381
QEMUFile *qemu_fdopen(int fd, const char *mode)
{
    QEMUFileStdio *s;

    if (mode == NULL ||
	(mode[0] != 'r' && mode[0] != 'w') ||
	mode[1] != 'b' || mode[2] != 0) {
        fprintf(stderr, "qemu_fdopen: Argument validity check failed\n");
        return NULL;
    }

382
    s = g_malloc0(sizeof(QEMUFileStdio));
P
Paolo Bonzini 已提交
383 384 385 386 387
    s->stdio_file = fdopen(fd, mode);
    if (!s->stdio_file)
        goto fail;

    if(mode[0] == 'r') {
388
        s->file = qemu_fopen_ops(s, &stdio_file_read_ops);
P
Paolo Bonzini 已提交
389
    } else {
390
        s->file = qemu_fopen_ops(s, &stdio_file_write_ops);
P
Paolo Bonzini 已提交
391 392 393 394
    }
    return s->file;

fail:
395
    g_free(s);
P
Paolo Bonzini 已提交
396 397 398
    return NULL;
}

399
static const QEMUFileOps socket_read_ops = {
P
Paolo Bonzini 已提交
400
    .get_fd =     socket_get_fd,
401 402 403 404
    .get_buffer = socket_get_buffer,
    .close =      socket_close
};

405 406 407
static const QEMUFileOps socket_write_ops = {
    .get_fd =     socket_get_fd,
    .put_buffer = socket_put_buffer,
408
    .writev_buffer = socket_writev_buffer,
409 410 411 412
    .close =      socket_close
};

QEMUFile *qemu_fopen_socket(int fd, const char *mode)
A
aliguori 已提交
413
{
414
    QEMUFileSocket *s = g_malloc0(sizeof(QEMUFileSocket));
A
aliguori 已提交
415

416 417 418 419 420 421 422
    if (mode == NULL ||
        (mode[0] != 'r' && mode[0] != 'w') ||
        mode[1] != 'b' || mode[2] != 0) {
        fprintf(stderr, "qemu_fopen: Argument validity check failed\n");
        return NULL;
    }

A
aliguori 已提交
423
    s->fd = fd;
424
    if (mode[0] == 'w') {
425
        socket_set_block(s->fd);
426 427 428 429
        s->file = qemu_fopen_ops(s, &socket_write_ops);
    } else {
        s->file = qemu_fopen_ops(s, &socket_read_ops);
    }
A
aliguori 已提交
430 431 432 433 434 435 436
    return s->file;
}

QEMUFile *qemu_fopen(const char *filename, const char *mode)
{
    QEMUFileStdio *s;

P
Paolo Bonzini 已提交
437 438 439
    if (mode == NULL ||
	(mode[0] != 'r' && mode[0] != 'w') ||
	mode[1] != 'b' || mode[2] != 0) {
B
Blue Swirl 已提交
440
        fprintf(stderr, "qemu_fopen: Argument validity check failed\n");
P
Paolo Bonzini 已提交
441 442 443
        return NULL;
    }

444
    s = g_malloc0(sizeof(QEMUFileStdio));
A
aliguori 已提交
445

P
Paolo Bonzini 已提交
446 447
    s->stdio_file = fopen(filename, mode);
    if (!s->stdio_file)
A
aliguori 已提交
448
        goto fail;
L
lirans@il.ibm.com 已提交
449
    
P
Paolo Bonzini 已提交
450
    if(mode[0] == 'w') {
451
        s->file = qemu_fopen_ops(s, &stdio_file_write_ops);
P
Paolo Bonzini 已提交
452
    } else {
453
        s->file = qemu_fopen_ops(s, &stdio_file_read_ops);
P
Paolo Bonzini 已提交
454 455
    }
    return s->file;
A
aliguori 已提交
456
fail:
457
    g_free(s);
A
aliguori 已提交
458 459 460
    return NULL;
}

461
static int block_put_buffer(void *opaque, const uint8_t *buf,
A
aliguori 已提交
462 463
                           int64_t pos, int size)
{
464
    bdrv_save_vmstate(opaque, buf, pos, size);
A
aliguori 已提交
465 466 467
    return size;
}

468
static int block_get_buffer(void *opaque, uint8_t *buf, int64_t pos, int size)
A
aliguori 已提交
469
{
470
    return bdrv_load_vmstate(opaque, buf, pos, size);
A
aliguori 已提交
471 472 473 474
}

static int bdrv_fclose(void *opaque)
{
475
    return bdrv_flush(opaque);
A
aliguori 已提交
476 477
}

478 479 480 481 482 483 484 485 486 487
static const QEMUFileOps bdrv_read_ops = {
    .get_buffer = block_get_buffer,
    .close =      bdrv_fclose
};

static const QEMUFileOps bdrv_write_ops = {
    .put_buffer = block_put_buffer,
    .close =      bdrv_fclose
};

488
static QEMUFile *qemu_fopen_bdrv(BlockDriverState *bs, int is_writable)
A
aliguori 已提交
489 490
{
    if (is_writable)
491 492
        return qemu_fopen_ops(bs, &bdrv_write_ops);
    return qemu_fopen_ops(bs, &bdrv_read_ops);
A
aliguori 已提交
493 494
}

495
QEMUFile *qemu_fopen_ops(void *opaque, const QEMUFileOps *ops)
A
aliguori 已提交
496 497 498
{
    QEMUFile *f;

499
    f = g_malloc0(sizeof(QEMUFile));
A
aliguori 已提交
500 501

    f->opaque = opaque;
502
    f->ops = ops;
A
aliguori 已提交
503 504 505 506
    f->is_write = 0;
    return f;
}

507
int qemu_file_get_error(QEMUFile *f)
A
aliguori 已提交
508
{
509
    return f->last_error;
A
aliguori 已提交
510 511
}

512
static void qemu_file_set_error(QEMUFile *f, int ret)
513
{
514 515 516
    if (f->last_error == 0) {
        f->last_error = ret;
    }
517 518
}

519 520 521
/** Flushes QEMUFile buffer
 *
 */
522
static void qemu_fflush(QEMUFile *f)
A
aliguori 已提交
523
{
524 525
    int ret = 0;

526 527 528
    if (!f->ops->put_buffer) {
        return;
    }
A
aliguori 已提交
529
    if (f->is_write && f->buf_index > 0) {
530
        ret = f->ops->put_buffer(f->opaque, f->buf, f->pos, f->buf_index);
531
        if (ret >= 0) {
532
            f->pos += f->buf_index;
533
        }
A
aliguori 已提交
534
        f->buf_index = 0;
535
        f->iovcnt = 0;
A
aliguori 已提交
536
    }
537 538 539
    if (ret < 0) {
        qemu_file_set_error(f, ret);
    }
A
aliguori 已提交
540 541 542 543 544
}

static void qemu_fill_buffer(QEMUFile *f)
{
    int len;
545
    int pending;
A
aliguori 已提交
546

547
    if (!f->ops->get_buffer)
A
aliguori 已提交
548 549 550 551 552
        return;

    if (f->is_write)
        abort();

553 554 555 556 557 558 559
    pending = f->buf_size - f->buf_index;
    if (pending > 0) {
        memmove(f->buf, f->buf + f->buf_index, pending);
    }
    f->buf_index = 0;
    f->buf_size = pending;

560
    len = f->ops->get_buffer(f->opaque, f->buf + pending, f->pos,
561
                        IO_BUF_SIZE - pending);
A
aliguori 已提交
562
    if (len > 0) {
563
        f->buf_size += len;
564
        f->pos += len;
565
    } else if (len == 0) {
566
        qemu_file_set_error(f, -EIO);
A
aliguori 已提交
567
    } else if (len != -EAGAIN)
568
        qemu_file_set_error(f, len);
A
aliguori 已提交
569 570
}

P
Paolo Bonzini 已提交
571 572 573 574 575 576 577 578
int qemu_get_fd(QEMUFile *f)
{
    if (f->ops->get_fd) {
        return f->ops->get_fd(f->opaque);
    }
    return -1;
}

579 580 581 582 583 584 585 586 587 588
/** Closes the file
 *
 * Returns negative error value if any error happened on previous operations or
 * while closing the file. Returns 0 or positive number on success.
 *
 * The meaning of return value on success depends on the specific backend
 * being used.
 */
int qemu_fclose(QEMUFile *f)
{
589
    int ret;
590 591
    qemu_fflush(f);
    ret = qemu_file_get_error(f);
592

593 594
    if (f->ops->close) {
        int ret2 = f->ops->close(f->opaque);
595 596 597
        if (ret >= 0) {
            ret = ret2;
        }
598
    }
599 600 601 602 603 604
    /* If any error was spotted before closing, we should report it
     * instead of the close() return value.
     */
    if (f->last_error) {
        ret = f->last_error;
    }
605
    g_free(f);
A
aliguori 已提交
606 607 608
    return ret;
}

609 610 611 612 613 614 615 616 617 618 619 620
static void add_to_iovec(QEMUFile *f, const uint8_t *buf, int size)
{
    /* check for adjacent buffer and coalesce them */
    if (f->iovcnt > 0 && buf == f->iov[f->iovcnt - 1].iov_base +
        f->iov[f->iovcnt - 1].iov_len) {
        f->iov[f->iovcnt - 1].iov_len += size;
    } else {
        f->iov[f->iovcnt].iov_base = (uint8_t *)buf;
        f->iov[f->iovcnt++].iov_len = size;
    }
}

A
aliguori 已提交
621 622 623 624
void qemu_put_buffer(QEMUFile *f, const uint8_t *buf, int size)
{
    int l;

625 626 627 628 629
    if (f->last_error) {
        return;
    }

    if (f->is_write == 0 && f->buf_index > 0) {
A
aliguori 已提交
630 631 632 633 634
        fprintf(stderr,
                "Attempted to write to buffer while read buffer is not empty\n");
        abort();
    }

635
    while (size > 0) {
A
aliguori 已提交
636 637 638 639
        l = IO_BUF_SIZE - f->buf_index;
        if (l > size)
            l = size;
        memcpy(f->buf + f->buf_index, buf, l);
640
        add_to_iovec(f, f->buf + f->buf_index, l);
A
aliguori 已提交
641 642
        f->is_write = 1;
        f->buf_index += l;
643
        f->bytes_xfer += l;
A
aliguori 已提交
644 645
        buf += l;
        size -= l;
646
        if (f->buf_index >= IO_BUF_SIZE || f->iovcnt >= MAX_IOV_SIZE) {
647 648
            qemu_fflush(f);
            if (qemu_file_get_error(f)) {
649 650
                break;
            }
651
        }
A
aliguori 已提交
652 653 654 655 656
    }
}

void qemu_put_byte(QEMUFile *f, int v)
{
657 658 659 660 661
    if (f->last_error) {
        return;
    }

    if (f->is_write == 0 && f->buf_index > 0) {
A
aliguori 已提交
662 663 664 665 666 667 668
        fprintf(stderr,
                "Attempted to write to buffer while read buffer is not empty\n");
        abort();
    }

    f->buf[f->buf_index++] = v;
    f->is_write = 1;
669 670
    f->bytes_xfer++;

671 672 673
    add_to_iovec(f, f->buf + (f->buf_index - 1), 1);

    if (f->buf_index >= IO_BUF_SIZE || f->iovcnt >= MAX_IOV_SIZE) {
674
        qemu_fflush(f);
675
    }
A
aliguori 已提交
676 677
}

678
static void qemu_file_skip(QEMUFile *f, int size)
A
aliguori 已提交
679
{
680 681 682 683 684 685
    if (f->buf_index + size <= f->buf_size) {
        f->buf_index += size;
    }
}

static int qemu_peek_buffer(QEMUFile *f, uint8_t *buf, int size, size_t offset)
A
aliguori 已提交
686
{
687 688
    int pending;
    int index;
A
aliguori 已提交
689

J
Juan Quintela 已提交
690
    if (f->is_write) {
A
aliguori 已提交
691
        abort();
J
Juan Quintela 已提交
692
    }
A
aliguori 已提交
693

694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723
    index = f->buf_index + offset;
    pending = f->buf_size - index;
    if (pending < size) {
        qemu_fill_buffer(f);
        index = f->buf_index + offset;
        pending = f->buf_size - index;
    }

    if (pending <= 0) {
        return 0;
    }
    if (size > pending) {
        size = pending;
    }

    memcpy(buf, f->buf + index, size);
    return size;
}

int qemu_get_buffer(QEMUFile *f, uint8_t *buf, int size)
{
    int pending = size;
    int done = 0;

    while (pending > 0) {
        int res;

        res = qemu_peek_buffer(f, buf, pending, 0);
        if (res == 0) {
            return done;
A
aliguori 已提交
724
        }
725 726 727 728
        qemu_file_skip(f, res);
        buf += res;
        pending -= res;
        done += res;
A
aliguori 已提交
729
    }
730
    return done;
A
aliguori 已提交
731 732
}

733
static int qemu_peek_byte(QEMUFile *f, int offset)
J
Juan Quintela 已提交
734
{
735 736
    int index = f->buf_index + offset;

J
Juan Quintela 已提交
737
    if (f->is_write) {
J
Juan Quintela 已提交
738
        abort();
J
Juan Quintela 已提交
739
    }
J
Juan Quintela 已提交
740

741
    if (index >= f->buf_size) {
J
Juan Quintela 已提交
742
        qemu_fill_buffer(f);
743 744
        index = f->buf_index + offset;
        if (index >= f->buf_size) {
J
Juan Quintela 已提交
745
            return 0;
J
Juan Quintela 已提交
746
        }
J
Juan Quintela 已提交
747
    }
748
    return f->buf[index];
J
Juan Quintela 已提交
749 750
}

A
aliguori 已提交
751 752
int qemu_get_byte(QEMUFile *f)
{
753
    int result;
A
aliguori 已提交
754

755 756
    result = qemu_peek_byte(f, 0);
    qemu_file_skip(f, 1);
757
    return result;
A
aliguori 已提交
758 759
}

760
int64_t qemu_ftell(QEMUFile *f)
A
aliguori 已提交
761
{
762 763
    qemu_fflush(f);
    return f->pos;
A
aliguori 已提交
764 765 766 767
}

int qemu_file_rate_limit(QEMUFile *f)
{
768 769 770 771 772 773
    if (qemu_file_get_error(f)) {
        return 1;
    }
    if (f->xfer_limit > 0 && f->bytes_xfer > f->xfer_limit) {
        return 1;
    }
A
aliguori 已提交
774 775 776
    return 0;
}

M
Michael S. Tsirkin 已提交
777
int64_t qemu_file_get_rate_limit(QEMUFile *f)
L
lirans@il.ibm.com 已提交
778
{
779
    return f->xfer_limit;
L
lirans@il.ibm.com 已提交
780 781
}

782
void qemu_file_set_rate_limit(QEMUFile *f, int64_t limit)
783
{
784 785
    f->xfer_limit = limit;
}
786

787 788 789
void qemu_file_reset_rate_limit(QEMUFile *f)
{
    f->bytes_xfer = 0;
790 791
}

A
aliguori 已提交
792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837
void qemu_put_be16(QEMUFile *f, unsigned int v)
{
    qemu_put_byte(f, v >> 8);
    qemu_put_byte(f, v);
}

void qemu_put_be32(QEMUFile *f, unsigned int v)
{
    qemu_put_byte(f, v >> 24);
    qemu_put_byte(f, v >> 16);
    qemu_put_byte(f, v >> 8);
    qemu_put_byte(f, v);
}

void qemu_put_be64(QEMUFile *f, uint64_t v)
{
    qemu_put_be32(f, v >> 32);
    qemu_put_be32(f, v);
}

unsigned int qemu_get_be16(QEMUFile *f)
{
    unsigned int v;
    v = qemu_get_byte(f) << 8;
    v |= qemu_get_byte(f);
    return v;
}

unsigned int qemu_get_be32(QEMUFile *f)
{
    unsigned int v;
    v = qemu_get_byte(f) << 24;
    v |= qemu_get_byte(f) << 16;
    v |= qemu_get_byte(f) << 8;
    v |= qemu_get_byte(f);
    return v;
}

uint64_t qemu_get_be64(QEMUFile *f)
{
    uint64_t v;
    v = (uint64_t)qemu_get_be32(f) << 32;
    v |= qemu_get_be32(f);
    return v;
}

838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861

/* timer */

void qemu_put_timer(QEMUFile *f, QEMUTimer *ts)
{
    uint64_t expire_time;

    expire_time = qemu_timer_expire_time_ns(ts);
    qemu_put_be64(f, expire_time);
}

void qemu_get_timer(QEMUFile *f, QEMUTimer *ts)
{
    uint64_t expire_time;

    expire_time = qemu_get_be64(f);
    if (expire_time != -1) {
        qemu_mod_timer_ns(ts, expire_time);
    } else {
        qemu_del_timer(ts);
    }
}


G
Gerd Hoffmann 已提交
862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882
/* bool */

static int get_bool(QEMUFile *f, void *pv, size_t size)
{
    bool *v = pv;
    *v = qemu_get_byte(f);
    return 0;
}

static void put_bool(QEMUFile *f, void *pv, size_t size)
{
    bool *v = pv;
    qemu_put_byte(f, *v);
}

const VMStateInfo vmstate_info_bool = {
    .name = "bool",
    .get  = get_bool,
    .put  = put_bool,
};

883 884 885 886 887 888 889 890 891
/* 8 bit int */

static int get_int8(QEMUFile *f, void *pv, size_t size)
{
    int8_t *v = pv;
    qemu_get_s8s(f, v);
    return 0;
}

892
static void put_int8(QEMUFile *f, void *pv, size_t size)
893
{
894
    int8_t *v = pv;
895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912
    qemu_put_s8s(f, v);
}

const VMStateInfo vmstate_info_int8 = {
    .name = "int8",
    .get  = get_int8,
    .put  = put_int8,
};

/* 16 bit int */

static int get_int16(QEMUFile *f, void *pv, size_t size)
{
    int16_t *v = pv;
    qemu_get_sbe16s(f, v);
    return 0;
}

913
static void put_int16(QEMUFile *f, void *pv, size_t size)
914
{
915
    int16_t *v = pv;
916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933
    qemu_put_sbe16s(f, v);
}

const VMStateInfo vmstate_info_int16 = {
    .name = "int16",
    .get  = get_int16,
    .put  = put_int16,
};

/* 32 bit int */

static int get_int32(QEMUFile *f, void *pv, size_t size)
{
    int32_t *v = pv;
    qemu_get_sbe32s(f, v);
    return 0;
}

934
static void put_int32(QEMUFile *f, void *pv, size_t size)
935
{
936
    int32_t *v = pv;
937 938 939 940 941 942 943 944 945
    qemu_put_sbe32s(f, v);
}

const VMStateInfo vmstate_info_int32 = {
    .name = "int32",
    .get  = get_int32,
    .put  = put_int32,
};

946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965
/* 32 bit int. See that the received value is the same than the one
   in the field */

static int get_int32_equal(QEMUFile *f, void *pv, size_t size)
{
    int32_t *v = pv;
    int32_t v2;
    qemu_get_sbe32s(f, &v2);

    if (*v == v2)
        return 0;
    return -EINVAL;
}

const VMStateInfo vmstate_info_int32_equal = {
    .name = "int32 equal",
    .get  = get_int32_equal,
    .put  = put_int32,
};

966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985
/* 32 bit int. See that the received value is the less or the same
   than the one in the field */

static int get_int32_le(QEMUFile *f, void *pv, size_t size)
{
    int32_t *old = pv;
    int32_t new;
    qemu_get_sbe32s(f, &new);

    if (*old <= new)
        return 0;
    return -EINVAL;
}

const VMStateInfo vmstate_info_int32_le = {
    .name = "int32 equal",
    .get  = get_int32_le,
    .put  = put_int32,
};

986 987 988 989 990 991 992 993 994
/* 64 bit int */

static int get_int64(QEMUFile *f, void *pv, size_t size)
{
    int64_t *v = pv;
    qemu_get_sbe64s(f, v);
    return 0;
}

995
static void put_int64(QEMUFile *f, void *pv, size_t size)
996
{
997
    int64_t *v = pv;
998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015
    qemu_put_sbe64s(f, v);
}

const VMStateInfo vmstate_info_int64 = {
    .name = "int64",
    .get  = get_int64,
    .put  = put_int64,
};

/* 8 bit unsigned int */

static int get_uint8(QEMUFile *f, void *pv, size_t size)
{
    uint8_t *v = pv;
    qemu_get_8s(f, v);
    return 0;
}

1016
static void put_uint8(QEMUFile *f, void *pv, size_t size)
1017
{
1018
    uint8_t *v = pv;
1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036
    qemu_put_8s(f, v);
}

const VMStateInfo vmstate_info_uint8 = {
    .name = "uint8",
    .get  = get_uint8,
    .put  = put_uint8,
};

/* 16 bit unsigned int */

static int get_uint16(QEMUFile *f, void *pv, size_t size)
{
    uint16_t *v = pv;
    qemu_get_be16s(f, v);
    return 0;
}

1037
static void put_uint16(QEMUFile *f, void *pv, size_t size)
1038
{
1039
    uint16_t *v = pv;
1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057
    qemu_put_be16s(f, v);
}

const VMStateInfo vmstate_info_uint16 = {
    .name = "uint16",
    .get  = get_uint16,
    .put  = put_uint16,
};

/* 32 bit unsigned int */

static int get_uint32(QEMUFile *f, void *pv, size_t size)
{
    uint32_t *v = pv;
    qemu_get_be32s(f, v);
    return 0;
}

1058
static void put_uint32(QEMUFile *f, void *pv, size_t size)
1059
{
1060
    uint32_t *v = pv;
1061 1062 1063 1064 1065 1066 1067 1068 1069
    qemu_put_be32s(f, v);
}

const VMStateInfo vmstate_info_uint32 = {
    .name = "uint32",
    .get  = get_uint32,
    .put  = put_uint32,
};

1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090
/* 32 bit uint. See that the received value is the same than the one
   in the field */

static int get_uint32_equal(QEMUFile *f, void *pv, size_t size)
{
    uint32_t *v = pv;
    uint32_t v2;
    qemu_get_be32s(f, &v2);

    if (*v == v2) {
        return 0;
    }
    return -EINVAL;
}

const VMStateInfo vmstate_info_uint32_equal = {
    .name = "uint32 equal",
    .get  = get_uint32_equal,
    .put  = put_uint32,
};

1091 1092 1093 1094 1095 1096 1097 1098 1099
/* 64 bit unsigned int */

static int get_uint64(QEMUFile *f, void *pv, size_t size)
{
    uint64_t *v = pv;
    qemu_get_be64s(f, v);
    return 0;
}

1100
static void put_uint64(QEMUFile *f, void *pv, size_t size)
1101
{
1102
    uint64_t *v = pv;
1103 1104 1105 1106 1107 1108 1109 1110 1111
    qemu_put_be64s(f, v);
}

const VMStateInfo vmstate_info_uint64 = {
    .name = "uint64",
    .get  = get_uint64,
    .put  = put_uint64,
};

1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132
/* 64 bit unsigned int. See that the received value is the same than the one
   in the field */

static int get_uint64_equal(QEMUFile *f, void *pv, size_t size)
{
    uint64_t *v = pv;
    uint64_t v2;
    qemu_get_be64s(f, &v2);

    if (*v == v2) {
        return 0;
    }
    return -EINVAL;
}

const VMStateInfo vmstate_info_uint64_equal = {
    .name = "int64 equal",
    .get  = get_uint64_equal,
    .put  = put_uint64,
};

1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147
/* 8 bit int. See that the received value is the same than the one
   in the field */

static int get_uint8_equal(QEMUFile *f, void *pv, size_t size)
{
    uint8_t *v = pv;
    uint8_t v2;
    qemu_get_8s(f, &v2);

    if (*v == v2)
        return 0;
    return -EINVAL;
}

const VMStateInfo vmstate_info_uint8_equal = {
J
Juan Quintela 已提交
1148
    .name = "uint8 equal",
1149 1150 1151 1152
    .get  = get_uint8_equal,
    .put  = put_uint8,
};

1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172
/* 16 bit unsigned int int. See that the received value is the same than the one
   in the field */

static int get_uint16_equal(QEMUFile *f, void *pv, size_t size)
{
    uint16_t *v = pv;
    uint16_t v2;
    qemu_get_be16s(f, &v2);

    if (*v == v2)
        return 0;
    return -EINVAL;
}

const VMStateInfo vmstate_info_uint16_equal = {
    .name = "uint16 equal",
    .get  = get_uint16_equal,
    .put  = put_uint16,
};

1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195
/* floating point */

static int get_float64(QEMUFile *f, void *pv, size_t size)
{
    float64 *v = pv;

    *v = make_float64(qemu_get_be64(f));
    return 0;
}

static void put_float64(QEMUFile *f, void *pv, size_t size)
{
    uint64_t *v = pv;

    qemu_put_be64(f, float64_val(*v));
}

const VMStateInfo vmstate_info_float64 = {
    .name = "float64",
    .get  = get_float64,
    .put  = put_float64,
};

J
Juan Quintela 已提交
1196 1197 1198 1199 1200 1201 1202 1203 1204
/* timers  */

static int get_timer(QEMUFile *f, void *pv, size_t size)
{
    QEMUTimer *v = pv;
    qemu_get_timer(f, v);
    return 0;
}

1205
static void put_timer(QEMUFile *f, void *pv, size_t size)
J
Juan Quintela 已提交
1206
{
1207
    QEMUTimer *v = pv;
J
Juan Quintela 已提交
1208 1209 1210 1211 1212 1213 1214 1215 1216
    qemu_put_timer(f, v);
}

const VMStateInfo vmstate_info_timer = {
    .name = "timer",
    .get  = get_timer,
    .put  = put_timer,
};

1217 1218 1219 1220 1221 1222 1223 1224 1225
/* uint8_t buffers */

static int get_buffer(QEMUFile *f, void *pv, size_t size)
{
    uint8_t *v = pv;
    qemu_get_buffer(f, v, size);
    return 0;
}

1226
static void put_buffer(QEMUFile *f, void *pv, size_t size)
1227
{
1228
    uint8_t *v = pv;
1229 1230 1231 1232 1233 1234 1235 1236 1237
    qemu_put_buffer(f, v, size);
}

const VMStateInfo vmstate_info_buffer = {
    .name = "buffer",
    .get  = get_buffer,
    .put  = put_buffer,
};

J
Juan Quintela 已提交
1238
/* unused buffers: space that was used for some fields that are
1239
   not useful anymore */
J
Juan Quintela 已提交
1240 1241 1242

static int get_unused_buffer(QEMUFile *f, void *pv, size_t size)
{
J
Jan Kiszka 已提交
1243 1244 1245 1246 1247 1248 1249 1250 1251
    uint8_t buf[1024];
    int block_len;

    while (size > 0) {
        block_len = MIN(sizeof(buf), size);
        size -= block_len;
        qemu_get_buffer(f, buf, block_len);
    }
   return 0;
J
Juan Quintela 已提交
1252 1253 1254 1255
}

static void put_unused_buffer(QEMUFile *f, void *pv, size_t size)
{
J
Jan Kiszka 已提交
1256 1257 1258 1259 1260 1261 1262 1263
    static const uint8_t buf[1024];
    int block_len;

    while (size > 0) {
        block_len = MIN(sizeof(buf), size);
        size -= block_len;
        qemu_put_buffer(f, buf, block_len);
    }
J
Juan Quintela 已提交
1264 1265 1266 1267 1268 1269 1270 1271
}

const VMStateInfo vmstate_info_unused_buffer = {
    .name = "unused_buffer",
    .get  = get_unused_buffer,
    .put  = put_unused_buffer,
};

1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311
/* bitmaps (as defined by bitmap.h). Note that size here is the size
 * of the bitmap in bits. The on-the-wire format of a bitmap is 64
 * bit words with the bits in big endian order. The in-memory format
 * is an array of 'unsigned long', which may be either 32 or 64 bits.
 */
/* This is the number of 64 bit words sent over the wire */
#define BITS_TO_U64S(nr) DIV_ROUND_UP(nr, 64)
static int get_bitmap(QEMUFile *f, void *pv, size_t size)
{
    unsigned long *bmp = pv;
    int i, idx = 0;
    for (i = 0; i < BITS_TO_U64S(size); i++) {
        uint64_t w = qemu_get_be64(f);
        bmp[idx++] = w;
        if (sizeof(unsigned long) == 4 && idx < BITS_TO_LONGS(size)) {
            bmp[idx++] = w >> 32;
        }
    }
    return 0;
}

static void put_bitmap(QEMUFile *f, void *pv, size_t size)
{
    unsigned long *bmp = pv;
    int i, idx = 0;
    for (i = 0; i < BITS_TO_U64S(size); i++) {
        uint64_t w = bmp[idx++];
        if (sizeof(unsigned long) == 4 && idx < BITS_TO_LONGS(size)) {
            w |= ((uint64_t)bmp[idx++]) << 32;
        }
        qemu_put_be64(f, w);
    }
}

const VMStateInfo vmstate_info_bitmap = {
    .name = "bitmap",
    .get = get_bitmap,
    .put = put_bitmap,
};

1312 1313 1314 1315 1316
typedef struct CompatEntry {
    char idstr[256];
    int instance_id;
} CompatEntry;

A
aliguori 已提交
1317
typedef struct SaveStateEntry {
B
Blue Swirl 已提交
1318
    QTAILQ_ENTRY(SaveStateEntry) entry;
A
aliguori 已提交
1319 1320
    char idstr[256];
    int instance_id;
J
Jan Kiszka 已提交
1321
    int alias_id;
A
aliguori 已提交
1322 1323
    int version_id;
    int section_id;
1324
    SaveVMHandlers *ops;
1325
    const VMStateDescription *vmsd;
A
aliguori 已提交
1326
    void *opaque;
1327
    CompatEntry *compat;
1328
    int no_migrate;
1329
    int is_ram;
A
aliguori 已提交
1330 1331
} SaveStateEntry;

L
lirans@il.ibm.com 已提交
1332

B
Blue Swirl 已提交
1333 1334
static QTAILQ_HEAD(savevm_handlers, SaveStateEntry) savevm_handlers =
    QTAILQ_HEAD_INITIALIZER(savevm_handlers);
1335
static int global_section_id;
A
aliguori 已提交
1336

1337 1338 1339 1340 1341
static int calculate_new_instance_id(const char *idstr)
{
    SaveStateEntry *se;
    int instance_id = 0;

B
Blue Swirl 已提交
1342
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1343 1344 1345 1346 1347 1348 1349 1350
        if (strcmp(idstr, se->idstr) == 0
            && instance_id <= se->instance_id) {
            instance_id = se->instance_id + 1;
        }
    }
    return instance_id;
}

1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367
static int calculate_compat_instance_id(const char *idstr)
{
    SaveStateEntry *se;
    int instance_id = 0;

    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
        if (!se->compat)
            continue;

        if (strcmp(idstr, se->compat->idstr) == 0
            && instance_id <= se->compat->instance_id) {
            instance_id = se->compat->instance_id + 1;
        }
    }
    return instance_id;
}

A
aliguori 已提交
1368 1369 1370 1371
/* TODO: Individual devices generally have very little idea about the rest
   of the system, so instance_id should be removed/replaced.
   Meanwhile pass -1 as instance_id if you do not already have a clearly
   distinguishing id for all instances of your device class. */
A
Alex Williamson 已提交
1372 1373
int register_savevm_live(DeviceState *dev,
                         const char *idstr,
A
aliguori 已提交
1374 1375
                         int instance_id,
                         int version_id,
1376
                         SaveVMHandlers *ops,
A
aliguori 已提交
1377 1378
                         void *opaque)
{
1379
    SaveStateEntry *se;
A
aliguori 已提交
1380

1381
    se = g_malloc0(sizeof(SaveStateEntry));
A
aliguori 已提交
1382 1383
    se->version_id = version_id;
    se->section_id = global_section_id++;
1384
    se->ops = ops;
A
aliguori 已提交
1385
    se->opaque = opaque;
1386
    se->vmsd = NULL;
1387
    se->no_migrate = 0;
1388
    /* if this is a live_savem then set is_ram */
1389
    if (ops->save_live_setup != NULL) {
1390 1391
        se->is_ram = 1;
    }
A
aliguori 已提交
1392

1393 1394
    if (dev) {
        char *id = qdev_get_dev_path(dev);
1395 1396 1397
        if (id) {
            pstrcpy(se->idstr, sizeof(se->idstr), id);
            pstrcat(se->idstr, sizeof(se->idstr), "/");
1398
            g_free(id);
1399

1400
            se->compat = g_malloc0(sizeof(CompatEntry));
1401 1402 1403 1404 1405 1406 1407 1408
            pstrcpy(se->compat->idstr, sizeof(se->compat->idstr), idstr);
            se->compat->instance_id = instance_id == -1 ?
                         calculate_compat_instance_id(idstr) : instance_id;
            instance_id = -1;
        }
    }
    pstrcat(se->idstr, sizeof(se->idstr), idstr);

1409
    if (instance_id == -1) {
1410
        se->instance_id = calculate_new_instance_id(se->idstr);
1411 1412
    } else {
        se->instance_id = instance_id;
A
aliguori 已提交
1413
    }
1414
    assert(!se->compat || se->instance_id == 0);
1415
    /* add at the end of list */
B
Blue Swirl 已提交
1416
    QTAILQ_INSERT_TAIL(&savevm_handlers, se, entry);
A
aliguori 已提交
1417 1418 1419
    return 0;
}

A
Alex Williamson 已提交
1420 1421
int register_savevm(DeviceState *dev,
                    const char *idstr,
A
aliguori 已提交
1422 1423 1424 1425 1426 1427
                    int instance_id,
                    int version_id,
                    SaveStateHandler *save_state,
                    LoadStateHandler *load_state,
                    void *opaque)
{
1428 1429 1430
    SaveVMHandlers *ops = g_malloc0(sizeof(SaveVMHandlers));
    ops->save_state = save_state;
    ops->load_state = load_state;
A
Alex Williamson 已提交
1431
    return register_savevm_live(dev, idstr, instance_id, version_id,
1432
                                ops, opaque);
A
aliguori 已提交
1433 1434
}

A
Alex Williamson 已提交
1435
void unregister_savevm(DeviceState *dev, const char *idstr, void *opaque)
1436
{
1437
    SaveStateEntry *se, *new_se;
1438 1439
    char id[256] = "";

1440 1441
    if (dev) {
        char *path = qdev_get_dev_path(dev);
1442 1443 1444
        if (path) {
            pstrcpy(id, sizeof(id), path);
            pstrcat(id, sizeof(id), "/");
1445
            g_free(path);
1446 1447 1448
        }
    }
    pstrcat(id, sizeof(id), idstr);
1449

B
Blue Swirl 已提交
1450
    QTAILQ_FOREACH_SAFE(se, &savevm_handlers, entry, new_se) {
1451
        if (strcmp(se->idstr, id) == 0 && se->opaque == opaque) {
B
Blue Swirl 已提交
1452
            QTAILQ_REMOVE(&savevm_handlers, se, entry);
1453
            if (se->compat) {
1454
                g_free(se->compat);
1455
            }
1456
            g_free(se->ops);
1457
            g_free(se);
1458 1459 1460 1461
        }
    }
}

A
Alex Williamson 已提交
1462
int vmstate_register_with_alias_id(DeviceState *dev, int instance_id,
J
Jan Kiszka 已提交
1463 1464 1465
                                   const VMStateDescription *vmsd,
                                   void *opaque, int alias_id,
                                   int required_for_version)
1466
{
1467
    SaveStateEntry *se;
1468

J
Jan Kiszka 已提交
1469 1470 1471
    /* If this triggers, alias support can be dropped for the vmsd. */
    assert(alias_id == -1 || required_for_version >= vmsd->minimum_version_id);

1472
    se = g_malloc0(sizeof(SaveStateEntry));
1473 1474 1475 1476
    se->version_id = vmsd->version_id;
    se->section_id = global_section_id++;
    se->opaque = opaque;
    se->vmsd = vmsd;
J
Jan Kiszka 已提交
1477
    se->alias_id = alias_id;
1478
    se->no_migrate = vmsd->unmigratable;
1479

1480 1481
    if (dev) {
        char *id = qdev_get_dev_path(dev);
1482 1483 1484
        if (id) {
            pstrcpy(se->idstr, sizeof(se->idstr), id);
            pstrcat(se->idstr, sizeof(se->idstr), "/");
1485
            g_free(id);
1486

1487
            se->compat = g_malloc0(sizeof(CompatEntry));
1488 1489 1490 1491 1492 1493 1494 1495
            pstrcpy(se->compat->idstr, sizeof(se->compat->idstr), vmsd->name);
            se->compat->instance_id = instance_id == -1 ?
                         calculate_compat_instance_id(vmsd->name) : instance_id;
            instance_id = -1;
        }
    }
    pstrcat(se->idstr, sizeof(se->idstr), vmsd->name);

1496
    if (instance_id == -1) {
1497
        se->instance_id = calculate_new_instance_id(se->idstr);
1498 1499
    } else {
        se->instance_id = instance_id;
1500
    }
1501
    assert(!se->compat || se->instance_id == 0);
1502
    /* add at the end of list */
B
Blue Swirl 已提交
1503
    QTAILQ_INSERT_TAIL(&savevm_handlers, se, entry);
1504 1505 1506
    return 0;
}

A
Alex Williamson 已提交
1507 1508
void vmstate_unregister(DeviceState *dev, const VMStateDescription *vmsd,
                        void *opaque)
1509
{
1510 1511
    SaveStateEntry *se, *new_se;

B
Blue Swirl 已提交
1512
    QTAILQ_FOREACH_SAFE(se, &savevm_handlers, entry, new_se) {
1513
        if (se->vmsd == vmsd && se->opaque == opaque) {
B
Blue Swirl 已提交
1514
            QTAILQ_REMOVE(&savevm_handlers, se, entry);
1515
            if (se->compat) {
1516
                g_free(se->compat);
1517
            }
1518
            g_free(se);
1519 1520
        }
    }
1521 1522
}

J
Juan Quintela 已提交
1523 1524 1525 1526 1527
static void vmstate_subsection_save(QEMUFile *f, const VMStateDescription *vmsd,
                                    void *opaque);
static int vmstate_subsection_load(QEMUFile *f, const VMStateDescription *vmsd,
                                   void *opaque);

1528 1529 1530 1531
int vmstate_load_state(QEMUFile *f, const VMStateDescription *vmsd,
                       void *opaque, int version_id)
{
    VMStateField *field = vmsd->fields;
J
Juan Quintela 已提交
1532
    int ret;
1533 1534 1535 1536 1537 1538 1539 1540 1541 1542

    if (version_id > vmsd->version_id) {
        return -EINVAL;
    }
    if (version_id < vmsd->minimum_version_id_old) {
        return -EINVAL;
    }
    if  (version_id < vmsd->minimum_version_id) {
        return vmsd->load_state_old(f, opaque, version_id);
    }
J
Juan Quintela 已提交
1543 1544 1545 1546 1547
    if (vmsd->pre_load) {
        int ret = vmsd->pre_load(opaque);
        if (ret)
            return ret;
    }
1548
    while(field->name) {
1549 1550 1551 1552
        if ((field->field_exists &&
             field->field_exists(opaque, version_id)) ||
            (!field->field_exists &&
             field->version_id <= version_id)) {
J
Juan Quintela 已提交
1553
            void *base_addr = opaque + field->offset;
J
Juan Quintela 已提交
1554
            int i, n_elems = 1;
J
Juan Quintela 已提交
1555
            int size = field->size;
1556

J
Juan Quintela 已提交
1557 1558
            if (field->flags & VMS_VBUFFER) {
                size = *(int32_t *)(opaque+field->size_offset);
1559 1560 1561
                if (field->flags & VMS_MULTIPLY) {
                    size *= field->size;
                }
J
Juan Quintela 已提交
1562
            }
J
Juan Quintela 已提交
1563 1564
            if (field->flags & VMS_ARRAY) {
                n_elems = field->num;
1565 1566
            } else if (field->flags & VMS_VARRAY_INT32) {
                n_elems = *(int32_t *)(opaque+field->num_offset);
J
Juan Quintela 已提交
1567 1568
            } else if (field->flags & VMS_VARRAY_UINT32) {
                n_elems = *(uint32_t *)(opaque+field->num_offset);
1569 1570
            } else if (field->flags & VMS_VARRAY_UINT16) {
                n_elems = *(uint16_t *)(opaque+field->num_offset);
1571 1572
            } else if (field->flags & VMS_VARRAY_UINT8) {
                n_elems = *(uint8_t *)(opaque+field->num_offset);
J
Juan Quintela 已提交
1573
            }
J
Juan Quintela 已提交
1574
            if (field->flags & VMS_POINTER) {
J
Juan Quintela 已提交
1575
                base_addr = *(void **)base_addr + field->start;
J
Juan Quintela 已提交
1576
            }
J
Juan Quintela 已提交
1577
            for (i = 0; i < n_elems; i++) {
J
Juan Quintela 已提交
1578
                void *addr = base_addr + size * i;
J
Juan Quintela 已提交
1579

1580 1581 1582
                if (field->flags & VMS_ARRAY_OF_POINTER) {
                    addr = *(void **)addr;
                }
J
Juan Quintela 已提交
1583
                if (field->flags & VMS_STRUCT) {
1584
                    ret = vmstate_load_state(f, field->vmsd, addr, field->vmsd->version_id);
J
Juan Quintela 已提交
1585
                } else {
J
Juan Quintela 已提交
1586
                    ret = field->info->get(f, addr, size);
J
Juan Quintela 已提交
1587 1588

                }
J
Juan Quintela 已提交
1589 1590 1591
                if (ret < 0) {
                    return ret;
                }
1592 1593 1594 1595
            }
        }
        field++;
    }
J
Juan Quintela 已提交
1596 1597 1598 1599
    ret = vmstate_subsection_load(f, vmsd, opaque);
    if (ret != 0) {
        return ret;
    }
1600
    if (vmsd->post_load) {
1601
        return vmsd->post_load(opaque, version_id);
1602
    }
1603 1604 1605 1606
    return 0;
}

void vmstate_save_state(QEMUFile *f, const VMStateDescription *vmsd,
1607
                        void *opaque)
1608 1609 1610
{
    VMStateField *field = vmsd->fields;

1611 1612 1613
    if (vmsd->pre_save) {
        vmsd->pre_save(opaque);
    }
1614
    while(field->name) {
1615 1616 1617 1618
        if (!field->field_exists ||
            field->field_exists(opaque, vmsd->version_id)) {
            void *base_addr = opaque + field->offset;
            int i, n_elems = 1;
J
Juan Quintela 已提交
1619
            int size = field->size;
J
Juan Quintela 已提交
1620

J
Juan Quintela 已提交
1621 1622
            if (field->flags & VMS_VBUFFER) {
                size = *(int32_t *)(opaque+field->size_offset);
1623 1624 1625
                if (field->flags & VMS_MULTIPLY) {
                    size *= field->size;
                }
J
Juan Quintela 已提交
1626
            }
1627 1628
            if (field->flags & VMS_ARRAY) {
                n_elems = field->num;
1629 1630
            } else if (field->flags & VMS_VARRAY_INT32) {
                n_elems = *(int32_t *)(opaque+field->num_offset);
1631 1632
            } else if (field->flags & VMS_VARRAY_UINT32) {
                n_elems = *(uint32_t *)(opaque+field->num_offset);
1633 1634
            } else if (field->flags & VMS_VARRAY_UINT16) {
                n_elems = *(uint16_t *)(opaque+field->num_offset);
1635 1636
            } else if (field->flags & VMS_VARRAY_UINT8) {
                n_elems = *(uint8_t *)(opaque+field->num_offset);
1637 1638
            }
            if (field->flags & VMS_POINTER) {
J
Juan Quintela 已提交
1639
                base_addr = *(void **)base_addr + field->start;
1640 1641
            }
            for (i = 0; i < n_elems; i++) {
J
Juan Quintela 已提交
1642
                void *addr = base_addr + size * i;
J
Juan Quintela 已提交
1643

1644 1645 1646
                if (field->flags & VMS_ARRAY_OF_POINTER) {
                    addr = *(void **)addr;
                }
1647 1648 1649
                if (field->flags & VMS_STRUCT) {
                    vmstate_save_state(f, field->vmsd, addr);
                } else {
J
Juan Quintela 已提交
1650
                    field->info->put(f, addr, size);
1651
                }
J
Juan Quintela 已提交
1652
            }
J
Juan Quintela 已提交
1653
        }
1654 1655
        field++;
    }
J
Juan Quintela 已提交
1656
    vmstate_subsection_save(f, vmsd, opaque);
1657 1658
}

1659 1660
static int vmstate_load(QEMUFile *f, SaveStateEntry *se, int version_id)
{
1661
    if (!se->vmsd) {         /* Old style */
1662
        return se->ops->load_state(f, se->opaque, version_id);
1663 1664
    }
    return vmstate_load_state(f, se->vmsd, se->opaque, version_id);
1665 1666
}

A
Alex Williamson 已提交
1667
static void vmstate_save(QEMUFile *f, SaveStateEntry *se)
1668
{
1669
    if (!se->vmsd) {         /* Old style */
1670
        se->ops->save_state(f, se->opaque);
A
Alex Williamson 已提交
1671
        return;
1672 1673
    }
    vmstate_save_state(f,se->vmsd, se->opaque);
1674 1675
}

A
aliguori 已提交
1676 1677 1678 1679 1680 1681 1682 1683 1684
#define QEMU_VM_FILE_MAGIC           0x5145564d
#define QEMU_VM_FILE_VERSION_COMPAT  0x00000002
#define QEMU_VM_FILE_VERSION         0x00000003

#define QEMU_VM_EOF                  0x00
#define QEMU_VM_SECTION_START        0x01
#define QEMU_VM_SECTION_PART         0x02
#define QEMU_VM_SECTION_END          0x03
#define QEMU_VM_SECTION_FULL         0x04
J
Juan Quintela 已提交
1685
#define QEMU_VM_SUBSECTION           0x05
A
aliguori 已提交
1686

L
Luiz Capitulino 已提交
1687
bool qemu_savevm_state_blocked(Error **errp)
A
Alex Williamson 已提交
1688 1689 1690 1691 1692
{
    SaveStateEntry *se;

    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
        if (se->no_migrate) {
L
Luiz Capitulino 已提交
1693
            error_set(errp, QERR_MIGRATION_NOT_SUPPORTED, se->idstr);
A
Alex Williamson 已提交
1694 1695 1696 1697 1698 1699
            return true;
        }
    }
    return false;
}

1700 1701
void qemu_savevm_state_begin(QEMUFile *f,
                             const MigrationParams *params)
A
aliguori 已提交
1702 1703
{
    SaveStateEntry *se;
J
Juan Quintela 已提交
1704
    int ret;
A
aliguori 已提交
1705

L
lirans@il.ibm.com 已提交
1706
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1707
        if (!se->ops || !se->ops->set_params) {
L
lirans@il.ibm.com 已提交
1708
            continue;
I
Isaku Yamahata 已提交
1709
        }
1710
        se->ops->set_params(params, se->opaque);
L
lirans@il.ibm.com 已提交
1711 1712
    }
    
A
aliguori 已提交
1713 1714 1715
    qemu_put_be32(f, QEMU_VM_FILE_MAGIC);
    qemu_put_be32(f, QEMU_VM_FILE_VERSION);

B
Blue Swirl 已提交
1716
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
A
aliguori 已提交
1717 1718
        int len;

1719
        if (!se->ops || !se->ops->save_live_setup) {
A
aliguori 已提交
1720
            continue;
1721
        }
1722 1723 1724 1725 1726
        if (se->ops && se->ops->is_active) {
            if (!se->ops->is_active(se->opaque)) {
                continue;
            }
        }
A
aliguori 已提交
1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738
        /* Section type */
        qemu_put_byte(f, QEMU_VM_SECTION_START);
        qemu_put_be32(f, se->section_id);

        /* ID string */
        len = strlen(se->idstr);
        qemu_put_byte(f, len);
        qemu_put_buffer(f, (uint8_t *)se->idstr, len);

        qemu_put_be32(f, se->instance_id);
        qemu_put_be32(f, se->version_id);

1739
        ret = se->ops->save_live_setup(f, se->opaque);
1740
        if (ret < 0) {
1741 1742
            qemu_file_set_error(f, ret);
            break;
1743
        }
A
aliguori 已提交
1744 1745 1746
    }
}

J
Juan Quintela 已提交
1747
/*
D
Dong Xu Wang 已提交
1748
 * this function has three return values:
J
Juan Quintela 已提交
1749 1750 1751 1752
 *   negative: there was one error, and we have -errno.
 *   0 : We haven't finished, caller have to go again
 *   1 : We have finished, we can go to complete phase
 */
1753
int qemu_savevm_state_iterate(QEMUFile *f)
A
aliguori 已提交
1754 1755 1756 1757
{
    SaveStateEntry *se;
    int ret = 1;

B
Blue Swirl 已提交
1758
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1759
        if (!se->ops || !se->ops->save_live_iterate) {
A
aliguori 已提交
1760
            continue;
1761
        }
1762 1763 1764 1765 1766
        if (se->ops && se->ops->is_active) {
            if (!se->ops->is_active(se->opaque)) {
                continue;
            }
        }
1767 1768 1769
        if (qemu_file_rate_limit(f)) {
            return 0;
        }
1770
        trace_savevm_section_start();
A
aliguori 已提交
1771 1772 1773 1774
        /* Section type */
        qemu_put_byte(f, QEMU_VM_SECTION_PART);
        qemu_put_be32(f, se->section_id);

1775
        ret = se->ops->save_live_iterate(f, se->opaque);
1776 1777
        trace_savevm_section_end(se->section_id);

1778 1779 1780
        if (ret < 0) {
            qemu_file_set_error(f, ret);
        }
1781
        if (ret <= 0) {
1782 1783 1784 1785 1786 1787
            /* Do not proceed to the next vmstate before this one reported
               completion of the current stage. This serializes the migration
               and reduces the probability that a faster changing state is
               synchronized over and over again. */
            break;
        }
A
aliguori 已提交
1788
    }
J
Juan Quintela 已提交
1789
    return ret;
A
aliguori 已提交
1790 1791
}

1792
void qemu_savevm_state_complete(QEMUFile *f)
A
aliguori 已提交
1793 1794
{
    SaveStateEntry *se;
1795
    int ret;
A
aliguori 已提交
1796

1797 1798
    cpu_synchronize_all_states();

B
Blue Swirl 已提交
1799
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1800
        if (!se->ops || !se->ops->save_live_complete) {
A
aliguori 已提交
1801
            continue;
1802
        }
1803 1804 1805 1806 1807
        if (se->ops && se->ops->is_active) {
            if (!se->ops->is_active(se->opaque)) {
                continue;
            }
        }
1808
        trace_savevm_section_start();
A
aliguori 已提交
1809 1810 1811 1812
        /* Section type */
        qemu_put_byte(f, QEMU_VM_SECTION_END);
        qemu_put_be32(f, se->section_id);

1813
        ret = se->ops->save_live_complete(f, se->opaque);
1814
        trace_savevm_section_end(se->section_id);
1815
        if (ret < 0) {
1816 1817
            qemu_file_set_error(f, ret);
            return;
1818
        }
A
aliguori 已提交
1819 1820
    }

B
Blue Swirl 已提交
1821
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
A
aliguori 已提交
1822 1823
        int len;

1824
        if ((!se->ops || !se->ops->save_state) && !se->vmsd) {
A
aliguori 已提交
1825
	    continue;
1826
        }
1827
        trace_savevm_section_start();
A
aliguori 已提交
1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839
        /* Section type */
        qemu_put_byte(f, QEMU_VM_SECTION_FULL);
        qemu_put_be32(f, se->section_id);

        /* ID string */
        len = strlen(se->idstr);
        qemu_put_byte(f, len);
        qemu_put_buffer(f, (uint8_t *)se->idstr, len);

        qemu_put_be32(f, se->instance_id);
        qemu_put_be32(f, se->version_id);

A
Alex Williamson 已提交
1840
        vmstate_save(f, se);
1841
        trace_savevm_section_end(se->section_id);
A
aliguori 已提交
1842 1843 1844
    }

    qemu_put_byte(f, QEMU_VM_EOF);
1845
    qemu_fflush(f);
A
aliguori 已提交
1846 1847
}

1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866
uint64_t qemu_savevm_state_pending(QEMUFile *f, uint64_t max_size)
{
    SaveStateEntry *se;
    uint64_t ret = 0;

    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
        if (!se->ops || !se->ops->save_live_pending) {
            continue;
        }
        if (se->ops && se->ops->is_active) {
            if (!se->ops->is_active(se->opaque)) {
                continue;
            }
        }
        ret += se->ops->save_live_pending(f, se->opaque, max_size);
    }
    return ret;
}

1867
void qemu_savevm_state_cancel(void)
1868 1869 1870 1871
{
    SaveStateEntry *se;

    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1872 1873
        if (se->ops && se->ops->cancel) {
            se->ops->cancel(se->opaque);
1874 1875 1876 1877
        }
    }
}

L
Luiz Capitulino 已提交
1878
static int qemu_savevm_state(QEMUFile *f)
A
aliguori 已提交
1879 1880
{
    int ret;
I
Isaku Yamahata 已提交
1881 1882 1883 1884
    MigrationParams params = {
        .blk = 0,
        .shared = 0
    };
A
aliguori 已提交
1885

L
Luiz Capitulino 已提交
1886
    if (qemu_savevm_state_blocked(NULL)) {
1887
        return -EINVAL;
A
Alex Williamson 已提交
1888 1889
    }

1890
    qemu_mutex_unlock_iothread();
1891
    qemu_savevm_state_begin(f, &params);
1892 1893
    qemu_mutex_lock_iothread();

1894 1895 1896 1897 1898
    while (qemu_file_get_error(f) == 0) {
        if (qemu_savevm_state_iterate(f) > 0) {
            break;
        }
    }
A
aliguori 已提交
1899

1900
    ret = qemu_file_get_error(f);
J
Juan Quintela 已提交
1901
    if (ret == 0) {
1902
        qemu_savevm_state_complete(f);
1903
        ret = qemu_file_get_error(f);
J
Juan Quintela 已提交
1904
    }
1905 1906 1907
    if (ret != 0) {
        qemu_savevm_state_cancel();
    }
A
aliguori 已提交
1908 1909 1910
    return ret;
}

1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925
static int qemu_save_device_state(QEMUFile *f)
{
    SaveStateEntry *se;

    qemu_put_be32(f, QEMU_VM_FILE_MAGIC);
    qemu_put_be32(f, QEMU_VM_FILE_VERSION);

    cpu_synchronize_all_states();

    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
        int len;

        if (se->is_ram) {
            continue;
        }
1926
        if ((!se->ops || !se->ops->save_state) && !se->vmsd) {
1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947 1948 1949
            continue;
        }

        /* Section type */
        qemu_put_byte(f, QEMU_VM_SECTION_FULL);
        qemu_put_be32(f, se->section_id);

        /* ID string */
        len = strlen(se->idstr);
        qemu_put_byte(f, len);
        qemu_put_buffer(f, (uint8_t *)se->idstr, len);

        qemu_put_be32(f, se->instance_id);
        qemu_put_be32(f, se->version_id);

        vmstate_save(f, se);
    }

    qemu_put_byte(f, QEMU_VM_EOF);

    return qemu_file_get_error(f);
}

A
aliguori 已提交
1950 1951 1952 1953
static SaveStateEntry *find_se(const char *idstr, int instance_id)
{
    SaveStateEntry *se;

B
Blue Swirl 已提交
1954
    QTAILQ_FOREACH(se, &savevm_handlers, entry) {
A
aliguori 已提交
1955
        if (!strcmp(se->idstr, idstr) &&
J
Jan Kiszka 已提交
1956 1957
            (instance_id == se->instance_id ||
             instance_id == se->alias_id))
A
aliguori 已提交
1958
            return se;
1959 1960 1961 1962 1963 1964 1965
        /* Migrating from an older version? */
        if (strstr(se->idstr, idstr) && se->compat) {
            if (!strcmp(se->compat->idstr, idstr) &&
                (instance_id == se->compat->instance_id ||
                 instance_id == se->alias_id))
                return se;
        }
A
aliguori 已提交
1966 1967 1968 1969
    }
    return NULL;
}

J
Juan Quintela 已提交
1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983
static const VMStateDescription *vmstate_get_subsection(const VMStateSubsection *sub, char *idstr)
{
    while(sub && sub->needed) {
        if (strcmp(idstr, sub->vmsd->name) == 0) {
            return sub->vmsd;
        }
        sub++;
    }
    return NULL;
}

static int vmstate_subsection_load(QEMUFile *f, const VMStateDescription *vmsd,
                                   void *opaque)
{
1984
    while (qemu_peek_byte(f, 0) == QEMU_VM_SUBSECTION) {
J
Juan Quintela 已提交
1985 1986
        char idstr[256];
        int ret;
1987
        uint8_t version_id, len, size;
J
Juan Quintela 已提交
1988 1989
        const VMStateDescription *sub_vmsd;

1990 1991 1992 1993 1994 1995 1996 1997 1998 1999
        len = qemu_peek_byte(f, 1);
        if (len < strlen(vmsd->name) + 1) {
            /* subsection name has be be "section_name/a" */
            return 0;
        }
        size = qemu_peek_buffer(f, (uint8_t *)idstr, len, 2);
        if (size != len) {
            return 0;
        }
        idstr[size] = 0;
J
Juan Quintela 已提交
2000

2001 2002 2003 2004
        if (strncmp(vmsd->name, idstr, strlen(vmsd->name)) != 0) {
            /* it don't have a valid subsection name */
            return 0;
        }
2005
        sub_vmsd = vmstate_get_subsection(vmsd->subsections, idstr);
J
Juan Quintela 已提交
2006 2007 2008
        if (sub_vmsd == NULL) {
            return -ENOENT;
        }
2009 2010 2011 2012 2013
        qemu_file_skip(f, 1); /* subsection */
        qemu_file_skip(f, 1); /* len */
        qemu_file_skip(f, len); /* idstr */
        version_id = qemu_get_be32(f);

J
Juan Quintela 已提交
2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040 2041 2042
        ret = vmstate_load_state(f, sub_vmsd, opaque, version_id);
        if (ret) {
            return ret;
        }
    }
    return 0;
}

static void vmstate_subsection_save(QEMUFile *f, const VMStateDescription *vmsd,
                                    void *opaque)
{
    const VMStateSubsection *sub = vmsd->subsections;

    while (sub && sub->needed) {
        if (sub->needed(opaque)) {
            const VMStateDescription *vmsd = sub->vmsd;
            uint8_t len;

            qemu_put_byte(f, QEMU_VM_SUBSECTION);
            len = strlen(vmsd->name);
            qemu_put_byte(f, len);
            qemu_put_buffer(f, (uint8_t *)vmsd->name, len);
            qemu_put_be32(f, vmsd->version_id);
            vmstate_save_state(f, vmsd, opaque);
        }
        sub++;
    }
}

A
aliguori 已提交
2043
typedef struct LoadStateEntry {
B
Blue Swirl 已提交
2044
    QLIST_ENTRY(LoadStateEntry) entry;
A
aliguori 已提交
2045 2046 2047 2048 2049 2050 2051
    SaveStateEntry *se;
    int section_id;
    int version_id;
} LoadStateEntry;

int qemu_loadvm_state(QEMUFile *f)
{
B
Blue Swirl 已提交
2052 2053
    QLIST_HEAD(, LoadStateEntry) loadvm_handlers =
        QLIST_HEAD_INITIALIZER(loadvm_handlers);
2054
    LoadStateEntry *le, *new_le;
A
aliguori 已提交
2055 2056 2057 2058
    uint8_t section_type;
    unsigned int v;
    int ret;

L
Luiz Capitulino 已提交
2059
    if (qemu_savevm_state_blocked(NULL)) {
A
Alex Williamson 已提交
2060 2061 2062
        return -EINVAL;
    }

A
aliguori 已提交
2063 2064 2065 2066 2067
    v = qemu_get_be32(f);
    if (v != QEMU_VM_FILE_MAGIC)
        return -EINVAL;

    v = qemu_get_be32(f);
J
Juan Quintela 已提交
2068 2069 2070 2071
    if (v == QEMU_VM_FILE_VERSION_COMPAT) {
        fprintf(stderr, "SaveVM v2 format is obsolete and don't work anymore\n");
        return -ENOTSUP;
    }
A
aliguori 已提交
2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108
    if (v != QEMU_VM_FILE_VERSION)
        return -ENOTSUP;

    while ((section_type = qemu_get_byte(f)) != QEMU_VM_EOF) {
        uint32_t instance_id, version_id, section_id;
        SaveStateEntry *se;
        char idstr[257];
        int len;

        switch (section_type) {
        case QEMU_VM_SECTION_START:
        case QEMU_VM_SECTION_FULL:
            /* Read section start */
            section_id = qemu_get_be32(f);
            len = qemu_get_byte(f);
            qemu_get_buffer(f, (uint8_t *)idstr, len);
            idstr[len] = 0;
            instance_id = qemu_get_be32(f);
            version_id = qemu_get_be32(f);

            /* Find savevm section */
            se = find_se(idstr, instance_id);
            if (se == NULL) {
                fprintf(stderr, "Unknown savevm section or instance '%s' %d\n", idstr, instance_id);
                ret = -EINVAL;
                goto out;
            }

            /* Validate version */
            if (version_id > se->version_id) {
                fprintf(stderr, "savevm: unsupported version %d for '%s' v%d\n",
                        version_id, idstr, se->version_id);
                ret = -EINVAL;
                goto out;
            }

            /* Add entry */
2109
            le = g_malloc0(sizeof(*le));
A
aliguori 已提交
2110 2111 2112 2113

            le->se = se;
            le->section_id = section_id;
            le->version_id = version_id;
B
Blue Swirl 已提交
2114
            QLIST_INSERT_HEAD(&loadvm_handlers, le, entry);
A
aliguori 已提交
2115

2116
            ret = vmstate_load(f, le->se, le->version_id);
2117 2118 2119 2120 2121
            if (ret < 0) {
                fprintf(stderr, "qemu: warning: error while loading state for instance 0x%x of device '%s'\n",
                        instance_id, idstr);
                goto out;
            }
A
aliguori 已提交
2122 2123 2124 2125 2126
            break;
        case QEMU_VM_SECTION_PART:
        case QEMU_VM_SECTION_END:
            section_id = qemu_get_be32(f);

B
Blue Swirl 已提交
2127
            QLIST_FOREACH(le, &loadvm_handlers, entry) {
2128 2129 2130 2131
                if (le->section_id == section_id) {
                    break;
                }
            }
A
aliguori 已提交
2132 2133 2134 2135 2136 2137
            if (le == NULL) {
                fprintf(stderr, "Unknown savevm section %d\n", section_id);
                ret = -EINVAL;
                goto out;
            }

2138
            ret = vmstate_load(f, le->se, le->version_id);
2139 2140 2141 2142 2143
            if (ret < 0) {
                fprintf(stderr, "qemu: warning: error while loading state section id %d\n",
                        section_id);
                goto out;
            }
A
aliguori 已提交
2144 2145 2146 2147 2148 2149 2150 2151
            break;
        default:
            fprintf(stderr, "Unknown savevm section type %d\n", section_type);
            ret = -EINVAL;
            goto out;
        }
    }

2152 2153
    cpu_synchronize_all_post_init();

A
aliguori 已提交
2154 2155 2156
    ret = 0;

out:
B
Blue Swirl 已提交
2157 2158
    QLIST_FOREACH_SAFE(le, &loadvm_handlers, entry, new_le) {
        QLIST_REMOVE(le, entry);
2159
        g_free(le);
A
aliguori 已提交
2160 2161
    }

2162 2163
    if (ret == 0) {
        ret = qemu_file_get_error(f);
2164
    }
A
aliguori 已提交
2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186

    return ret;
}

static int bdrv_snapshot_find(BlockDriverState *bs, QEMUSnapshotInfo *sn_info,
                              const char *name)
{
    QEMUSnapshotInfo *sn_tab, *sn;
    int nb_sns, i, ret;

    ret = -ENOENT;
    nb_sns = bdrv_snapshot_list(bs, &sn_tab);
    if (nb_sns < 0)
        return ret;
    for(i = 0; i < nb_sns; i++) {
        sn = &sn_tab[i];
        if (!strcmp(sn->id_str, name) || !strcmp(sn->name, name)) {
            *sn_info = *sn;
            ret = 0;
            break;
        }
    }
2187
    g_free(sn_tab);
A
aliguori 已提交
2188 2189 2190
    return ret;
}

2191 2192 2193 2194 2195 2196 2197 2198 2199
/*
 * Deletes snapshots of a given name in all opened images.
 */
static int del_existing_snapshots(Monitor *mon, const char *name)
{
    BlockDriverState *bs;
    QEMUSnapshotInfo sn1, *snapshot = &sn1;
    int ret;

2200 2201
    bs = NULL;
    while ((bs = bdrv_next(bs))) {
2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217
        if (bdrv_can_snapshot(bs) &&
            bdrv_snapshot_find(bs, snapshot, name) >= 0)
        {
            ret = bdrv_snapshot_delete(bs, name);
            if (ret < 0) {
                monitor_printf(mon,
                               "Error while deleting snapshot on '%s'\n",
                               bdrv_get_device_name(bs));
                return -1;
            }
        }
    }

    return 0;
}

2218
void do_savevm(Monitor *mon, const QDict *qdict)
A
aliguori 已提交
2219 2220 2221
{
    BlockDriverState *bs, *bs1;
    QEMUSnapshotInfo sn1, *sn = &sn1, old_sn1, *old_sn = &old_sn1;
2222
    int ret;
A
aliguori 已提交
2223 2224
    QEMUFile *f;
    int saved_vm_running;
K
Kevin Wolf 已提交
2225
    uint64_t vm_state_size;
2226
    qemu_timeval tv;
2227
    struct tm tm;
2228
    const char *name = qdict_get_try_str(qdict, "name");
A
aliguori 已提交
2229

2230
    /* Verify if there is a device that doesn't support snapshots and is writable */
2231 2232
    bs = NULL;
    while ((bs = bdrv_next(bs))) {
2233

2234
        if (!bdrv_is_inserted(bs) || bdrv_is_read_only(bs)) {
2235 2236 2237 2238 2239 2240 2241 2242 2243 2244
            continue;
        }

        if (!bdrv_can_snapshot(bs)) {
            monitor_printf(mon, "Device '%s' is writable but does not support snapshots.\n",
                               bdrv_get_device_name(bs));
            return;
        }
    }

2245
    bs = bdrv_snapshots();
A
aliguori 已提交
2246
    if (!bs) {
A
aliguori 已提交
2247
        monitor_printf(mon, "No block device can accept snapshots\n");
A
aliguori 已提交
2248 2249 2250
        return;
    }

2251
    saved_vm_running = runstate_is_running();
2252
    vm_stop(RUN_STATE_SAVE_VM);
A
aliguori 已提交
2253

2254
    memset(sn, 0, sizeof(*sn));
A
aliguori 已提交
2255 2256

    /* fill auxiliary fields */
2257
    qemu_gettimeofday(&tv);
A
aliguori 已提交
2258 2259
    sn->date_sec = tv.tv_sec;
    sn->date_nsec = tv.tv_usec * 1000;
2260
    sn->vm_clock_nsec = qemu_get_clock_ns(vm_clock);
A
aliguori 已提交
2261

2262 2263 2264 2265 2266 2267 2268 2269 2270
    if (name) {
        ret = bdrv_snapshot_find(bs, old_sn, name);
        if (ret >= 0) {
            pstrcpy(sn->name, sizeof(sn->name), old_sn->name);
            pstrcpy(sn->id_str, sizeof(sn->id_str), old_sn->id_str);
        } else {
            pstrcpy(sn->name, sizeof(sn->name), name);
        }
    } else {
B
Blue Swirl 已提交
2271 2272
        /* cast below needed for OpenBSD where tv_sec is still 'long' */
        localtime_r((const time_t *)&tv.tv_sec, &tm);
2273 2274 2275
        strftime(sn->name, sizeof(sn->name), "vm-%Y%m%d%H%M%S", &tm);
    }

2276
    /* Delete old snapshots of the same name */
2277
    if (name && del_existing_snapshots(mon, name) < 0) {
2278 2279 2280
        goto the_end;
    }

A
aliguori 已提交
2281
    /* save the VM state */
2282
    f = qemu_fopen_bdrv(bs, 1);
A
aliguori 已提交
2283
    if (!f) {
A
aliguori 已提交
2284
        monitor_printf(mon, "Could not open VM state file\n");
A
aliguori 已提交
2285 2286
        goto the_end;
    }
L
Luiz Capitulino 已提交
2287
    ret = qemu_savevm_state(f);
2288
    vm_state_size = qemu_ftell(f);
A
aliguori 已提交
2289 2290
    qemu_fclose(f);
    if (ret < 0) {
A
aliguori 已提交
2291
        monitor_printf(mon, "Error %d while writing VM\n", ret);
A
aliguori 已提交
2292 2293 2294 2295 2296
        goto the_end;
    }

    /* create the snapshots */

2297 2298
    bs1 = NULL;
    while ((bs1 = bdrv_next(bs1))) {
2299
        if (bdrv_can_snapshot(bs1)) {
2300 2301
            /* Write VM state size only to the image that contains the state */
            sn->vm_state_size = (bs == bs1 ? vm_state_size : 0);
A
aliguori 已提交
2302 2303
            ret = bdrv_snapshot_create(bs1, sn);
            if (ret < 0) {
A
aliguori 已提交
2304 2305
                monitor_printf(mon, "Error while creating snapshot on '%s'\n",
                               bdrv_get_device_name(bs1));
A
aliguori 已提交
2306 2307 2308 2309 2310 2311 2312 2313 2314
            }
        }
    }

 the_end:
    if (saved_vm_running)
        vm_start();
}

2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339
void qmp_xen_save_devices_state(const char *filename, Error **errp)
{
    QEMUFile *f;
    int saved_vm_running;
    int ret;

    saved_vm_running = runstate_is_running();
    vm_stop(RUN_STATE_SAVE_VM);

    f = qemu_fopen(filename, "wb");
    if (!f) {
        error_set(errp, QERR_OPEN_FILE_FAILED, filename);
        goto the_end;
    }
    ret = qemu_save_device_state(f);
    qemu_fclose(f);
    if (ret < 0) {
        error_set(errp, QERR_IO_ERROR);
    }

 the_end:
    if (saved_vm_running)
        vm_start();
}

2340
int load_vmstate(const char *name)
A
aliguori 已提交
2341
{
2342
    BlockDriverState *bs, *bs_vm_state;
2343
    QEMUSnapshotInfo sn;
A
aliguori 已提交
2344
    QEMUFile *f;
G
Gerd Hoffmann 已提交
2345
    int ret;
A
aliguori 已提交
2346

2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357
    bs_vm_state = bdrv_snapshots();
    if (!bs_vm_state) {
        error_report("No block device supports snapshots");
        return -ENOTSUP;
    }

    /* Don't even try to load empty VM states */
    ret = bdrv_snapshot_find(bs_vm_state, &sn, name);
    if (ret < 0) {
        return ret;
    } else if (sn.vm_state_size == 0) {
2358 2359
        error_report("This is a disk-only snapshot. Revert to it offline "
            "using qemu-img.");
2360 2361 2362 2363 2364
        return -EINVAL;
    }

    /* Verify if there is any device that doesn't support snapshots and is
    writable and check if the requested snapshot is available too. */
2365 2366
    bs = NULL;
    while ((bs = bdrv_next(bs))) {
2367

2368
        if (!bdrv_is_inserted(bs) || bdrv_is_read_only(bs)) {
2369 2370 2371 2372 2373 2374 2375 2376 2377
            continue;
        }

        if (!bdrv_can_snapshot(bs)) {
            error_report("Device '%s' is writable but does not support snapshots.",
                               bdrv_get_device_name(bs));
            return -ENOTSUP;
        }

2378 2379 2380 2381 2382 2383
        ret = bdrv_snapshot_find(bs, &sn, name);
        if (ret < 0) {
            error_report("Device '%s' does not have the requested snapshot '%s'",
                           bdrv_get_device_name(bs), name);
            return ret;
        }
A
aliguori 已提交
2384 2385 2386
    }

    /* Flush all IO requests so they don't interfere with the new state.  */
2387
    bdrv_drain_all();
A
aliguori 已提交
2388

2389 2390 2391 2392
    bs = NULL;
    while ((bs = bdrv_next(bs))) {
        if (bdrv_can_snapshot(bs)) {
            ret = bdrv_snapshot_goto(bs, name);
A
aliguori 已提交
2393
            if (ret < 0) {
2394 2395 2396
                error_report("Error %d while activating snapshot '%s' on '%s'",
                             ret, name, bdrv_get_device_name(bs));
                return ret;
A
aliguori 已提交
2397 2398 2399 2400 2401
            }
        }
    }

    /* restore the VM state */
2402
    f = qemu_fopen_bdrv(bs_vm_state, 0);
A
aliguori 已提交
2403
    if (!f) {
2404
        error_report("Could not open VM state file");
2405
        return -EINVAL;
A
aliguori 已提交
2406
    }
2407

J
Jan Kiszka 已提交
2408
    qemu_system_reset(VMRESET_SILENT);
A
aliguori 已提交
2409
    ret = qemu_loadvm_state(f);
2410

A
aliguori 已提交
2411 2412
    qemu_fclose(f);
    if (ret < 0) {
2413
        error_report("Error %d while loading VM state", ret);
2414
        return ret;
A
aliguori 已提交
2415
    }
2416

2417
    return 0;
2418 2419
}

2420
void do_delvm(Monitor *mon, const QDict *qdict)
A
aliguori 已提交
2421 2422
{
    BlockDriverState *bs, *bs1;
G
Gerd Hoffmann 已提交
2423
    int ret;
2424
    const char *name = qdict_get_str(qdict, "name");
A
aliguori 已提交
2425

2426
    bs = bdrv_snapshots();
A
aliguori 已提交
2427
    if (!bs) {
A
aliguori 已提交
2428
        monitor_printf(mon, "No block device supports snapshots\n");
A
aliguori 已提交
2429 2430 2431
        return;
    }

2432 2433
    bs1 = NULL;
    while ((bs1 = bdrv_next(bs1))) {
2434
        if (bdrv_can_snapshot(bs1)) {
A
aliguori 已提交
2435 2436 2437
            ret = bdrv_snapshot_delete(bs1, name);
            if (ret < 0) {
                if (ret == -ENOTSUP)
A
aliguori 已提交
2438 2439 2440
                    monitor_printf(mon,
                                   "Snapshots not supported on device '%s'\n",
                                   bdrv_get_device_name(bs1));
A
aliguori 已提交
2441
                else
A
aliguori 已提交
2442 2443
                    monitor_printf(mon, "Error %d while deleting snapshot on "
                                   "'%s'\n", ret, bdrv_get_device_name(bs1));
A
aliguori 已提交
2444 2445 2446 2447 2448
            }
        }
    }
}

2449
void do_info_snapshots(Monitor *mon, const QDict *qdict)
A
aliguori 已提交
2450 2451
{
    BlockDriverState *bs, *bs1;
2452 2453 2454 2455
    QEMUSnapshotInfo *sn_tab, *sn, s, *sn_info = &s;
    int nb_sns, i, ret, available;
    int total;
    int *available_snapshots;
A
aliguori 已提交
2456 2457
    char buf[256];

2458
    bs = bdrv_snapshots();
A
aliguori 已提交
2459
    if (!bs) {
A
aliguori 已提交
2460
        monitor_printf(mon, "No available block device supports snapshots\n");
A
aliguori 已提交
2461 2462 2463 2464 2465
        return;
    }

    nb_sns = bdrv_snapshot_list(bs, &sn_tab);
    if (nb_sns < 0) {
A
aliguori 已提交
2466
        monitor_printf(mon, "bdrv_snapshot_list: error %d\n", nb_sns);
A
aliguori 已提交
2467 2468
        return;
    }
2469 2470 2471 2472 2473 2474

    if (nb_sns == 0) {
        monitor_printf(mon, "There is no snapshot available.\n");
        return;
    }

2475
    available_snapshots = g_malloc0(sizeof(int) * nb_sns);
2476 2477
    total = 0;
    for (i = 0; i < nb_sns; i++) {
A
aliguori 已提交
2478
        sn = &sn_tab[i];
2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495
        available = 1;
        bs1 = NULL;

        while ((bs1 = bdrv_next(bs1))) {
            if (bdrv_can_snapshot(bs1) && bs1 != bs) {
                ret = bdrv_snapshot_find(bs1, sn_info, sn->id_str);
                if (ret < 0) {
                    available = 0;
                    break;
                }
            }
        }

        if (available) {
            available_snapshots[total] = i;
            total++;
        }
A
aliguori 已提交
2496
    }
2497 2498 2499 2500 2501 2502 2503 2504 2505 2506 2507

    if (total > 0) {
        monitor_printf(mon, "%s\n", bdrv_snapshot_dump(buf, sizeof(buf), NULL));
        for (i = 0; i < total; i++) {
            sn = &sn_tab[available_snapshots[i]];
            monitor_printf(mon, "%s\n", bdrv_snapshot_dump(buf, sizeof(buf), sn));
        }
    } else {
        monitor_printf(mon, "There is no suitable snapshot available\n");
    }

2508 2509
    g_free(sn_tab);
    g_free(available_snapshots);
2510

A
aliguori 已提交
2511
}
2512 2513 2514

void vmstate_register_ram(MemoryRegion *mr, DeviceState *dev)
{
2515
    qemu_ram_set_idstr(memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK,
2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526 2527
                       memory_region_name(mr), dev);
}

void vmstate_unregister_ram(MemoryRegion *mr, DeviceState *dev)
{
    /* Nothing do to while the implementation is in RAMBlock */
}

void vmstate_register_ram_global(MemoryRegion *mr)
{
    vmstate_register_ram(mr, NULL);
}