migration.c 12.3 KB
Newer Older
A
aliguori 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * QEMU live migration
 *
 * Copyright IBM, Corp. 2008
 *
 * Authors:
 *  Anthony Liguori   <aliguori@us.ibm.com>
 *
 * This work is licensed under the terms of the GNU GPL, version 2.  See
 * the COPYING file in the top-level directory.
 *
 */

#include "qemu-common.h"
#include "migration.h"
A
aliguori 已提交
16
#include "monitor.h"
17 18 19 20
#include "buffered_file.h"
#include "sysemu.h"
#include "block.h"
#include "qemu_socket.h"
21
#include "block-migration.h"
22
#include "qemu-objects.h"
23 24 25 26

//#define DEBUG_MIGRATION

#ifdef DEBUG_MIGRATION
M
malc 已提交
27
#define DPRINTF(fmt, ...) \
28 29
    do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
#else
M
malc 已提交
30
#define DPRINTF(fmt, ...) \
31 32
    do { } while (0)
#endif
A
aliguori 已提交
33 34

/* Migration speed throttling */
M
Michael S. Tsirkin 已提交
35
static int64_t max_throttle = (32 << 20);
A
aliguori 已提交
36 37 38

static MigrationState *current_migration;

39 40 41
static NotifierList migration_state_notifiers =
    NOTIFIER_LIST_INITIALIZER(migration_state_notifiers);

J
Juan Quintela 已提交
42
int qemu_start_incoming_migration(const char *uri)
A
aliguori 已提交
43
{
A
aliguori 已提交
44
    const char *p;
J
Juan Quintela 已提交
45
    int ret;
A
aliguori 已提交
46 47

    if (strstart(uri, "tcp:", &p))
J
Juan Quintela 已提交
48
        ret = tcp_start_incoming_migration(p);
49 50
#if !defined(WIN32)
    else if (strstart(uri, "exec:", &p))
J
Juan Quintela 已提交
51
        ret =  exec_start_incoming_migration(p);
C
Chris Lalancette 已提交
52
    else if (strstart(uri, "unix:", &p))
J
Juan Quintela 已提交
53
        ret = unix_start_incoming_migration(p);
P
Paolo Bonzini 已提交
54
    else if (strstart(uri, "fd:", &p))
J
Juan Quintela 已提交
55
        ret = fd_start_incoming_migration(p);
56
#endif
J
Juan Quintela 已提交
57
    else {
A
aliguori 已提交
58
        fprintf(stderr, "unknown migration protocol: %s\n", uri);
J
Juan Quintela 已提交
59 60 61
        ret = -EPROTONOSUPPORT;
    }
    return ret;
A
aliguori 已提交
62 63
}

64 65 66 67 68 69 70 71 72
void process_incoming_migration(QEMUFile *f)
{
    if (qemu_loadvm_state(f) < 0) {
        fprintf(stderr, "load of migration failed\n");
        exit(0);
    }
    qemu_announce_self();
    DPRINTF("successfully loaded vm state\n");

73 74
    incoming_expected = false;

75
    if (autostart) {
76
        vm_start();
77 78 79
    } else {
        runstate_set(RSTATE_PRE_LAUNCH);
    }
80 81
}

82
int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
A
aliguori 已提交
83
{
A
aliguori 已提交
84 85
    MigrationState *s = NULL;
    const char *p;
86 87 88
    int detach = qdict_get_try_bool(qdict, "detach", 0);
    int blk = qdict_get_try_bool(qdict, "blk", 0);
    int inc = qdict_get_try_bool(qdict, "inc", 0);
89
    const char *uri = qdict_get_str(qdict, "uri");
90 91 92 93

    if (current_migration &&
        current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
        monitor_printf(mon, "migration already in progress\n");
94
        return -1;
95 96
    }

A
Alex Williamson 已提交
97 98 99 100
    if (qemu_savevm_state_blocked(mon)) {
        return -1;
    }

101
    if (strstart(uri, "tcp:", &p)) {
102
        s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
103
                                         blk, inc);
104
#if !defined(WIN32)
105
    } else if (strstart(uri, "exec:", &p)) {
106
        s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
107
                                          blk, inc);
108
    } else if (strstart(uri, "unix:", &p)) {
109
        s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
110
                                          blk, inc);
111
    } else if (strstart(uri, "fd:", &p)) {
L
lirans@il.ibm.com 已提交
112
        s = fd_start_outgoing_migration(mon, p, max_throttle, detach, 
113
                                        blk, inc);
114
#endif
115
    } else {
A
aliguori 已提交
116
        monitor_printf(mon, "unknown migration protocol: %s\n", uri);
117 118
        return -1;
    }
A
aliguori 已提交
119

120
    if (s == NULL) {
A
aliguori 已提交
121
        monitor_printf(mon, "migration failed\n");
122 123
        return -1;
    }
A
aliguori 已提交
124

125 126
    if (current_migration) {
        current_migration->release(current_migration);
A
aliguori 已提交
127
    }
128 129

    current_migration = s;
130
    notifier_list_notify(&migration_state_notifiers, NULL);
131
    return 0;
A
aliguori 已提交
132 133
}

134
int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
A
aliguori 已提交
135 136 137 138
{
    MigrationState *s = current_migration;

    if (s)
A
aliguori 已提交
139
        s->cancel(s);
140 141

    return 0;
A
aliguori 已提交
142 143
}

144
int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
A
aliguori 已提交
145
{
146
    int64_t d;
147
    FdMigrationState *s;
A
aliguori 已提交
148

149
    d = qdict_get_int(qdict, "value");
M
Michael S. Tsirkin 已提交
150 151 152
    if (d < 0) {
        d = 0;
    }
153
    max_throttle = d;
154

155 156
    s = migrate_to_fms(current_migration);
    if (s && s->file) {
157 158
        qemu_file_set_rate_limit(s->file, max_throttle);
    }
159 160

    return 0;
A
aliguori 已提交
161 162
}

163 164 165 166 167 168 169 170 171 172 173
/* amount of nanoseconds we are willing to wait for migration to be down.
 * the choice of nanoseconds is because it is the maximum resolution that
 * get_clock() can achieve. It is an internal measure. All user-visible
 * units must be in seconds */
static uint64_t max_downtime = 30000000;

uint64_t migrate_max_downtime(void)
{
    return max_downtime;
}

174 175
int do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
                            QObject **ret_data)
G
Glauber Costa 已提交
176 177 178
{
    double d;

179 180
    d = qdict_get_double(qdict, "value") * 1e9;
    d = MAX(0, MIN(UINT64_MAX, d));
G
Glauber Costa 已提交
181
    max_downtime = (uint64_t)d;
182 183

    return 0;
G
Glauber Costa 已提交
184 185
}

186 187
static void migrate_print_status(Monitor *mon, const char *name,
                                 const QDict *status_dict)
A
aliguori 已提交
188
{
189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232
    QDict *qdict;

    qdict = qobject_to_qdict(qdict_get(status_dict, name));

    monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
                        qdict_get_int(qdict, "transferred") >> 10);
    monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
                        qdict_get_int(qdict, "remaining") >> 10);
    monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
                        qdict_get_int(qdict, "total") >> 10);
}

void do_info_migrate_print(Monitor *mon, const QObject *data)
{
    QDict *qdict;

    qdict = qobject_to_qdict(data);

    monitor_printf(mon, "Migration status: %s\n",
                   qdict_get_str(qdict, "status"));

    if (qdict_haskey(qdict, "ram")) {
        migrate_print_status(mon, "ram", qdict);
    }

    if (qdict_haskey(qdict, "disk")) {
        migrate_print_status(mon, "disk", qdict);
    }
}

static void migrate_put_status(QDict *qdict, const char *name,
                               uint64_t trans, uint64_t rem, uint64_t total)
{
    QObject *obj;

    obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
                               "'remaining': %" PRId64 ", "
                               "'total': %" PRId64 " }", trans, rem, total);
    qdict_put_obj(qdict, name, obj);
}

void do_info_migrate(Monitor *mon, QObject **ret_data)
{
    QDict *qdict;
A
aliguori 已提交
233
    MigrationState *s = current_migration;
A
aliguori 已提交
234

A
aliguori 已提交
235
    if (s) {
A
aliguori 已提交
236 237
        switch (s->get_status(s)) {
        case MIG_STATE_ACTIVE:
238 239 240 241 242 243
            qdict = qdict_new();
            qdict_put(qdict, "status", qstring_from_str("active"));

            migrate_put_status(qdict, "ram", ram_bytes_transferred(),
                               ram_bytes_remaining(), ram_bytes_total());

244
            if (blk_mig_active()) {
245 246 247
                migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
                                   blk_mig_bytes_remaining(),
                                   blk_mig_bytes_total());
248
            }
249 250

            *ret_data = QOBJECT(qdict);
A
aliguori 已提交
251 252
            break;
        case MIG_STATE_COMPLETED:
253
            *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
A
aliguori 已提交
254 255
            break;
        case MIG_STATE_ERROR:
256
            *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
A
aliguori 已提交
257 258
            break;
        case MIG_STATE_CANCELLED:
259
            *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
A
aliguori 已提交
260 261
            break;
        }
A
aliguori 已提交
262 263 264
    }
}

265 266
/* shared migration helpers */

267
void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
268
{
269 270
    s->mon = mon;
    if (monitor_suspend(mon) == 0) {
M
malc 已提交
271
        DPRINTF("suspending monitor\n");
272 273
    } else {
        monitor_printf(mon, "terminal does not allow synchronous "
274
                       "migration, continuing detached\n");
275
    }
276 277
}

278 279
void migrate_fd_error(FdMigrationState *s)
{
M
malc 已提交
280
    DPRINTF("setting error state\n");
281
    s->state = MIG_STATE_ERROR;
282
    notifier_list_notify(&migration_state_notifiers, NULL);
283 284 285
    migrate_fd_cleanup(s);
}

286
int migrate_fd_cleanup(FdMigrationState *s)
287
{
288 289
    int ret = 0;

290 291 292
    qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);

    if (s->file) {
M
malc 已提交
293
        DPRINTF("closing file\n");
294 295 296
        if (qemu_fclose(s->file) != 0) {
            ret = -1;
        }
297
        s->file = NULL;
298 299 300 301
    } else {
        if (s->mon) {
            monitor_resume(s->mon);
        }
302 303
    }

304
    if (s->fd != -1) {
305
        close(s->fd);
306
        s->fd = -1;
307
    }
308

309
    return ret;
310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326
}

void migrate_fd_put_notify(void *opaque)
{
    FdMigrationState *s = opaque;

    qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
    qemu_file_put_notify(s->file);
}

ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
{
    FdMigrationState *s = opaque;
    ssize_t ret;

    do {
        ret = s->write(s, data, size);
327
    } while (ret == -1 && ((s->get_error(s)) == EINTR));
328 329 330 331

    if (ret == -1)
        ret = -(s->get_error(s));

332
    if (ret == -EAGAIN) {
333
        qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
334 335
    } else if (ret < 0) {
        s->state = MIG_STATE_ERROR;
336
        notifier_list_notify(&migration_state_notifiers, NULL);
337
    }
338 339 340 341 342 343 344 345 346 347 348 349 350 351 352

    return ret;
}

void migrate_fd_connect(FdMigrationState *s)
{
    int ret;

    s->file = qemu_fopen_ops_buffered(s,
                                      s->bandwidth_limit,
                                      migrate_fd_put_buffer,
                                      migrate_fd_put_ready,
                                      migrate_fd_wait_for_unfreeze,
                                      migrate_fd_close);

M
malc 已提交
353
    DPRINTF("beginning savevm\n");
354
    ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
L
lirans@il.ibm.com 已提交
355
                                  s->mig_state.shared);
356
    if (ret < 0) {
M
malc 已提交
357
        DPRINTF("failed, %d\n", ret);
358 359 360
        migrate_fd_error(s);
        return;
    }
L
lirans@il.ibm.com 已提交
361
    
362 363 364 365 366 367 368 369
    migrate_fd_put_ready(s);
}

void migrate_fd_put_ready(void *opaque)
{
    FdMigrationState *s = opaque;

    if (s->state != MIG_STATE_ACTIVE) {
M
malc 已提交
370
        DPRINTF("put_ready returning because of non-active state\n");
371 372 373
        return;
    }

M
malc 已提交
374
    DPRINTF("iterate\n");
375
    if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
376
        int state;
377 378
        int old_vm_running = vm_running;

M
malc 已提交
379
        DPRINTF("done iterating\n");
380
        vm_stop(RSTATE_PRE_MIGRATE);
381

382
        if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
383 384 385
            if (old_vm_running) {
                vm_start();
            }
386 387 388 389
            state = MIG_STATE_ERROR;
        } else {
            state = MIG_STATE_COMPLETED;
        }
390 391 392 393 394 395
        if (migrate_fd_cleanup(s) < 0) {
            if (old_vm_running) {
                vm_start();
            }
            state = MIG_STATE_ERROR;
        }
396 397 398
        if (state == MIG_STATE_COMPLETED) {
            runstate_set(RSTATE_POST_MIGRATE);
        }
399
        s->state = state;
400
        notifier_list_notify(&migration_state_notifiers, NULL);
401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416
    }
}

int migrate_fd_get_status(MigrationState *mig_state)
{
    FdMigrationState *s = migrate_to_fms(mig_state);
    return s->state;
}

void migrate_fd_cancel(MigrationState *mig_state)
{
    FdMigrationState *s = migrate_to_fms(mig_state);

    if (s->state != MIG_STATE_ACTIVE)
        return;

M
malc 已提交
417
    DPRINTF("cancelling migration\n");
418 419

    s->state = MIG_STATE_CANCELLED;
420
    notifier_list_notify(&migration_state_notifiers, NULL);
421
    qemu_savevm_state_cancel(s->mon, s->file);
422 423 424 425 426 427 428 429

    migrate_fd_cleanup(s);
}

void migrate_fd_release(MigrationState *mig_state)
{
    FdMigrationState *s = migrate_to_fms(mig_state);

M
malc 已提交
430
    DPRINTF("releasing state\n");
431 432 433
   
    if (s->state == MIG_STATE_ACTIVE) {
        s->state = MIG_STATE_CANCELLED;
434
        notifier_list_notify(&migration_state_notifiers, NULL);
435 436
        migrate_fd_cleanup(s);
    }
437
    g_free(s);
438 439 440 441 442 443 444
}

void migrate_fd_wait_for_unfreeze(void *opaque)
{
    FdMigrationState *s = opaque;
    int ret;

M
malc 已提交
445
    DPRINTF("wait for unfreeze\n");
446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461
    if (s->state != MIG_STATE_ACTIVE)
        return;

    do {
        fd_set wfds;

        FD_ZERO(&wfds);
        FD_SET(s->fd, &wfds);

        ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
    } while (ret == -1 && (s->get_error(s)) == EINTR);
}

int migrate_fd_close(void *opaque)
{
    FdMigrationState *s = opaque;
462

463 464 465
    if (s->mon) {
        monitor_resume(s->mon);
    }
466
    qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
467 468
    return s->close(s);
}
469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487

void add_migration_state_change_notifier(Notifier *notify)
{
    notifier_list_add(&migration_state_notifiers, notify);
}

void remove_migration_state_change_notifier(Notifier *notify)
{
    notifier_list_remove(&migration_state_notifiers, notify);
}

int get_migration_state(void)
{
    if (current_migration) {
        return migrate_fd_get_status(current_migration);
    } else {
        return MIG_STATE_ERROR;
    }
}