migration.c 12.2 KB
Newer Older
A
aliguori 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * QEMU live migration
 *
 * Copyright IBM, Corp. 2008
 *
 * Authors:
 *  Anthony Liguori   <aliguori@us.ibm.com>
 *
 * This work is licensed under the terms of the GNU GPL, version 2.  See
 * the COPYING file in the top-level directory.
 *
 */

#include "qemu-common.h"
#include "migration.h"
A
aliguori 已提交
16
#include "monitor.h"
17 18 19 20
#include "buffered_file.h"
#include "sysemu.h"
#include "block.h"
#include "qemu_socket.h"
21
#include "block-migration.h"
22
#include "qemu-objects.h"
23 24 25 26

//#define DEBUG_MIGRATION

#ifdef DEBUG_MIGRATION
M
malc 已提交
27
#define DPRINTF(fmt, ...) \
28 29
    do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
#else
M
malc 已提交
30
#define DPRINTF(fmt, ...) \
31 32
    do { } while (0)
#endif
A
aliguori 已提交
33 34

/* Migration speed throttling */
M
Michael S. Tsirkin 已提交
35
static int64_t max_throttle = (32 << 20);
A
aliguori 已提交
36 37 38

static MigrationState *current_migration;

39 40 41
static NotifierList migration_state_notifiers =
    NOTIFIER_LIST_INITIALIZER(migration_state_notifiers);

J
Juan Quintela 已提交
42
int qemu_start_incoming_migration(const char *uri)
A
aliguori 已提交
43
{
A
aliguori 已提交
44
    const char *p;
J
Juan Quintela 已提交
45
    int ret;
A
aliguori 已提交
46 47

    if (strstart(uri, "tcp:", &p))
J
Juan Quintela 已提交
48
        ret = tcp_start_incoming_migration(p);
49 50
#if !defined(WIN32)
    else if (strstart(uri, "exec:", &p))
J
Juan Quintela 已提交
51
        ret =  exec_start_incoming_migration(p);
C
Chris Lalancette 已提交
52
    else if (strstart(uri, "unix:", &p))
J
Juan Quintela 已提交
53
        ret = unix_start_incoming_migration(p);
P
Paolo Bonzini 已提交
54
    else if (strstart(uri, "fd:", &p))
J
Juan Quintela 已提交
55
        ret = fd_start_incoming_migration(p);
56
#endif
J
Juan Quintela 已提交
57
    else {
A
aliguori 已提交
58
        fprintf(stderr, "unknown migration protocol: %s\n", uri);
J
Juan Quintela 已提交
59 60 61
        ret = -EPROTONOSUPPORT;
    }
    return ret;
A
aliguori 已提交
62 63
}

64 65 66 67 68 69 70 71 72
void process_incoming_migration(QEMUFile *f)
{
    if (qemu_loadvm_state(f) < 0) {
        fprintf(stderr, "load of migration failed\n");
        exit(0);
    }
    qemu_announce_self();
    DPRINTF("successfully loaded vm state\n");

73 74
    incoming_expected = false;

75 76 77 78
    if (autostart)
        vm_start();
}

79
int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
A
aliguori 已提交
80
{
A
aliguori 已提交
81 82
    MigrationState *s = NULL;
    const char *p;
83 84 85
    int detach = qdict_get_try_bool(qdict, "detach", 0);
    int blk = qdict_get_try_bool(qdict, "blk", 0);
    int inc = qdict_get_try_bool(qdict, "inc", 0);
86
    const char *uri = qdict_get_str(qdict, "uri");
87 88 89 90

    if (current_migration &&
        current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
        monitor_printf(mon, "migration already in progress\n");
91
        return -1;
92 93
    }

A
Alex Williamson 已提交
94 95 96 97
    if (qemu_savevm_state_blocked(mon)) {
        return -1;
    }

98
    if (strstart(uri, "tcp:", &p)) {
99
        s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
100
                                         blk, inc);
101
#if !defined(WIN32)
102
    } else if (strstart(uri, "exec:", &p)) {
103
        s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
104
                                          blk, inc);
105
    } else if (strstart(uri, "unix:", &p)) {
106
        s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
107
                                          blk, inc);
108
    } else if (strstart(uri, "fd:", &p)) {
L
lirans@il.ibm.com 已提交
109
        s = fd_start_outgoing_migration(mon, p, max_throttle, detach, 
110
                                        blk, inc);
111
#endif
112
    } else {
A
aliguori 已提交
113
        monitor_printf(mon, "unknown migration protocol: %s\n", uri);
114 115
        return -1;
    }
A
aliguori 已提交
116

117
    if (s == NULL) {
A
aliguori 已提交
118
        monitor_printf(mon, "migration failed\n");
119 120
        return -1;
    }
A
aliguori 已提交
121

122 123
    if (current_migration) {
        current_migration->release(current_migration);
A
aliguori 已提交
124
    }
125 126

    current_migration = s;
127
    notifier_list_notify(&migration_state_notifiers, NULL);
128
    return 0;
A
aliguori 已提交
129 130
}

131
int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
A
aliguori 已提交
132 133 134 135
{
    MigrationState *s = current_migration;

    if (s)
A
aliguori 已提交
136
        s->cancel(s);
137 138

    return 0;
A
aliguori 已提交
139 140
}

141
int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
A
aliguori 已提交
142
{
143
    int64_t d;
144
    FdMigrationState *s;
A
aliguori 已提交
145

146
    d = qdict_get_int(qdict, "value");
M
Michael S. Tsirkin 已提交
147 148 149
    if (d < 0) {
        d = 0;
    }
150
    max_throttle = d;
151

152 153
    s = migrate_to_fms(current_migration);
    if (s && s->file) {
154 155
        qemu_file_set_rate_limit(s->file, max_throttle);
    }
156 157

    return 0;
A
aliguori 已提交
158 159
}

160 161 162 163 164 165 166 167 168 169 170
/* amount of nanoseconds we are willing to wait for migration to be down.
 * the choice of nanoseconds is because it is the maximum resolution that
 * get_clock() can achieve. It is an internal measure. All user-visible
 * units must be in seconds */
static uint64_t max_downtime = 30000000;

uint64_t migrate_max_downtime(void)
{
    return max_downtime;
}

171 172
int do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
                            QObject **ret_data)
G
Glauber Costa 已提交
173 174 175
{
    double d;

176 177
    d = qdict_get_double(qdict, "value") * 1e9;
    d = MAX(0, MIN(UINT64_MAX, d));
G
Glauber Costa 已提交
178
    max_downtime = (uint64_t)d;
179 180

    return 0;
G
Glauber Costa 已提交
181 182
}

183 184
static void migrate_print_status(Monitor *mon, const char *name,
                                 const QDict *status_dict)
A
aliguori 已提交
185
{
186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229
    QDict *qdict;

    qdict = qobject_to_qdict(qdict_get(status_dict, name));

    monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
                        qdict_get_int(qdict, "transferred") >> 10);
    monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
                        qdict_get_int(qdict, "remaining") >> 10);
    monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
                        qdict_get_int(qdict, "total") >> 10);
}

void do_info_migrate_print(Monitor *mon, const QObject *data)
{
    QDict *qdict;

    qdict = qobject_to_qdict(data);

    monitor_printf(mon, "Migration status: %s\n",
                   qdict_get_str(qdict, "status"));

    if (qdict_haskey(qdict, "ram")) {
        migrate_print_status(mon, "ram", qdict);
    }

    if (qdict_haskey(qdict, "disk")) {
        migrate_print_status(mon, "disk", qdict);
    }
}

static void migrate_put_status(QDict *qdict, const char *name,
                               uint64_t trans, uint64_t rem, uint64_t total)
{
    QObject *obj;

    obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
                               "'remaining': %" PRId64 ", "
                               "'total': %" PRId64 " }", trans, rem, total);
    qdict_put_obj(qdict, name, obj);
}

void do_info_migrate(Monitor *mon, QObject **ret_data)
{
    QDict *qdict;
A
aliguori 已提交
230
    MigrationState *s = current_migration;
A
aliguori 已提交
231

A
aliguori 已提交
232
    if (s) {
A
aliguori 已提交
233 234
        switch (s->get_status(s)) {
        case MIG_STATE_ACTIVE:
235 236 237 238 239 240
            qdict = qdict_new();
            qdict_put(qdict, "status", qstring_from_str("active"));

            migrate_put_status(qdict, "ram", ram_bytes_transferred(),
                               ram_bytes_remaining(), ram_bytes_total());

241
            if (blk_mig_active()) {
242 243 244
                migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
                                   blk_mig_bytes_remaining(),
                                   blk_mig_bytes_total());
245
            }
246 247

            *ret_data = QOBJECT(qdict);
A
aliguori 已提交
248 249
            break;
        case MIG_STATE_COMPLETED:
250
            *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
A
aliguori 已提交
251 252
            break;
        case MIG_STATE_ERROR:
253
            *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
A
aliguori 已提交
254 255
            break;
        case MIG_STATE_CANCELLED:
256
            *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
A
aliguori 已提交
257 258
            break;
        }
A
aliguori 已提交
259 260 261
    }
}

262 263
/* shared migration helpers */

264
void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
265
{
266 267
    s->mon = mon;
    if (monitor_suspend(mon) == 0) {
M
malc 已提交
268
        DPRINTF("suspending monitor\n");
269 270
    } else {
        monitor_printf(mon, "terminal does not allow synchronous "
271
                       "migration, continuing detached\n");
272
    }
273 274
}

275 276
void migrate_fd_error(FdMigrationState *s)
{
M
malc 已提交
277
    DPRINTF("setting error state\n");
278
    s->state = MIG_STATE_ERROR;
279
    notifier_list_notify(&migration_state_notifiers, NULL);
280 281 282
    migrate_fd_cleanup(s);
}

283
int migrate_fd_cleanup(FdMigrationState *s)
284
{
285 286
    int ret = 0;

287 288 289
    qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);

    if (s->file) {
M
malc 已提交
290
        DPRINTF("closing file\n");
291 292 293
        if (qemu_fclose(s->file) != 0) {
            ret = -1;
        }
294
        s->file = NULL;
295 296 297 298
    } else {
        if (s->mon) {
            monitor_resume(s->mon);
        }
299 300
    }

301
    if (s->fd != -1) {
302
        close(s->fd);
303
        s->fd = -1;
304
    }
305

306
    return ret;
307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323
}

void migrate_fd_put_notify(void *opaque)
{
    FdMigrationState *s = opaque;

    qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
    qemu_file_put_notify(s->file);
}

ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
{
    FdMigrationState *s = opaque;
    ssize_t ret;

    do {
        ret = s->write(s, data, size);
324
    } while (ret == -1 && ((s->get_error(s)) == EINTR));
325 326 327 328

    if (ret == -1)
        ret = -(s->get_error(s));

329
    if (ret == -EAGAIN) {
330
        qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
331 332
    } else if (ret < 0) {
        s->state = MIG_STATE_ERROR;
333
        notifier_list_notify(&migration_state_notifiers, NULL);
334
    }
335 336 337 338 339 340 341 342 343 344 345 346 347 348 349

    return ret;
}

void migrate_fd_connect(FdMigrationState *s)
{
    int ret;

    s->file = qemu_fopen_ops_buffered(s,
                                      s->bandwidth_limit,
                                      migrate_fd_put_buffer,
                                      migrate_fd_put_ready,
                                      migrate_fd_wait_for_unfreeze,
                                      migrate_fd_close);

M
malc 已提交
350
    DPRINTF("beginning savevm\n");
351
    ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
L
lirans@il.ibm.com 已提交
352
                                  s->mig_state.shared);
353
    if (ret < 0) {
M
malc 已提交
354
        DPRINTF("failed, %d\n", ret);
355 356 357
        migrate_fd_error(s);
        return;
    }
L
lirans@il.ibm.com 已提交
358
    
359 360 361 362 363 364 365 366
    migrate_fd_put_ready(s);
}

void migrate_fd_put_ready(void *opaque)
{
    FdMigrationState *s = opaque;

    if (s->state != MIG_STATE_ACTIVE) {
M
malc 已提交
367
        DPRINTF("put_ready returning because of non-active state\n");
368 369 370
        return;
    }

M
malc 已提交
371
    DPRINTF("iterate\n");
372
    if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
373
        int state;
374 375
        int old_vm_running = vm_running;

M
malc 已提交
376
        DPRINTF("done iterating\n");
377
        vm_stop(RSTATE_PRE_MIGRATE);
378

379
        if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
380 381 382
            if (old_vm_running) {
                vm_start();
            }
383 384 385 386
            state = MIG_STATE_ERROR;
        } else {
            state = MIG_STATE_COMPLETED;
        }
387 388 389 390 391 392
        if (migrate_fd_cleanup(s) < 0) {
            if (old_vm_running) {
                vm_start();
            }
            state = MIG_STATE_ERROR;
        }
393
        s->state = state;
394
        notifier_list_notify(&migration_state_notifiers, NULL);
395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410
    }
}

int migrate_fd_get_status(MigrationState *mig_state)
{
    FdMigrationState *s = migrate_to_fms(mig_state);
    return s->state;
}

void migrate_fd_cancel(MigrationState *mig_state)
{
    FdMigrationState *s = migrate_to_fms(mig_state);

    if (s->state != MIG_STATE_ACTIVE)
        return;

M
malc 已提交
411
    DPRINTF("cancelling migration\n");
412 413

    s->state = MIG_STATE_CANCELLED;
414
    notifier_list_notify(&migration_state_notifiers, NULL);
415
    qemu_savevm_state_cancel(s->mon, s->file);
416 417 418 419 420 421 422 423

    migrate_fd_cleanup(s);
}

void migrate_fd_release(MigrationState *mig_state)
{
    FdMigrationState *s = migrate_to_fms(mig_state);

M
malc 已提交
424
    DPRINTF("releasing state\n");
425 426 427
   
    if (s->state == MIG_STATE_ACTIVE) {
        s->state = MIG_STATE_CANCELLED;
428
        notifier_list_notify(&migration_state_notifiers, NULL);
429 430
        migrate_fd_cleanup(s);
    }
431
    g_free(s);
432 433 434 435 436 437 438
}

void migrate_fd_wait_for_unfreeze(void *opaque)
{
    FdMigrationState *s = opaque;
    int ret;

M
malc 已提交
439
    DPRINTF("wait for unfreeze\n");
440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455
    if (s->state != MIG_STATE_ACTIVE)
        return;

    do {
        fd_set wfds;

        FD_ZERO(&wfds);
        FD_SET(s->fd, &wfds);

        ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
    } while (ret == -1 && (s->get_error(s)) == EINTR);
}

int migrate_fd_close(void *opaque)
{
    FdMigrationState *s = opaque;
456

457 458 459
    if (s->mon) {
        monitor_resume(s->mon);
    }
460
    qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
461 462
    return s->close(s);
}
463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481

void add_migration_state_change_notifier(Notifier *notify)
{
    notifier_list_add(&migration_state_notifiers, notify);
}

void remove_migration_state_change_notifier(Notifier *notify)
{
    notifier_list_remove(&migration_state_notifiers, notify);
}

int get_migration_state(void)
{
    if (current_migration) {
        return migrate_fd_get_status(current_migration);
    } else {
        return MIG_STATE_ERROR;
    }
}