qemu_migration.c 200.1 KB
Newer Older
1 2 3
/*
 * qemu_migration.c: QEMU migration handling
 *
4
 * Copyright (C) 2006-2015 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
17
 * License along with this library.  If not, see
O
Osier Yang 已提交
18
 * <http://www.gnu.org/licenses/>.
19 20 21 22 23
 *
 */

#include <config.h>

J
Ján Tomko 已提交
24 25
#include <netdb.h>
#include <sys/socket.h>
26
#include <sys/time.h>
27
#include <fcntl.h>
28
#include <poll.h>
29 30

#include "qemu_migration.h"
31
#include "qemu_migration_cookie.h"
32 33 34 35
#include "qemu_monitor.h"
#include "qemu_domain.h"
#include "qemu_process.h"
#include "qemu_capabilities.h"
36
#include "qemu_alias.h"
37
#include "qemu_cgroup.h"
38
#include "qemu_hotplug.h"
39
#include "qemu_blockjob.h"
40
#include "qemu_security.h"
41

42
#include "domain_audit.h"
43
#include "virlog.h"
44
#include "virerror.h"
45
#include "viralloc.h"
E
Eric Blake 已提交
46
#include "virfile.h"
47
#include "virnetdevopenvswitch.h"
48
#include "datatypes.h"
49
#include "virfdstream.h"
50
#include "viruuid.h"
51
#include "virtime.h"
52
#include "locking/domain_lock.h"
53
#include "rpc/virnetsocket.h"
54
#include "virstoragefile.h"
M
Martin Kletzander 已提交
55
#include "viruri.h"
56
#include "virhook.h"
57
#include "virstring.h"
58
#include "virtypedparam.h"
M
Michael R. Hines 已提交
59
#include "virprocess.h"
60
#include "nwfilter_conf.h"
61
#include "storage/storage_driver.h"
62 63 64

#define VIR_FROM_THIS VIR_FROM_QEMU

65 66
VIR_LOG_INIT("qemu.qemu_migration");

67 68 69 70 71 72 73 74 75 76 77 78 79
VIR_ENUM_IMPL(qemuMigrationJobPhase, QEMU_MIGRATION_PHASE_LAST,
              "none",
              "perform2",
              "begin3",
              "perform3",
              "perform3_done",
              "confirm3_cancelled",
              "confirm3",
              "prepare",
              "finish2",
              "finish3",
);

80 81 82 83 84
VIR_ENUM_IMPL(qemuMigrationCompressMethod, QEMU_MIGRATION_COMPRESS_LAST,
              "xbzrle",
              "mt",
);

85 86
#define QEMU_MIGRATION_TLS_ALIAS_BASE "libvirt_migrate"

87

88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110
/* qemuMigrationCheckTLSCreds
 * @driver: pointer to qemu driver
 * @vm: domain object
 * @asyncJob: migration job to join
 *
 * Query the migration parameters looking for the 'tls-creds' parameter.
 * If found, then we can support setting or clearing the parameters and thus
 * can support TLS for migration.
 *
 * Returns 0 if we were able to successfully fetch the params and
 * additionally if the tls-creds parameter exists, saves it in the
 * private domain structure. Returns -1 on failure.
 */
static int
qemuMigrationCheckTLSCreds(virQEMUDriverPtr driver,
                           virDomainObjPtr vm,
                           qemuDomainAsyncJob asyncJob)
{
    int ret = -1;
    qemuDomainObjPrivatePtr priv = vm->privateData;
    qemuMonitorMigrationParams migParams = { 0 };

    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
111
        return -1;
112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215

    if (qemuMonitorGetMigrationParams(priv->mon, &migParams) < 0)
        goto cleanup;

    /* NB: Could steal NULL pointer too! Let caller decide what to do. */
    VIR_STEAL_PTR(priv->migTLSAlias, migParams.migrateTLSAlias);

    ret = 0;

 cleanup:
    if (qemuDomainObjExitMonitor(driver, vm) < 0)
        ret = -1;

    qemuMigrationParamsClear(&migParams);

    return ret;
}


/* qemuMigrationCheckSetupTLS
 * @conn: Connection pointer
 * @driver: pointer to qemu driver
 * @vm: domain object
 * @cfg: configuration pointer
 * @asyncJob: migration job to join
 *
 * Check if TLS is possible and set up the environment. Assumes the caller
 * desires to use TLS (e.g. caller found VIR_MIGRATE_TLS flag).
 *
 * Ensure the qemu.conf has been properly configured to add an entry for
 * "migrate_tls_x509_cert_dir". Also check if the "tls-creds" parameter
 * was present from a query of migration parameters
 *
 * Returns 0 on success, -1 on error/failure
 */
static int
qemuMigrationCheckSetupTLS(virConnectPtr conn,
                           virQEMUDriverPtr driver,
                           virQEMUDriverConfigPtr cfg,
                           virDomainObjPtr vm,
                           qemuDomainAsyncJob asyncJob)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

    if (!cfg->migrateTLSx509certdir) {
        virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                       _("host migration TLS directory not configured"));
        return -1;
    }

    if (qemuMigrationCheckTLSCreds(driver, vm, asyncJob) < 0)
        return -1;

    if (!priv->migTLSAlias) {
        virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                       _("TLS migration is not supported with this "
                         "QEMU binary"));
        return -1;
    }

    /* If there's a secret, then grab/store it now using the connection */
    if (cfg->migrateTLSx509secretUUID &&
        !(priv->migSecinfo =
          qemuDomainSecretInfoTLSNew(conn, priv, QEMU_MIGRATION_TLS_ALIAS_BASE,
                                     cfg->migrateTLSx509secretUUID)))
        return -1;

    return 0;
}


/* qemuMigrationAddTLSObjects
 * @driver: pointer to qemu driver
 * @vm: domain object
 * @cfg: configuration pointer
 * @tlsListen: server or client
 * @asyncJob: Migration job to join
 * @tlsAlias: alias to be generated for TLS object
 * @secAlias: alias to be generated for a secinfo object
 * @migParams: migration parameters to set
 *
 * Create the TLS objects for the migration and set the migParams value
 *
 * Returns 0 on success, -1 on failure
 */
static int
qemuMigrationAddTLSObjects(virQEMUDriverPtr driver,
                           virDomainObjPtr vm,
                           virQEMUDriverConfigPtr cfg,
                           bool tlsListen,
                           qemuDomainAsyncJob asyncJob,
                           char **tlsAlias,
                           char **secAlias,
                           qemuMonitorMigrationParamsPtr migParams)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    virJSONValuePtr tlsProps = NULL;
    virJSONValuePtr secProps = NULL;

    if (qemuDomainGetTLSObjects(priv->qemuCaps, priv->migSecinfo,
                                cfg->migrateTLSx509certdir, tlsListen,
                                cfg->migrateTLSx509verify,
                                QEMU_MIGRATION_TLS_ALIAS_BASE,
                                &tlsProps, tlsAlias, &secProps, secAlias) < 0)
216
        goto error;
217 218 219 220 221 222 223 224 225

    /* Ensure the domain doesn't already have the TLS objects defined...
     * This should prevent any issues just in case some cleanup wasn't
     * properly completed (both src and dst use the same alias) or
     * some other error path between now and perform . */
    qemuDomainDelTLSObjects(driver, vm, asyncJob, *secAlias, *tlsAlias);

    if (qemuDomainAddTLSObjects(driver, vm, asyncJob, *secAlias, &secProps,
                                *tlsAlias, &tlsProps) < 0)
226
        goto error;
227 228

    if (VIR_STRDUP(migParams->migrateTLSAlias, *tlsAlias) < 0)
229
        goto error;
230 231

    return 0;
232 233 234 235 236

 error:
    virJSONValueFree(tlsProps);
    virJSONValueFree(secProps);
    return -1;
237 238 239
}


240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255
static void
qemuMigrationStoreDomainState(virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    priv->preMigrationState = virDomainObjGetState(vm, NULL);

    VIR_DEBUG("Storing pre-migration state=%d domain=%p",
              priv->preMigrationState, vm);
}

/* Returns true if the domain was resumed, false otherwise */
static bool
qemuMigrationRestoreDomainState(virConnectPtr conn, virDomainObjPtr vm)
{
    virQEMUDriverPtr driver = conn->privateData;
    qemuDomainObjPrivatePtr priv = vm->privateData;
256 257
    int reason;
    virDomainState state = virDomainObjGetState(vm, &reason);
258 259
    bool ret = false;

260 261 262 263 264
    VIR_DEBUG("driver=%p, vm=%p, pre-mig-state=%s, state=%s, reason=%s",
              driver, vm,
              virDomainStateTypeToString(priv->preMigrationState),
              virDomainStateTypeToString(state),
              virDomainStateReasonToString(state, reason));
265

266 267 268 269 270
    if (state != VIR_DOMAIN_PAUSED ||
        reason == VIR_DOMAIN_PAUSED_POSTCOPY_FAILED)
        goto cleanup;

    if (priv->preMigrationState == VIR_DOMAIN_RUNNING) {
271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293
        /* This is basically the only restore possibility that's safe
         * and we should attempt to do */

        VIR_DEBUG("Restoring pre-migration state due to migration error");

        /* we got here through some sort of failure; start the domain again */
        if (qemuProcessStartCPUs(driver, vm, conn,
                                 VIR_DOMAIN_RUNNING_MIGRATION_CANCELED,
                                 QEMU_ASYNC_JOB_MIGRATION_OUT) < 0) {
            /* Hm, we already know we are in error here.  We don't want to
             * overwrite the previous error, though, so we just throw something
             * to the logs and hope for the best */
            VIR_ERROR(_("Failed to resume guest %s after failure"), vm->def->name);
            goto cleanup;
        }
        ret = true;
    }

 cleanup:
    priv->preMigrationState = VIR_DOMAIN_NOSTATE;
    return ret;
}

294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347

static int
qemuMigrationPrecreateDisk(virConnectPtr conn,
                           virDomainDiskDefPtr disk,
                           unsigned long long capacity)
{
    int ret = -1;
    virStoragePoolPtr pool = NULL;
    virStorageVolPtr vol = NULL;
    char *volName = NULL, *basePath = NULL;
    char *volStr = NULL;
    virBuffer buf = VIR_BUFFER_INITIALIZER;
    const char *format = NULL;
    unsigned int flags = 0;

    VIR_DEBUG("Precreate disk type=%s", virStorageTypeToString(disk->src->type));

    switch ((virStorageType) disk->src->type) {
    case VIR_STORAGE_TYPE_FILE:
        if (!virDomainDiskGetSource(disk)) {
            VIR_DEBUG("Dropping sourceless disk '%s'",
                      disk->dst);
            return 0;
        }

        if (VIR_STRDUP(basePath, disk->src->path) < 0)
            goto cleanup;

        if (!(volName = strrchr(basePath, '/'))) {
            virReportError(VIR_ERR_INVALID_ARG,
                           _("malformed disk path: %s"),
                           disk->src->path);
            goto cleanup;
        }

        *volName = '\0';
        volName++;

        if (!(pool = storagePoolLookupByTargetPath(conn, basePath)))
            goto cleanup;
        format = virStorageFileFormatTypeToString(disk->src->format);
        if (disk->src->format == VIR_STORAGE_FILE_QCOW2)
            flags |= VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA;
        break;

    case VIR_STORAGE_TYPE_VOLUME:
        if (!(pool = virStoragePoolLookupByName(conn, disk->src->srcpool->pool)))
            goto cleanup;
        format = virStorageFileFormatTypeToString(disk->src->format);
        volName = disk->src->srcpool->volume;
        if (disk->src->format == VIR_STORAGE_FILE_QCOW2)
            flags |= VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA;
        break;

348 349 350 351 352
    case VIR_STORAGE_TYPE_NETWORK:
        VIR_DEBUG("Skipping creation of network disk '%s'",
                  disk->dst);
        return 0;

353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399
    case VIR_STORAGE_TYPE_BLOCK:
    case VIR_STORAGE_TYPE_DIR:
    case VIR_STORAGE_TYPE_NONE:
    case VIR_STORAGE_TYPE_LAST:
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("cannot precreate storage for disk type '%s'"),
                       virStorageTypeToString(disk->src->type));
        goto cleanup;
    }

    if ((vol = virStorageVolLookupByName(pool, volName))) {
        VIR_DEBUG("Skipping creation of already existing volume of name '%s'",
                  volName);
        ret = 0;
        goto cleanup;
    }

    virBufferAddLit(&buf, "<volume>\n");
    virBufferAdjustIndent(&buf, 2);
    virBufferEscapeString(&buf, "<name>%s</name>\n", volName);
    virBufferAsprintf(&buf, "<capacity>%llu</capacity>\n", capacity);
    virBufferAddLit(&buf, "<target>\n");
    virBufferAdjustIndent(&buf, 2);
    virBufferAsprintf(&buf, "<format type='%s'/>\n", format);
    virBufferAdjustIndent(&buf, -2);
    virBufferAddLit(&buf, "</target>\n");
    virBufferAdjustIndent(&buf, -2);
    virBufferAddLit(&buf, "</volume>\n");

    if (!(volStr = virBufferContentAndReset(&buf))) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("unable to create volume XML"));
        goto cleanup;
    }

    if (!(vol = virStorageVolCreateXML(pool, volStr, flags)))
        goto cleanup;

    ret = 0;
 cleanup:
    VIR_FREE(basePath);
    VIR_FREE(volStr);
    virObjectUnref(vol);
    virObjectUnref(pool);
    return ret;
}

400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417
static bool
qemuMigrateDisk(virDomainDiskDef const *disk,
                size_t nmigrate_disks, const char **migrate_disks)
{
    size_t i;

    /* Check if the disk alias is in the list */
    if (nmigrate_disks) {
        for (i = 0; i < nmigrate_disks; i++) {
            if (STREQ(disk->dst, migrate_disks[i]))
                return true;
        }
        return false;
    }

    /* Default is to migrate only non-shared non-readonly disks
     * with source */
    return !disk->src->shared && !disk->src->readonly &&
418
           !virStorageSourceIsEmpty(disk->src);
419 420
}

421 422 423 424 425

static int
qemuMigrationPrecreateStorage(virConnectPtr conn,
                              virQEMUDriverPtr driver ATTRIBUTE_UNUSED,
                              virDomainObjPtr vm,
426 427
                              qemuMigrationCookieNBDPtr nbd,
                              size_t nmigrate_disks,
428 429
                              const char **migrate_disks,
                              bool incremental)
430 431 432 433 434 435 436 437 438 439 440
{
    int ret = -1;
    size_t i = 0;

    if (!nbd || !nbd->ndisks)
        return 0;

    for (i = 0; i < nbd->ndisks; i++) {
        virDomainDiskDefPtr disk;
        const char *diskSrcPath;

441
        VIR_DEBUG("Looking up disk target '%s' (capacity=%llu)",
442 443
                  nbd->disks[i].target, nbd->disks[i].capacity);

444 445
        if (!(disk = virDomainDiskByName(vm->def, nbd->disks[i].target,
                                         false))) {
446 447 448 449 450 451 452 453
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("unable to find disk by target: %s"),
                           nbd->disks[i].target);
            goto cleanup;
        }

        diskSrcPath = virDomainDiskGetSource(disk);

454 455
        /* Skip disks we don't want to migrate and already existing disks. */
        if (!qemuMigrateDisk(disk, nmigrate_disks, migrate_disks) ||
456 457 458 459
            (diskSrcPath && virFileExists(diskSrcPath))) {
            continue;
        }

460 461 462 463 464 465 466
        if (incremental) {
            virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                           _("pre-creation of storage targets for incremental "
                             "storage migration is not supported"));
            goto cleanup;
        }

467 468 469 470 471 472 473 474 475 476 477 478
        VIR_DEBUG("Proceeding with disk source %s", NULLSTR(diskSrcPath));

        if (qemuMigrationPrecreateDisk(conn, disk, nbd->disks[i].capacity) < 0)
            goto cleanup;
    }

    ret = 0;
 cleanup:
    return ret;
}


479 480 481 482 483 484 485 486 487 488 489 490 491 492
/**
 * qemuMigrationStartNBDServer:
 * @driver: qemu driver
 * @vm: domain
 *
 * Starts NBD server. This is a newer method to copy
 * storage during migration than using 'blk' and 'inc'
 * arguments in 'migrate' monitor command.
 * Error is reported here.
 *
 * Returns 0 on success, -1 otherwise.
 */
static int
qemuMigrationStartNBDServer(virQEMUDriverPtr driver,
J
Ján Tomko 已提交
493
                            virDomainObjPtr vm,
494 495
                            const char *listenAddr,
                            size_t nmigrate_disks,
496 497
                            const char **migrate_disks,
                            int nbdPort)
498 499 500 501 502 503 504
{
    int ret = -1;
    qemuDomainObjPrivatePtr priv = vm->privateData;
    unsigned short port = 0;
    char *diskAlias = NULL;
    size_t i;

505 506 507 508 509 510
    if (nbdPort < 0 || nbdPort > USHRT_MAX) {
        virReportError(VIR_ERR_INVALID_ARG, "%s",
                       _("nbd port must be in range 0-65535"));
        return -1;
    }

511 512 513
    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];

514 515
        /* check whether disk should be migrated */
        if (!qemuMigrateDisk(disk, nmigrate_disks, migrate_disks))
516 517
            continue;

518
        if (disk->src->readonly || virStorageSourceIsEmpty(disk->src)) {
519
            virReportError(VIR_ERR_OPERATION_UNSUPPORTED,
520 521
                           _("Cannot migrate empty or read-only disk %s"),
                           disk->dst);
522 523 524
            goto cleanup;
        }

525
        VIR_FREE(diskAlias);
526
        if (!(diskAlias = qemuAliasFromDisk(disk)))
527 528 529 530 531 532
            goto cleanup;

        if (qemuDomainObjEnterMonitorAsync(driver, vm,
                                           QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
            goto cleanup;

533 534 535 536 537 538 539 540
        if (port == 0) {
            if (nbdPort)
                port = nbdPort;
            else if (virPortAllocatorAcquire(driver->migrationPorts, &port) < 0)
                goto exit_monitor;

            if (qemuMonitorNBDServerStart(priv->mon, listenAddr, port) < 0)
                goto exit_monitor;
541 542
        }

543 544 545
        if (qemuMonitorNBDServerAdd(priv->mon, diskAlias, true) < 0)
            goto exit_monitor;
        if (qemuDomainObjExitMonitor(driver, vm) < 0)
546 547 548 549 550 551
            goto cleanup;
    }

    priv->nbdPort = port;
    ret = 0;

552
 cleanup:
553
    VIR_FREE(diskAlias);
554
    if (ret < 0 && nbdPort == 0)
555
        virPortAllocatorRelease(driver->migrationPorts, port);
556
    return ret;
557 558 559 560

 exit_monitor:
    ignore_value(qemuDomainObjExitMonitor(driver, vm));
    goto cleanup;
561 562
}

563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589

static int
qemuMigrationStopNBDServer(virQEMUDriverPtr driver,
                           virDomainObjPtr vm,
                           qemuMigrationCookiePtr mig)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

    if (!mig->nbd)
        return 0;

    if (qemuDomainObjEnterMonitorAsync(driver, vm,
                                       QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
        return -1;

    if (qemuMonitorNBDServerStop(priv->mon) < 0)
        VIR_WARN("Unable to stop NBD server");
    if (qemuDomainObjExitMonitor(driver, vm) < 0)
        return -1;

    virPortAllocatorRelease(driver->migrationPorts, priv->nbdPort);
    priv->nbdPort = 0;
    return 0;
}


/**
590
 * qemuMigrationDriveMirrorReady:
591 592 593 594 595 596 597 598 599 600 601 602
 * @driver: qemu driver
 * @vm: domain
 *
 * Check the status of all drive-mirrors started by
 * qemuMigrationDriveMirror. Any pending block job events
 * for the mirrored disks will be processed.
 *
 * Returns 1 if all mirrors are "ready",
 *         0 if some mirrors are still performing initial sync,
 *        -1 on error.
 */
static int
603
qemuMigrationDriveMirrorReady(virQEMUDriverPtr driver,
604 605
                              virDomainObjPtr vm,
                              qemuDomainAsyncJob asyncJob)
606 607
{
    size_t i;
608 609
    size_t notReady = 0;
    int status;
610 611 612

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
613
        qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);
614

615
        if (!diskPriv->migrating)
616 617
            continue;

618
        status = qemuBlockJobUpdate(driver, vm, asyncJob, disk);
619
        if (status == VIR_DOMAIN_BLOCK_JOB_FAILED) {
620 621 622 623 624
            virReportError(VIR_ERR_OPERATION_FAILED,
                           _("migration of disk %s failed"),
                           disk->dst);
            return -1;
        }
625 626 627

        if (disk->mirrorState != VIR_DOMAIN_DISK_MIRROR_STATE_READY)
            notReady++;
628 629
    }

630 631 632 633 634 635 636
    if (notReady) {
        VIR_DEBUG("Waiting for %zu disk mirrors to get ready", notReady);
        return 0;
    } else {
        VIR_DEBUG("All disk mirrors are ready");
        return 1;
    }
637 638 639
}


640 641 642 643
/*
 * If @check is true, the function will report an error and return a different
 * code in case a block job fails. This way we can properly abort migration in
 * case some block jobs failed once all memory has already been transferred.
644
 *
645 646 647 648
 * Returns 1 if all mirrors are gone,
 *         0 if some mirrors are still active,
 *         -1 some mirrors failed but some are still active,
 *         -2 all mirrors are gone but some of them failed.
649 650
 */
static int
651
qemuMigrationDriveMirrorCancelled(virQEMUDriverPtr driver,
652
                                  virDomainObjPtr vm,
653
                                  qemuDomainAsyncJob asyncJob,
654
                                  bool check)
655
{
656 657
    size_t i;
    size_t active = 0;
658
    size_t completed = 0;
659 660
    int status;
    bool failed = false;
661

662
 retry:
663 664 665
    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
        qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);
666

667 668
        if (!diskPriv->migrating)
            continue;
669

670
        status = qemuBlockJobUpdate(driver, vm, asyncJob, disk);
671 672 673
        switch (status) {
        case VIR_DOMAIN_BLOCK_JOB_FAILED:
            if (check) {
674
                virReportError(VIR_ERR_OPERATION_FAILED,
675
                               _("migration of disk %s failed"),
676
                               disk->dst);
677
                failed = true;
678
            }
M
Marc Hartmayer 已提交
679
            ATTRIBUTE_FALLTHROUGH;
680 681
        case VIR_DOMAIN_BLOCK_JOB_CANCELED:
        case VIR_DOMAIN_BLOCK_JOB_COMPLETED:
682
            qemuBlockJobSyncEnd(driver, vm, asyncJob, disk);
683 684
            diskPriv->migrating = false;
            break;
685

686 687
        default:
            active++;
688
        }
689 690 691 692 693 694 695 696 697 698 699 700 701

        if (status == VIR_DOMAIN_BLOCK_JOB_COMPLETED)
            completed++;
    }

    /* Updating completed block job drops the lock thus we have to recheck
     * block jobs for disks that reside before the disk(s) with completed
     * block job.
     */
    if (completed > 0) {
        completed = 0;
        active = 0;
        goto retry;
702
    }
703

704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719
    if (failed) {
        if (active) {
            VIR_DEBUG("Some disk mirrors failed; still waiting for %zu "
                      "disk mirrors to finish", active);
            return -1;
        } else {
            VIR_DEBUG("All disk mirrors are gone; some of them failed");
            return -2;
        }
    } else {
        if (active) {
            VIR_DEBUG("Waiting for %zu disk mirrors to finish", active);
            return 0;
        } else {
            VIR_DEBUG("All disk mirrors are gone");
            return 1;
720
        }
721
    }
722
}
723 724


725 726 727 728 729 730 731 732 733
/*
 * Returns 0 on success,
 *         1 when job is already completed or it failed and failNoJob is false,
 *         -1 on error or when job failed and failNoJob is true.
 */
static int
qemuMigrationCancelOneDriveMirror(virQEMUDriverPtr driver,
                                  virDomainObjPtr vm,
                                  virDomainDiskDefPtr disk,
734 735
                                  bool failNoJob,
                                  qemuDomainAsyncJob asyncJob)
736 737 738 739 740 741 742
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    char *diskAlias = NULL;
    int ret = -1;
    int status;
    int rv;

743
    status = qemuBlockJobUpdate(driver, vm, asyncJob, disk);
744 745 746 747 748 749 750 751 752 753 754 755 756 757 758
    switch (status) {
    case VIR_DOMAIN_BLOCK_JOB_FAILED:
    case VIR_DOMAIN_BLOCK_JOB_CANCELED:
        if (failNoJob) {
            virReportError(VIR_ERR_OPERATION_FAILED,
                           _("migration of disk %s failed"),
                           disk->dst);
            return -1;
        }
        return 1;

    case VIR_DOMAIN_BLOCK_JOB_COMPLETED:
        return 1;
    }

759
    if (!(diskAlias = qemuAliasFromDisk(disk)))
760 761
        return -1;

762
    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
763 764
        goto cleanup;

765
    rv = qemuMonitorBlockJobCancel(priv->mon, diskAlias);
766 767 768 769 770

    if (qemuDomainObjExitMonitor(driver, vm) < 0 || rv < 0)
        goto cleanup;

    ret = 0;
771 772 773 774 775 776 777 778 779 780 781

 cleanup:
    VIR_FREE(diskAlias);
    return ret;
}


/**
 * qemuMigrationCancelDriveMirror:
 * @driver: qemu driver
 * @vm: domain
782
 * @check: if true report an error when some of the mirrors fails
783 784 785 786 787 788 789 790 791
 *
 * Cancel all drive-mirrors started by qemuMigrationDriveMirror.
 * Any pending block job events for the affected disks will be
 * processed.
 *
 * Returns 0 on success, -1 otherwise.
 */
static int
qemuMigrationCancelDriveMirror(virQEMUDriverPtr driver,
792
                               virDomainObjPtr vm,
793
                               bool check,
794 795
                               qemuDomainAsyncJob asyncJob,
                               virConnectPtr dconn)
796
{
797
    virErrorPtr err = NULL;
798
    int ret = -1;
799
    size_t i;
800 801 802 803
    int rv;
    bool failed = false;

    VIR_DEBUG("Cancelling drive mirrors for domain %s", vm->def->name);
804 805 806

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
807
        qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);
808

809
        if (!diskPriv->migrating)
810 811
            continue;

812 813
        rv = qemuMigrationCancelOneDriveMirror(driver, vm, disk,
                                               check, asyncJob);
814 815 816 817 818 819
        if (rv != 0) {
            if (rv < 0) {
                if (!err)
                    err = virSaveLastError();
                failed = true;
            }
820
            qemuBlockJobSyncEnd(driver, vm, asyncJob, disk);
821 822 823 824
            diskPriv->migrating = false;
        }
    }

825 826
    while ((rv = qemuMigrationDriveMirrorCancelled(driver, vm, asyncJob,
                                                   check)) != 1) {
827 828 829 830 831 832 833
        if (check && !failed &&
            dconn && virConnectIsAlive(dconn) <= 0) {
            virReportError(VIR_ERR_OPERATION_FAILED, "%s",
                           _("Lost connection to destination host"));
            failed = true;
        }

834 835 836 837
        if (rv < 0) {
            failed = true;
            if (rv == -2)
                break;
838
        }
839

840 841 842 843 844
        if (failed && !err)
            err = virSaveLastError();

        if (virDomainObjWait(vm) < 0)
            goto cleanup;
845 846
    }

847 848 849
    ret = failed ? -1 : 0;

 cleanup:
850 851 852 853 854
    if (err) {
        virSetError(err);
        virFreeError(err);
    }
    return ret;
855 856 857
}


858 859 860 861 862 863
/**
 * qemuMigrationDriveMirror:
 * @driver: qemu driver
 * @vm: domain
 * @mig: migration cookie
 * @host: where are we migrating to
864
 * @speed: bandwidth limit in MiB/s
865 866 867 868
 * @migrate_flags: migrate monitor command flags
 *
 * Run drive-mirror to feed NBD server running on dst and wait
 * till the process switches into another phase where writes go
869 870 871 872 873
 * simultaneously to both source and destination. On success,
 * update @migrate_flags so we don't tell 'migrate' command
 * to do the very same operation. On failure, the caller is
 * expected to call qemuMigrationCancelDriveMirror to stop all
 * running mirrors.
874 875 876 877 878 879 880 881 882 883
 *
 * Returns 0 on success (@migrate_flags updated),
 *        -1 otherwise.
 */
static int
qemuMigrationDriveMirror(virQEMUDriverPtr driver,
                         virDomainObjPtr vm,
                         qemuMigrationCookiePtr mig,
                         const char *host,
                         unsigned long speed,
884 885
                         unsigned int *migrate_flags,
                         size_t nmigrate_disks,
886 887
                         const char **migrate_disks,
                         virConnectPtr dconn)
888 889 890 891
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int ret = -1;
    int port;
892
    size_t i;
893 894
    char *diskAlias = NULL;
    char *nbd_dest = NULL;
895
    char *hoststr = NULL;
896
    unsigned long long mirror_speed = speed;
897
    unsigned int mirror_flags = VIR_DOMAIN_BLOCK_REBASE_REUSE_EXT;
898
    int rv;
899
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
900 901

    VIR_DEBUG("Starting drive mirrors for domain %s", vm->def->name);
902

903 904 905 906 907 908 909 910
    if (mirror_speed > LLONG_MAX >> 20) {
        virReportError(VIR_ERR_OVERFLOW,
                       _("bandwidth must be less than %llu"),
                       LLONG_MAX >> 20);
        goto cleanup;
    }
    mirror_speed <<= 20;

911 912 913 914
    /* steal NBD port and thus prevent its propagation back to destination */
    port = mig->nbd->port;
    mig->nbd->port = 0;

915 916
    /* escape literal IPv6 address */
    if (strchr(host, ':')) {
917
        if (virAsprintf(&hoststr, "[%s]", host) < 0)
918
            goto cleanup;
919
    } else if (VIR_STRDUP(hoststr, host) < 0) {
920
        goto cleanup;
921 922
    }

923 924 925 926 927
    if (*migrate_flags & QEMU_MONITOR_MIGRATE_NON_SHARED_INC)
        mirror_flags |= VIR_DOMAIN_BLOCK_REBASE_SHALLOW;

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
928
        qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);
929
        int mon_ret;
930

931 932
        /* check whether disk should be migrated */
        if (!qemuMigrateDisk(disk, nmigrate_disks, migrate_disks))
933 934
            continue;

935
        if (!(diskAlias = qemuAliasFromDisk(disk)) ||
936
            (virAsprintf(&nbd_dest, "nbd:%s:%d:exportname=%s",
937
                         hoststr, port, diskAlias) < 0))
938 939
            goto cleanup;

940
        if (qemuDomainObjEnterMonitorAsync(driver, vm,
941
                                           QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
942 943
            goto cleanup;

944
        qemuBlockJobSyncBegin(disk);
945
        /* Force "raw" format for NBD export */
946
        mon_ret = qemuMonitorDriveMirror(priv->mon, diskAlias, nbd_dest,
947
                                         "raw", mirror_speed, 0, 0, mirror_flags);
948 949
        VIR_FREE(diskAlias);
        VIR_FREE(nbd_dest);
950

951
        if (qemuDomainObjExitMonitor(driver, vm) < 0 || mon_ret < 0) {
952
            qemuBlockJobSyncEnd(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT, disk);
953 954
            goto cleanup;
        }
955
        diskPriv->migrating = true;
956

957
        if (virDomainSaveStatus(driver->xmlopt, cfg->stateDir, vm, driver->caps) < 0) {
958 959 960
            VIR_WARN("Failed to save status on vm %s", vm->def->name);
            goto cleanup;
        }
961
    }
962

963 964
    while ((rv = qemuMigrationDriveMirrorReady(driver, vm,
                                               QEMU_ASYNC_JOB_MIGRATION_OUT)) != 1) {
965 966
        if (rv < 0)
            goto cleanup;
967

968
        if (priv->job.abortJob) {
969
            priv->job.current->status = QEMU_DOMAIN_JOB_STATUS_CANCELED;
970 971 972 973
            virReportError(VIR_ERR_OPERATION_ABORTED, _("%s: %s"),
                           qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
                           _("canceled by client"));
            goto cleanup;
974
        }
975

976 977 978 979 980 981
        if (dconn && virConnectIsAlive(dconn) <= 0) {
            virReportError(VIR_ERR_OPERATION_FAILED, "%s",
                           _("Lost connection to destination host"));
            goto cleanup;
        }

982
        if (virDomainObjWait(vm) < 0)
983
            goto cleanup;
984 985
    }

986 987 988
    qemuMigrationFetchMirrorStats(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT,
                                  priv->job.current);

989
    /* Okay, all disks are ready. Modify migrate_flags */
990 991 992 993
    *migrate_flags &= ~(QEMU_MONITOR_MIGRATE_NON_SHARED_DISK |
                        QEMU_MONITOR_MIGRATE_NON_SHARED_INC);
    ret = 0;

994
 cleanup:
995
    virObjectUnref(cfg);
996 997
    VIR_FREE(diskAlias);
    VIR_FREE(nbd_dest);
998
    VIR_FREE(hoststr);
999 1000
    return ret;
}
1001

1002

1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030
/**
 * qemuMigrationIsAllowedHostdev:
 * @def: domain definition
 *
 * Checks that @def does not contain any host devices unsupported accross
 * migrations. Returns true if the vm is allowed to migrate.
 */
static bool
qemuMigrationIsAllowedHostdev(const virDomainDef *def)
{
    size_t i;

    /* Migration with USB host devices is allowed, all other devices are
     * forbidden. */
    for (i = 0; i < def->nhostdevs; i++) {
        virDomainHostdevDefPtr hostdev = def->hostdevs[i];
        if (hostdev->mode != VIR_DOMAIN_HOSTDEV_MODE_SUBSYS ||
            hostdev->source.subsys.type != VIR_DOMAIN_HOSTDEV_SUBSYS_TYPE_USB) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("domain has assigned non-USB host devices"));
            return false;
        }
    }

    return true;
}


1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044
/**
 * qemuMigrationIsAllowed:
 * @driver: qemu driver struct
 * @vm: domain object
 * @remote: migration is remote
 * @flags: migration flags (see struct virDomainMigrateFlags)
 *
 * Validates that the configuration of @vm can be migrated in various
 * situations. If @remote is true, the migration happens to remote host. @flags
 * is used to check various special migration types according to the request.
 *
 * Returns true if migration is supported. Reports libvirt error and returns
 * false otherwise.
 */
1045
bool
1046 1047 1048
qemuMigrationIsAllowed(virQEMUDriverPtr driver,
                       virDomainObjPtr vm,
                       bool remote,
1049
                       unsigned int flags)
1050
{
1051
    int nsnapshots;
1052
    int pauseReason;
1053
    size_t i;
1054

1055 1056 1057 1058 1059
    /* perform these checks only when migrating to remote hosts */
    if (remote) {
        nsnapshots = virDomainSnapshotObjListNum(vm->snapshots, NULL, 0);
        if (nsnapshots < 0)
            return false;
1060

1061 1062 1063 1064 1065
        if (nsnapshots > 0) {
            virReportError(VIR_ERR_OPERATION_INVALID,
                           _("cannot migrate domain with %d snapshots"),
                           nsnapshots);
            return false;
1066
        }
1067

1068
        /* cancel migration if disk I/O error is emitted while migrating */
1069
        if (flags & VIR_MIGRATE_ABORT_ON_ERROR &&
1070
            !(flags & VIR_MIGRATE_OFFLINE) &&
1071 1072
            virDomainObjGetState(vm, &pauseReason) == VIR_DOMAIN_PAUSED &&
            pauseReason == VIR_DOMAIN_PAUSED_IOERROR) {
E
Eric Blake 已提交
1073
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
1074
                           _("cannot migrate domain with I/O error"));
E
Eric Blake 已提交
1075 1076
            return false;
        }
1077 1078

    }
1079

1080 1081 1082 1083 1084 1085 1086
    /* following checks don't make sense for offline migration */
    if (!(flags & VIR_MIGRATE_OFFLINE)) {
        if (qemuProcessAutoDestroyActive(driver, vm)) {
            virReportError(VIR_ERR_OPERATION_INVALID,
                           "%s", _("domain is marked for auto destroy"));
            return false;
        }
1087

1088

1089 1090
        if (qemuDomainHasBlockjob(vm, false)) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
1091
                           _("domain has active block job"));
1092 1093 1094 1095 1096 1097
            return false;
        }

        if (!qemuMigrationIsAllowedHostdev(vm->def))
            return false;

1098
        if (vm->def->cpu) {
1099 1100 1101
            /* QEMU blocks migration and save with invariant TSC enabled
             * unless TSC frequency is explicitly set.
             */
1102 1103
            if (virCPUCheckFeature(vm->def->os.arch, vm->def->cpu,
                                   "invtsc") == 1) {
1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121
                bool block = true;

                for (i = 0; i < vm->def->clock.ntimers; i++) {
                    virDomainTimerDefPtr timer = vm->def->clock.timers[i];

                    if (timer->name == VIR_DOMAIN_TIMER_NAME_TSC &&
                        timer->frequency > 0) {
                        block = false;
                        break;
                    }
                }

                if (block) {
                    virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                                   _("domain has 'invtsc' CPU feature but "
                                     "TSC frequency is not specified"));
                    return false;
                }
1122
            }
J
Ján Tomko 已提交
1123 1124
        }

1125 1126 1127
        /* Verify that memory device config can be transferred reliably */
        for (i = 0; i < vm->def->nmems; i++) {
            virDomainMemoryDefPtr mem = vm->def->mems[i];
1128

1129 1130 1131 1132 1133
            if (mem->model == VIR_DOMAIN_MEMORY_MODEL_DIMM &&
                mem->info.type != VIR_DOMAIN_DEVICE_ADDRESS_TYPE_DIMM) {
                virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                               _("domain's dimm info lacks slot ID "
                                 "or base address"));
1134

1135 1136
                return false;
            }
1137
        }
1138 1139 1140 1141 1142 1143

        if (vm->def->nshmems) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("migration with shmem device is not supported"));
            return false;
        }
1144 1145
    }

1146 1147 1148
    return true;
}

1149
static bool
1150 1151
qemuMigrationIsSafe(virDomainDefPtr def,
                    size_t nmigrate_disks,
1152 1153 1154
                    const char **migrate_disks,
                    unsigned int flags)

1155
{
1156 1157
    bool storagemigration = flags & (VIR_MIGRATE_NON_SHARED_DISK |
                                     VIR_MIGRATE_NON_SHARED_INC);
1158
    size_t i;
1159
    int rc;
1160

1161
    for (i = 0; i < def->ndisks; i++) {
1162
        virDomainDiskDefPtr disk = def->disks[i];
1163
        const char *src = virDomainDiskGetSource(disk);
1164

1165
        /* Our code elsewhere guarantees shared disks are either readonly (in
1166
         * which case cache mode doesn't matter) or used with cache=none or used with cache=directsync */
1167 1168 1169
        if (virStorageSourceIsEmpty(disk->src) ||
            disk->src->readonly ||
            disk->src->shared ||
1170 1171
            disk->cachemode == VIR_DOMAIN_DISK_CACHE_DISABLE ||
            disk->cachemode == VIR_DOMAIN_DISK_CACHE_DIRECTSYNC)
1172
            continue;
1173

1174 1175 1176 1177
        /* disks which are migrated by qemu are safe too */
        if (storagemigration &&
            qemuMigrateDisk(disk, nmigrate_disks, migrate_disks))
            continue;
1178

1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190
        if (virDomainDiskGetType(disk) == VIR_STORAGE_TYPE_FILE) {
            if ((rc = virFileIsSharedFS(src)) < 0)
                return false;
            else if (rc == 0)
                continue;
            if ((rc = virStorageFileIsClusterFS(src)) < 0)
                return false;
            else if (rc == 1)
                continue;
        } else if (disk->src->type == VIR_STORAGE_TYPE_NETWORK &&
                   disk->src->protocol == VIR_STORAGE_NET_PROTOCOL_RBD) {
            continue;
1191
        }
1192 1193 1194

        virReportError(VIR_ERR_MIGRATE_UNSAFE, "%s",
                       _("Migration may lead to data corruption if disks"
1195
                         " use cache != none or cache != directsync"));
1196
        return false;
1197 1198 1199 1200 1201
    }

    return true;
}

1202 1203 1204 1205
/** qemuMigrationSetOffline
 * Pause domain for non-live migration.
 */
int
1206
qemuMigrationSetOffline(virQEMUDriverPtr driver,
1207 1208 1209
                        virDomainObjPtr vm)
{
    int ret;
1210
    VIR_DEBUG("driver=%p vm=%p", driver, vm);
1211 1212
    ret = qemuProcessStopCPUs(driver, vm, VIR_DOMAIN_PAUSED_MIGRATION,
                              QEMU_ASYNC_JOB_MIGRATION_OUT);
1213
    if (ret == 0) {
1214
        virObjectEventPtr event;
1215

1216
        event = virDomainEventLifecycleNewFromObj(vm,
1217 1218
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_MIGRATED);
1219
        qemuDomainEventQueue(driver, event);
1220 1221 1222 1223 1224
    }

    return ret;
}

1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266

void
qemuMigrationPostcopyFailed(virQEMUDriverPtr driver,
                            virDomainObjPtr vm)
{
    virDomainState state;
    int reason;

    state = virDomainObjGetState(vm, &reason);

    if (state != VIR_DOMAIN_PAUSED &&
        state != VIR_DOMAIN_RUNNING)
        return;

    if (state == VIR_DOMAIN_PAUSED &&
        reason == VIR_DOMAIN_PAUSED_POSTCOPY_FAILED)
        return;

    VIR_WARN("Migration of domain %s failed during post-copy; "
             "leaving the domain paused", vm->def->name);

    if (state == VIR_DOMAIN_RUNNING) {
        virObjectEventPtr event;

        if (qemuProcessStopCPUs(driver, vm,
                                VIR_DOMAIN_PAUSED_POSTCOPY_FAILED,
                                QEMU_ASYNC_JOB_MIGRATION_IN) < 0) {
            VIR_WARN("Unable to pause guest CPUs for %s", vm->def->name);
            return;
        }

        event = virDomainEventLifecycleNewFromObj(vm,
                                VIR_DOMAIN_EVENT_SUSPENDED,
                                VIR_DOMAIN_EVENT_SUSPENDED_POSTCOPY_FAILED);
        qemuDomainEventQueue(driver, event);
    } else {
        virDomainObjSetState(vm, VIR_DOMAIN_PAUSED,
                             VIR_DOMAIN_PAUSED_POSTCOPY_FAILED);
    }
}


1267
static int
1268
qemuMigrationSetOption(virQEMUDriverPtr driver,
1269
                       virDomainObjPtr vm,
1270
                       qemuMonitorMigrationCaps capability,
1271
                       bool state,
1272 1273 1274 1275 1276
                       qemuDomainAsyncJob job)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int ret;

1277 1278 1279 1280 1281
    if (!qemuMigrationCapsGet(vm, capability)) {
        if (!state) {
            /* Unsupported but we want it off anyway */
            return 0;
        }
1282 1283

        if (job == QEMU_ASYNC_JOB_MIGRATION_IN) {
1284 1285 1286 1287
            virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED,
                           _("Migration option '%s' is not supported by "
                             "target QEMU binary"),
                           qemuMonitorMigrationCapsTypeToString(capability));
1288
        } else {
1289 1290 1291 1292
            virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED,
                           _("Migration option '%s' is not supported by "
                             "source QEMU binary"),
                           qemuMonitorMigrationCapsTypeToString(capability));
1293
        }
1294
        return -1;
1295 1296
    }

1297 1298 1299
    if (qemuDomainObjEnterMonitorAsync(driver, vm, job) < 0)
        return -1;

1300
    ret = qemuMonitorSetMigrationCapability(priv->mon, capability, state);
1301

1302 1303
    if (qemuDomainObjExitMonitor(driver, vm) < 0)
        ret = -1;
1304

1305 1306 1307
    return ret;
}

1308 1309 1310 1311 1312 1313 1314

static int
qemuMigrationSetPostCopy(virQEMUDriverPtr driver,
                         virDomainObjPtr vm,
                         bool state,
                         qemuDomainAsyncJob job)
{
1315 1316
    qemuDomainObjPrivatePtr priv = vm->privateData;

1317 1318 1319 1320 1321
    if (qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_POSTCOPY,
                               state, job) < 0)
        return -1;

1322
    priv->job.postcopyEnabled = state;
1323 1324 1325 1326
    return 0;
}


1327
static int
1328
qemuMigrationWaitForSpice(virDomainObjPtr vm)
1329 1330 1331
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

1332 1333
    if (!virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_SEAMLESS_MIGRATION) ||
        !priv->job.spiceMigration)
1334 1335
        return 0;

1336
    VIR_DEBUG("Waiting for SPICE to finish migration");
1337 1338
    while (!priv->job.spiceMigrated && !priv->job.abortJob) {
        if (virDomainObjWait(vm) < 0)
1339 1340 1341 1342
            return -1;
    }
    return 0;
}
1343

1344 1345 1346 1347

static void
qemuMigrationUpdateJobType(qemuDomainJobInfoPtr jobInfo)
{
1348
    switch ((qemuMonitorMigrationStatus) jobInfo->stats.status) {
1349 1350 1351 1352
    case QEMU_MONITOR_MIGRATION_STATUS_POSTCOPY:
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_POSTCOPY;
        break;

1353
    case QEMU_MONITOR_MIGRATION_STATUS_COMPLETED:
1354
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_QEMU_COMPLETED;
1355 1356 1357
        break;

    case QEMU_MONITOR_MIGRATION_STATUS_INACTIVE:
1358
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_NONE;
1359 1360 1361
        break;

    case QEMU_MONITOR_MIGRATION_STATUS_ERROR:
1362
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_FAILED;
1363 1364 1365
        break;

    case QEMU_MONITOR_MIGRATION_STATUS_CANCELLED:
1366
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_CANCELED;
1367 1368
        break;

1369 1370 1371 1372 1373 1374 1375 1376
    case QEMU_MONITOR_MIGRATION_STATUS_PRE_SWITCHOVER:
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_PAUSED;
        break;

    case QEMU_MONITOR_MIGRATION_STATUS_DEVICE:
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_MIGRATING;
        break;

1377 1378 1379
    case QEMU_MONITOR_MIGRATION_STATUS_SETUP:
    case QEMU_MONITOR_MIGRATION_STATUS_ACTIVE:
    case QEMU_MONITOR_MIGRATION_STATUS_CANCELLING:
1380
    case QEMU_MONITOR_MIGRATION_STATUS_LAST:
1381 1382 1383 1384 1385 1386
        break;
    }
}


int
1387 1388 1389
qemuMigrationFetchStats(virQEMUDriverPtr driver,
                        virDomainObjPtr vm,
                        qemuDomainAsyncJob asyncJob,
1390 1391
                        qemuDomainJobInfoPtr jobInfo,
                        char **error)
1392 1393
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
1394
    qemuMonitorMigrationStats stats;
1395 1396 1397 1398 1399
    int rv;

    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
        return -1;

1400
    rv = qemuMonitorGetMigrationStats(priv->mon, &stats, error);
1401 1402 1403 1404

    if (qemuDomainObjExitMonitor(driver, vm) < 0 || rv < 0)
        return -1;

1405 1406 1407
    jobInfo->stats = stats;

    return 0;
1408 1409 1410
}


1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428
static const char *
qemuMigrationJobName(virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

    switch (priv->job.asyncJob) {
    case QEMU_ASYNC_JOB_MIGRATION_OUT:
        return _("migration job");
    case QEMU_ASYNC_JOB_SAVE:
        return _("domain save job");
    case QEMU_ASYNC_JOB_DUMP:
        return _("domain core dump job");
    default:
        return _("job");
    }
}


1429 1430 1431
static int
qemuMigrationCheckJobStatus(virQEMUDriverPtr driver,
                            virDomainObjPtr vm,
1432
                            qemuDomainAsyncJob asyncJob)
1433 1434 1435
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    qemuDomainJobInfoPtr jobInfo = priv->job.current;
1436
    char *error = NULL;
1437
    bool events = virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_MIGRATION_EVENT);
1438
    int ret = -1;
1439

1440 1441 1442 1443 1444
    if (!events ||
        jobInfo->stats.status == QEMU_MONITOR_MIGRATION_STATUS_ERROR) {
        if (qemuMigrationFetchStats(driver, vm, asyncJob, jobInfo, &error) < 0)
            return -1;
    }
1445

1446 1447
    qemuMigrationUpdateJobType(jobInfo);

1448 1449
    switch (jobInfo->status) {
    case QEMU_DOMAIN_JOB_STATUS_NONE:
1450 1451
        virReportError(VIR_ERR_OPERATION_FAILED, _("%s: %s"),
                       qemuMigrationJobName(vm), _("is not active"));
1452
        goto cleanup;
1453

1454
    case QEMU_DOMAIN_JOB_STATUS_FAILED:
1455
        virReportError(VIR_ERR_OPERATION_FAILED, _("%s: %s"),
1456 1457 1458
                       qemuMigrationJobName(vm),
                       error ? error : _("unexpectedly failed"));
        goto cleanup;
1459

1460
    case QEMU_DOMAIN_JOB_STATUS_CANCELED:
1461 1462
        virReportError(VIR_ERR_OPERATION_ABORTED, _("%s: %s"),
                       qemuMigrationJobName(vm), _("canceled by client"));
1463
        goto cleanup;
1464

1465 1466
    case QEMU_DOMAIN_JOB_STATUS_COMPLETED:
    case QEMU_DOMAIN_JOB_STATUS_ACTIVE:
1467
    case QEMU_DOMAIN_JOB_STATUS_MIGRATING:
1468
    case QEMU_DOMAIN_JOB_STATUS_QEMU_COMPLETED:
1469
    case QEMU_DOMAIN_JOB_STATUS_POSTCOPY:
1470
    case QEMU_DOMAIN_JOB_STATUS_PAUSED:
1471 1472
        break;
    }
1473 1474 1475 1476 1477 1478

    ret = 0;

 cleanup:
    VIR_FREE(error);
    return ret;
1479 1480 1481
}


1482 1483 1484
enum qemuMigrationCompletedFlags {
    QEMU_MIGRATION_COMPLETED_ABORT_ON_ERROR = (1 << 0),
    QEMU_MIGRATION_COMPLETED_CHECK_STORAGE  = (1 << 1),
1485
    QEMU_MIGRATION_COMPLETED_POSTCOPY       = (1 << 2),
1486
    QEMU_MIGRATION_COMPLETED_PRE_SWITCHOVER = (1 << 3),
1487 1488
};

1489

1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500
/**
 * Returns 1 if migration completed successfully,
 *         0 if the domain is still being migrated,
 *         -1 migration failed,
 *         -2 something else failed, we need to cancel migration.
 */
static int
qemuMigrationCompleted(virQEMUDriverPtr driver,
                       virDomainObjPtr vm,
                       qemuDomainAsyncJob asyncJob,
                       virConnectPtr dconn,
1501
                       unsigned int flags)
1502 1503 1504 1505 1506
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    qemuDomainJobInfoPtr jobInfo = priv->job.current;
    int pauseReason;

1507
    if (qemuMigrationCheckJobStatus(driver, vm, asyncJob) < 0)
1508 1509
        goto error;

1510
    if (flags & QEMU_MIGRATION_COMPLETED_CHECK_STORAGE &&
1511
        qemuMigrationDriveMirrorReady(driver, vm, asyncJob) < 0)
1512 1513
        goto error;

1514
    if (flags & QEMU_MIGRATION_COMPLETED_ABORT_ON_ERROR &&
1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527
        virDomainObjGetState(vm, &pauseReason) == VIR_DOMAIN_PAUSED &&
        pauseReason == VIR_DOMAIN_PAUSED_IOERROR) {
        virReportError(VIR_ERR_OPERATION_FAILED, _("%s: %s"),
                       qemuMigrationJobName(vm), _("failed due to I/O error"));
        goto error;
    }

    if (dconn && virConnectIsAlive(dconn) <= 0) {
        virReportError(VIR_ERR_OPERATION_FAILED, "%s",
                       _("Lost connection to destination host"));
        goto error;
    }

1528 1529 1530 1531 1532 1533 1534 1535 1536 1537
    /* Migration was paused before serializing device state, let's return to
     * the caller so that it can finish all block jobs, resume migration, and
     * wait again for the real end of the migration.
     */
    if (flags & QEMU_MIGRATION_COMPLETED_PRE_SWITCHOVER &&
        jobInfo->status == QEMU_DOMAIN_JOB_STATUS_PAUSED) {
        VIR_DEBUG("Migration paused before switchover");
        return 1;
    }

1538 1539 1540 1541 1542
    /* In case of postcopy the source considers migration completed at the
     * moment it switched from active to postcopy-active state. The destination
     * will continue waiting until the migrate state changes to completed.
     */
    if (flags & QEMU_MIGRATION_COMPLETED_POSTCOPY &&
1543
        jobInfo->status == QEMU_DOMAIN_JOB_STATUS_POSTCOPY) {
1544 1545 1546 1547
        VIR_DEBUG("Migration switched to post-copy");
        return 1;
    }

1548
    if (jobInfo->status == QEMU_DOMAIN_JOB_STATUS_QEMU_COMPLETED)
1549 1550 1551 1552 1553
        return 1;
    else
        return 0;

 error:
1554 1555 1556
    switch (jobInfo->status) {
    case QEMU_DOMAIN_JOB_STATUS_MIGRATING:
    case QEMU_DOMAIN_JOB_STATUS_POSTCOPY:
1557
    case QEMU_DOMAIN_JOB_STATUS_PAUSED:
1558
        /* The migration was aborted by us rather than QEMU itself. */
1559
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_FAILED;
1560
        return -2;
1561 1562 1563

    case QEMU_DOMAIN_JOB_STATUS_QEMU_COMPLETED:
        /* Something failed after QEMU already finished the migration. */
1564
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_FAILED;
1565
        return -1;
1566 1567 1568 1569

    case QEMU_DOMAIN_JOB_STATUS_FAILED:
    case QEMU_DOMAIN_JOB_STATUS_CANCELED:
        /* QEMU aborted the migration. */
1570
        return -1;
1571 1572 1573 1574 1575 1576

    case QEMU_DOMAIN_JOB_STATUS_ACTIVE:
    case QEMU_DOMAIN_JOB_STATUS_COMPLETED:
    case QEMU_DOMAIN_JOB_STATUS_NONE:
        /* Impossible. */
        break;
1577
    }
1578 1579

    return -1;
1580 1581 1582
}


1583 1584 1585
/* Returns 0 on success, -2 when migration needs to be cancelled, or -1 when
 * QEMU reports failed migration.
 */
1586
static int
J
Jiri Denemark 已提交
1587 1588
qemuMigrationWaitForCompletion(virQEMUDriverPtr driver,
                               virDomainObjPtr vm,
1589
                               qemuDomainAsyncJob asyncJob,
J
Jiri Denemark 已提交
1590
                               virConnectPtr dconn,
1591
                               unsigned int flags)
1592
{
1593
    qemuDomainObjPrivatePtr priv = vm->privateData;
J
Jiri Denemark 已提交
1594
    qemuDomainJobInfoPtr jobInfo = priv->job.current;
1595
    bool events = virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_MIGRATION_EVENT);
1596
    int rv;
1597

1598 1599
    jobInfo->status = QEMU_DOMAIN_JOB_STATUS_MIGRATING;

1600 1601
    while ((rv = qemuMigrationCompleted(driver, vm, asyncJob,
                                        dconn, flags)) != 1) {
1602 1603
        if (rv < 0)
            return rv;
1604

1605 1606
        if (events) {
            if (virDomainObjWait(vm) < 0) {
1607
                jobInfo->status = QEMU_DOMAIN_JOB_STATUS_FAILED;
1608 1609 1610 1611 1612 1613 1614 1615 1616 1617
                return -2;
            }
        } else {
            /* Poll every 50ms for progress & to allow cancellation */
            struct timespec ts = { .tv_sec = 0, .tv_nsec = 50 * 1000 * 1000ull };

            virObjectUnlock(vm);
            nanosleep(&ts, NULL);
            virObjectLock(vm);
        }
1618 1619
    }

1620
    if (events)
1621
        ignore_value(qemuMigrationFetchStats(driver, vm, asyncJob, jobInfo, NULL));
1622

1623
    qemuDomainJobInfoUpdateTime(jobInfo);
1624 1625 1626 1627 1628
    qemuDomainJobInfoUpdateDowntime(jobInfo);
    VIR_FREE(priv->job.completed);
    if (VIR_ALLOC(priv->job.completed) == 0)
        *priv->job.completed = *jobInfo;

1629 1630 1631 1632
    if (asyncJob != QEMU_ASYNC_JOB_MIGRATION_OUT &&
        jobInfo->status == QEMU_DOMAIN_JOB_STATUS_QEMU_COMPLETED)
        jobInfo->status = QEMU_DOMAIN_JOB_STATUS_COMPLETED;

1633
    return 0;
1634 1635 1636
}


1637 1638 1639
static int
qemuMigrationWaitForDestCompletion(virQEMUDriverPtr driver,
                                   virDomainObjPtr vm,
1640 1641
                                   qemuDomainAsyncJob asyncJob,
                                   bool postcopy)
1642 1643
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
1644
    unsigned int flags = 0;
1645 1646 1647 1648 1649 1650 1651
    int rv;

    if (!virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_MIGRATION_EVENT))
        return 0;

    VIR_DEBUG("Waiting for incoming migration to complete");

1652 1653 1654 1655 1656
    if (postcopy)
        flags = QEMU_MIGRATION_COMPLETED_POSTCOPY;

    while ((rv = qemuMigrationCompleted(driver, vm, asyncJob,
                                        NULL, flags)) != 1) {
1657 1658 1659 1660 1661 1662 1663 1664
        if (rv < 0 || virDomainObjWait(vm) < 0)
            return -1;
    }

    return 0;
}


1665
static int
1666
qemuDomainMigrateGraphicsRelocate(virQEMUDriverPtr driver,
1667
                                  virDomainObjPtr vm,
1668 1669
                                  qemuMigrationCookiePtr cookie,
                                  const char *graphicsuri)
1670 1671
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
1672 1673
    int ret = -1;
    const char *listenAddress = NULL;
1674
    virSocketAddr addr;
1675 1676 1677 1678 1679
    virURIPtr uri = NULL;
    int type = -1;
    int port = -1;
    int tlsPort = -1;
    const char *tlsSubject = NULL;
1680

1681
    if (!cookie || (!cookie->graphics && !graphicsuri))
1682 1683
        return 0;

1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702
    if (graphicsuri && !(uri = virURIParse(graphicsuri)))
        goto cleanup;

    if (cookie->graphics) {
        type = cookie->graphics->type;

        listenAddress = cookie->graphics->listen;

        if (!listenAddress ||
            (virSocketAddrParse(&addr, listenAddress, AF_UNSPEC) > 0 &&
             virSocketAddrIsWildcard(&addr)))
            listenAddress = cookie->remoteHostname;

        port = cookie->graphics->port;
        tlsPort = cookie->graphics->tlsPort;
        tlsSubject = cookie->graphics->tlsSubject;
    }

    if (uri) {
1703
        size_t i;
1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730

        if ((type = virDomainGraphicsTypeFromString(uri->scheme)) < 0) {
            virReportError(VIR_ERR_INVALID_ARG,
                           _("unknown graphics type %s"), uri->scheme);
            goto cleanup;
        }

        if (uri->server)
            listenAddress = uri->server;
        if (uri->port > 0)
            port = uri->port;

        for (i = 0; i < uri->paramsCount; i++) {
            virURIParamPtr param = uri->params + i;

            if (STRCASEEQ(param->name, "tlsPort")) {
                if (virStrToLong_i(param->value, NULL, 10, &tlsPort) < 0) {
                    virReportError(VIR_ERR_INVALID_ARG,
                                   _("invalid tlsPort number: %s"),
                                   param->value);
                    goto cleanup;
                }
            } else if (STRCASEEQ(param->name, "tlsSubject")) {
                tlsSubject = param->value;
            }
        }
    }
1731 1732 1733 1734

    /* QEMU doesn't support VNC relocation yet, so
     * skip it to avoid generating an error
     */
1735 1736 1737 1738
    if (type != VIR_DOMAIN_GRAPHICS_TYPE_SPICE) {
        ret = 0;
        goto cleanup;
    }
1739

1740 1741 1742 1743 1744 1745 1746 1747 1748
    /* Older libvirt sends port == 0 for listen type='none' graphics. It's
     * safe to ignore such requests since relocation to unknown port does
     * not make sense in general.
     */
    if (port <= 0 && tlsPort <= 0) {
        ret = 0;
        goto cleanup;
    }

1749 1750 1751 1752
    if (qemuDomainObjEnterMonitorAsync(driver, vm,
                                       QEMU_ASYNC_JOB_MIGRATION_OUT) == 0) {
        ret = qemuMonitorGraphicsRelocate(priv->mon, type, listenAddress,
                                          port, tlsPort, tlsSubject);
1753
        priv->job.spiceMigration = !ret;
1754 1755
        if (qemuDomainObjExitMonitor(driver, vm) < 0)
            ret = -1;
1756
    }
1757

1758
 cleanup:
1759
    virURIFree(uri);
1760 1761 1762 1763
    return ret;
}


1764
static int
1765
qemuDomainMigrateOPDRelocate(virQEMUDriverPtr driver ATTRIBUTE_UNUSED,
1766 1767 1768
                             virDomainObjPtr vm,
                             qemuMigrationCookiePtr cookie)
{
1769 1770
    virDomainNetDefPtr netptr;
    int ret = -1;
1771
    size_t i;
1772 1773 1774 1775 1776 1777 1778 1779

    for (i = 0; i < cookie->network->nnets; i++) {
        netptr = vm->def->nets[i];

        switch (cookie->network->net[i].vporttype) {
        case VIR_NETDEV_VPORT_PROFILE_NONE:
        case VIR_NETDEV_VPORT_PROFILE_8021QBG:
        case VIR_NETDEV_VPORT_PROFILE_8021QBH:
1780
           break;
1781
        case VIR_NETDEV_VPORT_PROFILE_OPENVSWITCH:
1782 1783
            if (virNetDevOpenvswitchSetMigrateData(cookie->network->net[i].portdata,
                                                   netptr->ifname) != 0) {
J
Jiri Denemark 已提交
1784 1785 1786
                virReportError(VIR_ERR_INTERNAL_ERROR,
                               _("Unable to run command to set OVS port data for "
                                 "interface %s"), netptr->ifname);
1787 1788 1789
                goto cleanup;
            }
            break;
1790 1791 1792 1793 1794
        default:
            break;
        }
    }

1795
    ret = 0;
1796
 cleanup:
1797 1798 1799 1800
    return ret;
}


1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840
int
qemuMigrationCheckIncoming(virQEMUCapsPtr qemuCaps,
                           const char *migrateFrom)
{
    if (STRPREFIX(migrateFrom, "rdma")) {
        if (!virQEMUCapsGet(qemuCaps, QEMU_CAPS_MIGRATE_RDMA)) {
            virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                           _("incoming RDMA migration is not supported "
                             "with this QEMU binary"));
            return -1;
        }
    } else if (!STRPREFIX(migrateFrom, "tcp") &&
               !STRPREFIX(migrateFrom, "exec") &&
               !STRPREFIX(migrateFrom, "fd") &&
               !STRPREFIX(migrateFrom, "unix") &&
               STRNEQ(migrateFrom, "stdio")) {
        virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                       _("unknown migration protocol"));
        return -1;
    }

    return 0;
}


char *
qemuMigrationIncomingURI(const char *migrateFrom,
                         int migrateFd)
{
    char *uri = NULL;

    if (STREQ(migrateFrom, "stdio"))
        ignore_value(virAsprintf(&uri, "fd:%d", migrateFd));
    else
        ignore_value(VIR_STRDUP(uri, migrateFrom));

    return uri;
}


1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866
int
qemuMigrationRunIncoming(virQEMUDriverPtr driver,
                         virDomainObjPtr vm,
                         const char *uri,
                         qemuDomainAsyncJob asyncJob)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int ret = -1;
    int rv;

    VIR_DEBUG("Setting up incoming migration with URI %s", uri);

    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
        return -1;

    rv = qemuMonitorMigrateIncoming(priv->mon, uri);

    if (qemuDomainObjExitMonitor(driver, vm) < 0 || rv < 0)
        goto cleanup;

    if (asyncJob == QEMU_ASYNC_JOB_MIGRATION_IN) {
        /* qemuMigrationWaitForDestCompletion is called from the Finish phase */
        ret = 0;
        goto cleanup;
    }

1867
    if (qemuMigrationWaitForDestCompletion(driver, vm, asyncJob, false) < 0)
1868 1869 1870 1871 1872 1873 1874 1875 1876
        goto cleanup;

    ret = 0;

 cleanup:
    return ret;
}


1877 1878 1879 1880 1881 1882
/* This is called for outgoing non-p2p migrations when a connection to the
 * client which initiated the migration was closed but we were waiting for it
 * to follow up with the next phase, that is, in between
 * qemuDomainMigrateBegin3 and qemuDomainMigratePerform3 or
 * qemuDomainMigratePerform3 and qemuDomainMigrateConfirm3.
 */
1883 1884 1885 1886
static virDomainObjPtr
qemuMigrationCleanup(virDomainObjPtr vm,
                     virConnectPtr conn,
                     void *opaque)
1887
{
1888
    virQEMUDriverPtr driver = opaque;
1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903
    qemuDomainObjPrivatePtr priv = vm->privateData;

    VIR_DEBUG("vm=%s, conn=%p, asyncJob=%s, phase=%s",
              vm->def->name, conn,
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
              qemuDomainAsyncJobPhaseToString(priv->job.asyncJob,
                                              priv->job.phase));

    if (!qemuMigrationJobIsActive(vm, QEMU_ASYNC_JOB_MIGRATION_OUT))
        goto cleanup;

    VIR_DEBUG("The connection which started outgoing migration of domain %s"
              " was closed; canceling the migration",
              vm->def->name);

1904
    switch ((qemuMigrationJobPhase) priv->job.phase) {
1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934
    case QEMU_MIGRATION_PHASE_BEGIN3:
        /* just forget we were about to migrate */
        qemuDomainObjDiscardAsyncJob(driver, vm);
        break;

    case QEMU_MIGRATION_PHASE_PERFORM3_DONE:
        VIR_WARN("Migration of domain %s finished but we don't know if the"
                 " domain was successfully started on destination or not",
                 vm->def->name);
        /* clear the job and let higher levels decide what to do */
        qemuDomainObjDiscardAsyncJob(driver, vm);
        break;

    case QEMU_MIGRATION_PHASE_PERFORM3:
        /* cannot be seen without an active migration API; unreachable */
    case QEMU_MIGRATION_PHASE_CONFIRM3:
    case QEMU_MIGRATION_PHASE_CONFIRM3_CANCELLED:
        /* all done; unreachable */
    case QEMU_MIGRATION_PHASE_PREPARE:
    case QEMU_MIGRATION_PHASE_FINISH2:
    case QEMU_MIGRATION_PHASE_FINISH3:
        /* incoming migration; unreachable */
    case QEMU_MIGRATION_PHASE_PERFORM2:
        /* single phase outgoing migration; unreachable */
    case QEMU_MIGRATION_PHASE_NONE:
    case QEMU_MIGRATION_PHASE_LAST:
        /* unreachable */
        ;
    }

1935
 cleanup:
1936 1937 1938
    return vm;
}

1939

1940
/* The caller is supposed to lock the vm and start a migration job. */
1941 1942 1943 1944 1945 1946 1947
static char *
qemuMigrationBeginPhase(virQEMUDriverPtr driver,
                        virDomainObjPtr vm,
                        const char *xmlin,
                        const char *dname,
                        char **cookieout,
                        int *cookieoutlen,
1948 1949
                        size_t nmigrate_disks,
                        const char **migrate_disks,
1950
                        unsigned long flags)
1951 1952 1953
{
    char *rv = NULL;
    qemuMigrationCookiePtr mig = NULL;
1954
    virDomainDefPtr def = NULL;
1955
    qemuDomainObjPrivatePtr priv = vm->privateData;
1956
    virCapsPtr caps = NULL;
1957
    unsigned int cookieFlags = QEMU_MIGRATION_COOKIE_LOCKSTATE;
1958

1959
    VIR_DEBUG("driver=%p, vm=%p, xmlin=%s, dname=%s,"
1960
              " cookieout=%p, cookieoutlen=%p,"
1961
              " nmigrate_disks=%zu, migrate_disks=%p, flags=0x%lx",
1962
              driver, vm, NULLSTR(xmlin), NULLSTR(dname),
1963 1964
              cookieout, cookieoutlen, nmigrate_disks,
              migrate_disks, flags);
1965

1966 1967 1968
    if (!(caps = virQEMUDriverGetCapabilities(driver, false)))
        goto cleanup;

1969 1970 1971 1972 1973 1974
    /* Only set the phase if we are inside QEMU_ASYNC_JOB_MIGRATION_OUT.
     * Otherwise we will start the async job later in the perform phase losing
     * change protection.
     */
    if (priv->job.asyncJob == QEMU_ASYNC_JOB_MIGRATION_OUT)
        qemuMigrationJobSetPhase(driver, vm, QEMU_MIGRATION_PHASE_BEGIN3);
1975

1976
    if (!qemuMigrationIsAllowed(driver, vm, true, flags))
1977 1978
        goto cleanup;

1979
    if (!(flags & (VIR_MIGRATE_UNSAFE | VIR_MIGRATE_OFFLINE)) &&
1980
        !qemuMigrationIsSafe(vm->def, nmigrate_disks, migrate_disks, flags))
1981 1982
        goto cleanup;

1983 1984 1985 1986 1987 1988 1989 1990 1991
    if (flags & VIR_MIGRATE_POSTCOPY &&
        (!(flags & VIR_MIGRATE_LIVE) ||
         flags & VIR_MIGRATE_PAUSED)) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("post-copy migration is not supported with non-live "
                         "or paused migration"));
        goto cleanup;
    }

1992 1993 1994 1995 1996 1997
    if (flags & VIR_MIGRATE_POSTCOPY && flags & VIR_MIGRATE_TUNNELLED) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("post-copy is not supported with tunnelled migration"));
        goto cleanup;
    }

1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040
    if (flags & (VIR_MIGRATE_NON_SHARED_DISK | VIR_MIGRATE_NON_SHARED_INC)) {
        bool has_drive_mirror =  virQEMUCapsGet(priv->qemuCaps,
                                                QEMU_CAPS_DRIVE_MIRROR);

        if (nmigrate_disks) {
            if (has_drive_mirror) {
                size_t i, j;
                /* Check user requested only known disk targets. */
                for (i = 0; i < nmigrate_disks; i++) {
                    for (j = 0; j < vm->def->ndisks; j++) {
                        if (STREQ(vm->def->disks[j]->dst, migrate_disks[i]))
                            break;
                    }

                    if (j == vm->def->ndisks) {
                        virReportError(VIR_ERR_INVALID_ARG,
                                       _("disk target %s not found"),
                                       migrate_disks[i]);
                        goto cleanup;
                    }
                }

                if (flags & VIR_MIGRATE_TUNNELLED) {
                    virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                                   _("Selecting disks to migrate is not "
                                     "implemented for tunnelled migration"));
                    goto cleanup;
                }
            } else {
                virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                               _("qemu does not support drive-mirror command"));
                goto cleanup;
            }
        }

        if (has_drive_mirror) {
            /* TODO support NBD for TUNNELLED migration */
            if (flags & VIR_MIGRATE_TUNNELLED) {
                VIR_WARN("NBD in tunnelled migration is currently not supported");
            } else {
                cookieFlags |= QEMU_MIGRATION_COOKIE_NBD;
                priv->nbdPort = 0;
            }
2041 2042 2043
        }
    }

2044
    if (virDomainDefHasMemoryHotplug(vm->def) ||
2045
        ((flags & VIR_MIGRATE_PERSIST_DEST) &&
2046
         vm->newDef && virDomainDefHasMemoryHotplug(vm->newDef)))
2047 2048
        cookieFlags |= QEMU_MIGRATION_COOKIE_MEMORY_HOTPLUG;

2049 2050 2051 2052 2053
    if (!qemuDomainVcpuHotplugIsInOrder(vm->def) ||
        ((flags & VIR_MIGRATE_PERSIST_DEST) &&
         vm->newDef && !qemuDomainVcpuHotplugIsInOrder(vm->newDef)))
        cookieFlags |= QEMU_MIGRATION_COOKIE_CPU_HOTPLUG;

2054 2055 2056
    if (priv->origCPU)
        cookieFlags |= QEMU_MIGRATION_COOKIE_CPU;

2057 2058
    cookieFlags |= QEMU_MIGRATION_COOKIE_ALLOW_REBOOT;

2059
    if (!(mig = qemuMigrationEatCookie(driver, vm, NULL, 0, 0)))
2060 2061 2062 2063
        goto cleanup;

    if (qemuMigrationBakeCookie(mig, driver, vm,
                                cookieout, cookieoutlen,
2064
                                cookieFlags) < 0)
2065 2066
        goto cleanup;

L
liguang 已提交
2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088
    if (flags & VIR_MIGRATE_OFFLINE) {
        if (flags & (VIR_MIGRATE_NON_SHARED_DISK |
                     VIR_MIGRATE_NON_SHARED_INC)) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("offline migration cannot handle "
                             "non-shared storage"));
            goto cleanup;
        }
        if (!(flags & VIR_MIGRATE_PERSIST_DEST)) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("offline migration must be specified with "
                             "the persistent flag set"));
            goto cleanup;
        }
        if (flags & VIR_MIGRATE_TUNNELLED) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("tunnelled offline migration does not "
                             "make sense"));
            goto cleanup;
        }
    }

2089
    if (xmlin) {
2090
        if (!(def = virDomainDefParseString(xmlin, caps, driver->xmlopt, priv->qemuCaps,
2091 2092
                                            VIR_DOMAIN_DEF_PARSE_INACTIVE |
                                            VIR_DOMAIN_DEF_PARSE_SKIP_VALIDATE)))
2093 2094
            goto cleanup;

2095
        if (!qemuDomainCheckABIStability(driver, vm, def))
2096 2097
            goto cleanup;

2098
        rv = qemuDomainDefFormatLive(driver, def, NULL, false, true);
2099
    } else {
2100 2101
        rv = qemuDomainDefFormatLive(driver, vm->def, priv->origCPU,
                                     false, true);
2102
    }
2103

2104
 cleanup:
2105
    qemuMigrationCookieFree(mig);
2106
    virObjectUnref(caps);
2107
    virDomainDefFree(def);
2108 2109 2110
    return rv;
}

2111 2112 2113 2114 2115 2116 2117
char *
qemuMigrationBegin(virConnectPtr conn,
                   virDomainObjPtr vm,
                   const char *xmlin,
                   const char *dname,
                   char **cookieout,
                   int *cookieoutlen,
2118 2119
                   size_t nmigrate_disks,
                   const char **migrate_disks,
2120 2121 2122
                   unsigned long flags)
{
    virQEMUDriverPtr driver = conn->privateData;
2123
    virQEMUDriverConfigPtr cfg = NULL;
2124
    char *xml = NULL;
2125
    qemuDomainAsyncJob asyncJob;
2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136

    if ((flags & VIR_MIGRATE_CHANGE_PROTECTION)) {
        if (qemuMigrationJobStart(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
            goto cleanup;
        asyncJob = QEMU_ASYNC_JOB_MIGRATION_OUT;
    } else {
        if (qemuDomainObjBeginJob(driver, vm, QEMU_JOB_MODIFY) < 0)
            goto cleanup;
        asyncJob = QEMU_ASYNC_JOB_NONE;
    }

2137 2138
    qemuMigrationStoreDomainState(vm);

2139 2140 2141 2142 2143 2144 2145 2146 2147 2148
    if (!virDomainObjIsActive(vm) && !(flags & VIR_MIGRATE_OFFLINE)) {
        virReportError(VIR_ERR_OPERATION_INVALID,
                       "%s", _("domain is not running"));
        goto endjob;
    }

    /* Check if there is any ejected media.
     * We don't want to require them on the destination.
     */
    if (!(flags & VIR_MIGRATE_OFFLINE) &&
2149
        qemuProcessRefreshDisks(driver, vm, asyncJob) < 0)
2150 2151 2152 2153
        goto endjob;

    if (!(xml = qemuMigrationBeginPhase(driver, vm, xmlin, dname,
                                        cookieout, cookieoutlen,
2154
                                        nmigrate_disks, migrate_disks, flags)))
2155 2156
        goto endjob;

2157 2158 2159 2160 2161 2162
    if (flags & VIR_MIGRATE_TLS) {
        cfg = virQEMUDriverGetConfig(driver);
        if (qemuMigrationCheckSetupTLS(conn, driver, cfg, vm, asyncJob) < 0)
            goto endjob;
    }

2163 2164 2165 2166 2167
    if ((flags & VIR_MIGRATE_CHANGE_PROTECTION)) {
        /* We keep the job active across API calls until the confirm() call.
         * This prevents any other APIs being invoked while migration is taking
         * place.
         */
2168
        if (virCloseCallbacksSet(driver->closeCallbacks, vm, conn,
2169 2170
                                 qemuMigrationCleanup) < 0) {
            VIR_FREE(xml);
2171
            goto endjob;
2172
        }
2173
        qemuMigrationJobContinue(vm);
2174 2175 2176 2177
    } else {
        goto endjob;
    }

2178
 cleanup:
2179
    virObjectUnref(cfg);
M
Michal Privoznik 已提交
2180
    virDomainObjEndAPI(&vm);
2181 2182
    return xml;

2183
 endjob:
2184 2185 2186 2187
    if (flags & VIR_MIGRATE_CHANGE_PROTECTION)
        qemuMigrationJobFinish(driver, vm);
    else
        qemuDomainObjEndJob(driver, vm);
2188 2189 2190
    goto cleanup;
}

2191

2192 2193
/* Prepare is the first step, and it runs on the destination host.
 */
2194

2195
static void
2196
qemuMigrationPrepareCleanup(virQEMUDriverPtr driver,
2197 2198 2199 2200 2201 2202 2203 2204 2205 2206
                            virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

    VIR_DEBUG("driver=%p, vm=%s, job=%s, asyncJob=%s",
              driver,
              vm->def->name,
              qemuDomainJobTypeToString(priv->job.active),
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob));

2207 2208 2209
    virPortAllocatorRelease(driver->migrationPorts, priv->migrationPort);
    priv->migrationPort = 0;

2210 2211 2212 2213 2214
    if (!qemuMigrationJobIsActive(vm, QEMU_ASYNC_JOB_MIGRATION_IN))
        return;
    qemuDomainObjDiscardAsyncJob(driver, vm);
}

2215
static qemuProcessIncomingDefPtr
2216 2217 2218 2219
qemuMigrationPrepareIncoming(virDomainObjPtr vm,
                             bool tunnel,
                             const char *protocol,
                             const char *listenAddress,
2220 2221
                             unsigned short port,
                             int fd)
2222 2223
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
2224
    qemuProcessIncomingDefPtr inc = NULL;
2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286
    char *migrateFrom = NULL;

    if (tunnel) {
        if (VIR_STRDUP(migrateFrom, "stdio") < 0)
            goto cleanup;
    } else {
        bool encloseAddress = false;
        bool hostIPv6Capable = false;
        bool qemuIPv6Capable = false;
        struct addrinfo *info = NULL;
        struct addrinfo hints = { .ai_flags = AI_ADDRCONFIG,
                                  .ai_socktype = SOCK_STREAM };
        const char *incFormat;

        if (getaddrinfo("::", NULL, &hints, &info) == 0) {
            freeaddrinfo(info);
            hostIPv6Capable = true;
        }
        qemuIPv6Capable = virQEMUCapsGet(priv->qemuCaps,
                                         QEMU_CAPS_IPV6_MIGRATION);

        if (listenAddress) {
            if (virSocketAddrNumericFamily(listenAddress) == AF_INET6) {
                if (!qemuIPv6Capable) {
                    virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                                   _("qemu isn't capable of IPv6"));
                    goto cleanup;
                }
                if (!hostIPv6Capable) {
                    virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                                   _("host isn't capable of IPv6"));
                    goto cleanup;
                }
                /* IPv6 address must be escaped in brackets on the cmd line */
                encloseAddress = true;
            } else {
                /* listenAddress is a hostname or IPv4 */
            }
        } else if (qemuIPv6Capable && hostIPv6Capable) {
            /* Listen on :: instead of 0.0.0.0 if QEMU understands it
             * and there is at least one IPv6 address configured
             */
            listenAddress = "::";
            encloseAddress = true;
        } else {
            listenAddress = "0.0.0.0";
        }

        /* QEMU will be started with
         *   -incoming protocol:[<IPv6 addr>]:port,
         *   -incoming protocol:<IPv4 addr>:port, or
         *   -incoming protocol:<hostname>:port
         */
        if (encloseAddress)
            incFormat = "%s:[%s]:%d";
        else
            incFormat = "%s:%s:%d";
        if (virAsprintf(&migrateFrom, incFormat,
                        protocol, listenAddress, port) < 0)
            goto cleanup;
    }

2287 2288
    inc = qemuProcessIncomingDefNew(priv->qemuCaps, listenAddress,
                                    migrateFrom, fd, NULL);
2289

2290
 cleanup:
2291 2292
    VIR_FREE(migrateFrom);
    return inc;
2293 2294
}

2295 2296 2297 2298
static int
qemuMigrationSetCompression(virQEMUDriverPtr driver,
                            virDomainObjPtr vm,
                            qemuDomainAsyncJob job,
2299 2300
                            qemuMigrationCompressionPtr compression,
                            qemuMonitorMigrationParamsPtr migParams)
2301
{
2302 2303 2304
    int ret = -1;
    qemuDomainObjPrivatePtr priv = vm->privateData;

2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318
    if (qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_XBZRLE,
                               compression->methods &
                                   (1ULL << QEMU_MIGRATION_COMPRESS_XBZRLE),
                               job) < 0)
        return -1;

    if (qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_COMPRESS,
                               compression->methods &
                                   (1ULL << QEMU_MIGRATION_COMPRESS_MT),
                               job) < 0)
        return -1;

2319 2320 2321
    if (qemuDomainObjEnterMonitorAsync(driver, vm, job) < 0)
        return -1;

2322 2323
    migParams->compressLevel_set = compression->level_set;
    migParams->compressLevel = compression->level;
2324

2325 2326
    migParams->compressThreads_set = compression->threads_set;
    migParams->compressThreads = compression->threads;
2327

2328 2329
    migParams->decompressThreads_set = compression->dthreads_set;
    migParams->decompressThreads = compression->dthreads;
2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342

    if (compression->xbzrle_cache_set &&
        qemuMonitorSetMigrationCacheSize(priv->mon,
                                         compression->xbzrle_cache) < 0)
        goto cleanup;

    ret = 0;

 cleanup:
    if (qemuDomainObjExitMonitor(driver, vm) < 0)
        ret = -1;

    return ret;
2343 2344
}

2345

2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367
void
qemuMigrationParamsClear(qemuMonitorMigrationParamsPtr migParams)
{
    if (!migParams)
        return;

    VIR_FREE(migParams->migrateTLSAlias);
    VIR_FREE(migParams->migrateTLSHostname);
}


void
qemuMigrationParamsFree(qemuMonitorMigrationParamsPtr *migParams)
{
    if (!*migParams)
        return;

    qemuMigrationParamsClear(*migParams);
    VIR_FREE(*migParams);
}


2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401
/* qemuMigrationSetEmptyTLSParams
 * @driver: pointer to qemu driver
 * @vm: domain object
 * @asyncJob: migration job to join
 * @migParams: Pointer to a migration parameters block
 *
 * If we support setting the tls-creds, then set both tls-creds and
 * tls-hostname to the empty string ("") which indicates to not use
 * TLS on this migration.
 *
 * Returns 0 on success, -1 on failure
 */
static int
qemuMigrationSetEmptyTLSParams(virQEMUDriverPtr driver,
                               virDomainObjPtr vm,
                               qemuDomainAsyncJob asyncJob,
                               qemuMonitorMigrationParamsPtr migParams)
{
   qemuDomainObjPrivatePtr priv = vm->privateData;

   if (qemuMigrationCheckTLSCreds(driver, vm, asyncJob) < 0)
       return -1;

   if (!priv->migTLSAlias)
       return 0;

   if (VIR_STRDUP(migParams->migrateTLSAlias, "") < 0 ||
       VIR_STRDUP(migParams->migrateTLSHostname, "") < 0)
       return -1;

    return 0;
}


2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440 2441 2442
qemuMonitorMigrationParamsPtr
qemuMigrationParams(virTypedParameterPtr params,
                    int nparams,
                    unsigned long flags)
{
    qemuMonitorMigrationParamsPtr migParams;

    if (VIR_ALLOC(migParams) < 0)
        return NULL;

    if (!params)
        return migParams;

#define GET(PARAM, VAR)                                                     \
    do {                                                                    \
        int rc;                                                             \
        if ((rc = virTypedParamsGetInt(params, nparams,                     \
                                       VIR_MIGRATE_PARAM_ ## PARAM,         \
                                       &migParams->VAR)) < 0)               \
            goto error;                                                     \
                                                                            \
        if (rc == 1)                                                        \
            migParams->VAR ## _set = true;                                  \
    } while (0)

    GET(AUTO_CONVERGE_INITIAL, cpuThrottleInitial);
    GET(AUTO_CONVERGE_INCREMENT, cpuThrottleIncrement);

#undef GET

    if ((migParams->cpuThrottleInitial_set ||
         migParams->cpuThrottleIncrement_set) &&
        !(flags & VIR_MIGRATE_AUTO_CONVERGE)) {
        virReportError(VIR_ERR_INVALID_ARG, "%s",
                       _("Turn auto convergence on to tune it"));
        goto error;
    }

    return migParams;

 error:
2443
    qemuMigrationParamsFree(&migParams);
2444 2445 2446 2447
    return NULL;
}


2448 2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471 2472
static int
qemuMigrationSetParams(virQEMUDriverPtr driver,
                       virDomainObjPtr vm,
                       qemuDomainAsyncJob job,
                       qemuMonitorMigrationParamsPtr migParams)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int ret = -1;

    if (qemuDomainObjEnterMonitorAsync(driver, vm, job) < 0)
        return -1;

    if (qemuMonitorSetMigrationParams(priv->mon, migParams) < 0)
        goto cleanup;

    ret = 0;

 cleanup:
    if (qemuDomainObjExitMonitor(driver, vm) < 0)
        ret = -1;

    return ret;
}


2473 2474 2475 2476 2477 2478
/* qemuMigrationResetTLS
 * @driver: pointer to qemu driver
 * @vm: domain object
 * @asyncJob: migration job to join
 *
 * Deconstruct all the setup possibly done for TLS - delete the TLS and
2479
 * security objects, free the secinfo, and reset the migration params to "".
2480 2481 2482
 *
 * Returns 0 on success, -1 on failure
 */
2483
static int
2484 2485
qemuMigrationResetTLS(virQEMUDriverPtr driver,
                      virDomainObjPtr vm,
2486
                      qemuDomainAsyncJob asyncJob)
2487 2488
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
2489 2490
    char *tlsAlias = NULL;
    char *secAlias = NULL;
2491
    qemuMonitorMigrationParams migParams = { 0 };
R
Roman Bogorodskiy 已提交
2492
    int ret = -1;
2493

2494
    if (qemuMigrationCheckTLSCreds(driver, vm, asyncJob) < 0)
2495 2496
        return -1;

2497 2498
    /* If the tls-creds doesn't exist or if they're set to "" then there's
     * nothing to do since we never set anything up */
2499 2500 2501 2502 2503 2504
    if (!priv->migTLSAlias || !*priv->migTLSAlias)
        return 0;

    /* NB: If either or both fail to allocate memory we can still proceed
     *     since the next time we migrate another deletion attempt will be
     *     made after successfully generating the aliases. */
2505 2506
    tlsAlias = qemuAliasTLSObjFromSrcAlias(QEMU_MIGRATION_TLS_ALIAS_BASE);
    secAlias = qemuDomainGetSecretAESAlias(QEMU_MIGRATION_TLS_ALIAS_BASE, false);
2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518

    qemuDomainDelTLSObjects(driver, vm, asyncJob, secAlias, tlsAlias);
    qemuDomainSecretInfoFree(&priv->migSecinfo);

    if (VIR_STRDUP(migParams.migrateTLSAlias, "") < 0 ||
        VIR_STRDUP(migParams.migrateTLSHostname, "") < 0 ||
        qemuMigrationSetParams(driver, vm, asyncJob, &migParams) < 0)
        goto cleanup;

    ret = 0;

 cleanup:
2519 2520
    VIR_FREE(tlsAlias);
    VIR_FREE(secAlias);
2521 2522 2523 2524 2525 2526
    qemuMigrationParamsClear(&migParams);

    return ret;
}


2527
static int
2528
qemuMigrationPrepareAny(virQEMUDriverPtr driver,
2529 2530 2531 2532 2533
                        virConnectPtr dconn,
                        const char *cookiein,
                        int cookieinlen,
                        char **cookieout,
                        int *cookieoutlen,
2534
                        virDomainDefPtr *def,
2535
                        const char *origname,
L
liguang 已提交
2536
                        virStreamPtr st,
2537
                        const char *protocol,
2538 2539
                        unsigned short port,
                        bool autoPort,
2540
                        const char *listenAddress,
2541 2542
                        size_t nmigrate_disks,
                        const char **migrate_disks,
2543
                        int nbdPort,
2544
                        qemuMigrationCompressionPtr compression,
L
liguang 已提交
2545
                        unsigned long flags)
2546 2547
{
    virDomainObjPtr vm = NULL;
2548
    virObjectEventPtr event = NULL;
2549
    virQEMUDriverConfigPtr cfg = NULL;
2550
    int ret = -1;
2551
    int dataFD[2] = { -1, -1 };
2552
    qemuDomainObjPrivatePtr priv = NULL;
2553
    qemuMigrationCookiePtr mig = NULL;
2554
    bool tunnel = !!st;
J
Jiri Denemark 已提交
2555
    char *xmlout = NULL;
L
liguang 已提交
2556
    unsigned int cookieFlags;
2557
    unsigned int startFlags;
2558
    virCapsPtr caps = NULL;
2559
    qemuProcessIncomingDefPtr incoming = NULL;
2560
    bool taint_hook = false;
2561 2562 2563
    bool stopProcess = false;
    bool relabel = false;
    int rv;
2564 2565
    char *tlsAlias = NULL;
    char *secAlias = NULL;
2566
    qemuMonitorMigrationParams migParams = { 0 };
2567

2568 2569
    virNWFilterReadLockFilterUpdates();

L
liguang 已提交
2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584 2585 2586 2587 2588 2589
    if (flags & VIR_MIGRATE_OFFLINE) {
        if (flags & (VIR_MIGRATE_NON_SHARED_DISK |
                     VIR_MIGRATE_NON_SHARED_INC)) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("offline migration cannot handle "
                             "non-shared storage"));
            goto cleanup;
        }
        if (!(flags & VIR_MIGRATE_PERSIST_DEST)) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("offline migration must be specified with "
                             "the persistent flag set"));
            goto cleanup;
        }
        if (tunnel) {
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("tunnelled offline migration does not "
                             "make sense"));
            goto cleanup;
        }
2590 2591 2592
        cookieFlags = 0;
    } else {
        cookieFlags = QEMU_MIGRATION_COOKIE_GRAPHICS;
L
liguang 已提交
2593 2594
    }

2595 2596 2597 2598 2599 2600 2601 2602 2603
    if (flags & VIR_MIGRATE_POSTCOPY &&
        (!(flags & VIR_MIGRATE_LIVE) ||
         flags & VIR_MIGRATE_PAUSED)) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("post-copy migration is not supported with non-live "
                         "or paused migration"));
        goto cleanup;
    }

2604 2605 2606 2607 2608 2609
    if (flags & VIR_MIGRATE_POSTCOPY && flags & VIR_MIGRATE_TUNNELLED) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("post-copy is not supported with tunnelled migration"));
        goto cleanup;
    }

2610 2611 2612
    if (!(caps = virQEMUDriverGetCapabilities(driver, false)))
        goto cleanup;

2613
    if (!qemuMigrationIsAllowedHostdev(*def))
2614 2615
        goto cleanup;

J
Jiri Denemark 已提交
2616 2617 2618 2619 2620
    /* Let migration hook filter domain XML */
    if (virHookPresent(VIR_HOOK_DRIVER_QEMU)) {
        char *xml;
        int hookret;

2621
        if (!(xml = qemuDomainDefFormatXML(driver, *def,
2622 2623
                                           VIR_DOMAIN_XML_SECURE |
                                           VIR_DOMAIN_XML_MIGRATABLE)))
J
Jiri Denemark 已提交
2624 2625
            goto cleanup;

2626
        hookret = virHookCall(VIR_HOOK_DRIVER_QEMU, (*def)->name,
J
Jiri Denemark 已提交
2627 2628 2629 2630 2631 2632 2633
                              VIR_HOOK_QEMU_OP_MIGRATE, VIR_HOOK_SUBOP_BEGIN,
                              NULL, xml, &xmlout);
        VIR_FREE(xml);

        if (hookret < 0) {
            goto cleanup;
        } else if (hookret == 0) {
2634
            if (virStringIsEmpty(xmlout)) {
J
Jiri Denemark 已提交
2635 2636 2637 2638 2639 2640
                VIR_DEBUG("Migrate hook filter returned nothing; using the"
                          " original XML");
            } else {
                virDomainDefPtr newdef;

                VIR_DEBUG("Using hook-filtered domain XML: %s", xmlout);
2641
                newdef = virDomainDefParseString(xmlout, caps, driver->xmlopt, NULL,
2642 2643
                                                 VIR_DOMAIN_DEF_PARSE_INACTIVE |
                                                 VIR_DOMAIN_DEF_PARSE_SKIP_VALIDATE);
J
Jiri Denemark 已提交
2644 2645 2646
                if (!newdef)
                    goto cleanup;

2647
                if (!qemuDomainDefCheckABIStability(driver, *def, newdef)) {
J
Jiri Denemark 已提交
2648 2649 2650 2651
                    virDomainDefFree(newdef);
                    goto cleanup;
                }

2652 2653
                virDomainDefFree(*def);
                *def = newdef;
2654 2655 2656 2657
                /* We should taint the domain here. However, @vm and therefore
                 * privateData too are still NULL, so just notice the fact and
                 * taint it later. */
                taint_hook = true;
J
Jiri Denemark 已提交
2658 2659 2660 2661
            }
        }
    }

2662
    if (!(vm = virDomainObjListAdd(driver->domains, *def,
2663
                                   driver->xmlopt,
2664 2665 2666
                                   VIR_DOMAIN_OBJ_LIST_ADD_LIVE |
                                   VIR_DOMAIN_OBJ_LIST_ADD_CHECK_LIVE,
                                   NULL)))
2667
        goto cleanup;
2668

2669
    virObjectRef(vm);
2670
    *def = NULL;
2671
    priv = vm->privateData;
2672 2673
    if (VIR_STRDUP(priv->origname, origname) < 0)
        goto cleanup;
2674

2675 2676 2677 2678 2679
    if (taint_hook) {
        /* Domain XML has been altered by a hook script. */
        priv->hookRun = true;
    }

2680
    if (!(mig = qemuMigrationEatCookie(driver, vm, cookiein, cookieinlen,
2681
                                       QEMU_MIGRATION_COOKIE_LOCKSTATE |
2682
                                       QEMU_MIGRATION_COOKIE_NBD |
2683
                                       QEMU_MIGRATION_COOKIE_MEMORY_HOTPLUG |
2684
                                       QEMU_MIGRATION_COOKIE_CPU_HOTPLUG |
2685 2686
                                       QEMU_MIGRATION_COOKIE_CPU |
                                       QEMU_MIGRATION_COOKIE_ALLOW_REBOOT)))
2687 2688
        goto cleanup;

2689 2690
    if (STREQ_NULLABLE(protocol, "rdma") &&
        !virMemoryLimitIsSet(vm->def->mem.hard_limit)) {
M
Michael R. Hines 已提交
2691 2692 2693 2694 2695 2696
        virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                       _("cannot start RDMA migration with no memory hard "
                         "limit set"));
        goto cleanup;
    }

2697
    if (qemuMigrationPrecreateStorage(dconn, driver, vm, mig->nbd,
2698 2699
                                      nmigrate_disks, migrate_disks,
                                      !!(flags & VIR_MIGRATE_NON_SHARED_INC)) < 0)
2700 2701
        goto cleanup;

2702
    if (qemuMigrationJobStart(driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
2703
        goto cleanup;
2704
    qemuMigrationJobSetPhase(driver, vm, QEMU_MIGRATION_PHASE_PREPARE);
2705 2706 2707 2708

    /* Domain starts inactive, even if the domain XML had an id field. */
    vm->def->id = -1;

L
liguang 已提交
2709 2710 2711
    if (flags & VIR_MIGRATE_OFFLINE)
        goto done;

2712 2713
    if (tunnel &&
        (pipe(dataFD) < 0 || virSetCloseExec(dataFD[1]) < 0)) {
2714 2715
        virReportSystemError(errno, "%s",
                             _("cannot create pipe for tunnelled migration"));
2716
        goto stopjob;
2717 2718
    }

2719 2720
    startFlags = VIR_QEMU_PROCESS_START_AUTODESTROY;

2721
    if (qemuProcessInit(driver, vm, mig->cpu, QEMU_ASYNC_JOB_MIGRATION_IN,
2722
                        true, startFlags) < 0)
2723
        goto stopjob;
2724
    stopProcess = true;
2725

2726 2727
    priv->allowReboot = mig->allowReboot;

2728 2729 2730
    if (!(incoming = qemuMigrationPrepareIncoming(vm, tunnel, protocol,
                                                  listenAddress, port,
                                                  dataFD[0])))
2731
        goto stopjob;
2732

2733
    if (qemuProcessPrepareDomain(dconn, driver, vm, startFlags) < 0)
2734 2735
        goto stopjob;

2736
    if (qemuProcessPrepareHost(driver, vm, startFlags) < 0)
2737 2738
        goto stopjob;

2739 2740 2741
    rv = qemuProcessLaunch(dconn, driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN,
                           incoming, NULL,
                           VIR_NETDEV_VPORT_PROFILE_OP_MIGRATE_IN_START,
2742
                           startFlags);
2743 2744 2745
    if (rv < 0) {
        if (rv == -2)
            relabel = true;
2746
        goto stopjob;
2747
    }
2748
    relabel = true;
2749

2750 2751 2752 2753
    if (tunnel) {
        if (virFDStreamOpen(st, dataFD[1]) < 0) {
            virReportSystemError(errno, "%s",
                                 _("cannot pass pipe for tunnelled migration"));
2754
            goto stopjob;
2755
        }
2756
        dataFD[1] = -1; /* 'st' owns the FD now & will close it */
2757 2758
    }

2759
    if (qemuMigrationSetCompression(driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN,
2760
                                    compression, &migParams) < 0)
2761
        goto stopjob;
2762

2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783 2784 2785 2786
    /* Migrations using TLS need to add the "tls-creds-x509" object and
     * set the migration TLS parameters */
    if (flags & VIR_MIGRATE_TLS) {
        cfg = virQEMUDriverGetConfig(driver);
        if (qemuMigrationCheckSetupTLS(dconn, driver, cfg, vm,
                                       QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
            goto stopjob;

        if (qemuMigrationAddTLSObjects(driver, vm, cfg, true,
                                       QEMU_ASYNC_JOB_MIGRATION_IN,
                                       &tlsAlias, &secAlias, &migParams) < 0)
            goto stopjob;

        /* Force reset of 'tls-hostname', it's a source only parameter */
        if (VIR_STRDUP(migParams.migrateTLSHostname, "") < 0)
            goto stopjob;

    } else {
        if (qemuMigrationSetEmptyTLSParams(driver, vm,
                                           QEMU_ASYNC_JOB_MIGRATION_IN,
                                           &migParams) < 0)
            goto stopjob;
    }

2787
    if (STREQ_NULLABLE(protocol, "rdma") &&
M
Michael R. Hines 已提交
2788
        virProcessSetMaxMemLock(vm->pid, vm->def->mem.hard_limit << 10) < 0) {
2789
        goto stopjob;
M
Michael R. Hines 已提交
2790 2791
    }

2792 2793
    if (qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_RDMA_PIN_ALL,
2794 2795
                               flags & VIR_MIGRATE_RDMA_PIN_ALL,
                               QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
2796
        goto stopjob;
2797

2798 2799 2800 2801 2802
    if (qemuMigrationSetPostCopy(driver, vm,
                                 flags & VIR_MIGRATE_POSTCOPY,
                                 QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
        goto stopjob;

2803 2804 2805 2806
    if (qemuMigrationSetParams(driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN,
                               &migParams) < 0)
        goto stopjob;

2807 2808 2809
    if (mig->nbd &&
        flags & (VIR_MIGRATE_NON_SHARED_DISK | VIR_MIGRATE_NON_SHARED_INC) &&
        virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_NBD_SERVER)) {
2810
        if (qemuMigrationStartNBDServer(driver, vm, incoming->address,
2811 2812
                                        nmigrate_disks, migrate_disks,
                                        nbdPort) < 0) {
2813
            goto stopjob;
2814
        }
2815
        cookieFlags |= QEMU_MIGRATION_COOKIE_NBD;
2816 2817
    }

2818 2819 2820 2821 2822 2823 2824 2825 2826
    if (mig->lockState) {
        VIR_DEBUG("Received lockstate %s", mig->lockState);
        VIR_FREE(priv->lockState);
        priv->lockState = mig->lockState;
        mig->lockState = NULL;
    } else {
        VIR_DEBUG("Received no lockstate");
    }

2827 2828 2829 2830 2831 2832 2833 2834 2835
    if (incoming->deferredURI &&
        qemuMigrationRunIncoming(driver, vm, incoming->deferredURI,
                                 QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
        goto stopjob;

    if (qemuProcessFinishStartup(dconn, driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN,
                                 false, VIR_DOMAIN_PAUSED_MIGRATION) < 0)
        goto stopjob;

2836
 done:
2837 2838
    if (qemuMigrationBakeCookie(mig, driver, vm, cookieout,
                                cookieoutlen, cookieFlags) < 0) {
2839 2840 2841 2842 2843 2844 2845
        /* We could tear down the whole guest here, but
         * cookie data is (so far) non-critical, so that
         * seems a little harsh. We'll just warn for now.
         */
        VIR_WARN("Unable to encode migration cookie");
    }

2846
    if (qemuDomainCleanupAdd(vm, qemuMigrationPrepareCleanup) < 0)
2847
        goto stopjob;
2848

L
liguang 已提交
2849 2850
    if (!(flags & VIR_MIGRATE_OFFLINE)) {
        virDomainAuditStart(vm, "migrated", true);
2851
        event = virDomainEventLifecycleNewFromObj(vm,
L
liguang 已提交
2852 2853 2854
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_MIGRATED);
    }
2855

2856 2857 2858 2859
    /* We keep the job active across API calls until the finish() call.
     * This prevents any other APIs being invoked while incoming
     * migration is taking place.
     */
2860
    qemuMigrationJobContinue(vm);
2861

2862 2863
    if (autoPort)
        priv->migrationPort = port;
2864 2865 2866 2867 2868
    /* in this case port is not auto selected and we don't need to manage it
     * anymore after cookie is baked
     */
    if (nbdPort != 0)
        priv->nbdPort = 0;
2869
    ret = 0;
2870

2871
 cleanup:
2872 2873 2874
    VIR_FREE(tlsAlias);
    VIR_FREE(secAlias);
    virObjectUnref(cfg);
2875
    qemuProcessIncomingDefFree(incoming);
J
Jiri Denemark 已提交
2876
    VIR_FREE(xmlout);
2877 2878
    VIR_FORCE_CLOSE(dataFD[0]);
    VIR_FORCE_CLOSE(dataFD[1]);
2879 2880 2881
    if (ret < 0 && priv) {
        /* priv is set right after vm is added to the list of domains
         * and there is no 'goto cleanup;' in the middle of those */
2882
        VIR_FREE(priv->origname);
2883 2884 2885 2886 2887
        /* release if port is auto selected which is not the case if
         * it is given in parameters
         */
        if (nbdPort == 0)
            virPortAllocatorRelease(driver->migrationPorts, priv->nbdPort);
2888
        priv->nbdPort = 0;
2889
        virDomainObjRemoveTransientDef(vm);
2890
        qemuDomainRemoveInactiveJob(driver, vm);
2891
    }
2892
    qemuMigrationParamsClear(&migParams);
M
Michal Privoznik 已提交
2893
    virDomainObjEndAPI(&vm);
2894
    qemuDomainEventQueue(driver, event);
2895
    qemuMigrationCookieFree(mig);
2896
    virObjectUnref(caps);
2897
    virNWFilterUnlockFilterUpdates();
2898
    return ret;
2899

2900
 stopjob:
2901
    qemuMigrationReset(driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN);
2902

2903 2904 2905 2906
    if (stopProcess) {
        unsigned int stopFlags = VIR_QEMU_PROCESS_STOP_MIGRATED;
        if (!relabel)
            stopFlags |= VIR_QEMU_PROCESS_STOP_NO_RELABEL;
2907
        virDomainAuditStart(vm, "migrated", false);
2908 2909
        qemuProcessStop(driver, vm, VIR_DOMAIN_SHUTOFF_FAILED,
                        QEMU_ASYNC_JOB_MIGRATION_IN, stopFlags);
2910
    }
2911

2912
    qemuMigrationJobFinish(driver, vm);
2913
    goto cleanup;
2914 2915 2916
}


2917 2918 2919 2920 2921
/*
 * This version starts an empty VM listening on a localhost TCP port, and
 * sets up the corresponding virStream to handle the incoming data.
 */
int
2922
qemuMigrationPrepareTunnel(virQEMUDriverPtr driver,
2923 2924 2925 2926 2927 2928
                           virConnectPtr dconn,
                           const char *cookiein,
                           int cookieinlen,
                           char **cookieout,
                           int *cookieoutlen,
                           virStreamPtr st,
2929
                           virDomainDefPtr *def,
2930
                           const char *origname,
L
liguang 已提交
2931
                           unsigned long flags)
2932
{
2933
    qemuMigrationCompressionPtr compression = NULL;
2934 2935 2936
    int ret;

    VIR_DEBUG("driver=%p, dconn=%p, cookiein=%s, cookieinlen=%d, "
2937
              "cookieout=%p, cookieoutlen=%p, st=%p, def=%p, "
2938
              "origname=%s, flags=0x%lx",
2939
              driver, dconn, NULLSTR(cookiein), cookieinlen,
2940
              cookieout, cookieoutlen, st, *def, origname, flags);
2941

2942 2943 2944 2945 2946 2947
    if (st == NULL) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("tunnelled migration requested but NULL stream passed"));
        return -1;
    }

2948 2949 2950
    if (!(compression = qemuMigrationCompressionParse(NULL, 0, flags)))
        return -1;

2951
    ret = qemuMigrationPrepareAny(driver, dconn, cookiein, cookieinlen,
2952
                                  cookieout, cookieoutlen, def, origname,
2953 2954 2955
                                  st, NULL, 0, false, NULL, 0, NULL, 0,
                                  compression, flags);
    VIR_FREE(compression);
2956 2957 2958 2959
    return ret;
}


2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981 2982
static virURIPtr
qemuMigrationParseURI(const char *uri, bool *wellFormed)
{
    char *tmp = NULL;
    virURIPtr parsed;

    /* For compatibility reasons tcp://... URIs are sent as tcp:...
     * We need to transform them to a well-formed URI before parsing. */
    if (STRPREFIX(uri, "tcp:") && !STRPREFIX(uri + 4, "//")) {
        if (virAsprintf(&tmp, "tcp://%s", uri + 4) < 0)
            return NULL;
        uri = tmp;
    }

    parsed = virURIParse(uri);
    if (parsed && wellFormed)
        *wellFormed = !tmp;
    VIR_FREE(tmp);

    return parsed;
}


2983
int
2984
qemuMigrationPrepareDirect(virQEMUDriverPtr driver,
2985
                           virConnectPtr dconn,
2986 2987 2988 2989
                           const char *cookiein,
                           int cookieinlen,
                           char **cookieout,
                           int *cookieoutlen,
2990 2991
                           const char *uri_in,
                           char **uri_out,
2992
                           virDomainDefPtr *def,
2993
                           const char *origname,
2994
                           const char *listenAddress,
2995 2996
                           size_t nmigrate_disks,
                           const char **migrate_disks,
2997
                           int nbdPort,
2998
                           qemuMigrationCompressionPtr compression,
L
liguang 已提交
2999
                           unsigned long flags)
3000
{
3001 3002
    unsigned short port = 0;
    bool autoPort = true;
3003 3004
    char *hostname = NULL;
    int ret = -1;
3005
    virURIPtr uri = NULL;
3006 3007
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
    const char *migrateHost = cfg->migrateHost;
J
Jiri Denemark 已提交
3008

3009 3010
    VIR_DEBUG("driver=%p, dconn=%p, cookiein=%s, cookieinlen=%d, "
              "cookieout=%p, cookieoutlen=%p, uri_in=%s, uri_out=%p, "
3011
              "def=%p, origname=%s, listenAddress=%s, "
3012
              "nmigrate_disks=%zu, migrate_disks=%p, nbdPort=%d, flags=0x%lx",
3013 3014
              driver, dconn, NULLSTR(cookiein), cookieinlen,
              cookieout, cookieoutlen, NULLSTR(uri_in), uri_out,
3015
              *def, origname, NULLSTR(listenAddress),
3016
              nmigrate_disks, migrate_disks, nbdPort, flags);
3017

3018 3019
    *uri_out = NULL;

3020 3021 3022
    /* The URI passed in may be NULL or a string "tcp://somehostname:port".
     *
     * If the URI passed in is NULL then we allocate a port number
3023 3024 3025
     * from our pool of port numbers, and if the migrateHost is configured,
     * we return a URI of "tcp://migrateHost:port", otherwise return a URI
     * of "tcp://ourhostname:port".
3026 3027 3028 3029 3030 3031
     *
     * If the URI passed in is not NULL then we try to parse out the
     * port number and use that (note that the hostname is assumed
     * to be a correct hostname which refers to the target machine).
     */
    if (uri_in == NULL) {
3032 3033 3034
        bool encloseAddress = false;
        const char *incFormat;

3035
        if (virPortAllocatorAcquire(driver->migrationPorts, &port) < 0)
3036
            goto cleanup;
3037

3038
        if (migrateHost != NULL) {
3039 3040
            if (virSocketAddrNumericFamily(migrateHost) == AF_INET6)
                encloseAddress = true;
3041

3042
            if (VIR_STRDUP(hostname, migrateHost) < 0)
3043 3044 3045 3046 3047
                goto cleanup;
        } else {
            if ((hostname = virGetHostname()) == NULL)
                goto cleanup;
        }
3048 3049

        if (STRPREFIX(hostname, "localhost")) {
3050 3051 3052
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("hostname on destination resolved to localhost,"
                             " but migration requires an FQDN"));
3053 3054 3055 3056 3057
            goto cleanup;
        }

        /* XXX this really should have been a properly well-formed
         * URI, but we can't add in tcp:// now without breaking
3058
         * compatibility with old targets. We at least make the
3059 3060
         * new targets accept both syntaxes though.
         */
3061 3062 3063 3064 3065 3066
        if (encloseAddress)
            incFormat = "%s:[%s]:%d";
        else
            incFormat = "%s:%s:%d";

        if (virAsprintf(uri_out, incFormat, "tcp", hostname, port) < 0)
3067 3068
            goto cleanup;
    } else {
3069
        bool well_formed_uri;
J
Ján Tomko 已提交
3070

3071 3072
        if (!(uri = qemuMigrationParseURI(uri_in, &well_formed_uri)))
            goto cleanup;
J
Ján Tomko 已提交
3073

3074 3075 3076 3077 3078 3079 3080
        if (uri->scheme == NULL) {
            virReportError(VIR_ERR_INVALID_ARG,
                           _("missing scheme in migration URI: %s"),
                           uri_in);
            goto cleanup;
        }

M
Michael R. Hines 已提交
3081 3082
        if (STRNEQ(uri->scheme, "tcp") &&
            STRNEQ(uri->scheme, "rdma")) {
3083 3084 3085
            virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED,
                           _("unsupported scheme %s in migration URI %s"),
                           uri->scheme, uri_in);
J
Ján Tomko 已提交
3086 3087 3088 3089 3090 3091 3092 3093 3094 3095
            goto cleanup;
        }

        if (uri->server == NULL) {
            virReportError(VIR_ERR_INVALID_ARG, _("missing host in migration"
                                                  " URI: %s"), uri_in);
            goto cleanup;
        }

        if (uri->port == 0) {
3096
            if (virPortAllocatorAcquire(driver->migrationPorts, &port) < 0)
3097
                goto cleanup;
3098

3099
            /* Send well-formed URI only if uri_in was well-formed */
3100 3101 3102 3103 3104 3105 3106 3107
            if (well_formed_uri) {
                uri->port = port;
                if (!(*uri_out = virURIFormat(uri)))
                    goto cleanup;
            } else {
                if (virAsprintf(uri_out, "%s:%d", uri_in, port) < 0)
                    goto cleanup;
            }
3108
        } else {
3109 3110
            port = uri->port;
            autoPort = false;
3111 3112 3113 3114 3115 3116
        }
    }

    if (*uri_out)
        VIR_DEBUG("Generated uri_out=%s", *uri_out);

3117
    ret = qemuMigrationPrepareAny(driver, dconn, cookiein, cookieinlen,
3118
                                  cookieout, cookieoutlen, def, origname,
3119
                                  NULL, uri ? uri->scheme : "tcp",
3120
                                  port, autoPort, listenAddress,
3121 3122
                                  nmigrate_disks, migrate_disks, nbdPort,
                                  compression, flags);
3123
 cleanup:
3124
    virURIFree(uri);
3125
    VIR_FREE(hostname);
3126
    virObjectUnref(cfg);
3127
    if (ret != 0) {
3128
        VIR_FREE(*uri_out);
3129 3130 3131
        if (autoPort)
            virPortAllocatorRelease(driver->migrationPorts, port);
    }
3132 3133 3134 3135
    return ret;
}


3136 3137 3138
virDomainDefPtr
qemuMigrationPrepareDef(virQEMUDriverPtr driver,
                        const char *dom_xml,
3139 3140
                        const char *dname,
                        char **origname)
3141 3142 3143
{
    virCapsPtr caps = NULL;
    virDomainDefPtr def;
3144
    char *name = NULL;
3145 3146 3147 3148 3149 3150 3151 3152 3153 3154

    if (!dom_xml) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("no domain XML passed"));
        return NULL;
    }

    if (!(caps = virQEMUDriverGetCapabilities(driver, false)))
        return NULL;

3155
    if (!(def = virDomainDefParseString(dom_xml, caps, driver->xmlopt, NULL,
3156 3157
                                        VIR_DOMAIN_DEF_PARSE_INACTIVE |
                                        VIR_DOMAIN_DEF_PARSE_SKIP_VALIDATE)))
3158 3159 3160
        goto cleanup;

    if (dname) {
3161
        name = def->name;
3162 3163 3164 3165 3166 3167
        if (VIR_STRDUP(def->name, dname) < 0) {
            virDomainDefFree(def);
            def = NULL;
        }
    }

3168
 cleanup:
3169
    virObjectUnref(caps);
3170 3171 3172 3173
    if (def && origname)
        *origname = name;
    else
        VIR_FREE(name);
3174 3175 3176 3177
    return def;
}


3178 3179 3180 3181 3182 3183 3184 3185 3186 3187
static int
qemuMigrationConfirmPhase(virQEMUDriverPtr driver,
                          virConnectPtr conn,
                          virDomainObjPtr vm,
                          const char *cookiein,
                          int cookieinlen,
                          unsigned int flags,
                          int retcode)
{
    qemuMigrationCookiePtr mig;
3188
    virObjectEventPtr event;
3189 3190
    int rv = -1;
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
3191 3192
    qemuDomainObjPrivatePtr priv = vm->privateData;
    qemuDomainJobInfoPtr jobInfo = NULL;
3193 3194

    VIR_DEBUG("driver=%p, conn=%p, vm=%p, cookiein=%s, cookieinlen=%d, "
3195
              "flags=0x%x, retcode=%d",
3196 3197 3198 3199 3200 3201 3202 3203 3204 3205
              driver, conn, vm, NULLSTR(cookiein), cookieinlen,
              flags, retcode);

    virCheckFlags(QEMU_MIGRATION_FLAGS, -1);

    qemuMigrationJobSetPhase(driver, vm,
                             retcode == 0
                             ? QEMU_MIGRATION_PHASE_CONFIRM3
                             : QEMU_MIGRATION_PHASE_CONFIRM3_CANCELLED);

3206 3207
    if (!(mig = qemuMigrationEatCookie(driver, vm, cookiein, cookieinlen,
                                       QEMU_MIGRATION_COOKIE_STATS)))
3208 3209
        goto cleanup;

3210 3211 3212
    if (retcode == 0)
        jobInfo = priv->job.completed;
    else
3213
        VIR_FREE(priv->job.completed);
3214 3215 3216

    /* Update times with the values sent by the destination daemon */
    if (mig->jobInfo && jobInfo) {
3217 3218 3219 3220 3221 3222 3223 3224
        int reason;

        /* We need to refresh migration statistics after a completed post-copy
         * migration since priv->job.completed contains obsolete data from the
         * time we switched to post-copy mode.
         */
        if (virDomainObjGetState(vm, &reason) == VIR_DOMAIN_PAUSED &&
            reason == VIR_DOMAIN_PAUSED_POSTCOPY &&
3225
            qemuMigrationFetchStats(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT,
3226
                                    jobInfo, NULL) < 0)
3227 3228
            VIR_WARN("Could not refresh migration statistics");

3229 3230 3231 3232 3233
        qemuDomainJobInfoUpdateTime(jobInfo);
        jobInfo->timeDeltaSet = mig->jobInfo->timeDeltaSet;
        jobInfo->timeDelta = mig->jobInfo->timeDelta;
        jobInfo->stats.downtime_set = mig->jobInfo->stats.downtime_set;
        jobInfo->stats.downtime = mig->jobInfo->stats.downtime;
3234 3235
    }

3236 3237 3238
    if (flags & VIR_MIGRATE_OFFLINE)
        goto done;

3239 3240
    /* Did the migration go as planned?  If yes, kill off the domain object.
     * If something failed, resume CPUs, but only if we didn't use post-copy.
3241 3242 3243 3244
     */
    if (retcode == 0) {
        /* If guest uses SPICE and supports seamless migration we have to hold
         * up domain shutdown until SPICE server transfers its data */
3245
        qemuMigrationWaitForSpice(vm);
3246 3247

        qemuProcessStop(driver, vm, VIR_DOMAIN_SHUTOFF_MIGRATED,
3248
                        QEMU_ASYNC_JOB_MIGRATION_OUT,
3249 3250 3251
                        VIR_QEMU_PROCESS_STOP_MIGRATED);
        virDomainAuditStop(vm, "migrated");

3252
        event = virDomainEventLifecycleNewFromObj(vm,
3253 3254
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_MIGRATED);
3255 3256
        qemuDomainEventQueue(driver, event);
        qemuDomainEventEmitJobCompleted(driver, vm);
3257
    } else {
3258
        virErrorPtr orig_err = virSaveLastError();
3259
        int reason;
3260 3261

        /* cancel any outstanding NBD jobs */
3262
        qemuMigrationCancelDriveMirror(driver, vm, false,
3263
                                       QEMU_ASYNC_JOB_MIGRATION_OUT, NULL);
3264 3265 3266

        virSetError(orig_err);
        virFreeError(orig_err);
3267

3268 3269 3270 3271
        if (virDomainObjGetState(vm, &reason) == VIR_DOMAIN_PAUSED &&
            reason == VIR_DOMAIN_PAUSED_POSTCOPY) {
            qemuMigrationPostcopyFailed(driver, vm);
        } else if (qemuMigrationRestoreDomainState(conn, vm)) {
3272 3273 3274
            event = virDomainEventLifecycleNewFromObj(vm,
                                                      VIR_DOMAIN_EVENT_RESUMED,
                                                      VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
3275
            qemuDomainEventQueue(driver, event);
3276 3277
        }

3278
        qemuMigrationReset(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT);
3279

3280
        if (virDomainSaveStatus(driver->xmlopt, cfg->stateDir, vm, driver->caps) < 0)
3281 3282 3283
            VIR_WARN("Failed to save status on vm %s", vm->def->name);
    }

3284
 done:
3285 3286 3287
    qemuMigrationCookieFree(mig);
    rv = 0;

3288
 cleanup:
3289 3290 3291 3292 3293 3294 3295 3296 3297 3298 3299 3300 3301
    virObjectUnref(cfg);
    return rv;
}

int
qemuMigrationConfirm(virConnectPtr conn,
                     virDomainObjPtr vm,
                     const char *cookiein,
                     int cookieinlen,
                     unsigned int flags,
                     int cancelled)
{
    virQEMUDriverPtr driver = conn->privateData;
3302
    qemuMigrationJobPhase phase;
3303 3304 3305 3306 3307 3308 3309 3310 3311 3312 3313 3314 3315 3316
    virQEMUDriverConfigPtr cfg = NULL;
    int ret = -1;

    cfg = virQEMUDriverGetConfig(driver);

    if (!qemuMigrationJobIsActive(vm, QEMU_ASYNC_JOB_MIGRATION_OUT))
        goto cleanup;

    if (cancelled)
        phase = QEMU_MIGRATION_PHASE_CONFIRM3_CANCELLED;
    else
        phase = QEMU_MIGRATION_PHASE_CONFIRM3;

    qemuMigrationJobStartPhase(driver, vm, phase);
3317 3318
    virCloseCallbacksUnset(driver->closeCallbacks, vm,
                           qemuMigrationCleanup);
3319 3320 3321 3322 3323

    ret = qemuMigrationConfirmPhase(driver, conn, vm,
                                    cookiein, cookieinlen,
                                    flags, cancelled);

3324
    qemuMigrationJobFinish(driver, vm);
3325
    if (!virDomainObjIsActive(vm)) {
3326
        if (flags & VIR_MIGRATE_UNDEFINE_SOURCE) {
3327
            virDomainDeleteConfig(cfg->configDir, cfg->autostartDir, vm);
3328 3329
            vm->persistent = 0;
        }
3330
        qemuDomainRemoveInactiveJob(driver, vm);
3331 3332
    }

3333
 cleanup:
M
Michal Privoznik 已提交
3334
    virDomainObjEndAPI(&vm);
3335 3336 3337 3338 3339
    virObjectUnref(cfg);
    return ret;
}


3340 3341
enum qemuMigrationDestinationType {
    MIGRATION_DEST_HOST,
3342
    MIGRATION_DEST_CONNECT_HOST,
3343
    MIGRATION_DEST_FD,
3344
};
3345

3346 3347 3348 3349
enum qemuMigrationForwardType {
    MIGRATION_FWD_DIRECT,
    MIGRATION_FWD_STREAM,
};
3350

3351 3352 3353 3354 3355 3356
typedef struct _qemuMigrationSpec qemuMigrationSpec;
typedef qemuMigrationSpec *qemuMigrationSpecPtr;
struct _qemuMigrationSpec {
    enum qemuMigrationDestinationType destType;
    union {
        struct {
3357
            const char *protocol;
3358 3359 3360 3361
            const char *name;
            int port;
        } host;

3362 3363 3364 3365
        struct {
            int qemu;
            int local;
        } fd;
3366 3367 3368 3369 3370 3371 3372
    } dest;

    enum qemuMigrationForwardType fwdType;
    union {
        virStreamPtr stream;
    } fwd;
};
3373 3374 3375

#define TUNNEL_SEND_BUF_SIZE 65536

3376 3377 3378 3379 3380 3381 3382
typedef struct _qemuMigrationIOThread qemuMigrationIOThread;
typedef qemuMigrationIOThread *qemuMigrationIOThreadPtr;
struct _qemuMigrationIOThread {
    virThread thread;
    virStreamPtr st;
    int sock;
    virError err;
3383 3384
    int wakeupRecvFD;
    int wakeupSendFD;
3385 3386 3387
};

static void qemuMigrationIOFunc(void *arg)
3388
{
3389
    qemuMigrationIOThreadPtr data = arg;
3390 3391 3392 3393 3394 3395 3396
    char *buffer = NULL;
    struct pollfd fds[2];
    int timeout = -1;
    virErrorPtr err = NULL;

    VIR_DEBUG("Running migration tunnel; stream=%p, sock=%d",
              data->st, data->sock);
3397

3398
    if (VIR_ALLOC_N(buffer, TUNNEL_SEND_BUF_SIZE) < 0)
3399
        goto abrt;
3400

3401 3402 3403
    fds[0].fd = data->sock;
    fds[1].fd = data->wakeupRecvFD;

3404
    for (;;) {
3405 3406 3407 3408 3409 3410 3411 3412 3413 3414
        int ret;

        fds[0].events = fds[1].events = POLLIN;
        fds[0].revents = fds[1].revents = 0;

        ret = poll(fds, ARRAY_CARDINALITY(fds), timeout);

        if (ret < 0) {
            if (errno == EAGAIN || errno == EINTR)
                continue;
3415
            virReportSystemError(errno, "%s",
3416 3417
                                 _("poll failed in migration tunnel"));
            goto abrt;
3418
        }
3419 3420 3421 3422 3423 3424 3425

        if (ret == 0) {
            /* We were asked to gracefully stop but reading would block. This
             * can only happen if qemu told us migration finished but didn't
             * close the migration fd. We handle this in the same way as EOF.
             */
            VIR_DEBUG("QEMU forgot to close migration fd");
3426
            break;
3427
        }
3428

3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444
        if (fds[1].revents & (POLLIN | POLLERR | POLLHUP)) {
            char stop = 0;

            if (saferead(data->wakeupRecvFD, &stop, 1) != 1) {
                virReportSystemError(errno, "%s",
                                     _("failed to read from wakeup fd"));
                goto abrt;
            }

            VIR_DEBUG("Migration tunnel was asked to %s",
                      stop ? "abort" : "finish");
            if (stop) {
                goto abrt;
            } else {
                timeout = 0;
            }
3445 3446
        }

3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461 3462 3463
        if (fds[0].revents & (POLLIN | POLLERR | POLLHUP)) {
            int nbytes;

            nbytes = saferead(data->sock, buffer, TUNNEL_SEND_BUF_SIZE);
            if (nbytes > 0) {
                if (virStreamSend(data->st, buffer, nbytes) < 0)
                    goto error;
            } else if (nbytes < 0) {
                virReportSystemError(errno, "%s",
                        _("tunnelled migration failed to read from qemu"));
                goto abrt;
            } else {
                /* EOF; get out of here */
                break;
            }
        }
    }
3464

3465 3466
    if (virStreamFinish(data->st) < 0)
        goto error;
3467

3468
    VIR_FORCE_CLOSE(data->sock);
3469 3470
    VIR_FREE(buffer);

3471 3472
    return;

3473
 abrt:
3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484
    err = virSaveLastError();
    if (err && err->code == VIR_ERR_OK) {
        virFreeError(err);
        err = NULL;
    }
    virStreamAbort(data->st);
    if (err) {
        virSetError(err);
        virFreeError(err);
    }

3485
 error:
3486 3487 3488 3489 3490
    /* Let the source qemu know that the transfer cant continue anymore.
     * Don't copy the error for EPIPE as destination has the actual error. */
    VIR_FORCE_CLOSE(data->sock);
    if (!virLastErrorIsSystemErrno(EPIPE))
        virCopyLastError(&data->err);
3491
    virResetLastError();
3492
    VIR_FREE(buffer);
3493 3494 3495 3496 3497 3498 3499
}


static qemuMigrationIOThreadPtr
qemuMigrationStartTunnel(virStreamPtr st,
                         int sock)
{
3500 3501
    qemuMigrationIOThreadPtr io = NULL;
    int wakeupFD[2] = { -1, -1 };
3502

3503 3504 3505 3506
    if (pipe2(wakeupFD, O_CLOEXEC) < 0) {
        virReportSystemError(errno, "%s",
                             _("Unable to make pipe"));
        goto error;
3507 3508
    }

3509
    if (VIR_ALLOC(io) < 0)
3510
        goto error;
3511

3512 3513
    io->st = st;
    io->sock = sock;
3514 3515
    io->wakeupRecvFD = wakeupFD[0];
    io->wakeupSendFD = wakeupFD[1];
3516 3517 3518 3519 3520 3521

    if (virThreadCreate(&io->thread, true,
                        qemuMigrationIOFunc,
                        io) < 0) {
        virReportSystemError(errno, "%s",
                             _("Unable to create migration thread"));
3522
        goto error;
3523 3524 3525
    }

    return io;
3526

3527
 error:
3528 3529 3530 3531
    VIR_FORCE_CLOSE(wakeupFD[0]);
    VIR_FORCE_CLOSE(wakeupFD[1]);
    VIR_FREE(io);
    return NULL;
3532 3533 3534
}

static int
3535
qemuMigrationStopTunnel(qemuMigrationIOThreadPtr io, bool error)
3536 3537
{
    int rv = -1;
3538 3539 3540 3541 3542 3543 3544 3545 3546
    char stop = error ? 1 : 0;

    /* make sure the thread finishes its job and is joinable */
    if (safewrite(io->wakeupSendFD, &stop, 1) != 1) {
        virReportSystemError(errno, "%s",
                             _("failed to wakeup migration tunnel"));
        goto cleanup;
    }

3547 3548 3549 3550
    virThreadJoin(&io->thread);

    /* Forward error from the IO thread, to this thread */
    if (io->err.code != VIR_ERR_OK) {
3551 3552 3553 3554
        if (error)
            rv = 0;
        else
            virSetError(&io->err);
3555 3556 3557 3558 3559 3560
        virResetError(&io->err);
        goto cleanup;
    }

    rv = 0;

3561
 cleanup:
3562 3563
    VIR_FORCE_CLOSE(io->wakeupSendFD);
    VIR_FORCE_CLOSE(io->wakeupRecvFD);
3564 3565
    VIR_FREE(io);
    return rv;
3566 3567
}

3568
static int
3569
qemuMigrationConnect(virQEMUDriverPtr driver,
3570 3571 3572 3573 3574 3575 3576 3577 3578
                     virDomainObjPtr vm,
                     qemuMigrationSpecPtr spec)
{
    virNetSocketPtr sock;
    const char *host;
    char *port = NULL;
    int ret = -1;

    host = spec->dest.host.name;
3579
    if (virAsprintf(&port, "%d", spec->dest.host.port) < 0)
3580 3581 3582 3583 3584
        return -1;

    spec->destType = MIGRATION_DEST_FD;
    spec->dest.fd.qemu = -1;

3585
    if (qemuSecuritySetSocketLabel(driver->securityManager, vm->def) < 0)
3586
        goto cleanup;
3587 3588 3589
    if (virNetSocketNewConnectTCP(host, port,
                                  AF_UNSPEC,
                                  &sock) == 0) {
3590
        spec->dest.fd.qemu = virNetSocketDupFD(sock, true);
3591
        virObjectUnref(sock);
3592
    }
3593
    if (qemuSecurityClearSocketLabel(driver->securityManager, vm->def) < 0 ||
3594 3595 3596
        spec->dest.fd.qemu == -1)
        goto cleanup;

3597 3598 3599 3600 3601 3602 3603
    /* Migration expects a blocking FD */
    if (virSetBlocking(spec->dest.fd.qemu, true) < 0) {
        virReportSystemError(errno, _("Unable to set FD %d blocking"),
                             spec->dest.fd.qemu);
        goto cleanup;
    }

3604 3605
    ret = 0;

3606
 cleanup:
3607 3608 3609 3610 3611 3612
    VIR_FREE(port);
    if (ret < 0)
        VIR_FORCE_CLOSE(spec->dest.fd.qemu);
    return ret;
}

3613 3614 3615 3616 3617 3618 3619 3620 3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634

static int
qemuMigrationContinue(virQEMUDriverPtr driver,
                      virDomainObjPtr vm,
                      qemuMonitorMigrationStatus status,
                      qemuDomainAsyncJob asyncJob)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int ret;

    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
        return -1;

    ret = qemuMonitorMigrateContinue(priv->mon, status);

    if (qemuDomainObjExitMonitor(driver, vm) < 0)
        ret = -1;

    return ret;
}


3635
static int
3636
qemuMigrationRun(virQEMUDriverPtr driver,
3637
                 virDomainObjPtr vm,
3638
                 const char *persist_xml,
3639 3640 3641 3642 3643 3644
                 const char *cookiein,
                 int cookieinlen,
                 char **cookieout,
                 int *cookieoutlen,
                 unsigned long flags,
                 unsigned long resource,
3645
                 qemuMigrationSpecPtr spec,
3646
                 virConnectPtr dconn,
3647 3648
                 const char *graphicsuri,
                 size_t nmigrate_disks,
3649
                 const char **migrate_disks,
3650 3651
                 qemuMigrationCompressionPtr compression,
                 qemuMonitorMigrationParamsPtr migParams)
3652
{
3653
    int ret = -1;
3654
    unsigned int migrate_flags = QEMU_MONITOR_MIGRATE_BACKGROUND;
3655
    virQEMUDriverConfigPtr cfg = NULL;
3656
    qemuDomainObjPrivatePtr priv = vm->privateData;
3657
    qemuMigrationCookiePtr mig = NULL;
3658 3659
    char *tlsAlias = NULL;
    char *secAlias = NULL;
3660
    qemuMigrationIOThreadPtr iothread = NULL;
3661
    int fd = -1;
3662
    unsigned long migrate_speed = resource ? resource : priv->migMaxBandwidth;
3663
    virErrorPtr orig_err = NULL;
3664
    unsigned int cookieFlags = 0;
3665
    bool abort_on_error = !!(flags & VIR_MIGRATE_ABORT_ON_ERROR);
3666
    bool events = virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_MIGRATION_EVENT);
3667
    bool cancel = false;
3668
    unsigned int waitFlags;
3669
    virDomainDefPtr persistDef = NULL;
3670
    char *timestamp;
3671
    int rc;
3672 3673

    VIR_DEBUG("driver=%p, vm=%p, cookiein=%s, cookieinlen=%d, "
3674
              "cookieout=%p, cookieoutlen=%p, flags=0x%lx, resource=%lu, "
3675 3676
              "spec=%p (dest=%d, fwd=%d), dconn=%p, graphicsuri=%s, "
              "nmigrate_disks=%zu, migrate_disks=%p",
3677 3678
              driver, vm, NULLSTR(cookiein), cookieinlen,
              cookieout, cookieoutlen, flags, resource,
3679
              spec, spec->destType, spec->fwdType, dconn,
3680
              NULLSTR(graphicsuri), nmigrate_disks, migrate_disks);
3681

3682 3683 3684 3685 3686 3687 3688 3689 3690 3691
    if (flags & VIR_MIGRATE_NON_SHARED_DISK) {
        migrate_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_DISK;
        cookieFlags |= QEMU_MIGRATION_COOKIE_NBD;
    }

    if (flags & VIR_MIGRATE_NON_SHARED_INC) {
        migrate_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_INC;
        cookieFlags |= QEMU_MIGRATION_COOKIE_NBD;
    }

3692 3693
    if (virLockManagerPluginUsesState(driver->lockManager) &&
        !cookieout) {
3694 3695 3696 3697
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("Migration with lock driver %s requires"
                         " cookie support"),
                       virLockManagerPluginGetName(driver->lockManager));
3698 3699 3700
        return -1;
    }

3701 3702 3703
    if (events)
        priv->signalIOError = abort_on_error;

3704 3705
    if (flags & VIR_MIGRATE_PERSIST_DEST) {
        if (persist_xml) {
3706 3707
            if (!(persistDef = qemuMigrationPrepareDef(driver, persist_xml,
                                                       NULL, NULL)))
3708
                goto error;
3709 3710 3711
        } else {
            virDomainDefPtr def = vm->newDef ? vm->newDef : vm->def;
            if (!(persistDef = qemuDomainDefCopy(driver, def,
3712 3713
                                                 VIR_DOMAIN_XML_SECURE |
                                                 VIR_DOMAIN_XML_MIGRATABLE)))
3714
                goto error;
3715 3716 3717
        }
    }

3718 3719 3720
    mig = qemuMigrationEatCookie(driver, vm, cookiein, cookieinlen,
                                 cookieFlags | QEMU_MIGRATION_COOKIE_GRAPHICS);
    if (!mig)
3721
        goto error;
3722

3723
    if (qemuDomainMigrateGraphicsRelocate(driver, vm, mig, graphicsuri) < 0)
3724 3725
        VIR_WARN("unable to provide data for graphics client relocation");

3726 3727 3728 3729 3730 3731 3732 3733
    if (flags & VIR_MIGRATE_TLS) {
        cfg = virQEMUDriverGetConfig(driver);

        /* Begin/CheckSetupTLS already set up migTLSAlias, the following
         * assumes that and adds the TLS objects to the domain. */
        if (qemuMigrationAddTLSObjects(driver, vm, cfg, false,
                                       QEMU_ASYNC_JOB_MIGRATION_OUT,
                                       &tlsAlias, &secAlias, migParams) < 0)
3734
            goto error;
3735 3736 3737 3738 3739 3740 3741

        /* We need to add tls-hostname whenever QEMU itself does not
         * connect directly to the destination. */
        if (spec->destType == MIGRATION_DEST_CONNECT_HOST ||
            spec->destType == MIGRATION_DEST_FD) {
            if (VIR_STRDUP(migParams->migrateTLSHostname,
                           spec->dest.host.name) < 0)
3742
                goto error;
3743 3744 3745
        } else {
            /* Be sure there's nothing from a previous migration */
            if (VIR_STRDUP(migParams->migrateTLSHostname, "") < 0)
3746
                goto error;
3747 3748 3749 3750 3751
        }
    } else {
        if (qemuMigrationSetEmptyTLSParams(driver, vm,
                                           QEMU_ASYNC_JOB_MIGRATION_OUT,
                                           migParams) < 0)
3752
            goto error;
3753 3754
    }

3755 3756 3757 3758 3759 3760 3761
    if (migrate_flags & (QEMU_MONITOR_MIGRATE_NON_SHARED_DISK |
                         QEMU_MONITOR_MIGRATE_NON_SHARED_INC)) {
        if (mig->nbd) {
            /* This will update migrate_flags on success */
            if (qemuMigrationDriveMirror(driver, vm, mig,
                                         spec->dest.host.name,
                                         migrate_speed,
3762 3763
                                         &migrate_flags,
                                         nmigrate_disks,
3764 3765
                                         migrate_disks,
                                         dconn) < 0) {
3766
                goto error;
3767 3768 3769 3770 3771 3772 3773
            }
        } else {
            /* Destination doesn't support NBD server.
             * Fall back to previous implementation. */
            VIR_DEBUG("Destination doesn't support NBD server "
                      "Falling back to previous implementation.");
        }
3774 3775
    }

3776
    /* Before EnterMonitor, since qemuMigrationSetOffline already does that */
3777 3778 3779
    if (!(flags & VIR_MIGRATE_LIVE) &&
        virDomainObjGetState(vm, NULL) == VIR_DOMAIN_RUNNING) {
        if (qemuMigrationSetOffline(driver, vm) < 0)
3780
            goto error;
3781 3782
    }

3783
    if (qemuMigrationSetCompression(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT,
3784
                                    compression, migParams) < 0)
3785
        goto error;
3786

3787 3788 3789 3790
    if (qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_AUTO_CONVERGE,
                               flags & VIR_MIGRATE_AUTO_CONVERGE,
                               QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
3791
        goto error;
3792

3793 3794
    if (qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_RDMA_PIN_ALL,
3795
                               flags & VIR_MIGRATE_RDMA_PIN_ALL,
3796
                               QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
3797
        goto error;
3798

3799 3800 3801
    if (qemuMigrationSetPostCopy(driver, vm,
                                 flags & VIR_MIGRATE_POSTCOPY,
                                 QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
3802
        goto error;
3803

3804 3805 3806 3807 3808 3809
    if (qemuMigrationCapsGet(vm, QEMU_MONITOR_MIGRATION_CAPS_PAUSE_BEFORE_SWITCHOVER) &&
        qemuMigrationSetOption(driver, vm,
                               QEMU_MONITOR_MIGRATION_CAPS_PAUSE_BEFORE_SWITCHOVER,
                               true, QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
        goto error;

3810
    if (qemuMigrationSetParams(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT,
3811
                               migParams) < 0)
3812
        goto error;
3813

3814 3815
    if (qemuDomainObjEnterMonitorAsync(driver, vm,
                                       QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
3816
        goto error;
3817

3818
    if (priv->job.abortJob) {
3819 3820
        /* explicitly do this *after* we entered the monitor,
         * as this is a critical section so we are guaranteed
3821
         * priv->job.abortJob will not change */
3822
        priv->job.current->status = QEMU_DOMAIN_JOB_STATUS_CANCELED;
3823 3824 3825
        virReportError(VIR_ERR_OPERATION_ABORTED, _("%s: %s"),
                       qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
                       _("canceled by client"));
3826
        goto exit_monitor;
3827 3828
    }

3829 3830
    if (qemuMonitorSetMigrationSpeed(priv->mon, migrate_speed) < 0)
        goto exit_monitor;
3831

3832 3833
    /* connect to the destination qemu if needed */
    if (spec->destType == MIGRATION_DEST_CONNECT_HOST &&
3834
        qemuMigrationConnect(driver, vm, spec) < 0) {
3835
        goto exit_monitor;
3836
    }
3837

3838 3839 3840 3841 3842 3843
    /* log start of migration */
    if ((timestamp = virTimeStringNow()) != NULL) {
        qemuDomainLogAppendMessage(driver, vm, "%s: initiating migration\n", timestamp);
        VIR_FREE(timestamp);
    }

3844
    rc = -1;
3845 3846
    switch (spec->destType) {
    case MIGRATION_DEST_HOST:
M
Michael R. Hines 已提交
3847 3848
        if (STREQ(spec->dest.host.protocol, "rdma") &&
            virProcessSetMaxMemLock(vm->pid, vm->def->mem.hard_limit << 10) < 0) {
3849
            goto exit_monitor;
M
Michael R. Hines 已提交
3850
        }
3851 3852 3853 3854
        rc = qemuMonitorMigrateToHost(priv->mon, migrate_flags,
                                      spec->dest.host.protocol,
                                      spec->dest.host.name,
                                      spec->dest.host.port);
3855 3856
        break;

3857 3858 3859 3860
    case MIGRATION_DEST_CONNECT_HOST:
        /* handled above and transformed into MIGRATION_DEST_FD */
        break;

3861
    case MIGRATION_DEST_FD:
3862
        if (spec->fwdType != MIGRATION_FWD_DIRECT) {
3863
            fd = spec->dest.fd.local;
3864 3865
            spec->dest.fd.local = -1;
        }
3866 3867
        rc = qemuMonitorMigrateToFd(priv->mon, migrate_flags,
                                    spec->dest.fd.qemu);
3868 3869
        VIR_FORCE_CLOSE(spec->dest.fd.qemu);
        break;
3870
    }
3871 3872

    if (qemuDomainObjExitMonitor(driver, vm) < 0 || rc < 0)
3873
        goto error;
3874 3875 3876

    /* From this point onwards we *must* call cancel to abort the
     * migration on source if anything goes wrong */
3877
    cancel = true;
3878

3879 3880
    if (spec->fwdType != MIGRATION_FWD_DIRECT) {
        if (!(iothread = qemuMigrationStartTunnel(spec->fwd.stream, fd)))
3881
            goto error;
3882 3883 3884 3885 3886
        /* If we've created a tunnel, then the 'fd' will be closed in the
         * qemuMigrationIOFunc as data->sock.
         */
        fd = -1;
    }
3887

3888
    waitFlags = QEMU_MIGRATION_COMPLETED_PRE_SWITCHOVER;
3889 3890 3891 3892 3893 3894 3895
    if (abort_on_error)
        waitFlags |= QEMU_MIGRATION_COMPLETED_ABORT_ON_ERROR;
    if (mig->nbd)
        waitFlags |= QEMU_MIGRATION_COMPLETED_CHECK_STORAGE;
    if (flags & VIR_MIGRATE_POSTCOPY)
        waitFlags |= QEMU_MIGRATION_COMPLETED_POSTCOPY;

3896 3897
    rc = qemuMigrationWaitForCompletion(driver, vm,
                                        QEMU_ASYNC_JOB_MIGRATION_OUT,
3898
                                        dconn, waitFlags);
3899
    if (rc == -2) {
3900
        goto error;
3901 3902 3903 3904 3905
    } else if (rc == -1) {
        /* QEMU reported failed migration, nothing to cancel anymore */
        cancel = false;
        goto error;
    }
3906

3907 3908 3909
    /* When migration completed, QEMU will have paused the CPUs for us.
     * Wait for the STOP event to be processed or explicitly stop CPUs
     * (for old QEMU which does not send events) to release the lock state.
3910
     */
3911 3912 3913 3914 3915
    if (priv->monJSON) {
        while (virDomainObjGetState(vm, NULL) == VIR_DOMAIN_RUNNING) {
            priv->signalStop = true;
            rc = virDomainObjWait(vm);
            priv->signalStop = false;
3916
            if (rc < 0)
3917
                goto error;
3918
        }
3919 3920
    } else if (virDomainObjGetState(vm, NULL) == VIR_DOMAIN_RUNNING &&
               qemuMigrationSetOffline(driver, vm) < 0) {
3921
        goto error;
3922
    }
3923 3924 3925 3926 3927

    if (mig && mig->nbd &&
        qemuMigrationCancelDriveMirror(driver, vm, true,
                                       QEMU_ASYNC_JOB_MIGRATION_OUT,
                                       dconn) < 0)
3928
        goto error;
3929

3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950 3951 3952 3953
    /* When migration was paused before serializing device state we need to
     * resume it now once we finished all block jobs and wait for the real
     * end of the migration.
     */
    if (priv->job.current->status == QEMU_DOMAIN_JOB_STATUS_PAUSED) {
        if (qemuMigrationContinue(driver, vm,
                                  QEMU_MONITOR_MIGRATION_STATUS_PRE_SWITCHOVER,
                                  QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
            goto error;

        waitFlags ^= QEMU_MIGRATION_COMPLETED_PRE_SWITCHOVER;

        rc = qemuMigrationWaitForCompletion(driver, vm,
                                            QEMU_ASYNC_JOB_MIGRATION_OUT,
                                            dconn, waitFlags);
        if (rc == -2) {
            goto error;
        } else if (rc == -1) {
            /* QEMU reported failed migration, nothing to cancel anymore */
            cancel = false;
            goto error;
        }
    }

3954 3955 3956 3957 3958
    if (iothread) {
        qemuMigrationIOThreadPtr io;

        VIR_STEAL_PTR(io, iothread);
        if (qemuMigrationStopTunnel(io, false) < 0)
3959
            goto error;
3960 3961 3962
    }

    if (priv->job.completed) {
3963
        priv->job.completed->stopped = priv->job.current->stopped;
3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974 3975 3976
        qemuDomainJobInfoUpdateTime(priv->job.completed);
        qemuDomainJobInfoUpdateDowntime(priv->job.completed);
        ignore_value(virTimeMillisNow(&priv->job.completed->sent));
    }

    cookieFlags |= QEMU_MIGRATION_COOKIE_NETWORK |
                   QEMU_MIGRATION_COOKIE_STATS;

    if (qemuMigrationCookieAddPersistent(mig, &persistDef) < 0 ||
        qemuMigrationBakeCookie(mig, driver, vm, cookieout,
                                cookieoutlen, cookieFlags) < 0) {
        VIR_WARN("Unable to encode migration cookie");
    }
3977

3978
    ret = 0;
3979

3980
 cleanup:
3981 3982 3983
    VIR_FREE(tlsAlias);
    VIR_FREE(secAlias);
    virObjectUnref(cfg);
3984
    VIR_FORCE_CLOSE(fd);
3985
    virDomainDefFree(persistDef);
3986 3987
    qemuMigrationCookieFree(mig);

3988 3989 3990
    if (events)
        priv->signalIOError = false;

3991 3992 3993 3994 3995
    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }

3996 3997
    return ret;

3998
 error:
3999 4000 4001 4002 4003 4004 4005 4006 4007 4008
    orig_err = virSaveLastError();

    if (cancel &&
        priv->job.current->status != QEMU_DOMAIN_JOB_STATUS_QEMU_COMPLETED &&
        virDomainObjIsActive(vm) &&
        qemuDomainObjEnterMonitorAsync(driver, vm,
                                       QEMU_ASYNC_JOB_MIGRATION_OUT) == 0) {
        qemuMonitorMigrateCancel(priv->mon);
        ignore_value(qemuDomainObjExitMonitor(driver, vm));
    }
4009 4010 4011 4012 4013 4014 4015 4016 4017 4018

    /* cancel any outstanding NBD jobs */
    if (mig && mig->nbd)
        qemuMigrationCancelDriveMirror(driver, vm, false,
                                       QEMU_ASYNC_JOB_MIGRATION_OUT,
                                       dconn);

    if (iothread)
        qemuMigrationStopTunnel(iothread, true);

4019
    if (priv->job.current->status != QEMU_DOMAIN_JOB_STATUS_CANCELED)
4020 4021 4022 4023
        priv->job.current->status = QEMU_DOMAIN_JOB_STATUS_FAILED;

    goto cleanup;

4024 4025
 exit_monitor:
    ignore_value(qemuDomainObjExitMonitor(driver, vm));
4026
    goto error;
4027 4028
}

4029
/* Perform migration using QEMU's native migrate support,
4030 4031
 * not encrypted obviously
 */
4032
static int doNativeMigrate(virQEMUDriverPtr driver,
4033
                           virDomainObjPtr vm,
4034
                           const char *persist_xml,
4035 4036 4037 4038 4039 4040
                           const char *uri,
                           const char *cookiein,
                           int cookieinlen,
                           char **cookieout,
                           int *cookieoutlen,
                           unsigned long flags,
4041
                           unsigned long resource,
4042
                           virConnectPtr dconn,
4043 4044
                           const char *graphicsuri,
                           size_t nmigrate_disks,
4045
                           const char **migrate_disks,
4046 4047
                           qemuMigrationCompressionPtr compression,
                           qemuMonitorMigrationParamsPtr migParams)
4048
{
4049
    qemuDomainObjPrivatePtr priv = vm->privateData;
M
Martin Kletzander 已提交
4050
    virURIPtr uribits = NULL;
4051
    int ret = -1;
4052 4053 4054
    qemuMigrationSpec spec;

    VIR_DEBUG("driver=%p, vm=%p, uri=%s, cookiein=%s, cookieinlen=%d, "
4055
              "cookieout=%p, cookieoutlen=%p, flags=0x%lx, resource=%lu, "
4056
              "graphicsuri=%s, nmigrate_disks=%zu migrate_disks=%p",
4057
              driver, vm, uri, NULLSTR(cookiein), cookieinlen,
4058
              cookieout, cookieoutlen, flags, resource,
4059
              NULLSTR(graphicsuri), nmigrate_disks, migrate_disks);
4060

4061
    if (!(uribits = qemuMigrationParseURI(uri, NULL)))
4062 4063
        return -1;

4064 4065 4066 4067 4068 4069 4070
    if (uribits->scheme == NULL) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("missing scheme in migration URI: %s"),
                       uri);
        goto cleanup;
    }

M
Michael R. Hines 已提交
4071 4072 4073 4074 4075
    if (STREQ(uribits->scheme, "rdma")) {
        if (!virQEMUCapsGet(priv->qemuCaps, QEMU_CAPS_MIGRATE_RDMA)) {
            virReportError(VIR_ERR_OPERATION_UNSUPPORTED, "%s",
                           _("outgoing RDMA migration is not supported "
                             "with this QEMU binary"));
4076
            goto cleanup;
M
Michael R. Hines 已提交
4077
        }
4078
        if (!virMemoryLimitIsSet(vm->def->mem.hard_limit)) {
M
Michael R. Hines 已提交
4079 4080 4081
            virReportError(VIR_ERR_OPERATION_INVALID, "%s",
                           _("cannot start RDMA migration with no memory hard "
                             "limit set"));
4082
            goto cleanup;
M
Michael R. Hines 已提交
4083 4084 4085
        }
    }

4086
    if (STRNEQ(uribits->scheme, "rdma"))
4087 4088
        spec.destType = MIGRATION_DEST_CONNECT_HOST;
    else
4089
        spec.destType = MIGRATION_DEST_HOST;
4090
    spec.dest.host.protocol = uribits->scheme;
4091 4092 4093
    spec.dest.host.name = uribits->server;
    spec.dest.host.port = uribits->port;
    spec.fwdType = MIGRATION_FWD_DIRECT;
4094

4095
    ret = qemuMigrationRun(driver, vm, persist_xml, cookiein, cookieinlen, cookieout,
4096
                           cookieoutlen, flags, resource, &spec, dconn,
4097
                           graphicsuri, nmigrate_disks, migrate_disks,
4098
                           compression, migParams);
4099 4100 4101 4102

    if (spec.destType == MIGRATION_DEST_FD)
        VIR_FORCE_CLOSE(spec.dest.fd.qemu);

4103
 cleanup:
4104
    virURIFree(uribits);
4105 4106 4107 4108 4109

    return ret;
}


4110
static int doTunnelMigrate(virQEMUDriverPtr driver,
4111 4112
                           virDomainObjPtr vm,
                           virStreamPtr st,
4113
                           const char *persist_xml,
4114 4115 4116 4117 4118
                           const char *cookiein,
                           int cookieinlen,
                           char **cookieout,
                           int *cookieoutlen,
                           unsigned long flags,
4119
                           unsigned long resource,
4120
                           virConnectPtr dconn,
4121 4122
                           const char *graphicsuri,
                           size_t nmigrate_disks,
4123
                           const char **migrate_disks,
4124 4125
                           qemuMigrationCompressionPtr compression,
                           qemuMonitorMigrationParamsPtr migParams)
4126 4127 4128
{
    int ret = -1;
    qemuMigrationSpec spec;
4129
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
4130
    int fds[2] = { -1, -1 };
4131 4132

    VIR_DEBUG("driver=%p, vm=%p, st=%p, cookiein=%s, cookieinlen=%d, "
4133
              "cookieout=%p, cookieoutlen=%p, flags=0x%lx, resource=%lu, "
4134
              "graphicsuri=%s, nmigrate_disks=%zu, migrate_disks=%p",
4135
              driver, vm, st, NULLSTR(cookiein), cookieinlen,
4136
              cookieout, cookieoutlen, flags, resource,
4137
              NULLSTR(graphicsuri), nmigrate_disks, migrate_disks);
4138 4139 4140 4141

    spec.fwdType = MIGRATION_FWD_STREAM;
    spec.fwd.stream = st;

4142

4143 4144 4145
    spec.destType = MIGRATION_DEST_FD;
    spec.dest.fd.qemu = -1;
    spec.dest.fd.local = -1;
4146

4147 4148 4149 4150 4151
    if (pipe2(fds, O_CLOEXEC) == 0) {
        spec.dest.fd.qemu = fds[1];
        spec.dest.fd.local = fds[0];
    }
    if (spec.dest.fd.qemu == -1 ||
4152 4153
        qemuSecuritySetImageFDLabel(driver->securityManager, vm->def,
                                    spec.dest.fd.qemu) < 0) {
4154 4155 4156
        virReportSystemError(errno, "%s",
                             _("cannot create pipe for tunnelled migration"));
        goto cleanup;
4157 4158
    }

4159 4160 4161
    ret = qemuMigrationRun(driver, vm, persist_xml, cookiein, cookieinlen,
                           cookieout, cookieoutlen, flags, resource, &spec,
                           dconn, graphicsuri, nmigrate_disks, migrate_disks,
4162
                           compression, migParams);
4163

4164
 cleanup:
4165 4166
    VIR_FORCE_CLOSE(spec.dest.fd.qemu);
    VIR_FORCE_CLOSE(spec.dest.fd.local);
4167

4168
    virObjectUnref(cfg);
4169 4170 4171 4172
    return ret;
}


4173 4174 4175 4176
/* This is essentially a re-impl of virDomainMigrateVersion2
 * from libvirt.c, but running in source libvirtd context,
 * instead of client app context & also adding in tunnel
 * handling */
4177
static int doPeer2PeerMigrate2(virQEMUDriverPtr driver,
4178
                               virConnectPtr sconn ATTRIBUTE_UNUSED,
4179 4180
                               virConnectPtr dconn,
                               virDomainObjPtr vm,
4181
                               const char *dconnuri,
4182 4183 4184
                               unsigned long flags,
                               const char *dname,
                               unsigned long resource)
4185 4186 4187
{
    virDomainPtr ddomain = NULL;
    char *uri_out = NULL;
4188
    char *cookie = NULL;
4189 4190 4191
    char *dom_xml = NULL;
    int cookielen = 0, ret;
    virErrorPtr orig_err = NULL;
4192
    bool cancelled;
4193
    virStreamPtr st = NULL;
4194
    unsigned long destflags;
4195
    qemuMigrationCompressionPtr compression = NULL;
4196
    qemuMonitorMigrationParams migParams = { 0 };
4197

4198
    VIR_DEBUG("driver=%p, sconn=%p, dconn=%p, vm=%p, dconnuri=%s, "
4199
              "flags=0x%lx, dname=%s, resource=%lu",
4200 4201
              driver, sconn, dconn, vm, NULLSTR(dconnuri),
              flags, NULLSTR(dname), resource);
4202

4203 4204 4205 4206 4207
    /* In version 2 of the protocol, the prepare step is slightly
     * different.  We fetch the domain XML of the source domain
     * and pass it to Prepare2.
     */
    if (!(dom_xml = qemuDomainFormatXML(driver, vm,
4208 4209
                                        QEMU_DOMAIN_FORMAT_LIVE_FLAGS |
                                        VIR_DOMAIN_XML_MIGRATABLE)))
4210 4211 4212 4213 4214
        return -1;

    if (virDomainObjGetState(vm, NULL) == VIR_DOMAIN_PAUSED)
        flags |= VIR_MIGRATE_PAUSED;

4215 4216
    destflags = flags & ~(VIR_MIGRATE_ABORT_ON_ERROR |
                          VIR_MIGRATE_AUTO_CONVERGE);
4217

4218 4219 4220
    if (!(compression = qemuMigrationCompressionParse(NULL, 0, flags)))
        goto cleanup;

4221 4222 4223 4224 4225 4226 4227 4228 4229 4230
    VIR_DEBUG("Prepare2 %p", dconn);
    if (flags & VIR_MIGRATE_TUNNELLED) {
        /*
         * Tunnelled Migrate Version 2 does not support cookies
         * due to missing parameters in the prepareTunnel() API.
         */

        if (!(st = virStreamNew(dconn, 0)))
            goto cleanup;

4231
        qemuDomainObjEnterRemote(vm);
4232
        ret = dconn->driver->domainMigratePrepareTunnel
4233
            (dconn, st, destflags, dname, resource, dom_xml);
4234
        qemuDomainObjExitRemote(vm);
4235
    } else {
4236
        qemuDomainObjEnterRemote(vm);
4237 4238
        ret = dconn->driver->domainMigratePrepare2
            (dconn, &cookie, &cookielen, NULL, &uri_out,
4239
             destflags, dname, resource, dom_xml);
4240
        qemuDomainObjExitRemote(vm);
4241 4242 4243
    }
    VIR_FREE(dom_xml);
    if (ret == -1)
4244 4245 4246
        goto cleanup;

    /* the domain may have shutdown or crashed while we had the locks dropped
4247
     * in qemuDomainObjEnterRemote, so check again
4248 4249
     */
    if (!virDomainObjIsActive(vm)) {
4250 4251
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("guest unexpectedly quit"));
4252 4253 4254
        goto cleanup;
    }

4255 4256
    if (!(flags & VIR_MIGRATE_TUNNELLED) &&
        (uri_out == NULL)) {
4257 4258
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("domainMigratePrepare2 did not set uri"));
4259
        cancelled = true;
4260
        orig_err = virSaveLastError();
4261
        goto finish;
4262 4263
    }

4264 4265 4266 4267
    /* Perform the migration.  The driver isn't supposed to return
     * until the migration is complete.
     */
    VIR_DEBUG("Perform %p", sconn);
4268
    qemuMigrationJobSetPhase(driver, vm, QEMU_MIGRATION_PHASE_PERFORM2);
4269
    if (flags & VIR_MIGRATE_TUNNELLED)
4270
        ret = doTunnelMigrate(driver, vm, st, NULL,
4271
                              NULL, 0, NULL, NULL,
4272
                              flags, resource, dconn,
4273
                              NULL, 0, NULL, compression, &migParams);
4274
    else
4275
        ret = doNativeMigrate(driver, vm, NULL, uri_out,
4276 4277
                              cookie, cookielen,
                              NULL, NULL, /* No out cookie with v2 migration */
4278 4279
                              flags, resource, dconn, NULL, 0, NULL,
                              compression, &migParams);
4280 4281 4282 4283

    /* Perform failed. Make sure Finish doesn't overwrite the error */
    if (ret < 0)
        orig_err = virSaveLastError();
4284

4285 4286 4287
    /* If Perform returns < 0, then we need to cancel the VM
     * startup on the destination
     */
4288
    cancelled = ret < 0;
4289

4290
 finish:
4291 4292 4293 4294
    /* In version 2 of the migration protocol, we pass the
     * status code from the sender to the destination host,
     * so it can do any cleanup if the migration failed.
     */
4295
    dname = dname ? dname : vm->def->name;
4296
    VIR_DEBUG("Finish2 %p ret=%d", dconn, ret);
4297
    qemuDomainObjEnterRemote(vm);
4298
    ddomain = dconn->driver->domainMigrateFinish2
4299
        (dconn, dname, cookie, cookielen,
4300
         uri_out ? uri_out : dconnuri, destflags, cancelled);
4301
    qemuDomainObjExitRemote(vm);
4302 4303
    if (cancelled && ddomain)
        VIR_ERROR(_("finish step ignored that migration was cancelled"));
4304

4305
 cleanup:
4306
    if (ddomain) {
4307
        virObjectUnref(ddomain);
4308 4309 4310 4311
        ret = 0;
    } else {
        ret = -1;
    }
4312

4313
    virObjectUnref(st);
4314 4315 4316 4317 4318

    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
4319
    qemuMigrationParamsClear(&migParams);
4320
    VIR_FREE(uri_out);
4321
    VIR_FREE(cookie);
4322
    VIR_FREE(compression);
4323 4324

    return ret;
4325 4326 4327
}


4328 4329 4330 4331
/* This is essentially a re-impl of virDomainMigrateVersion3
 * from libvirt.c, but running in source libvirtd context,
 * instead of client app context & also adding in tunnel
 * handling */
4332 4333 4334 4335 4336 4337 4338
static int
doPeer2PeerMigrate3(virQEMUDriverPtr driver,
                    virConnectPtr sconn,
                    virConnectPtr dconn,
                    const char *dconnuri,
                    virDomainObjPtr vm,
                    const char *xmlin,
4339
                    const char *persist_xml,
4340 4341
                    const char *dname,
                    const char *uri,
4342
                    const char *graphicsuri,
4343
                    const char *listenAddress,
4344 4345
                    size_t nmigrate_disks,
                    const char **migrate_disks,
4346
                    int nbdPort,
4347
                    qemuMigrationCompressionPtr compression,
4348
                    qemuMonitorMigrationParamsPtr migParams,
4349 4350 4351
                    unsigned long long bandwidth,
                    bool useParams,
                    unsigned long flags)
4352 4353 4354 4355 4356 4357 4358 4359 4360 4361
{
    virDomainPtr ddomain = NULL;
    char *uri_out = NULL;
    char *cookiein = NULL;
    char *cookieout = NULL;
    char *dom_xml = NULL;
    int cookieinlen = 0;
    int cookieoutlen = 0;
    int ret = -1;
    virErrorPtr orig_err = NULL;
4362
    bool cancelled = true;
4363
    virStreamPtr st = NULL;
4364
    unsigned long destflags;
4365 4366 4367
    virTypedParameterPtr params = NULL;
    int nparams = 0;
    int maxparams = 0;
4368
    size_t i;
4369 4370

    VIR_DEBUG("driver=%p, sconn=%p, dconn=%p, dconnuri=%s, vm=%p, xmlin=%s, "
4371
              "dname=%s, uri=%s, graphicsuri=%s, listenAddress=%s, "
4372
              "nmigrate_disks=%zu, migrate_disks=%p, nbdPort=%d, "
4373
              "bandwidth=%llu, useParams=%d, flags=0x%lx",
4374
              driver, sconn, dconn, NULLSTR(dconnuri), vm, NULLSTR(xmlin),
4375
              NULLSTR(dname), NULLSTR(uri), NULLSTR(graphicsuri),
4376
              NULLSTR(listenAddress), nmigrate_disks, migrate_disks, nbdPort,
4377
              bandwidth, useParams, flags);
4378

4379 4380 4381 4382 4383
    /* Unlike the virDomainMigrateVersion3 counterpart, we don't need
     * to worry about auto-setting the VIR_MIGRATE_CHANGE_PROTECTION
     * bit here, because we are already running inside the context of
     * a single job.  */

4384
    dom_xml = qemuMigrationBeginPhase(driver, vm, xmlin, dname,
4385 4386
                                      &cookieout, &cookieoutlen,
                                      nmigrate_disks, migrate_disks, flags);
4387 4388 4389
    if (!dom_xml)
        goto cleanup;

4390 4391 4392 4393 4394 4395 4396 4397 4398 4399 4400 4401 4402 4403 4404 4405 4406 4407 4408 4409
    if (useParams) {
        if (virTypedParamsAddString(&params, &nparams, &maxparams,
                                    VIR_MIGRATE_PARAM_DEST_XML, dom_xml) < 0)
            goto cleanup;

        if (dname &&
            virTypedParamsAddString(&params, &nparams, &maxparams,
                                    VIR_MIGRATE_PARAM_DEST_NAME, dname) < 0)
            goto cleanup;

        if (uri &&
            virTypedParamsAddString(&params, &nparams, &maxparams,
                                    VIR_MIGRATE_PARAM_URI, uri) < 0)
            goto cleanup;

        if (bandwidth &&
            virTypedParamsAddULLong(&params, &nparams, &maxparams,
                                    VIR_MIGRATE_PARAM_BANDWIDTH,
                                    bandwidth) < 0)
            goto cleanup;
4410 4411 4412 4413 4414 4415

        if (graphicsuri &&
            virTypedParamsAddString(&params, &nparams, &maxparams,
                                    VIR_MIGRATE_PARAM_GRAPHICS_URI,
                                    graphicsuri) < 0)
            goto cleanup;
4416 4417 4418 4419 4420
        if (listenAddress &&
            virTypedParamsAddString(&params, &nparams, &maxparams,
                                    VIR_MIGRATE_PARAM_LISTEN_ADDRESS,
                                    listenAddress) < 0)
            goto cleanup;
4421 4422 4423 4424 4425
        for (i = 0; i < nmigrate_disks; i++)
            if (virTypedParamsAddString(&params, &nparams, &maxparams,
                                        VIR_MIGRATE_PARAM_MIGRATE_DISKS,
                                        migrate_disks[i]) < 0)
                goto cleanup;
4426 4427 4428 4429 4430
        if (nbdPort &&
            virTypedParamsAddInt(&params, &nparams, &maxparams,
                                 VIR_MIGRATE_PARAM_DISKS_PORT,
                                 nbdPort) < 0)
            goto cleanup;
4431 4432 4433 4434

        if (qemuMigrationCompressionDump(compression, &params, &nparams,
                                         &maxparams, &flags) < 0)
            goto cleanup;
4435 4436
    }

4437 4438 4439
    if (virDomainObjGetState(vm, NULL) == VIR_DOMAIN_PAUSED)
        flags |= VIR_MIGRATE_PAUSED;

4440 4441
    destflags = flags & ~(VIR_MIGRATE_ABORT_ON_ERROR |
                          VIR_MIGRATE_AUTO_CONVERGE);
4442

4443 4444 4445 4446 4447 4448 4449 4450 4451
    VIR_DEBUG("Prepare3 %p", dconn);
    cookiein = cookieout;
    cookieinlen = cookieoutlen;
    cookieout = NULL;
    cookieoutlen = 0;
    if (flags & VIR_MIGRATE_TUNNELLED) {
        if (!(st = virStreamNew(dconn, 0)))
            goto cleanup;

4452
        qemuDomainObjEnterRemote(vm);
4453 4454 4455 4456 4457 4458 4459 4460 4461
        if (useParams) {
            ret = dconn->driver->domainMigratePrepareTunnel3Params
                (dconn, st, params, nparams, cookiein, cookieinlen,
                 &cookieout, &cookieoutlen, destflags);
        } else {
            ret = dconn->driver->domainMigratePrepareTunnel3
                (dconn, st, cookiein, cookieinlen, &cookieout, &cookieoutlen,
                 destflags, dname, bandwidth, dom_xml);
        }
4462
        qemuDomainObjExitRemote(vm);
4463
    } else {
4464
        qemuDomainObjEnterRemote(vm);
4465 4466 4467 4468 4469 4470 4471 4472 4473
        if (useParams) {
            ret = dconn->driver->domainMigratePrepare3Params
                (dconn, params, nparams, cookiein, cookieinlen,
                 &cookieout, &cookieoutlen, &uri_out, destflags);
        } else {
            ret = dconn->driver->domainMigratePrepare3
                (dconn, cookiein, cookieinlen, &cookieout, &cookieoutlen,
                 uri, &uri_out, destflags, dname, bandwidth, dom_xml);
        }
4474
        qemuDomainObjExitRemote(vm);
4475 4476 4477 4478 4479
    }
    VIR_FREE(dom_xml);
    if (ret == -1)
        goto cleanup;

L
liguang 已提交
4480 4481 4482 4483
    if (flags & VIR_MIGRATE_OFFLINE) {
        VIR_DEBUG("Offline migration, skipping Perform phase");
        VIR_FREE(cookieout);
        cookieoutlen = 0;
4484
        cancelled = false;
L
liguang 已提交
4485 4486 4487
        goto finish;
    }

4488 4489 4490 4491
    if (uri_out) {
        uri = uri_out;
        if (useParams &&
            virTypedParamsReplaceString(&params, &nparams,
4492 4493
                                        VIR_MIGRATE_PARAM_URI, uri_out) < 0) {
            orig_err = virSaveLastError();
4494
            goto finish;
4495
        }
4496
    } else if (!uri && !(flags & VIR_MIGRATE_TUNNELLED)) {
4497 4498
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("domainMigratePrepare3 did not set uri"));
4499
        orig_err = virSaveLastError();
4500 4501 4502 4503 4504 4505 4506 4507
        goto finish;
    }

    /* Perform the migration.  The driver isn't supposed to return
     * until the migration is complete. The src VM should remain
     * running, but in paused state until the destination can
     * confirm migration completion.
     */
4508
    VIR_DEBUG("Perform3 %p uri=%s", sconn, NULLSTR(uri));
4509
    qemuMigrationJobSetPhase(driver, vm, QEMU_MIGRATION_PHASE_PERFORM3);
4510 4511 4512 4513 4514
    VIR_FREE(cookiein);
    cookiein = cookieout;
    cookieinlen = cookieoutlen;
    cookieout = NULL;
    cookieoutlen = 0;
4515
    if (flags & VIR_MIGRATE_TUNNELLED) {
4516
        ret = doTunnelMigrate(driver, vm, st, persist_xml,
4517 4518
                              cookiein, cookieinlen,
                              &cookieout, &cookieoutlen,
4519
                              flags, bandwidth, dconn, graphicsuri,
4520 4521
                              nmigrate_disks, migrate_disks, compression,
                              migParams);
4522
    } else {
4523
        ret = doNativeMigrate(driver, vm, persist_xml, uri,
4524 4525
                              cookiein, cookieinlen,
                              &cookieout, &cookieoutlen,
4526
                              flags, bandwidth, dconn, graphicsuri,
4527 4528
                              nmigrate_disks, migrate_disks, compression,
                              migParams);
4529
    }
4530 4531

    /* Perform failed. Make sure Finish doesn't overwrite the error */
4532
    if (ret < 0) {
4533
        orig_err = virSaveLastError();
4534 4535 4536 4537
    } else {
        qemuMigrationJobSetPhase(driver, vm,
                                 QEMU_MIGRATION_PHASE_PERFORM3_DONE);
    }
4538 4539 4540 4541

    /* If Perform returns < 0, then we need to cancel the VM
     * startup on the destination
     */
4542
    cancelled = ret < 0;
4543

4544
 finish:
4545 4546 4547 4548 4549 4550 4551 4552 4553 4554 4555 4556
    /*
     * The status code from the source is passed to the destination.
     * The dest can cleanup in the source indicated it failed to
     * send all migration data. Returns NULL for ddomain if
     * the dest was unable to complete migration.
     */
    VIR_DEBUG("Finish3 %p ret=%d", dconn, ret);
    VIR_FREE(cookiein);
    cookiein = cookieout;
    cookieinlen = cookieoutlen;
    cookieout = NULL;
    cookieoutlen = 0;
4557 4558 4559 4560 4561 4562 4563 4564 4565 4566 4567 4568 4569 4570 4571 4572 4573 4574 4575 4576 4577 4578 4579

    if (useParams) {
        if (virTypedParamsGetString(params, nparams,
                                    VIR_MIGRATE_PARAM_DEST_NAME, NULL) <= 0 &&
            virTypedParamsReplaceString(&params, &nparams,
                                        VIR_MIGRATE_PARAM_DEST_NAME,
                                        vm->def->name) < 0) {
            ddomain = NULL;
        } else {
            qemuDomainObjEnterRemote(vm);
            ddomain = dconn->driver->domainMigrateFinish3Params
                (dconn, params, nparams, cookiein, cookieinlen,
                 &cookieout, &cookieoutlen, destflags, cancelled);
            qemuDomainObjExitRemote(vm);
        }
    } else {
        dname = dname ? dname : vm->def->name;
        qemuDomainObjEnterRemote(vm);
        ddomain = dconn->driver->domainMigrateFinish3
            (dconn, dname, cookiein, cookieinlen, &cookieout, &cookieoutlen,
             dconnuri, uri, destflags, cancelled);
        qemuDomainObjExitRemote(vm);
    }
4580 4581 4582 4583 4584 4585 4586 4587 4588 4589 4590 4591 4592 4593 4594 4595 4596 4597 4598 4599

    if (cancelled) {
        if (ddomain) {
            VIR_ERROR(_("finish step ignored that migration was cancelled"));
        } else {
            /* If Finish reported a useful error, use it instead of the
             * original "migration unexpectedly failed" error.
             *
             * This is ugly but we can't do better with the APIs we have. We
             * only replace the error if Finish was called with cancelled == 1
             * and reported a real error (old libvirt would report an error
             * from RPC instead of MIGRATE_FINISH_OK), which only happens when
             * the domain died on destination. To further reduce a possibility
             * of false positives we also check that Perform returned
             * VIR_ERR_OPERATION_FAILED.
             */
            if (orig_err &&
                orig_err->domain == VIR_FROM_QEMU &&
                orig_err->code == VIR_ERR_OPERATION_FAILED) {
                virErrorPtr err = virGetLastError();
4600 4601
                if (err &&
                    err->domain == VIR_FROM_QEMU &&
4602 4603 4604 4605 4606 4607 4608
                    err->code != VIR_ERR_MIGRATE_FINISH_OK) {
                    virFreeError(orig_err);
                    orig_err = NULL;
                }
            }
        }
    }
4609

4610 4611 4612 4613 4614 4615 4616
    /* If ddomain is NULL, then we were unable to start
     * the guest on the target, and must restart on the
     * source. There is a small chance that the ddomain
     * is NULL due to an RPC failure, in which case
     * ddomain could in fact be running on the dest.
     * The lock manager plugins should take care of
     * safety in this scenario.
4617
     */
4618
    cancelled = ddomain == NULL;
4619

4620 4621 4622 4623 4624 4625
    /* If finish3 set an error, and we don't have an earlier
     * one we need to preserve it in case confirm3 overwrites
     */
    if (!orig_err)
        orig_err = virSaveLastError();

4626 4627 4628 4629
    /*
     * If cancelled, then src VM will be restarted, else
     * it will be killed
     */
4630
    VIR_DEBUG("Confirm3 %p cancelled=%d vm=%p", sconn, cancelled, vm);
4631 4632 4633 4634 4635
    VIR_FREE(cookiein);
    cookiein = cookieout;
    cookieinlen = cookieoutlen;
    cookieout = NULL;
    cookieoutlen = 0;
4636 4637 4638
    ret = qemuMigrationConfirmPhase(driver, sconn, vm,
                                    cookiein, cookieinlen,
                                    flags, cancelled);
4639 4640 4641 4642
    /* If Confirm3 returns -1, there's nothing more we can
     * do, but fortunately worst case is that there is a
     * domain left in 'paused' state on source.
     */
4643 4644 4645
    if (ret < 0)
        VIR_WARN("Guest %s probably left in 'paused' state on source",
                 vm->def->name);
4646 4647 4648

 cleanup:
    if (ddomain) {
4649
        virObjectUnref(ddomain);
4650 4651 4652 4653 4654
        ret = 0;
    } else {
        ret = -1;
    }

4655
    virObjectUnref(st);
4656 4657 4658 4659 4660 4661 4662 4663

    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
    VIR_FREE(uri_out);
    VIR_FREE(cookiein);
    VIR_FREE(cookieout);
4664
    virTypedParamsFree(params, nparams);
4665 4666 4667 4668
    return ret;
}


4669 4670 4671 4672 4673 4674 4675 4676 4677 4678 4679 4680
static void
qemuMigrationConnectionClosed(virConnectPtr conn,
                              int reason,
                              void *opaque)
{
    virDomainObjPtr vm = opaque;

    VIR_DEBUG("conn=%p, reason=%d, vm=%s", conn, reason, vm->def->name);
    virDomainObjBroadcast(vm);
}


4681 4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692
static int virConnectCredType[] = {
    VIR_CRED_AUTHNAME,
    VIR_CRED_PASSPHRASE,
};


static virConnectAuth virConnectAuthConfig = {
    .credtype = virConnectCredType,
    .ncredtype = ARRAY_CARDINALITY(virConnectCredType),
};


4693
static int doPeer2PeerMigrate(virQEMUDriverPtr driver,
4694
                              virConnectPtr sconn,
4695
                              virDomainObjPtr vm,
4696
                              const char *xmlin,
4697
                              const char *persist_xml,
4698
                              const char *dconnuri,
4699
                              const char *uri,
4700
                              const char *graphicsuri,
4701
                              const char *listenAddress,
4702 4703
                              size_t nmigrate_disks,
                              const char **migrate_disks,
4704
                              int nbdPort,
4705
                              qemuMigrationCompressionPtr compression,
4706
                              qemuMonitorMigrationParamsPtr migParams,
4707 4708
                              unsigned long flags,
                              const char *dname,
4709 4710
                              unsigned long resource,
                              bool *v3proto)
4711 4712 4713 4714
{
    int ret = -1;
    virConnectPtr dconn = NULL;
    bool p2p;
4715
    virErrorPtr orig_err = NULL;
4716
    bool offline = false;
4717
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
4718
    bool useParams;
4719

4720 4721
    VIR_DEBUG("driver=%p, sconn=%p, vm=%p, xmlin=%s, dconnuri=%s, uri=%s, "
              "graphicsuri=%s, listenAddress=%s, nmigrate_disks=%zu, "
4722
              "migrate_disks=%p, nbdPort=%d, flags=0x%lx, dname=%s, "
4723
              "resource=%lu",
4724
              driver, sconn, vm, NULLSTR(xmlin), NULLSTR(dconnuri),
4725
              NULLSTR(uri), NULLSTR(graphicsuri), NULLSTR(listenAddress),
4726 4727
              nmigrate_disks, migrate_disks, nbdPort, flags, NULLSTR(dname),
              resource);
4728

4729 4730 4731 4732 4733 4734 4735 4736 4737 4738 4739 4740 4741 4742
    if (flags & VIR_MIGRATE_TUNNELLED && uri) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("migration URI is not supported by tunnelled "
                         "migration"));
        goto cleanup;
    }

    if (flags & VIR_MIGRATE_TUNNELLED && listenAddress) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("listen address is not supported by tunnelled "
                         "migration"));
        goto cleanup;
    }

4743 4744 4745 4746 4747 4748 4749
    if (flags & VIR_MIGRATE_TUNNELLED && nbdPort) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("disk port address is not supported by tunnelled "
                         "migration"));
        goto cleanup;
    }

4750 4751 4752 4753
    /* the order of operations is important here; we make sure the
     * destination side is completely setup before we touch the source
     */

4754
    qemuDomainObjEnterRemote(vm);
4755
    dconn = virConnectOpenAuth(dconnuri, &virConnectAuthConfig, 0);
4756
    qemuDomainObjExitRemote(vm);
4757
    if (dconn == NULL) {
4758
        virReportError(VIR_ERR_OPERATION_FAILED,
4759 4760
                       _("Failed to connect to remote libvirt URI %s: %s"),
                       dconnuri, virGetLastErrorMessage());
4761
        virObjectUnref(cfg);
4762 4763 4764
        return -1;
    }

4765 4766
    if (virConnectSetKeepAlive(dconn, cfg->keepAliveInterval,
                               cfg->keepAliveCount) < 0)
4767 4768
        goto cleanup;

4769 4770 4771 4772 4773
    if (virConnectRegisterCloseCallback(dconn, qemuMigrationConnectionClosed,
                                        vm, NULL) < 0) {
        goto cleanup;
    }

4774
    qemuDomainObjEnterRemote(vm);
4775 4776
    p2p = VIR_DRV_SUPPORTS_FEATURE(dconn->driver, dconn,
                                   VIR_DRV_FEATURE_MIGRATION_P2P);
4777
        /* v3proto reflects whether the caller used Perform3, but with
4778
         * p2p migrate, regardless of whether Perform2 or Perform3
4779 4780 4781 4782
         * were used, we decide protocol based on what target supports
         */
    *v3proto = VIR_DRV_SUPPORTS_FEATURE(dconn->driver, dconn,
                                        VIR_DRV_FEATURE_MIGRATION_V3);
4783 4784
    useParams = VIR_DRV_SUPPORTS_FEATURE(dconn->driver, dconn,
                                         VIR_DRV_FEATURE_MIGRATION_PARAMS);
L
liguang 已提交
4785 4786 4787
    if (flags & VIR_MIGRATE_OFFLINE)
        offline = VIR_DRV_SUPPORTS_FEATURE(dconn->driver, dconn,
                                           VIR_DRV_FEATURE_MIGRATION_OFFLINE);
4788
    qemuDomainObjExitRemote(vm);
4789

4790
    if (!p2p) {
4791 4792
        virReportError(VIR_ERR_OPERATION_FAILED, "%s",
                       _("Destination libvirt does not support peer-to-peer migration protocol"));
4793 4794 4795
        goto cleanup;
    }

4796 4797
    /* Only xmlin, dname, uri, and bandwidth parameters can be used with
     * old-style APIs. */
4798
    if (!useParams && (graphicsuri || listenAddress || nmigrate_disks)) {
4799 4800 4801 4802 4803 4804
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("Migration APIs with extensible parameters are not "
                         "supported but extended parameters were passed"));
        goto cleanup;
    }

L
liguang 已提交
4805 4806 4807 4808 4809 4810 4811
    if (flags & VIR_MIGRATE_OFFLINE && !offline) {
        virReportError(VIR_ERR_ARGUMENT_UNSUPPORTED, "%s",
                       _("offline migration is not supported by "
                         "the destination host"));
        goto cleanup;
    }

4812
    /* domain may have been stopped while we were talking to remote daemon */
L
liguang 已提交
4813
    if (!virDomainObjIsActive(vm) && !(flags & VIR_MIGRATE_OFFLINE)) {
4814 4815
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("guest unexpectedly quit"));
4816 4817 4818
        goto cleanup;
    }

4819 4820 4821 4822 4823 4824 4825
    /* Change protection is only required on the source side (us), and
     * only for v3 migration when begin and perform are separate jobs.
     * But peer-2-peer is already a single job, and we still want to
     * talk to older destinations that would reject the flag.
     * Therefore it is safe to clear the bit here.  */
    flags &= ~VIR_MIGRATE_CHANGE_PROTECTION;

4826 4827
    if (*v3proto) {
        ret = doPeer2PeerMigrate3(driver, sconn, dconn, dconnuri, vm, xmlin,
4828 4829
                                  persist_xml, dname, uri, graphicsuri,
                                  listenAddress, nmigrate_disks, migrate_disks,
4830 4831
                                  nbdPort, compression, migParams, resource,
                                  useParams, flags);
4832
    } else {
4833
        ret = doPeer2PeerMigrate2(driver, sconn, dconn, vm,
4834
                                  dconnuri, flags, dname, resource);
4835
    }
4836

4837
 cleanup:
4838
    orig_err = virSaveLastError();
4839
    qemuDomainObjEnterRemote(vm);
4840
    virConnectUnregisterCloseCallback(dconn, qemuMigrationConnectionClosed);
4841
    virObjectUnref(dconn);
4842
    qemuDomainObjExitRemote(vm);
4843 4844 4845 4846
    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
4847
    virObjectUnref(cfg);
4848 4849 4850 4851
    return ret;
}


4852 4853 4854 4855 4856 4857
/*
 * This implements perform part of the migration protocol when migration job
 * does not need to be active across several APIs, i.e., peer2peer migration or
 * perform phase of v2 non-peer2peer migration.
 */
static int
4858
qemuMigrationPerformJob(virQEMUDriverPtr driver,
4859 4860 4861
                        virConnectPtr conn,
                        virDomainObjPtr vm,
                        const char *xmlin,
4862
                        const char *persist_xml,
4863 4864
                        const char *dconnuri,
                        const char *uri,
4865
                        const char *graphicsuri,
4866
                        const char *listenAddress,
4867 4868
                        size_t nmigrate_disks,
                        const char **migrate_disks,
4869
                        int nbdPort,
4870
                        qemuMigrationCompressionPtr compression,
4871
                        qemuMonitorMigrationParamsPtr migParams,
4872
                        const char *cookiein,
4873 4874 4875 4876 4877 4878 4879
                        int cookieinlen,
                        char **cookieout,
                        int *cookieoutlen,
                        unsigned long flags,
                        const char *dname,
                        unsigned long resource,
                        bool v3proto)
4880
{
4881
    virObjectEventPtr event = NULL;
4882
    int ret = -1;
4883
    virErrorPtr orig_err = NULL;
4884
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
4885

4886
    if (qemuMigrationJobStart(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
4887 4888
        goto cleanup;

L
liguang 已提交
4889
    if (!virDomainObjIsActive(vm) && !(flags & VIR_MIGRATE_OFFLINE)) {
4890 4891
        virReportError(VIR_ERR_OPERATION_INVALID,
                       "%s", _("domain is not running"));
4892 4893 4894
        goto endjob;
    }

4895
    if (!qemuMigrationIsAllowed(driver, vm, true, flags))
4896
        goto endjob;
4897

4898
    if (!(flags & (VIR_MIGRATE_UNSAFE | VIR_MIGRATE_OFFLINE)) &&
4899
        !qemuMigrationIsSafe(vm->def, nmigrate_disks, migrate_disks, flags))
4900
        goto endjob;
4901

4902
    qemuMigrationStoreDomainState(vm);
4903 4904

    if ((flags & (VIR_MIGRATE_TUNNELLED | VIR_MIGRATE_PEER2PEER))) {
4905
        ret = doPeer2PeerMigrate(driver, conn, vm, xmlin, persist_xml,
4906
                                 dconnuri, uri, graphicsuri, listenAddress,
4907
                                 nmigrate_disks, migrate_disks, nbdPort,
4908 4909
                                 compression, migParams, flags, dname, resource,
                                 &v3proto);
4910
    } else {
4911
        qemuMigrationJobSetPhase(driver, vm, QEMU_MIGRATION_PHASE_PERFORM2);
4912
        ret = doNativeMigrate(driver, vm, persist_xml, uri, cookiein, cookieinlen,
4913
                              cookieout, cookieoutlen,
4914
                              flags, resource, NULL, NULL, 0, NULL,
4915
                              compression, migParams);
4916
    }
4917 4918
    if (ret < 0)
        goto endjob;
4919

4920 4921 4922 4923
    /*
     * In v3 protocol, the source VM is not killed off until the
     * confirm step.
     */
4924
    if (!v3proto) {
4925
        qemuProcessStop(driver, vm, VIR_DOMAIN_SHUTOFF_MIGRATED,
4926
                        QEMU_ASYNC_JOB_MIGRATION_OUT,
4927
                        VIR_QEMU_PROCESS_STOP_MIGRATED);
4928
        virDomainAuditStop(vm, "migrated");
4929
        event = virDomainEventLifecycleNewFromObj(vm,
4930 4931
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_MIGRATED);
4932 4933
    }

4934
 endjob:
4935 4936 4937
    if (ret < 0)
        orig_err = virSaveLastError();

4938 4939 4940 4941
    /* v2 proto has no confirm phase so we need to reset migration parameters
     * here
     */
    if (!v3proto && ret < 0)
4942
        qemuMigrationReset(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT);
4943

4944
    if (qemuMigrationRestoreDomainState(conn, vm)) {
4945
        event = virDomainEventLifecycleNewFromObj(vm,
4946 4947 4948
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
    }
4949

4950
    qemuMigrationJobFinish(driver, vm);
4951
    if (!virDomainObjIsActive(vm) && ret == 0) {
4952
        if (flags & VIR_MIGRATE_UNDEFINE_SOURCE) {
4953
            virDomainDeleteConfig(cfg->configDir, cfg->autostartDir, vm);
4954 4955
            vm->persistent = 0;
        }
4956
        qemuDomainRemoveInactiveJob(driver, vm);
4957 4958
    }

4959 4960 4961 4962 4963
    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }

4964
 cleanup:
M
Michal Privoznik 已提交
4965
    virDomainObjEndAPI(&vm);
4966
    qemuDomainEventQueue(driver, event);
4967
    virObjectUnref(cfg);
4968 4969 4970 4971 4972 4973 4974
    return ret;
}

/*
 * This implements perform phase of v3 migration protocol.
 */
static int
4975
qemuMigrationPerformPhase(virQEMUDriverPtr driver,
4976 4977
                          virConnectPtr conn,
                          virDomainObjPtr vm,
4978
                          const char *persist_xml,
4979
                          const char *uri,
4980
                          const char *graphicsuri,
4981 4982
                          size_t nmigrate_disks,
                          const char **migrate_disks,
4983
                          qemuMigrationCompressionPtr compression,
4984
                          qemuMonitorMigrationParamsPtr migParams,
4985 4986 4987 4988 4989 4990 4991
                          const char *cookiein,
                          int cookieinlen,
                          char **cookieout,
                          int *cookieoutlen,
                          unsigned long flags,
                          unsigned long resource)
{
4992
    virObjectEventPtr event = NULL;
4993 4994 4995 4996 4997 4998 4999 5000 5001 5002 5003
    int ret = -1;

    /* If we didn't start the job in the begin phase, start it now. */
    if (!(flags & VIR_MIGRATE_CHANGE_PROTECTION)) {
        if (qemuMigrationJobStart(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT) < 0)
            goto cleanup;
    } else if (!qemuMigrationJobIsActive(vm, QEMU_ASYNC_JOB_MIGRATION_OUT)) {
        goto cleanup;
    }

    qemuMigrationJobStartPhase(driver, vm, QEMU_MIGRATION_PHASE_PERFORM3);
5004 5005
    virCloseCallbacksUnset(driver->closeCallbacks, vm,
                           qemuMigrationCleanup);
5006

5007
    ret = doNativeMigrate(driver, vm, persist_xml, uri, cookiein, cookieinlen,
5008
                          cookieout, cookieoutlen,
5009
                          flags, resource, NULL, graphicsuri,
5010
                          nmigrate_disks, migrate_disks, compression, migParams);
5011

5012 5013 5014 5015 5016
    if (ret < 0) {
        if (qemuMigrationRestoreDomainState(conn, vm)) {
            event = virDomainEventLifecycleNewFromObj(vm,
                                                      VIR_DOMAIN_EVENT_RESUMED,
                                                      VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
5017
        }
5018
        goto endjob;
5019
    }
5020 5021 5022

    qemuMigrationJobSetPhase(driver, vm, QEMU_MIGRATION_PHASE_PERFORM3_DONE);

5023 5024
    if (virCloseCallbacksSet(driver->closeCallbacks, vm, conn,
                             qemuMigrationCleanup) < 0)
5025 5026
        goto endjob;

5027
 endjob:
5028 5029
    if (ret < 0) {
        qemuMigrationReset(driver, vm, QEMU_ASYNC_JOB_MIGRATION_OUT);
5030
        qemuMigrationJobFinish(driver, vm);
5031
    } else {
5032
        qemuMigrationJobContinue(vm);
5033 5034
    }

5035
    if (!virDomainObjIsActive(vm))
5036
        qemuDomainRemoveInactiveJob(driver, vm);
5037

5038
 cleanup:
M
Michal Privoznik 已提交
5039
    virDomainObjEndAPI(&vm);
5040
    qemuDomainEventQueue(driver, event);
5041 5042 5043
    return ret;
}

5044
int
5045
qemuMigrationPerform(virQEMUDriverPtr driver,
5046 5047 5048
                     virConnectPtr conn,
                     virDomainObjPtr vm,
                     const char *xmlin,
5049
                     const char *persist_xml,
5050 5051
                     const char *dconnuri,
                     const char *uri,
5052
                     const char *graphicsuri,
5053
                     const char *listenAddress,
5054 5055
                     size_t nmigrate_disks,
                     const char **migrate_disks,
5056
                     int nbdPort,
5057
                     qemuMigrationCompressionPtr compression,
5058
                     qemuMonitorMigrationParamsPtr migParams,
5059 5060 5061 5062 5063 5064 5065 5066 5067 5068
                     const char *cookiein,
                     int cookieinlen,
                     char **cookieout,
                     int *cookieoutlen,
                     unsigned long flags,
                     const char *dname,
                     unsigned long resource,
                     bool v3proto)
{
    VIR_DEBUG("driver=%p, conn=%p, vm=%p, xmlin=%s, dconnuri=%s, "
5069
              "uri=%s, graphicsuri=%s, listenAddress=%s, "
5070
              "nmigrate_disks=%zu, migrate_disks=%p, nbdPort=%d, "
5071
              "cookiein=%s, cookieinlen=%d, cookieout=%p, cookieoutlen=%p, "
5072
              "flags=0x%lx, dname=%s, resource=%lu, v3proto=%d",
5073
              driver, conn, vm, NULLSTR(xmlin), NULLSTR(dconnuri),
5074
              NULLSTR(uri), NULLSTR(graphicsuri), NULLSTR(listenAddress),
5075 5076 5077
              nmigrate_disks, migrate_disks, nbdPort,
              NULLSTR(cookiein), cookieinlen, cookieout, cookieoutlen,
              flags, NULLSTR(dname), resource, v3proto);
5078 5079 5080

    if ((flags & (VIR_MIGRATE_TUNNELLED | VIR_MIGRATE_PEER2PEER))) {
        if (cookieinlen) {
5081 5082
            virReportError(VIR_ERR_OPERATION_INVALID,
                           "%s", _("received unexpected cookie with P2P migration"));
5083 5084 5085
            return -1;
        }

5086
        return qemuMigrationPerformJob(driver, conn, vm, xmlin, persist_xml, dconnuri, uri,
5087
                                       graphicsuri, listenAddress,
5088
                                       nmigrate_disks, migrate_disks, nbdPort,
5089 5090
                                       compression, migParams,
                                       cookiein, cookieinlen,
5091 5092
                                       cookieout, cookieoutlen,
                                       flags, dname, resource, v3proto);
5093 5094
    } else {
        if (dconnuri) {
5095 5096
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("Unexpected dconnuri parameter with non-peer2peer migration"));
5097 5098 5099 5100
            return -1;
        }

        if (v3proto) {
5101
            return qemuMigrationPerformPhase(driver, conn, vm, persist_xml, uri,
5102
                                             graphicsuri,
5103
                                             nmigrate_disks, migrate_disks,
5104 5105
                                             compression, migParams,
                                             cookiein, cookieinlen,
5106
                                             cookieout, cookieoutlen,
5107
                                             flags, resource);
5108
        } else {
5109
            return qemuMigrationPerformJob(driver, conn, vm, xmlin, persist_xml, NULL,
5110
                                           uri, graphicsuri, listenAddress,
5111
                                           nmigrate_disks, migrate_disks, nbdPort,
5112 5113
                                           compression, migParams,
                                           cookiein, cookieinlen,
5114 5115 5116 5117 5118
                                           cookieout, cookieoutlen, flags,
                                           dname, resource, v3proto);
        }
    }
}
5119

5120
static int
5121 5122
qemuMigrationVPAssociatePortProfiles(virDomainDefPtr def)
{
5123
    size_t i;
5124 5125 5126 5127 5128
    int last_good_net = -1;
    virDomainNetDefPtr net;

    for (i = 0; i < def->nnets; i++) {
        net = def->nets[i];
5129
        if (virDomainNetGetActualType(net) == VIR_DOMAIN_NET_TYPE_DIRECT) {
5130
            if (virNetDevVPortProfileAssociate(net->ifname,
5131
                                               virDomainNetGetActualVirtPortProfile(net),
5132
                                               &net->mac,
5133
                                               virDomainNetGetActualDirectDev(net),
5134
                                               -1,
5135
                                               def->uuid,
5136 5137
                                               VIR_NETDEV_VPORT_PROFILE_OP_MIGRATE_IN_FINISH,
                                               false) < 0) {
5138 5139 5140
                virReportError(VIR_ERR_OPERATION_FAILED,
                               _("Port profile Associate failed for %s"),
                               net->ifname);
5141
                goto err_exit;
5142
            }
5143
            last_good_net = i;
5144
            VIR_DEBUG("Port profile Associate succeeded for %s", net->ifname);
5145

5146
            if (virNetDevMacVLanVPortProfileRegisterCallback(net->ifname, &net->mac,
5147 5148 5149 5150
                                                             virDomainNetGetActualDirectDev(net), def->uuid,
                                                             virDomainNetGetActualVirtPortProfile(net),
                                                             VIR_NETDEV_VPORT_PROFILE_OP_CREATE))
                goto err_exit;
5151 5152 5153
        }
    }

5154
    return 0;
5155

5156
 err_exit:
5157
    for (i = 0; last_good_net != -1 && i <= last_good_net; i++) {
5158
        net = def->nets[i];
5159
        if (virDomainNetGetActualType(net) == VIR_DOMAIN_NET_TYPE_DIRECT) {
5160
            ignore_value(virNetDevVPortProfileDisassociate(net->ifname,
5161
                                                           virDomainNetGetActualVirtPortProfile(net),
5162
                                                           &net->mac,
5163
                                                           virDomainNetGetActualDirectDev(net),
5164
                                                           -1,
5165
                                                           VIR_NETDEV_VPORT_PROFILE_OP_MIGRATE_IN_FINISH));
5166 5167
        }
    }
5168
    return -1;
5169 5170 5171
}


J
Jiri Denemark 已提交
5172 5173 5174
static int
qemuMigrationPersist(virQEMUDriverPtr driver,
                     virDomainObjPtr vm,
5175 5176
                     qemuMigrationCookiePtr mig,
                     bool ignoreSaveError)
J
Jiri Denemark 已提交
5177 5178 5179 5180
{
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
    virCapsPtr caps = NULL;
    virDomainDefPtr vmdef;
5181 5182
    virDomainDefPtr oldDef = NULL;
    unsigned int oldPersist = vm->persistent;
J
Jiri Denemark 已提交
5183 5184 5185 5186 5187 5188 5189
    virObjectEventPtr event;
    int ret = -1;

    if (!(caps = virQEMUDriverGetCapabilities(driver, false)))
        goto cleanup;

    vm->persistent = 1;
5190 5191
    oldDef = vm->newDef;
    vm->newDef = qemuMigrationCookieGetPersistent(mig);
J
Jiri Denemark 已提交
5192

5193 5194
    if (!(vmdef = virDomainObjGetPersistentDef(caps, driver->xmlopt, vm)))
        goto error;
J
Jiri Denemark 已提交
5195

5196 5197
    if (virDomainSaveConfig(cfg->configDir, driver->caps, vmdef) < 0 &&
        !ignoreSaveError)
5198
        goto error;
J
Jiri Denemark 已提交
5199 5200 5201

    event = virDomainEventLifecycleNewFromObj(vm,
                                              VIR_DOMAIN_EVENT_DEFINED,
5202 5203 5204
                                              oldPersist ?
                                              VIR_DOMAIN_EVENT_DEFINED_UPDATED :
                                              VIR_DOMAIN_EVENT_DEFINED_ADDED);
5205
    qemuDomainEventQueue(driver, event);
J
Jiri Denemark 已提交
5206 5207 5208 5209

    ret = 0;

 cleanup:
5210
    virDomainDefFree(oldDef);
J
Jiri Denemark 已提交
5211 5212 5213
    virObjectUnref(caps);
    virObjectUnref(cfg);
    return ret;
5214 5215 5216 5217 5218 5219 5220

 error:
    virDomainDefFree(vm->newDef);
    vm->persistent = oldPersist;
    vm->newDef = oldDef;
    oldDef = NULL;
    goto cleanup;
J
Jiri Denemark 已提交
5221 5222 5223
}


5224
virDomainPtr
5225
qemuMigrationFinish(virQEMUDriverPtr driver,
5226 5227
                    virConnectPtr dconn,
                    virDomainObjPtr vm,
5228 5229 5230 5231
                    const char *cookiein,
                    int cookieinlen,
                    char **cookieout,
                    int *cookieoutlen,
5232
                    unsigned long flags,
5233 5234
                    int retcode,
                    bool v3proto)
5235 5236
{
    virDomainPtr dom = NULL;
5237
    qemuMigrationCookiePtr mig = NULL;
5238
    virErrorPtr orig_err = NULL;
5239
    int cookie_flags = 0;
J
Jiri Denemark 已提交
5240
    qemuDomainObjPrivatePtr priv = vm->privateData;
5241
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
5242
    unsigned short port;
5243 5244
    unsigned long long timeReceived = 0;
    virObjectEventPtr event;
5245
    qemuDomainJobInfoPtr jobInfo = NULL;
5246
    bool inPostCopy = false;
5247
    bool doKill = true;
5248

5249
    VIR_DEBUG("driver=%p, dconn=%p, vm=%p, cookiein=%s, cookieinlen=%d, "
5250
              "cookieout=%p, cookieoutlen=%p, flags=0x%lx, retcode=%d",
5251 5252
              driver, dconn, vm, NULLSTR(cookiein), cookieinlen,
              cookieout, cookieoutlen, flags, retcode);
5253

5254 5255 5256
    port = priv->migrationPort;
    priv->migrationPort = 0;

5257 5258
    if (!qemuMigrationJobIsActive(vm, QEMU_ASYNC_JOB_MIGRATION_IN)) {
        qemuMigrationErrorReport(driver, vm->def->name);
5259
        goto cleanup;
5260
    }
5261

5262 5263
    ignore_value(virTimeMillisNow(&timeReceived));

5264 5265 5266
    qemuMigrationJobStartPhase(driver, vm,
                               v3proto ? QEMU_MIGRATION_PHASE_FINISH3
                                       : QEMU_MIGRATION_PHASE_FINISH2);
5267

5268
    qemuDomainCleanupRemove(vm, qemuMigrationPrepareCleanup);
5269
    VIR_FREE(priv->job.completed);
5270

5271
    cookie_flags = QEMU_MIGRATION_COOKIE_NETWORK |
5272 5273
                   QEMU_MIGRATION_COOKIE_STATS |
                   QEMU_MIGRATION_COOKIE_NBD;
5274 5275 5276
    /* Some older versions of libvirt always send persistent XML in the cookie
     * even though VIR_MIGRATE_PERSIST_DEST was not used. */
    cookie_flags |= QEMU_MIGRATION_COOKIE_PERSISTENT;
5277 5278 5279

    if (!(mig = qemuMigrationEatCookie(driver, vm, cookiein,
                                       cookieinlen, cookie_flags)))
5280
        goto endjob;
5281

5282
    if (flags & VIR_MIGRATE_OFFLINE) {
5283 5284
        if (retcode == 0 &&
            qemuMigrationPersist(driver, vm, mig, false) == 0)
5285
            dom = virGetDomain(dconn, vm->def->name, vm->def->uuid, -1);
5286 5287
        goto endjob;
    }
5288

5289 5290 5291 5292
    if (retcode != 0) {
        /* Check for a possible error on the monitor in case Finish was called
         * earlier than monitor EOF handler got a chance to process the error
         */
5293
        qemuDomainCheckMonitor(driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN);
5294 5295
        goto endjob;
    }
5296

5297 5298 5299 5300 5301 5302
    if (!virDomainObjIsActive(vm)) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("guest unexpectedly quit"));
        qemuMigrationErrorReport(driver, vm->def->name);
        goto endjob;
    }
5303

5304 5305
    if (qemuMigrationVPAssociatePortProfiles(vm->def) < 0)
        goto endjob;
5306

5307 5308
    if (mig->network && qemuDomainMigrateOPDRelocate(driver, vm, mig) < 0)
        VIR_WARN("unable to provide network data for relocation");
5309

5310 5311
    if (qemuMigrationStopNBDServer(driver, vm, mig) < 0)
        goto endjob;
5312

5313 5314
    if (qemuRefreshVirtioChannelState(driver, vm,
                                      QEMU_ASYNC_JOB_MIGRATION_IN) < 0)
5315 5316
        goto endjob;

5317 5318
    if (qemuConnectAgent(driver, vm) < 0)
        goto endjob;
5319

5320 5321 5322 5323 5324 5325 5326 5327 5328 5329 5330 5331 5332
    if (flags & VIR_MIGRATE_PERSIST_DEST) {
        if (qemuMigrationPersist(driver, vm, mig, !v3proto) < 0) {
            /* Hmpf.  Migration was successful, but making it persistent
             * was not.  If we report successful, then when this domain
             * shuts down, management tools are in for a surprise.  On the
             * other hand, if we report failure, then the management tools
             * might try to restart the domain on the source side, even
             * though the domain is actually running on the destination.
             * Pretend success and hope that this is a rare situation and
             * management tools are smart.
             *
             * However, in v3 protocol, the source VM is still available
             * to restart during confirm() step, so we kill it off now.
5333 5334 5335
             */
            if (v3proto)
                goto endjob;
5336
        }
5337
    }
5338

5339 5340 5341 5342
    /* We need to wait for QEMU to process all data sent by the source
     * before starting guest CPUs.
     */
    if (qemuMigrationWaitForDestCompletion(driver, vm,
5343 5344
                                           QEMU_ASYNC_JOB_MIGRATION_IN,
                                           !!(flags & VIR_MIGRATE_POSTCOPY)) < 0) {
5345 5346 5347 5348 5349 5350
        /* There's not much we can do for v2 protocol since the
         * original domain on the source host is already gone.
         */
        if (v3proto)
            goto endjob;
    }
5351

5352
    if (priv->job.current->status == QEMU_DOMAIN_JOB_STATUS_POSTCOPY)
5353 5354
        inPostCopy = true;

5355 5356 5357 5358 5359 5360
    if (!(flags & VIR_MIGRATE_PAUSED)) {
        /* run 'cont' on the destination, which allows migration on qemu
         * >= 0.10.6 to work properly.  This isn't strictly necessary on
         * older qemu's, but it also doesn't hurt anything there
         */
        if (qemuProcessStartCPUs(driver, vm, dconn,
5361 5362
                                 inPostCopy ? VIR_DOMAIN_RUNNING_POSTCOPY
                                            : VIR_DOMAIN_RUNNING_MIGRATED,
5363 5364 5365 5366 5367 5368 5369 5370
                                 QEMU_ASYNC_JOB_MIGRATION_IN) < 0) {
            if (virGetLastError() == NULL)
                virReportError(VIR_ERR_INTERNAL_ERROR,
                               "%s", _("resume operation failed"));
            /* Need to save the current error, in case shutting
             * down the process overwrites it
             */
            orig_err = virSaveLastError();
5371

5372 5373 5374 5375 5376 5377 5378 5379 5380 5381
            /*
             * In v3 protocol, the source VM is still available to
             * restart during confirm() step, so we kill it off
             * now.
             * In v2 protocol, the source is dead, so we leave
             * target in paused state, in case admin can fix
             * things up.
             */
            if (v3proto)
                goto endjob;
5382
        }
5383 5384

        if (inPostCopy) {
5385
            doKill = false;
5386 5387 5388 5389 5390
            event = virDomainEventLifecycleNewFromObj(vm,
                                        VIR_DOMAIN_EVENT_RESUMED,
                                        VIR_DOMAIN_EVENT_RESUMED_POSTCOPY);
            qemuDomainEventQueue(driver, event);
        }
5391
    }
5392

5393
    if (mig->jobInfo) {
5394
        jobInfo = mig->jobInfo;
5395 5396 5397 5398 5399 5400
        mig->jobInfo = NULL;

        if (jobInfo->sent && timeReceived) {
            jobInfo->timeDelta = timeReceived - jobInfo->sent;
            jobInfo->received = timeReceived;
            jobInfo->timeDeltaSet = true;
5401
        }
5402 5403
        qemuDomainJobInfoUpdateTime(jobInfo);
        qemuDomainJobInfoUpdateDowntime(jobInfo);
5404
    }
L
liguang 已提交
5405

5406 5407 5408 5409 5410 5411 5412 5413 5414 5415 5416 5417 5418
    if (inPostCopy) {
        if (qemuMigrationWaitForDestCompletion(driver, vm,
                                               QEMU_ASYNC_JOB_MIGRATION_IN,
                                               false) < 0) {
            goto endjob;
        }
        if (virDomainObjGetState(vm, NULL) == VIR_DOMAIN_RUNNING) {
            virDomainObjSetState(vm,
                                 VIR_DOMAIN_RUNNING,
                                 VIR_DOMAIN_RUNNING_MIGRATED);
        }
    }

5419
    dom = virGetDomain(dconn, vm->def->name, vm->def->uuid, vm->def->id);
5420

5421 5422 5423 5424
    event = virDomainEventLifecycleNewFromObj(vm,
                                              VIR_DOMAIN_EVENT_RESUMED,
                                              VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
    qemuDomainEventQueue(driver, event);
5425

5426 5427 5428 5429 5430 5431
    if (virDomainObjGetState(vm, NULL) == VIR_DOMAIN_PAUSED) {
        virDomainObjSetState(vm, VIR_DOMAIN_PAUSED, VIR_DOMAIN_PAUSED_USER);
        event = virDomainEventLifecycleNewFromObj(vm,
                                                  VIR_DOMAIN_EVENT_SUSPENDED,
                                                  VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
        qemuDomainEventQueue(driver, event);
5432
    }
5433

5434
    if (virDomainObjIsActive(vm) &&
5435
        virDomainSaveStatus(driver->xmlopt, cfg->stateDir, vm, driver->caps) < 0)
5436 5437 5438 5439 5440
        VIR_WARN("Failed to save status on vm %s", vm->def->name);

    /* Guest is successfully running, so cancel previous auto destroy */
    qemuProcessAutoDestroyRemove(driver, vm);

5441
 endjob:
5442
    if (!dom &&
5443 5444
        !(flags & VIR_MIGRATE_OFFLINE) &&
        virDomainObjIsActive(vm)) {
5445
        if (doKill) {
5446 5447 5448 5449 5450 5451 5452 5453 5454 5455 5456
            qemuProcessStop(driver, vm, VIR_DOMAIN_SHUTOFF_FAILED,
                            QEMU_ASYNC_JOB_MIGRATION_IN,
                            VIR_QEMU_PROCESS_STOP_MIGRATED);
            virDomainAuditStop(vm, "failed");
            event = virDomainEventLifecycleNewFromObj(vm,
                                VIR_DOMAIN_EVENT_STOPPED,
                                VIR_DOMAIN_EVENT_STOPPED_FAILED);
            qemuDomainEventQueue(driver, event);
        } else {
            qemuMigrationPostcopyFailed(driver, vm);
        }
5457 5458
    }

5459 5460 5461 5462 5463 5464
    if (dom) {
        priv->job.completed = jobInfo;
        jobInfo = NULL;
        if (qemuMigrationBakeCookie(mig, driver, vm, cookieout, cookieoutlen,
                                    QEMU_MIGRATION_COOKIE_STATS) < 0)
            VIR_WARN("Unable to encode migration cookie");
5465 5466 5467 5468 5469 5470

        /* Remove completed stats for post-copy, everything but timing fields
         * is obsolete anyway.
         */
        if (inPostCopy)
            VIR_FREE(priv->job.completed);
5471
    }
5472

5473
    qemuMigrationReset(driver, vm, QEMU_ASYNC_JOB_MIGRATION_IN);
5474

5475
    qemuMigrationJobFinish(driver, vm);
5476
    if (!virDomainObjIsActive(vm))
5477
        qemuDomainRemoveInactiveJob(driver, vm);
5478

5479
 cleanup:
5480
    VIR_FREE(jobInfo);
5481
    virPortAllocatorRelease(driver->migrationPorts, port);
5482
    if (priv->mon)
5483
        qemuMonitorSetDomainLog(priv->mon, NULL, NULL, NULL);
5484
    VIR_FREE(priv->origname);
M
Michal Privoznik 已提交
5485
    virDomainObjEndAPI(&vm);
5486
    qemuMigrationCookieFree(mig);
5487 5488 5489 5490
    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
5491
    virObjectUnref(cfg);
5492 5493 5494 5495 5496 5497

    /* Set a special error if Finish is expected to return NULL as a result of
     * successful call with retcode != 0
     */
    if (retcode != 0 && !dom && !virGetLastError())
        virReportError(VIR_ERR_MIGRATE_FINISH_OK, NULL);
5498 5499
    return dom;
}
5500

5501

5502
/* Helper function called while vm is active.  */
5503
int
5504
qemuMigrationToFile(virQEMUDriverPtr driver, virDomainObjPtr vm,
5505
                    int fd,
5506
                    const char *compressor,
5507
                    qemuDomainAsyncJob asyncJob)
5508 5509 5510
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int rc;
5511
    int ret = -1;
5512 5513
    virCommandPtr cmd = NULL;
    int pipeFD[2] = { -1, -1 };
5514
    unsigned long saveMigBandwidth = priv->migMaxBandwidth;
5515
    char *errbuf = NULL;
5516
    virErrorPtr orig_err = NULL;
5517 5518 5519 5520 5521

    /* Increase migration bandwidth to unlimited since target is a file.
     * Failure to change migration speed is not fatal. */
    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) == 0) {
        qemuMonitorSetMigrationSpeed(priv->mon,
5522 5523
                                     QEMU_DOMAIN_MIG_BANDWIDTH_MAX);
        priv->migMaxBandwidth = QEMU_DOMAIN_MIG_BANDWIDTH_MAX;
5524 5525
        if (qemuDomainObjExitMonitor(driver, vm) < 0)
            return -1;
5526
    }
5527

5528 5529 5530 5531 5532 5533 5534
    if (!virDomainObjIsActive(vm)) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("guest unexpectedly quit"));
        /* nothing to tear down */
        return -1;
    }

5535 5536 5537 5538
    if (compressor && pipe(pipeFD) < 0) {
        virReportSystemError(errno, "%s",
                             _("Failed to create pipe for migration"));
        return -1;
5539 5540
    }

5541 5542 5543 5544
    /* All right! We can use fd migration, which means that qemu
     * doesn't have to open() the file, so while we still have to
     * grant SELinux access, we can do it on fd and avoid cleanup
     * later, as well as skip futzing with cgroup.  */
5545 5546
    if (qemuSecuritySetImageFDLabel(driver->securityManager, vm->def,
                                    compressor ? pipeFD[1] : fd) < 0)
5547 5548
        goto cleanup;

5549
    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
5550 5551
        goto cleanup;

5552
    if (!compressor) {
5553 5554 5555
        rc = qemuMonitorMigrateToFd(priv->mon,
                                    QEMU_MONITOR_MIGRATE_BACKGROUND,
                                    fd);
5556 5557 5558 5559 5560 5561 5562
    } else {
        const char *prog = compressor;
        const char *args[] = {
            prog,
            "-c",
            NULL
        };
5563 5564 5565 5566 5567 5568 5569 5570 5571 5572 5573

        cmd = virCommandNewArgs(args);
        virCommandSetInputFD(cmd, pipeFD[0]);
        virCommandSetOutputFD(cmd, &fd);
        virCommandSetErrorBuffer(cmd, &errbuf);
        virCommandDoAsyncIO(cmd);
        if (virSetCloseExec(pipeFD[1]) < 0) {
            virReportSystemError(errno, "%s",
                                 _("Unable to set cloexec flag"));
            ignore_value(qemuDomainObjExitMonitor(driver, vm));
            goto cleanup;
5574
        }
5575 5576 5577 5578 5579 5580 5581 5582 5583 5584
        if (virCommandRunAsync(cmd, NULL) < 0) {
            ignore_value(qemuDomainObjExitMonitor(driver, vm));
            goto cleanup;
        }
        rc = qemuMonitorMigrateToFd(priv->mon,
                                    QEMU_MONITOR_MIGRATE_BACKGROUND,
                                    pipeFD[1]);
        if (VIR_CLOSE(pipeFD[0]) < 0 ||
            VIR_CLOSE(pipeFD[1]) < 0)
            VIR_WARN("failed to close intermediate pipe");
5585
    }
5586
    if (qemuDomainObjExitMonitor(driver, vm) < 0)
5587
        goto cleanup;
5588 5589 5590
    if (rc < 0)
        goto cleanup;

5591
    rc = qemuMigrationWaitForCompletion(driver, vm, asyncJob, NULL, 0);
5592

5593 5594 5595 5596
    if (rc < 0) {
        if (rc == -2) {
            orig_err = virSaveLastError();
            virCommandAbort(cmd);
5597 5598
            if (virDomainObjIsActive(vm) &&
                qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) == 0) {
5599
                qemuMonitorMigrateCancel(priv->mon);
5600
                ignore_value(qemuDomainObjExitMonitor(driver, vm));
5601 5602
            }
        }
5603
        goto cleanup;
5604
    }
5605

5606 5607 5608
    if (cmd && virCommandWait(cmd, NULL) < 0)
        goto cleanup;

5609
    qemuDomainEventEmitJobCompleted(driver, vm);
5610 5611
    ret = 0;

5612
 cleanup:
5613 5614 5615
    if (ret < 0 && !orig_err)
        orig_err = virSaveLastError();

5616
    /* Restore max migration bandwidth */
5617 5618
    if (virDomainObjIsActive(vm) &&
        qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) == 0) {
5619 5620
        qemuMonitorSetMigrationSpeed(priv->mon, saveMigBandwidth);
        priv->migMaxBandwidth = saveMigBandwidth;
5621
        ignore_value(qemuDomainObjExitMonitor(driver, vm));
5622 5623
    }

5624 5625
    VIR_FORCE_CLOSE(pipeFD[0]);
    VIR_FORCE_CLOSE(pipeFD[1]);
5626 5627 5628 5629 5630
    if (cmd) {
        VIR_DEBUG("Compression binary stderr: %s", NULLSTR(errbuf));
        VIR_FREE(errbuf);
        virCommandFree(cmd);
    }
5631 5632 5633 5634 5635 5636

    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }

5637 5638
    return ret;
}
5639

5640 5641 5642 5643 5644 5645 5646 5647 5648 5649 5650 5651 5652 5653 5654 5655 5656 5657 5658 5659 5660 5661 5662 5663 5664 5665 5666 5667 5668 5669 5670 5671 5672 5673 5674 5675 5676 5677 5678 5679 5680 5681 5682 5683 5684 5685 5686

int
qemuMigrationCancel(virQEMUDriverPtr driver,
                    virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    virHashTablePtr blockJobs = NULL;
    bool storage = false;
    size_t i;
    int ret = -1;

    VIR_DEBUG("Canceling unfinished outgoing migration of domain %s",
              vm->def->name);

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
        if (QEMU_DOMAIN_DISK_PRIVATE(disk)->migrating) {
            qemuBlockJobSyncBegin(disk);
            storage = true;
        }
    }

    qemuDomainObjEnterMonitor(driver, vm);

    ignore_value(qemuMonitorMigrateCancel(priv->mon));
    if (storage)
        blockJobs = qemuMonitorGetAllBlockJobInfo(priv->mon);

    if (qemuDomainObjExitMonitor(driver, vm) < 0 || (storage && !blockJobs))
        goto endsyncjob;

    if (!storage) {
        ret = 0;
        goto cleanup;
    }

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
        qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);

        if (!diskPriv->migrating)
            continue;

        if (virHashLookup(blockJobs, disk->info.alias)) {
            VIR_DEBUG("Drive mirror on disk %s is still running", disk->dst);
        } else {
            VIR_DEBUG("Drive mirror on disk %s is gone", disk->dst);
5687
            qemuBlockJobSyncEnd(driver, vm, QEMU_ASYNC_JOB_NONE, disk);
5688 5689 5690 5691 5692
            diskPriv->migrating = false;
        }
    }

    if (qemuMigrationCancelDriveMirror(driver, vm, false,
5693
                                       QEMU_ASYNC_JOB_NONE, NULL) < 0)
5694 5695 5696 5697 5698 5699 5700 5701 5702 5703 5704 5705 5706 5707 5708
        goto endsyncjob;

    ret = 0;

 cleanup:
    virHashFree(blockJobs);
    return ret;

 endsyncjob:
    if (storage) {
        for (i = 0; i < vm->def->ndisks; i++) {
            virDomainDiskDefPtr disk = vm->def->disks[i];
            qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);

            if (diskPriv->migrating) {
5709
                qemuBlockJobSyncEnd(driver, vm, QEMU_ASYNC_JOB_NONE, disk);
5710 5711 5712 5713 5714 5715 5716 5717
                diskPriv->migrating = false;
            }
        }
    }
    goto cleanup;
}


5718
int
5719
qemuMigrationJobStart(virQEMUDriverPtr driver,
5720
                      virDomainObjPtr vm,
5721
                      qemuDomainAsyncJob job)
5722
{
5723 5724
    virDomainJobOperation op;
    unsigned long long mask;
5725

5726
    if (job == QEMU_ASYNC_JOB_MIGRATION_IN) {
5727 5728
        op = VIR_DOMAIN_JOB_OPERATION_MIGRATION_IN;
        mask = QEMU_JOB_NONE;
5729
    } else {
5730 5731 5732 5733
        op = VIR_DOMAIN_JOB_OPERATION_MIGRATION_OUT;
        mask = QEMU_JOB_DEFAULT_MASK |
               JOB_MASK(QEMU_JOB_SUSPEND) |
               JOB_MASK(QEMU_JOB_MIGRATION_OP);
5734
    }
5735

5736 5737 5738 5739
    if (qemuDomainObjBeginAsyncJob(driver, vm, job, op) < 0)
        return -1;

    qemuDomainObjSetAsyncJobMask(vm, mask);
5740 5741 5742 5743
    return 0;
}

void
5744
qemuMigrationJobSetPhase(virQEMUDriverPtr driver,
5745
                         virDomainObjPtr vm,
5746
                         qemuMigrationJobPhase phase)
5747 5748 5749 5750 5751 5752 5753 5754 5755 5756 5757 5758 5759 5760
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

    if (phase < priv->job.phase) {
        VIR_ERROR(_("migration protocol going backwards %s => %s"),
                  qemuMigrationJobPhaseTypeToString(priv->job.phase),
                  qemuMigrationJobPhaseTypeToString(phase));
        return;
    }

    qemuDomainObjSetJobPhase(driver, vm, phase);
}

void
5761
qemuMigrationJobStartPhase(virQEMUDriverPtr driver,
5762
                           virDomainObjPtr vm,
5763
                           qemuMigrationJobPhase phase)
5764 5765 5766 5767
{
    qemuMigrationJobSetPhase(driver, vm, phase);
}

5768
void
5769 5770
qemuMigrationJobContinue(virDomainObjPtr vm)
{
5771
    qemuDomainObjReleaseAsyncJob(vm);
5772 5773 5774 5775
}

bool
qemuMigrationJobIsActive(virDomainObjPtr vm,
5776
                         qemuDomainAsyncJob job)
5777 5778 5779 5780 5781 5782 5783 5784 5785 5786 5787
{
    qemuDomainObjPrivatePtr priv = vm->privateData;

    if (priv->job.asyncJob != job) {
        const char *msg;

        if (job == QEMU_ASYNC_JOB_MIGRATION_IN)
            msg = _("domain '%s' is not processing incoming migration");
        else
            msg = _("domain '%s' is not being migrated");

5788
        virReportError(VIR_ERR_OPERATION_INVALID, msg, vm->def->name);
5789 5790 5791 5792 5793
        return false;
    }
    return true;
}

5794
void
5795
qemuMigrationJobFinish(virQEMUDriverPtr driver, virDomainObjPtr vm)
5796
{
5797
    qemuDomainObjEndAsyncJob(driver, vm);
5798
}
5799 5800 5801 5802 5803 5804 5805 5806 5807 5808 5809 5810 5811 5812 5813 5814 5815 5816 5817 5818 5819 5820 5821 5822 5823 5824 5825 5826 5827 5828 5829 5830 5831 5832 5833 5834 5835 5836 5837 5838 5839 5840 5841 5842 5843 5844 5845 5846 5847 5848 5849 5850 5851 5852


static void
qemuMigrationErrorFree(void *data,
                       const void *name ATTRIBUTE_UNUSED)
{
    virErrorPtr err = data;
    virFreeError(err);
}

int
qemuMigrationErrorInit(virQEMUDriverPtr driver)
{
    driver->migrationErrors = virHashAtomicNew(64, qemuMigrationErrorFree);
    if (driver->migrationErrors)
        return 0;
    else
        return -1;
}

/**
 * This function consumes @err; the caller should consider the @err pointer
 * invalid after calling this function.
 */
void
qemuMigrationErrorSave(virQEMUDriverPtr driver,
                       const char *name,
                       virErrorPtr err)
{
    if (!err)
        return;

    VIR_DEBUG("Saving incoming migration error for domain %s: %s",
              name, err->message);
    if (virHashAtomicUpdate(driver->migrationErrors, name, err) < 0) {
        VIR_WARN("Failed to save migration error for domain '%s'", name);
        virFreeError(err);
    }
}

void
qemuMigrationErrorReport(virQEMUDriverPtr driver,
                         const char *name)
{
    virErrorPtr err;

    if (!(err = virHashAtomicSteal(driver->migrationErrors, name)))
        return;

    VIR_DEBUG("Restoring saved incoming migration error for domain %s: %s",
              name, err->message);
    virSetError(err);
    virFreeError(err);
}
5853 5854 5855 5856 5857 5858 5859 5860 5861 5862 5863 5864 5865 5866 5867 5868 5869 5870 5871 5872 5873 5874 5875 5876 5877 5878 5879 5880 5881 5882 5883 5884 5885 5886 5887 5888 5889 5890


/* don't ever pass NULL params with non zero nparams */
qemuMigrationCompressionPtr
qemuMigrationCompressionParse(virTypedParameterPtr params,
                              int nparams,
                              unsigned long flags)
{
    size_t i;
    qemuMigrationCompressionPtr compression = NULL;

    if (VIR_ALLOC(compression) < 0)
        return NULL;

    for (i = 0; i < nparams; i++) {
        int method;

        if (STRNEQ(params[i].field, VIR_MIGRATE_PARAM_COMPRESSION))
            continue;

        method = qemuMigrationCompressMethodTypeFromString(params[i].value.s);
        if (method < 0) {
            virReportError(VIR_ERR_INVALID_ARG,
                           _("Unsupported compression method '%s'"),
                           params[i].value.s);
            goto error;
        }

        if (compression->methods & (1ULL << method)) {
            virReportError(VIR_ERR_INVALID_ARG,
                           _("Compression method '%s' is specified twice"),
                           params[i].value.s);
            goto error;
        }

        compression->methods |= 1ULL << method;
    }

5891
#define GET_PARAM(PARAM, TYPE, VALUE)                                       \
5892 5893
    do {                                                                    \
        int rc;                                                             \
5894
        const char *par = VIR_MIGRATE_PARAM_COMPRESSION_ ## PARAM;          \
5895 5896
                                                                            \
        if ((rc = virTypedParamsGet ## TYPE(params, nparams,                \
5897
                                            par, &compression->VALUE)) < 0) \
5898 5899 5900
            goto error;                                                     \
                                                                            \
        if (rc == 1)                                                        \
5901
            compression->VALUE ## _set = true;                              \
5902 5903 5904
    } while (0)

    if (params) {
5905 5906 5907 5908
        GET_PARAM(MT_LEVEL, Int, level);
        GET_PARAM(MT_THREADS, Int, threads);
        GET_PARAM(MT_DTHREADS, Int, dthreads);
        GET_PARAM(XBZRLE_CACHE, ULLong, xbzrle_cache);
5909 5910 5911 5912
    }

#undef GET_PARAM

5913 5914 5915
    if ((compression->level_set ||
         compression->threads_set ||
         compression->dthreads_set) &&
5916 5917 5918 5919 5920 5921 5922 5923 5924 5925 5926 5927 5928
        !(compression->methods & (1ULL << QEMU_MIGRATION_COMPRESS_MT))) {
        virReportError(VIR_ERR_INVALID_ARG, "%s",
                       _("Turn multithread compression on to tune it"));
        goto error;
    }

    if (compression->xbzrle_cache_set &&
        !(compression->methods & (1ULL << QEMU_MIGRATION_COMPRESS_XBZRLE))) {
        virReportError(VIR_ERR_INVALID_ARG, "%s",
                       _("Turn xbzrle compression on to tune it"));
        goto error;
    }

5929 5930 5931 5932 5933 5934 5935 5936 5937 5938 5939 5940 5941 5942 5943 5944 5945 5946 5947
    if (!compression->methods && (flags & VIR_MIGRATE_COMPRESSED))
        compression->methods = 1ULL << QEMU_MIGRATION_COMPRESS_XBZRLE;

    return compression;

 error:
    VIR_FREE(compression);
    return NULL;
}

int
qemuMigrationCompressionDump(qemuMigrationCompressionPtr compression,
                             virTypedParameterPtr *params,
                             int *nparams,
                             int *maxparams,
                             unsigned long *flags)
{
    size_t i;

5948 5949
    if (compression->methods == 1ULL << QEMU_MIGRATION_COMPRESS_XBZRLE &&
        !compression->xbzrle_cache_set) {
5950 5951 5952 5953 5954 5955 5956 5957 5958 5959 5960 5961
        *flags |= VIR_MIGRATE_COMPRESSED;
        return 0;
    }

    for (i = 0; i < QEMU_MIGRATION_COMPRESS_LAST; ++i) {
        if ((compression->methods & (1ULL << i)) &&
            virTypedParamsAddString(params, nparams, maxparams,
                                    VIR_MIGRATE_PARAM_COMPRESSION,
                                    qemuMigrationCompressMethodTypeToString(i)) < 0)
            return -1;
    }

5962
    if (compression->level_set &&
5963 5964
        virTypedParamsAddInt(params, nparams, maxparams,
                             VIR_MIGRATE_PARAM_COMPRESSION_MT_LEVEL,
5965
                             compression->level) < 0)
5966 5967
        return -1;

5968
    if (compression->threads_set &&
5969 5970
        virTypedParamsAddInt(params, nparams, maxparams,
                             VIR_MIGRATE_PARAM_COMPRESSION_MT_THREADS,
5971
                             compression->threads) < 0)
5972 5973
        return -1;

5974
    if (compression->dthreads_set &&
5975 5976
        virTypedParamsAddInt(params, nparams, maxparams,
                             VIR_MIGRATE_PARAM_COMPRESSION_MT_DTHREADS,
5977
                             compression->dthreads) < 0)
5978 5979 5980 5981 5982 5983 5984 5985
        return -1;

    if (compression->xbzrle_cache_set &&
        virTypedParamsAddULLong(params, nparams, maxparams,
                                VIR_MIGRATE_PARAM_COMPRESSION_XBZRLE_CACHE,
                                compression->xbzrle_cache) < 0)
        return -1;

5986 5987
    return 0;
}
5988 5989 5990 5991 5992 5993 5994 5995 5996 5997 5998 5999 6000


/*
 * qemuMigrationReset:
 *
 * Reset all migration parameters so that the next job which internally uses
 * migration (save, managedsave, snapshots, dump) will not try to use them.
 */
void
qemuMigrationReset(virQEMUDriverPtr driver,
                   virDomainObjPtr vm,
                   qemuDomainAsyncJob job)
{
6001
    qemuMonitorMigrationCaps cap;
6002
    virErrorPtr err = virSaveLastError();
6003

6004
    if (!virDomainObjIsActive(vm))
6005
        goto cleanup;
6006

6007
    if (qemuMigrationResetTLS(driver, vm, job) < 0)
6008
        goto cleanup;
6009 6010

    for (cap = 0; cap < QEMU_MONITOR_MIGRATION_CAPS_LAST; cap++) {
6011 6012
        if (qemuMigrationCapsGet(vm, cap) &&
            qemuMigrationSetOption(driver, vm, cap, false, job) < 0)
6013 6014 6015 6016 6017 6018 6019
            goto cleanup;
    }

 cleanup:
    if (err) {
        virSetError(err);
        virFreeError(err);
6020
    }
6021
}
6022 6023 6024 6025 6026 6027 6028 6029 6030 6031 6032 6033 6034 6035 6036 6037 6038 6039 6040 6041 6042 6043 6044 6045 6046 6047 6048 6049 6050 6051 6052 6053 6054 6055 6056 6057 6058 6059 6060 6061 6062 6063 6064 6065 6066 6067 6068 6069 6070 6071 6072


int
qemuMigrationFetchMirrorStats(virQEMUDriverPtr driver,
                              virDomainObjPtr vm,
                              qemuDomainAsyncJob asyncJob,
                              qemuDomainJobInfoPtr jobInfo)
{
    size_t i;
    qemuDomainObjPrivatePtr priv = vm->privateData;
    bool nbd = false;
    virHashTablePtr blockinfo = NULL;
    qemuDomainMirrorStatsPtr stats = &jobInfo->mirrorStats;

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
        if (QEMU_DOMAIN_DISK_PRIVATE(disk)->migrating) {
            nbd = true;
            break;
        }
    }

    if (!nbd)
        return 0;

    if (qemuDomainObjEnterMonitorAsync(driver, vm, asyncJob) < 0)
        return -1;

    blockinfo = qemuMonitorGetAllBlockJobInfo(priv->mon);

    if (qemuDomainObjExitMonitor(driver, vm) < 0 || !blockinfo)
        return -1;

    memset(stats, 0, sizeof(*stats));

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk = vm->def->disks[i];
        qemuDomainDiskPrivatePtr diskPriv = QEMU_DOMAIN_DISK_PRIVATE(disk);
        qemuMonitorBlockJobInfoPtr data;

        if (!diskPriv->migrating ||
            !(data = virHashLookup(blockinfo, disk->info.alias)))
            continue;

        stats->transferred += data->cur;
        stats->total += data->end;
    }

    virHashFree(blockinfo);
    return 0;
}
6073 6074 6075 6076 6077 6078 6079 6080 6081 6082 6083 6084 6085 6086


bool
qemuMigrationCapsGet(virDomainObjPtr vm,
                     qemuMonitorMigrationCaps cap)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    bool enabled = false;

    if (priv->migrationCaps)
        ignore_value(virBitmapGetBit(priv->migrationCaps, cap, &enabled));

    return enabled;
}