qemu_driver.c 319.6 KB
Newer Older
D
Daniel P. Berrange 已提交
1 2 3
/*
 * driver.c: core driver methods for managing qemu guests
 *
4
 * Copyright (C) 2006-2011 Red Hat, Inc.
D
Daniel P. Berrange 已提交
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 * Copyright (C) 2006 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307  USA
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

24
#include <config.h>
25

D
Daniel P. Berrange 已提交
26 27
#include <sys/types.h>
#include <sys/poll.h>
28
#include <sys/time.h>
D
Daniel P. Berrange 已提交
29 30 31
#include <dirent.h>
#include <limits.h>
#include <string.h>
32
#include <stdbool.h>
D
Daniel P. Berrange 已提交
33 34 35 36 37
#include <stdio.h>
#include <stdarg.h>
#include <stdlib.h>
#include <unistd.h>
#include <errno.h>
38
#include <sys/utsname.h>
39 40 41 42
#include <sys/stat.h>
#include <fcntl.h>
#include <signal.h>
#include <paths.h>
43
#include <stdio.h>
44
#include <sys/wait.h>
45
#include <sys/ioctl.h>
46
#include <sys/un.h>
D
Daniel P. Berrange 已提交
47

48

49
#include "virterror_internal.h"
50
#include "logging.h"
51
#include "datatypes.h"
52 53
#include "qemu_driver.h"
#include "qemu_conf.h"
54
#include "qemu_capabilities.h"
55
#include "qemu_command.h"
56
#include "qemu_cgroup.h"
57
#include "qemu_hostdev.h"
58
#include "qemu_hotplug.h"
59
#include "qemu_monitor.h"
60
#include "qemu_bridge_filter.h"
61
#include "qemu_audit.h"
J
Jim Meyering 已提交
62
#include "c-ctype.h"
63
#include "event.h"
64
#include "buf.h"
65
#include "util.h"
66
#include "nodeinfo.h"
67
#include "stats_linux.h"
68
#include "capabilities.h"
69
#include "memory.h"
70
#include "uuid.h"
71
#include "domain_conf.h"
72 73
#include "node_device_conf.h"
#include "pci.h"
74
#include "hostusb.h"
75
#include "processinfo.h"
C
Chris Lalancette 已提交
76
#include "libvirt_internal.h"
77
#include "xml.h"
78
#include "cpu/cpu.h"
79
#include "macvtap.h"
80
#include "sysinfo.h"
81
#include "domain_nwfilter.h"
82
#include "hooks.h"
83
#include "storage_file.h"
84
#include "files.h"
85
#include "fdstream.h"
86
#include "configmake.h"
H
Hu Tao 已提交
87
#include "threadpool.h"
88

89 90
#define VIR_FROM_THIS VIR_FROM_QEMU

91 92 93
#define QEMU_VNC_PORT_MIN  5900
#define QEMU_VNC_PORT_MAX  65535

94 95
#define QEMU_NB_MEM_PARAM  3

96

97 98
#define timeval_to_ms(tv)       (((tv).tv_sec * 1000ull) + ((tv).tv_usec / 1000))

H
Hu Tao 已提交
99 100 101 102 103 104 105 106
struct watchdogEvent
{
    virDomainObjPtr vm;
    int action;
};

static void processWatchdogEvent(void *data, void *opaque);

107 108
static int qemudShutdown(void);

109 110 111
static void qemuDomainEventFlush(int timer, void *opaque);
static void qemuDomainEventQueue(struct qemud_driver *driver,
                                 virDomainEventPtr event);
112

J
Jiri Denemark 已提交
113 114
static int qemudDomainObjStart(virConnectPtr conn,
                               struct qemud_driver *driver,
115 116
                               virDomainObjPtr vm,
                               bool start_paused);
J
Jiri Denemark 已提交
117

118 119
static int qemudStartVMDaemon(virConnectPtr conn,
                              struct qemud_driver *driver,
120
                              virDomainObjPtr vm,
121
                              const char *migrateFrom,
122
                              bool start_paused,
123
                              int stdin_fd,
124 125
                              const char *stdin_path,
                              enum virVMOperationType vmop);
126

127
static void qemudShutdownVMDaemon(struct qemud_driver *driver,
128 129
                                  virDomainObjPtr vm,
                                  int migrated);
130

131
static int qemudDomainGetMaxVcpus(virDomainPtr dom);
132

133
static int qemuDetectVcpuPIDs(struct qemud_driver *driver,
134
                              virDomainObjPtr vm);
135

136 137 138
static int qemudVMFiltersInstantiate(virConnectPtr conn,
                                     virDomainDefPtr def);

J
Jim Meyering 已提交
139
static struct qemud_driver *qemu_driver = NULL;
140

141

H
Hu Tao 已提交
142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
static int doStartCPUs(struct qemud_driver *driver, virDomainObjPtr vm, virConnectPtr conn)
{
    int ret;
    qemuDomainObjPrivatePtr priv = vm->privateData;

    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorStartCPUs(priv->mon, conn);
    if (ret == 0) {
        vm->state = VIR_DOMAIN_RUNNING;
    }
    qemuDomainObjExitMonitorWithDriver(driver, vm);

    return ret;
}

H
Hu Tao 已提交
157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172
static int doStopCPUs(struct qemud_driver *driver, virDomainObjPtr vm)
{
    int ret;
    int oldState = vm->state;
    qemuDomainObjPrivatePtr priv = vm->privateData;

    vm->state = VIR_DOMAIN_PAUSED;
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorStopCPUs(priv->mon);
    qemuDomainObjExitMonitorWithDriver(driver, vm);
    if (ret < 0) {
        vm->state = oldState;
    }
    return ret;
}

173

174
static int
175
qemudLogFD(struct qemud_driver *driver, const char* name, bool append)
176
{
177
    char *logfile;
178
    mode_t logmode;
179
    int fd = -1;
180

181
    if (virAsprintf(&logfile, "%s/%s.log", driver->logDir, name) < 0) {
182
        virReportOOMError();
183 184 185 186
        return -1;
    }

    logmode = O_CREAT | O_WRONLY;
187
    /* Only logrotate files in /var/log, so only append if running privileged */
188
    if (driver->privileged || append)
189
        logmode |= O_APPEND;
190 191 192
    else
        logmode |= O_TRUNC;

193
    if ((fd = open(logfile, logmode, S_IRUSR | S_IWUSR)) < 0) {
194
        virReportSystemError(errno,
195 196
                             _("failed to create logfile %s"),
                             logfile);
197
        VIR_FREE(logfile);
198 199
        return -1;
    }
200
    VIR_FREE(logfile);
201
    if (virSetCloseExec(fd) < 0) {
202
        virReportSystemError(errno, "%s",
203
                             _("Unable to set VM logfile close-on-exec flag"));
204
        VIR_FORCE_CLOSE(fd);
205 206 207 208 209 210
        return -1;
    }
    return fd;
}


211
static int
212
qemudLogReadFD(const char* logDir, const char* name, off_t pos)
213
{
214
    char *logfile;
215
    mode_t logmode = O_RDONLY;
216
    int fd = -1;
217

218
    if (virAsprintf(&logfile, "%s/%s.log", logDir, name) < 0) {
219 220 221
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("failed to build logfile name %s/%s.log"),
                        logDir, name);
222 223 224 225
        return -1;
    }

    if ((fd = open(logfile, logmode)) < 0) {
226
        virReportSystemError(errno,
227 228
                             _("failed to create logfile %s"),
                             logfile);
229
        VIR_FREE(logfile);
230 231
        return -1;
    }
232
    if (virSetCloseExec(fd) < 0) {
233
        virReportSystemError(errno, "%s",
234
                             _("Unable to set VM logfile close-on-exec flag"));
235
        VIR_FORCE_CLOSE(fd);
236
        VIR_FREE(logfile);
237 238
        return -1;
    }
239
    if (pos < 0 || lseek(fd, pos, SEEK_SET) < 0) {
240
        virReportSystemError(pos < 0 ? 0 : errno,
241 242
                             _("Unable to seek to %lld in %s"),
                             (long long) pos, logfile);
243
        VIR_FORCE_CLOSE(fd);
244
    }
245
    VIR_FREE(logfile);
246 247 248 249
    return fd;
}


250 251 252 253 254 255 256 257 258
struct qemuAutostartData {
    struct qemud_driver *driver;
    virConnectPtr conn;
};
static void
qemuAutostartDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    struct qemuAutostartData *data = opaque;
259
    virErrorPtr err;
260 261

    virDomainObjLock(vm);
262 263 264 265 266 267 268 269 270
    virResetLastError();
    if (qemuDomainObjBeginJobWithDriver(data->driver, vm) < 0) {
        err = virGetLastError();
        VIR_ERROR(_("Failed to start job on VM '%s': %s"),
                  vm->def->name,
                  err ? err->message : _("unknown error"));
    } else {
        if (vm->autostart &&
            !virDomainObjIsActive(vm) &&
271
            qemudDomainObjStart(data->conn, data->driver, vm, false) < 0) {
272
            err = virGetLastError();
273
            VIR_ERROR(_("Failed to autostart VM '%s': %s"),
274
                      vm->def->name,
275
                      err ? err->message : _("unknown error"));
276
        }
277 278 279

        if (qemuDomainObjEndJob(vm) == 0)
            vm = NULL;
280
    }
281 282 283

    if (vm)
        virDomainObjUnlock(vm);
284 285
}

286 287
static void
qemudAutostartConfigs(struct qemud_driver *driver) {
288 289 290 291 292
    /* XXX: Figure out a better way todo this. The domain
     * startup code needs a connection handle in order
     * to lookup the bridge associated with a virtual
     * network
     */
293 294 295
    virConnectPtr conn = virConnectOpen(driver->privileged ?
                                        "qemu:///system" :
                                        "qemu:///session");
296
    /* Ignoring NULL conn which is mostly harmless here */
297
    struct qemuAutostartData data = { driver, conn };
298

299
    qemuDriverLock(driver);
300
    virHashForEach(driver->domains.objs, qemuAutostartDomain, &data);
301
    qemuDriverUnlock(driver);
302

303 304
    if (conn)
        virConnectClose(conn);
305 306
}

307 308 309 310 311 312 313 314 315

/**
 * qemudRemoveDomainStatus
 *
 * remove all state files of a domain from statedir
 *
 * Returns 0 on success
 */
static int
316
qemudRemoveDomainStatus(struct qemud_driver *driver,
317 318
                        virDomainObjPtr vm)
{
319
    char ebuf[1024];
320 321 322
    char *file = NULL;

    if (virAsprintf(&file, "%s/%s.xml", driver->stateDir, vm->def->name) < 0) {
323
        virReportOOMError();
D
Daniel Veillard 已提交
324
        return(-1);
325 326
    }

327
    if (unlink(file) < 0 && errno != ENOENT && errno != ENOTDIR)
328
        VIR_WARN("Failed to remove domain XML for %s: %s",
D
Daniel Veillard 已提交
329 330 331
                 vm->def->name, virStrerror(errno, ebuf, sizeof(ebuf)));
    VIR_FREE(file);

332
    if (virFileDeletePid(driver->stateDir, vm->def->name) != 0)
333
        VIR_WARN("Failed to remove PID file for %s: %s",
334
                 vm->def->name, virStrerror(errno, ebuf, sizeof(ebuf)));
335

D
Daniel Veillard 已提交
336

337
    return 0;
338 339
}

340 341 342 343 344 345 346 347 348 349 350 351 352

/*
 * This is a callback registered with a qemuMonitorPtr  instance,
 * and to be invoked when the monitor console hits an end of file
 * condition, or error, thus indicating VM shutdown should be
 * performed
 */
static void
qemuHandleMonitorEOF(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                     virDomainObjPtr vm,
                     int hasError) {
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event = NULL;
353
    qemuDomainObjPrivatePtr priv;
354

355
    VIR_DEBUG("Received EOF on %p '%s'", vm, vm->def->name);
356

357 358
    virDomainObjLock(vm);

359 360 361 362 363 364 365
    priv = vm->privateData;
    if (!hasError && priv->monJSON && !priv->gotShutdown) {
        VIR_DEBUG("Monitor connection to '%s' closed without SHUTDOWN event; "
                  "assuming the domain crashed", vm->def->name);
        hasError = 1;
    }

366 367 368 369 370 371
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     hasError ?
                                     VIR_DOMAIN_EVENT_STOPPED_FAILED :
                                     VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);

372
    qemudShutdownVMDaemon(driver, vm, 0);
373 374
    qemuDomainStopAudit(vm, hasError ? "failed" : "shutdown");

375 376 377 378 379 380 381 382 383 384 385 386 387
    if (!vm->persistent)
        virDomainRemoveInactive(&driver->domains, vm);
    else
        virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }
}


388 389 390
static virDomainDiskDefPtr
findDomainDiskByPath(virDomainObjPtr vm,
                     const char *path)
391 392 393 394 395 396 397
{
    int i;

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk;

        disk = vm->def->disks[i];
398 399
        if (disk->src != NULL && STREQ(disk->src, path))
            return disk;
400
    }
401 402 403 404

    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                    _("no disk found with path %s"),
                    path);
405 406 407
    return NULL;
}

408 409 410 411 412 413
static virDomainDiskDefPtr
findDomainDiskByAlias(virDomainObjPtr vm,
                      const char *alias)
{
    int i;

414 415 416
    if (STRPREFIX(alias, QEMU_DRIVE_HOST_PREFIX))
        alias += strlen(QEMU_DRIVE_HOST_PREFIX);

417 418 419 420 421 422 423 424 425 426 427 428 429 430
    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk;

        disk = vm->def->disks[i];
        if (disk->info.alias != NULL && STREQ(disk->info.alias, alias))
            return disk;
    }

    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                    _("no disk found with alias %s"),
                    alias);
    return NULL;
}

431
static int
432 433 434 435
getVolumeQcowPassphrase(virConnectPtr conn,
                        virDomainDiskDefPtr disk,
                        char **secretRet,
                        size_t *secretLen)
436 437 438 439 440
{
    virSecretPtr secret;
    char *passphrase;
    unsigned char *data;
    size_t size;
441
    int ret = -1;
442
    virStorageEncryptionPtr enc;
443

444 445 446 447 448 449 450
    if (!disk->encryption) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("disk %s does not have any encryption information"),
                        disk->src);
        return -1;
    }
    enc = disk->encryption;
451 452

    if (!conn) {
453
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
454
                        "%s", _("cannot find secrets without a connection"));
455
        goto cleanup;
456 457 458 459 460
    }

    if (conn->secretDriver == NULL ||
        conn->secretDriver->lookupByUUID == NULL ||
        conn->secretDriver->getValue == NULL) {
461 462
        qemuReportError(VIR_ERR_NO_SUPPORT, "%s",
                        _("secret storage not supported"));
463
        goto cleanup;
464 465 466 467 468 469
    }

    if (enc->format != VIR_STORAGE_ENCRYPTION_FORMAT_QCOW ||
        enc->nsecrets != 1 ||
        enc->secrets[0]->type !=
        VIR_STORAGE_ENCRYPTION_SECRET_TYPE_PASSPHRASE) {
470
        qemuReportError(VIR_ERR_INVALID_DOMAIN,
471
                        _("invalid <encryption> for volume %s"), disk->src);
472
        goto cleanup;
473 474 475 476 477
    }

    secret = conn->secretDriver->lookupByUUID(conn,
                                              enc->secrets[0]->uuid);
    if (secret == NULL)
478
        goto cleanup;
479 480 481 482
    data = conn->secretDriver->getValue(secret, &size,
                                        VIR_SECRET_GET_VALUE_INTERNAL_CALL);
    virUnrefSecret(secret);
    if (data == NULL)
483
        goto cleanup;
484 485 486 487

    if (memchr(data, '\0', size) != NULL) {
        memset(data, 0, size);
        VIR_FREE(data);
488 489
        qemuReportError(VIR_ERR_INVALID_SECRET,
                        _("format='qcow' passphrase for %s must not contain a "
490
                          "'\\0'"), disk->src);
491
        goto cleanup;
492 493 494 495 496
    }

    if (VIR_ALLOC_N(passphrase, size + 1) < 0) {
        memset(data, 0, size);
        VIR_FREE(data);
497
        virReportOOMError();
498
        goto cleanup;
499 500 501 502 503 504 505 506 507 508
    }
    memcpy(passphrase, data, size);
    passphrase[size] = '\0';

    memset(data, 0, size);
    VIR_FREE(data);

    *secretRet = passphrase;
    *secretLen = size;

509 510 511
    ret = 0;

cleanup:
512 513
    return ret;
}
514

515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535
static int
findVolumeQcowPassphrase(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virConnectPtr conn,
                         virDomainObjPtr vm,
                         const char *path,
                         char **secretRet,
                         size_t *secretLen)
{
    virDomainDiskDefPtr disk;
    int ret = -1;

    virDomainObjLock(vm);
    disk = findDomainDiskByPath(vm, path);

    if (!disk)
        goto cleanup;

    ret = getVolumeQcowPassphrase(conn, disk, secretRet, secretLen);

cleanup:
    virDomainObjUnlock(vm);
536
    return ret;
537 538
}

539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560

static int
qemuHandleDomainReset(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                      virDomainObjPtr vm)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event;

    virDomainObjLock(vm);
    event = virDomainEventRebootNewFromObj(vm);
    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;
}


561 562 563 564 565 566 567 568 569 570 571 572
static int
qemuHandleDomainShutdown(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virDomainObjPtr vm)
{
    virDomainObjLock(vm);
    ((qemuDomainObjPrivatePtr) vm->privateData)->gotShutdown = true;
    virDomainObjUnlock(vm);

    return 0;
}


573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604
static int
qemuHandleDomainStop(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                     virDomainObjPtr vm)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event = NULL;

    virDomainObjLock(vm);
    if (vm->state == VIR_DOMAIN_RUNNING) {
        VIR_DEBUG("Transitioned guest %s to paused state due to unknown event", vm->def->name);

        vm->state = VIR_DOMAIN_PAUSED;
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);

        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            VIR_WARN("Unable to save status on vm %s after IO error", vm->def->name);
    }
    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        if (event)
            qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;
}


605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633
static int
qemuHandleDomainRTCChange(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                          virDomainObjPtr vm,
                          long long offset)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event;

    virDomainObjLock(vm);
    event = virDomainEventRTCChangeNewFromObj(vm, offset);

    if (vm->def->clock.offset == VIR_DOMAIN_CLOCK_OFFSET_VARIABLE)
        vm->def->clock.data.adjustment = offset;

    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
        VIR_WARN0("unable to save domain status with RTC change");

    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;
}


634 635 636 637 638 639
static int
qemuHandleDomainWatchdog(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virDomainObjPtr vm,
                         int action)
{
    struct qemud_driver *driver = qemu_driver;
640 641
    virDomainEventPtr watchdogEvent = NULL;
    virDomainEventPtr lifecycleEvent = NULL;
642 643

    virDomainObjLock(vm);
644 645 646 647 648 649 650 651 652 653 654 655 656 657
    watchdogEvent = virDomainEventWatchdogNewFromObj(vm, action);

    if (action == VIR_DOMAIN_EVENT_WATCHDOG_PAUSE &&
        vm->state == VIR_DOMAIN_RUNNING) {
        VIR_DEBUG("Transitioned guest %s to paused state due to watchdog", vm->def->name);

        vm->state = VIR_DOMAIN_PAUSED;
        lifecycleEvent = virDomainEventNewFromObj(vm,
                                                  VIR_DOMAIN_EVENT_SUSPENDED,
                                                  VIR_DOMAIN_EVENT_SUSPENDED_WATCHDOG);

        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            VIR_WARN("Unable to save status on vm %s after IO error", vm->def->name);
    }
H
Hu Tao 已提交
658 659 660 661 662 663 664 665 666 667 668

    if (vm->def->watchdog->action == VIR_DOMAIN_WATCHDOG_ACTION_DUMP) {
        struct watchdogEvent *wdEvent;
        if (VIR_ALLOC(wdEvent) == 0) {
            wdEvent->action = VIR_DOMAIN_WATCHDOG_ACTION_DUMP;
            wdEvent->vm = vm;
            ignore_value(virThreadPoolSendJob(driver->workerPool, wdEvent));
        } else
            virReportOOMError();
    }

669 670
    virDomainObjUnlock(vm);

671
    if (watchdogEvent || lifecycleEvent) {
672
        qemuDriverLock(driver);
673 674 675 676
        if (watchdogEvent)
            qemuDomainEventQueue(driver, watchdogEvent);
        if (lifecycleEvent)
            qemuDomainEventQueue(driver, lifecycleEvent);
677 678 679 680 681 682 683
        qemuDriverUnlock(driver);
    }

    return 0;
}


684 685 686 687
static int
qemuHandleDomainIOError(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                        virDomainObjPtr vm,
                        const char *diskAlias,
688 689
                        int action,
                        const char *reason)
690 691
{
    struct qemud_driver *driver = qemu_driver;
692
    virDomainEventPtr ioErrorEvent = NULL;
693
    virDomainEventPtr ioErrorEvent2 = NULL;
694
    virDomainEventPtr lifecycleEvent = NULL;
695 696 697 698 699 700 701 702 703 704 705 706 707 708 709
    const char *srcPath;
    const char *devAlias;
    virDomainDiskDefPtr disk;

    virDomainObjLock(vm);
    disk = findDomainDiskByAlias(vm, diskAlias);

    if (disk) {
        srcPath = disk->src;
        devAlias = disk->info.alias;
    } else {
        srcPath = "";
        devAlias = "";
    }

710
    ioErrorEvent = virDomainEventIOErrorNewFromObj(vm, srcPath, devAlias, action);
711
    ioErrorEvent2 = virDomainEventIOErrorReasonNewFromObj(vm, srcPath, devAlias, action, reason);
712 713 714 715 716 717 718 719 720 721 722 723 724

    if (action == VIR_DOMAIN_EVENT_IO_ERROR_PAUSE &&
        vm->state == VIR_DOMAIN_RUNNING) {
        VIR_DEBUG("Transitioned guest %s to paused state due to IO error", vm->def->name);

        vm->state = VIR_DOMAIN_PAUSED;
        lifecycleEvent = virDomainEventNewFromObj(vm,
                                                  VIR_DOMAIN_EVENT_SUSPENDED,
                                                  VIR_DOMAIN_EVENT_SUSPENDED_IOERROR);

        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            VIR_WARN("Unable to save status on vm %s after IO error", vm->def->name);
    }
725 726
    virDomainObjUnlock(vm);

727
    if (ioErrorEvent || ioErrorEvent2 || lifecycleEvent) {
728
        qemuDriverLock(driver);
729 730
        if (ioErrorEvent)
            qemuDomainEventQueue(driver, ioErrorEvent);
731 732
        if (ioErrorEvent2)
            qemuDomainEventQueue(driver, ioErrorEvent2);
733 734
        if (lifecycleEvent)
            qemuDomainEventQueue(driver, lifecycleEvent);
735 736 737 738 739 740 741
        qemuDriverUnlock(driver);
    }

    return 0;
}


742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833
static int
qemuHandleDomainGraphics(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virDomainObjPtr vm,
                         int phase,
                         int localFamily,
                         const char *localNode,
                         const char *localService,
                         int remoteFamily,
                         const char *remoteNode,
                         const char *remoteService,
                         const char *authScheme,
                         const char *x509dname,
                         const char *saslUsername)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event;
    virDomainEventGraphicsAddressPtr localAddr = NULL;
    virDomainEventGraphicsAddressPtr remoteAddr = NULL;
    virDomainEventGraphicsSubjectPtr subject = NULL;
    int i;

    virDomainObjLock(vm);

    if (VIR_ALLOC(localAddr) < 0)
        goto no_memory;
    localAddr->family = localFamily;
    if (!(localAddr->service = strdup(localService)) ||
        !(localAddr->node = strdup(localNode)))
        goto no_memory;

    if (VIR_ALLOC(remoteAddr) < 0)
        goto no_memory;
    remoteAddr->family = remoteFamily;
    if (!(remoteAddr->service = strdup(remoteService)) ||
        !(remoteAddr->node = strdup(remoteNode)))
        goto no_memory;

    if (VIR_ALLOC(subject) < 0)
        goto no_memory;
    if (x509dname) {
        if (VIR_REALLOC_N(subject->identities, subject->nidentity+1) < 0)
            goto no_memory;
        if (!(subject->identities[subject->nidentity].type = strdup("x509dname")) ||
            !(subject->identities[subject->nidentity].name = strdup(x509dname)))
            goto no_memory;
        subject->nidentity++;
    }
    if (saslUsername) {
        if (VIR_REALLOC_N(subject->identities, subject->nidentity+1) < 0)
            goto no_memory;
        if (!(subject->identities[subject->nidentity].type = strdup("saslUsername")) ||
            !(subject->identities[subject->nidentity].name = strdup(saslUsername)))
            goto no_memory;
        subject->nidentity++;
    }

    event = virDomainEventGraphicsNewFromObj(vm, phase, localAddr, remoteAddr, authScheme, subject);
    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;

no_memory:
    virReportOOMError();
    if (localAddr) {
        VIR_FREE(localAddr->service);
        VIR_FREE(localAddr->node);
        VIR_FREE(localAddr);
    }
    if (remoteAddr) {
        VIR_FREE(remoteAddr->service);
        VIR_FREE(remoteAddr->node);
        VIR_FREE(remoteAddr);
    }
    if (subject) {
        for (i = 0 ; i < subject->nidentity ; i++) {
            VIR_FREE(subject->identities[i].type);
            VIR_FREE(subject->identities[i].name);
        }
        VIR_FREE(subject->identities);
        VIR_FREE(subject);
    }

    return -1;
}


834 835 836 837 838 839 840 841 842
static void qemuHandleMonitorDestroy(qemuMonitorPtr mon,
                                     virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    if (priv->mon == mon)
        priv->mon = NULL;
    virDomainObjUnref(vm);
}

843
static qemuMonitorCallbacks monitorCallbacks = {
844
    .destroy = qemuHandleMonitorDestroy,
845 846
    .eofNotify = qemuHandleMonitorEOF,
    .diskSecretLookup = findVolumeQcowPassphrase,
847
    .domainShutdown = qemuHandleDomainShutdown,
848
    .domainStop = qemuHandleDomainStop,
849
    .domainReset = qemuHandleDomainReset,
850
    .domainRTCChange = qemuHandleDomainRTCChange,
851
    .domainWatchdog = qemuHandleDomainWatchdog,
852
    .domainIOError = qemuHandleDomainIOError,
853
    .domainGraphics = qemuHandleDomainGraphics,
854 855
};

856
static int
857
qemuConnectMonitor(struct qemud_driver *driver, virDomainObjPtr vm)
858
{
859
    qemuDomainObjPrivatePtr priv = vm->privateData;
860
    int ret = -1;
861

862
    if (virSecurityManagerSetSocketLabel(driver->securityManager, vm) < 0) {
863 864
        VIR_ERROR(_("Failed to set security context for monitor for %s"),
                  vm->def->name);
865 866 867
        goto error;
    }

868 869 870 871 872 873 874 875 876 877 878
    /* Hold an extra reference because we can't allow 'vm' to be
     * deleted while the monitor is active */
    virDomainObjRef(vm);

    priv->mon = qemuMonitorOpen(vm,
                                priv->monConfig,
                                priv->monJSON,
                                &monitorCallbacks);

    if (priv->mon == NULL)
        virDomainObjUnref(vm);
879

880
    if (virSecurityManagerClearSocketLabel(driver->securityManager, vm) < 0) {
881 882
        VIR_ERROR(_("Failed to clear security context for monitor for %s"),
                  vm->def->name);
883
        goto error;
884
    }
885

886 887 888 889 890 891
    if (priv->mon == NULL) {
        VIR_INFO("Failed to connect monitor for %s", vm->def->name);
        goto error;
    }


892 893 894 895
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorSetCapabilities(priv->mon);
    qemuDomainObjExitMonitorWithDriver(driver, vm);

896
error:
897
    if (ret < 0)
898 899 900
        qemuMonitorClose(priv->mon);

    return ret;
901
}
902

903 904 905 906
struct virReconnectDomainData {
    virConnectPtr conn;
    struct qemud_driver *driver;
};
907 908 909
/*
 * Open an existing VM's monitor, re-detect VCPU threads
 * and re-reserve the security labels in use
910
 */
911 912
static void
qemuReconnectDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
913
{
914
    virDomainObjPtr obj = payload;
915 916
    struct virReconnectDomainData *data = opaque;
    struct qemud_driver *driver = data->driver;
917
    qemuDomainObjPrivatePtr priv;
918
    unsigned long long qemuCmdFlags;
919
    virConnectPtr conn = data->conn;
920 921

    virDomainObjLock(obj);
922

923 924
    VIR_DEBUG("Reconnect monitor to %p '%s'", obj, obj->def->name);

925 926
    priv = obj->privateData;

927
    /* XXX check PID liveliness & EXE path */
928
    if (qemuConnectMonitor(driver, obj) < 0)
929
        goto error;
930

931 932 933 934
    if (qemuUpdateActivePciHostdevs(driver, obj->def) < 0) {
        goto error;
    }

935 936 937
    /* XXX we should be persisting the original flags in the XML
     * not re-detecting them, since the binary may have changed
     * since launch time */
938 939 940
    if (qemuCapsExtractVersionInfo(obj->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) >= 0 &&
941
        (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE)) {
942 943
        priv->persistentAddrs = 1;

944 945 946 947
        if (!(priv->pciaddrs = qemuDomainPCIAddressSetCreate(obj->def)) ||
            qemuAssignDevicePCISlots(obj->def, priv->pciaddrs) < 0)
            goto error;
    }
948

949
    if (virSecurityManagerReserveLabel(driver->securityManager, obj) < 0)
950
        goto error;
951

952 953 954
    if (qemudVMFiltersInstantiate(conn, obj->def))
        goto error;

955 956
    if (obj->def->id >= driver->nextvmid)
        driver->nextvmid = obj->def->id + 1;
957

958 959
    virDomainObjUnlock(obj);
    return;
960

961
error:
962 963 964
    /* We can't get the monitor back, so must kill the VM
     * to remove danger of it ending up running twice if
     * user tries to start it again later */
965
    qemudShutdownVMDaemon(driver, obj, 0);
966 967 968 969
    if (!obj->persistent)
        virDomainRemoveInactive(&driver->domains, obj);
    else
        virDomainObjUnlock(obj);
970
}
971

972
/**
973
 * qemudReconnectDomains
974 975 976 977 978
 *
 * Try to re-open the resources for live VMs that we care
 * about.
 */
static void
979
qemuReconnectDomains(virConnectPtr conn, struct qemud_driver *driver)
980
{
981 982
    struct virReconnectDomainData data = {conn, driver};
    virHashForEach(driver->domains.objs, qemuReconnectDomain, &data);
983 984
}

985

986
static int
987
qemuSecurityInit(struct qemud_driver *driver)
988
{
989 990 991 992
    virSecurityManagerPtr mgr = virSecurityManagerNew(driver->securityDriverName,
                                                      driver->allowDiskFormatProbing);
    if (!mgr)
        goto error;
993

994 995 996 997 998 999 1000
    if (driver->privileged) {
        virSecurityManagerPtr dac = virSecurityManagerNewDAC(driver->user,
                                                             driver->group,
                                                             driver->allowDiskFormatProbing,
                                                             driver->dynamicOwnership);
        if (!dac)
            goto error;
1001

1002 1003 1004
        if (!(driver->securityManager = virSecurityManagerNewStack(mgr,
                                                                   dac)))
            goto error;
1005
    } else {
1006
        driver->securityManager = mgr;
1007 1008
    }

1009
    return 0;
1010 1011 1012 1013 1014

error:
    VIR_ERROR0(_("Failed to initialize security drivers"));
    virSecurityManagerFree(mgr);
    return -1;
1015
}
1016 1017


1018 1019
static virCapsPtr
qemuCreateCapabilities(virCapsPtr oldcaps,
1020
                       struct qemud_driver *driver)
1021 1022 1023 1024
{
    virCapsPtr caps;

    /* Basic host arch / guest machine capabilities */
1025
    if (!(caps = qemuCapsInit(oldcaps))) {
1026
        virReportOOMError();
1027 1028 1029
        return NULL;
    }

1030 1031 1032 1033 1034 1035 1036 1037
    if (driver->allowDiskFormatProbing) {
        caps->defaultDiskDriverName = NULL;
        caps->defaultDiskDriverType = NULL;
    } else {
        caps->defaultDiskDriverName = "qemu";
        caps->defaultDiskDriverType = "raw";
    }

1038 1039
    qemuDomainSetPrivateDataHooks(caps);
    qemuDomainSetNamespaceHooks(caps);
1040

1041 1042 1043 1044 1045
    if (virGetHostUUID(caps->host.host_uuid)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                         "%s", _("cannot get the host uuid"));
        goto err_exit;
    }
1046 1047

    /* Security driver data */
1048
    const char *doi, *model;
1049

1050 1051 1052
    doi = virSecurityManagerGetDOI(driver->securityManager);
    model = virSecurityManagerGetModel(driver->securityManager);
    if (STRNEQ(model, "none")) {
1053 1054 1055 1056 1057 1058
        if (!(caps->host.secModel.model = strdup(model)))
            goto no_memory;
        if (!(caps->host.secModel.doi = strdup(doi)))
            goto no_memory;
    }

1059 1060 1061
    VIR_DEBUG("Initialized caps for security driver \"%s\" with "
              "DOI \"%s\"", model, doi);

1062 1063 1064
    return caps;

no_memory:
1065
    virReportOOMError();
1066
err_exit:
1067 1068 1069
    virCapabilitiesFree(caps);
    return NULL;
}
1070

C
Chris Lalancette 已提交
1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087
static void qemuDomainSnapshotLoad(void *payload,
                                   const char *name ATTRIBUTE_UNUSED,
                                   void *data)
{
    virDomainObjPtr vm = (virDomainObjPtr)payload;
    char *baseDir = (char *)data;
    char *snapDir = NULL;
    DIR *dir = NULL;
    struct dirent *entry;
    char *xmlStr;
    int ret;
    char *fullpath;
    virDomainSnapshotDefPtr def = NULL;
    char ebuf[1024];

    virDomainObjLock(vm);
    if (virAsprintf(&snapDir, "%s/%s", baseDir, vm->def->name) < 0) {
1088
        VIR_ERROR(_("Failed to allocate memory for snapshot directory for domain %s"),
C
Chris Lalancette 已提交
1089 1090 1091 1092 1093 1094 1095 1096 1097
                   vm->def->name);
        goto cleanup;
    }

    VIR_INFO("Scanning for snapshots for domain %s in %s", vm->def->name,
             snapDir);

    if (!(dir = opendir(snapDir))) {
        if (errno != ENOENT)
1098
            VIR_ERROR(_("Failed to open snapshot directory %s for domain %s: %s"),
C
Chris Lalancette 已提交
1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112
                      snapDir, vm->def->name,
                      virStrerror(errno, ebuf, sizeof(ebuf)));
        goto cleanup;
    }

    while ((entry = readdir(dir))) {
        if (entry->d_name[0] == '.')
            continue;

        /* NB: ignoring errors, so one malformed config doesn't
           kill the whole process */
        VIR_INFO("Loading snapshot file '%s'", entry->d_name);

        if (virAsprintf(&fullpath, "%s/%s", snapDir, entry->d_name) < 0) {
1113
            VIR_ERROR0(_("Failed to allocate memory for path"));
C
Chris Lalancette 已提交
1114 1115 1116 1117 1118 1119
            continue;
        }

        ret = virFileReadAll(fullpath, 1024*1024*1, &xmlStr);
        if (ret < 0) {
            /* Nothing we can do here, skip this one */
1120
            VIR_ERROR(_("Failed to read snapshot file %s: %s"), fullpath,
C
Chris Lalancette 已提交
1121
                      virStrerror(errno, ebuf, sizeof(ebuf)));
1122
            VIR_FREE(fullpath);
C
Chris Lalancette 已提交
1123 1124 1125 1126 1127 1128
            continue;
        }

        def = virDomainSnapshotDefParseString(xmlStr, 0);
        if (def == NULL) {
            /* Nothing we can do here, skip this one */
1129
            VIR_ERROR(_("Failed to parse snapshot XML from file '%s'"), fullpath);
1130
            VIR_FREE(fullpath);
C
Chris Lalancette 已提交
1131 1132 1133 1134
            VIR_FREE(xmlStr);
            continue;
        }

1135
        virDomainSnapshotAssignDef(&vm->snapshots, def);
C
Chris Lalancette 已提交
1136

1137
        VIR_FREE(fullpath);
C
Chris Lalancette 已提交
1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158
        VIR_FREE(xmlStr);
    }

    /* FIXME: qemu keeps internal track of snapshots.  We can get access
     * to this info via the "info snapshots" monitor command for running
     * domains, or via "qemu-img snapshot -l" for shutoff domains.  It would
     * be nice to update our internal state based on that, but there is a
     * a problem.  qemu doesn't track all of the same metadata that we do.
     * In particular we wouldn't be able to fill in the <parent>, which is
     * pretty important in our metadata.
     */

    virResetLastError();

cleanup:
    if (dir)
        closedir(dir);
    VIR_FREE(snapDir);
    virDomainObjUnlock(vm);
}

1159 1160 1161 1162 1163 1164
/**
 * qemudStartup:
 *
 * Initialization function for the QEmu daemon
 */
static int
1165
qemudStartup(int privileged) {
1166
    char *base = NULL;
1167
    char *driverConf = NULL;
1168
    int rc;
1169
    virConnectPtr conn = NULL;
1170

1171
    if (VIR_ALLOC(qemu_driver) < 0)
1172 1173
        return -1;

1174
    if (virMutexInit(&qemu_driver->lock) < 0) {
1175
        VIR_ERROR0(_("cannot initialize mutex"));
1176 1177 1178
        VIR_FREE(qemu_driver);
        return -1;
    }
1179
    qemuDriverLock(qemu_driver);
1180
    qemu_driver->privileged = privileged;
1181

1182 1183 1184
    /* Don't have a dom0 so start from 1 */
    qemu_driver->nextvmid = 1;

1185 1186 1187
    if (virDomainObjListInit(&qemu_driver->domains) < 0)
        goto out_of_memory;

1188
    /* Init callback list */
1189
    if (VIR_ALLOC(qemu_driver->domainEventCallbacks) < 0)
1190
        goto out_of_memory;
1191 1192 1193 1194 1195 1196
    if (!(qemu_driver->domainEventQueue = virDomainEventQueueNew()))
        goto out_of_memory;

    if ((qemu_driver->domainEventTimer =
         virEventAddTimeout(-1, qemuDomainEventFlush, qemu_driver, NULL)) < 0)
        goto error;
1197

1198 1199 1200 1201 1202
    /* Allocate bitmap for vnc port reservation */
    if ((qemu_driver->reservedVNCPorts =
         virBitmapAlloc(QEMU_VNC_PORT_MAX - QEMU_VNC_PORT_MIN)) == NULL)
        goto out_of_memory;

1203 1204 1205 1206
    /* read the host sysinfo */
    if (privileged)
        qemu_driver->hostsysinfo = virSysinfoRead();

1207
    if (privileged) {
1208
        if (virAsprintf(&qemu_driver->logDir,
1209
                        "%s/log/libvirt/qemu", LOCALSTATEDIR) == -1)
1210
            goto out_of_memory;
1211

1212
        if ((base = strdup (SYSCONFDIR "/libvirt")) == NULL)
1213
            goto out_of_memory;
1214 1215

        if (virAsprintf(&qemu_driver->stateDir,
1216
                      "%s/run/libvirt/qemu", LOCALSTATEDIR) == -1)
1217
            goto out_of_memory;
1218 1219

        if (virAsprintf(&qemu_driver->libDir,
1220
                      "%s/lib/libvirt/qemu", LOCALSTATEDIR) == -1)
1221 1222 1223
            goto out_of_memory;

        if (virAsprintf(&qemu_driver->cacheDir,
1224
                      "%s/cache/libvirt/qemu", LOCALSTATEDIR) == -1)
1225
            goto out_of_memory;
1226
        if (virAsprintf(&qemu_driver->saveDir,
1227
                      "%s/lib/libvirt/qemu/save", LOCALSTATEDIR) == -1)
1228
            goto out_of_memory;
C
Chris Lalancette 已提交
1229
        if (virAsprintf(&qemu_driver->snapshotDir,
1230
                        "%s/lib/libvirt/qemu/snapshot", LOCALSTATEDIR) == -1)
C
Chris Lalancette 已提交
1231
            goto out_of_memory;
H
Hu Tao 已提交
1232 1233 1234
        if (virAsprintf(&qemu_driver->autoDumpPath,
                        "%s/lib/libvirt/qemu/dump", LOCALSTATEDIR) == -1)
            goto out_of_memory;
1235
    } else {
1236
        uid_t uid = geteuid();
1237
        char *userdir = virGetUserDirectory(uid);
1238
        if (!userdir)
1239
            goto error;
1240

1241
        if (virAsprintf(&qemu_driver->logDir,
1242 1243
                        "%s/.libvirt/qemu/log", userdir) == -1) {
            VIR_FREE(userdir);
1244
            goto out_of_memory;
1245
        }
1246

1247 1248
        if (virAsprintf(&base, "%s/.libvirt", userdir) == -1) {
            VIR_FREE(userdir);
1249
            goto out_of_memory;
1250 1251
        }
        VIR_FREE(userdir);
1252 1253 1254

        if (virAsprintf(&qemu_driver->stateDir, "%s/qemu/run", base) == -1)
            goto out_of_memory;
1255 1256 1257 1258
        if (virAsprintf(&qemu_driver->libDir, "%s/qemu/lib", base) == -1)
            goto out_of_memory;
        if (virAsprintf(&qemu_driver->cacheDir, "%s/qemu/cache", base) == -1)
            goto out_of_memory;
1259 1260
        if (virAsprintf(&qemu_driver->saveDir, "%s/qemu/save", base) == -1)
            goto out_of_memory;
C
Chris Lalancette 已提交
1261 1262
        if (virAsprintf(&qemu_driver->snapshotDir, "%s/qemu/snapshot", base) == -1)
            goto out_of_memory;
H
Hu Tao 已提交
1263 1264
        if (virAsprintf(&qemu_driver->autoDumpPath, "%s/qemu/dump", base) == -1)
            goto out_of_memory;
1265 1266
    }

L
Laine Stump 已提交
1267
    if (virFileMakePath(qemu_driver->stateDir) != 0) {
1268
        char ebuf[1024];
1269
        VIR_ERROR(_("Failed to create state dir '%s': %s"),
1270
                  qemu_driver->stateDir, virStrerror(errno, ebuf, sizeof ebuf));
1271
        goto error;
1272
    }
L
Laine Stump 已提交
1273
    if (virFileMakePath(qemu_driver->libDir) != 0) {
1274
        char ebuf[1024];
1275
        VIR_ERROR(_("Failed to create lib dir '%s': %s"),
1276 1277 1278
                  qemu_driver->libDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
L
Laine Stump 已提交
1279
    if (virFileMakePath(qemu_driver->cacheDir) != 0) {
1280
        char ebuf[1024];
1281
        VIR_ERROR(_("Failed to create cache dir '%s': %s"),
1282 1283 1284
                  qemu_driver->cacheDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
1285 1286 1287 1288 1289 1290
    if (virFileMakePath(qemu_driver->saveDir) != 0) {
        char ebuf[1024];
        VIR_ERROR(_("Failed to create save dir '%s': %s"),
                  qemu_driver->saveDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
C
Chris Lalancette 已提交
1291 1292 1293 1294 1295 1296
    if (virFileMakePath(qemu_driver->snapshotDir) != 0) {
        char ebuf[1024];
        VIR_ERROR(_("Failed to create save dir '%s': %s"),
                  qemu_driver->snapshotDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
H
Hu Tao 已提交
1297 1298 1299 1300 1301 1302
    if (virFileMakePath(qemu_driver->autoDumpPath) != 0) {
        char ebuf[1024];
        VIR_ERROR(_("Failed to create dump dir '%s': %s"),
                  qemu_driver->autoDumpPath, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
1303 1304 1305 1306

    /* Configuration paths are either ~/.libvirt/qemu/... (session) or
     * /etc/libvirt/qemu/... (system).
     */
1307 1308 1309
    if (virAsprintf(&driverConf, "%s/qemu.conf", base) < 0 ||
        virAsprintf(&qemu_driver->configDir, "%s/qemu", base) < 0 ||
        virAsprintf(&qemu_driver->autostartDir, "%s/qemu/autostart", base) < 0)
1310 1311
        goto out_of_memory;

1312
    VIR_FREE(base);
1313

1314 1315 1316 1317 1318 1319 1320
    rc = virCgroupForDriver("qemu", &qemu_driver->cgroup, privileged, 1);
    if (rc < 0) {
        char buf[1024];
        VIR_WARN("Unable to create cgroup for driver: %s",
                 virStrerror(-rc, buf, sizeof(buf)));
    }

1321 1322 1323
    if (qemudLoadDriverConfig(qemu_driver, driverConf) < 0) {
        goto error;
    }
1324
    VIR_FREE(driverConf);
1325

1326
    if (qemuSecurityInit(qemu_driver) < 0)
1327
        goto error;
D
Daniel P. Berrange 已提交
1328

1329
    if ((qemu_driver->caps = qemuCreateCapabilities(NULL,
1330
                                                    qemu_driver)) == NULL)
1331
        goto error;
1332

1333
    if ((qemu_driver->activePciHostdevs = pciDeviceListNew()) == NULL)
1334 1335
        goto error;

1336 1337
    if (privileged) {
        if (chown(qemu_driver->libDir, qemu_driver->user, qemu_driver->group) < 0) {
1338
            virReportSystemError(errno,
1339 1340 1341 1342 1343
                                 _("unable to set ownership of '%s' to user %d:%d"),
                                 qemu_driver->libDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
        if (chown(qemu_driver->cacheDir, qemu_driver->user, qemu_driver->group) < 0) {
1344
            virReportSystemError(errno,
1345 1346 1347 1348
                                 _("unable to set ownership of '%s' to %d:%d"),
                                 qemu_driver->cacheDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
1349 1350 1351 1352 1353 1354
        if (chown(qemu_driver->saveDir, qemu_driver->user, qemu_driver->group) < 0) {
            virReportSystemError(errno,
                                 _("unable to set ownership of '%s' to %d:%d"),
                                 qemu_driver->saveDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
C
Chris Lalancette 已提交
1355 1356 1357 1358 1359 1360
        if (chown(qemu_driver->snapshotDir, qemu_driver->user, qemu_driver->group) < 0) {
            virReportSystemError(errno,
                                 _("unable to set ownership of '%s' to %d:%d"),
                                 qemu_driver->snapshotDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
1361 1362
    }

1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376
    /* If hugetlbfs is present, then we need to create a sub-directory within
     * it, since we can't assume the root mount point has permissions that
     * will let our spawned QEMU instances use it.
     *
     * NB the check for '/', since user may config "" to disable hugepages
     * even when mounted
     */
    if (qemu_driver->hugetlbfs_mount &&
        qemu_driver->hugetlbfs_mount[0] == '/') {
        char *mempath = NULL;
        if (virAsprintf(&mempath, "%s/libvirt/qemu", qemu_driver->hugetlbfs_mount) < 0)
            goto out_of_memory;

        if ((rc = virFileMakePath(mempath)) != 0) {
1377
            virReportSystemError(rc,
1378 1379 1380 1381 1382 1383
                                 _("unable to create hugepage path %s"), mempath);
            VIR_FREE(mempath);
            goto error;
        }
        if (qemu_driver->privileged &&
            chown(mempath, qemu_driver->user, qemu_driver->group) < 0) {
1384
            virReportSystemError(errno,
1385 1386 1387 1388 1389 1390 1391 1392 1393
                                 _("unable to set ownership on %s to %d:%d"),
                                 mempath, qemu_driver->user, qemu_driver->group);
            VIR_FREE(mempath);
            goto error;
        }

        qemu_driver->hugepage_path = mempath;
    }

1394
    /* Get all the running persistent or transient configs first */
1395
    if (virDomainLoadAllConfigs(qemu_driver->caps,
1396 1397 1398 1399 1400 1401
                                &qemu_driver->domains,
                                qemu_driver->stateDir,
                                NULL,
                                1, NULL, NULL) < 0)
        goto error;

1402 1403 1404 1405 1406
    conn = virConnectOpen(qemu_driver->privileged ?
                          "qemu:///system" :
                          "qemu:///session");

    qemuReconnectDomains(conn, qemu_driver);
1407 1408

    /* Then inactive persistent configs */
1409
    if (virDomainLoadAllConfigs(qemu_driver->caps,
1410 1411
                                &qemu_driver->domains,
                                qemu_driver->configDir,
1412
                                qemu_driver->autostartDir,
1413
                                0, NULL, NULL) < 0)
1414
        goto error;
C
Chris Lalancette 已提交
1415 1416 1417 1418 1419


    virHashForEach(qemu_driver->domains.objs, qemuDomainSnapshotLoad,
                   qemu_driver->snapshotDir);

1420 1421
    qemuDriverUnlock(qemu_driver);

1422 1423
    qemudAutostartConfigs(qemu_driver);

H
Hu Tao 已提交
1424 1425 1426 1427
    qemu_driver->workerPool = virThreadPoolNew(0, 1, processWatchdogEvent, qemu_driver);
    if (!qemu_driver->workerPool)
        goto error;

1428 1429
    if (conn)
        virConnectClose(conn);
1430

1431 1432
    return 0;

1433
out_of_memory:
1434
    virReportOOMError();
1435 1436 1437
error:
    if (qemu_driver)
        qemuDriverUnlock(qemu_driver);
1438 1439
    if (conn)
        virConnectClose(conn);
1440
    VIR_FREE(base);
1441
    VIR_FREE(driverConf);
1442
    qemudShutdown();
1443 1444 1445
    return -1;
}

1446 1447 1448 1449
static void qemudNotifyLoadDomain(virDomainObjPtr vm, int newVM, void *opaque)
{
    struct qemud_driver *driver = opaque;

1450 1451 1452 1453 1454 1455 1456 1457
    if (newVM) {
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED);
        if (event)
            qemuDomainEventQueue(driver, event);
    }
1458 1459
}

1460 1461 1462 1463 1464 1465 1466 1467
/**
 * qemudReload:
 *
 * Function to restart the QEmu daemon, it will recheck the configuration
 * files and update its state and the networking
 */
static int
qemudReload(void) {
1468 1469 1470
    if (!qemu_driver)
        return 0;

1471
    qemuDriverLock(qemu_driver);
1472
    virDomainLoadAllConfigs(qemu_driver->caps,
1473 1474
                            &qemu_driver->domains,
                            qemu_driver->configDir,
1475
                            qemu_driver->autostartDir,
1476
                            0, qemudNotifyLoadDomain, qemu_driver);
1477
    qemuDriverUnlock(qemu_driver);
1478

1479
    qemudAutostartConfigs(qemu_driver);
1480 1481

    return 0;
1482 1483
}

1484 1485 1486 1487 1488 1489 1490 1491 1492 1493
/**
 * qemudActive:
 *
 * Checks if the QEmu daemon is active, i.e. has an active domain or
 * an active network
 *
 * Returns 1 if active, 0 otherwise
 */
static int
qemudActive(void) {
1494
    int active = 0;
1495

1496 1497 1498
    if (!qemu_driver)
        return 0;

1499
    /* XXX having to iterate here is not great because it requires many locks */
1500
    qemuDriverLock(qemu_driver);
1501
    active = virDomainObjListNumOfDomains(&qemu_driver->domains, 1);
1502 1503
    qemuDriverUnlock(qemu_driver);
    return active;
1504 1505
}

1506 1507 1508 1509 1510 1511 1512
/**
 * qemudShutdown:
 *
 * Shutdown the QEmu daemon, it will stop all active domains and networks
 */
static int
qemudShutdown(void) {
1513
    int i;
1514

1515
    if (!qemu_driver)
1516
        return -1;
1517

1518
    qemuDriverLock(qemu_driver);
1519
    pciDeviceListFree(qemu_driver->activePciHostdevs);
1520 1521
    virCapabilitiesFree(qemu_driver->caps);

1522
    virDomainObjListDeinit(&qemu_driver->domains);
1523
    virBitmapFree(qemu_driver->reservedVNCPorts);
1524

1525 1526
    virSysinfoDefFree(qemu_driver->hostsysinfo);

1527 1528
    VIR_FREE(qemu_driver->configDir);
    VIR_FREE(qemu_driver->autostartDir);
E
Eric Blake 已提交
1529
    VIR_FREE(qemu_driver->logDir);
1530
    VIR_FREE(qemu_driver->stateDir);
1531 1532
    VIR_FREE(qemu_driver->libDir);
    VIR_FREE(qemu_driver->cacheDir);
1533
    VIR_FREE(qemu_driver->saveDir);
C
Chris Lalancette 已提交
1534
    VIR_FREE(qemu_driver->snapshotDir);
H
Hu Tao 已提交
1535
    VIR_FREE(qemu_driver->autoDumpPath);
1536
    VIR_FREE(qemu_driver->vncTLSx509certdir);
J
Jim Meyering 已提交
1537
    VIR_FREE(qemu_driver->vncListen);
1538
    VIR_FREE(qemu_driver->vncPassword);
1539
    VIR_FREE(qemu_driver->vncSASLdir);
E
Eric Blake 已提交
1540 1541 1542
    VIR_FREE(qemu_driver->spiceTLSx509certdir);
    VIR_FREE(qemu_driver->spiceListen);
    VIR_FREE(qemu_driver->spicePassword);
1543 1544
    VIR_FREE(qemu_driver->hugetlbfs_mount);
    VIR_FREE(qemu_driver->hugepage_path);
E
Eric Blake 已提交
1545 1546 1547
    VIR_FREE(qemu_driver->saveImageFormat);
    VIR_FREE(qemu_driver->dumpImageFormat);

1548 1549
    virSecurityManagerFree(qemu_driver->securityManager);

E
Eric Blake 已提交
1550
    ebtablesContextFree(qemu_driver->ebtables);
D
Daniel P. Berrange 已提交
1551

1552 1553 1554 1555 1556 1557
    if (qemu_driver->cgroupDeviceACL) {
        for (i = 0 ; qemu_driver->cgroupDeviceACL[i] != NULL ; i++)
            VIR_FREE(qemu_driver->cgroupDeviceACL[i]);
        VIR_FREE(qemu_driver->cgroupDeviceACL);
    }

1558 1559
    /* Free domain callback list */
    virDomainEventCallbackListFree(qemu_driver->domainEventCallbacks);
1560 1561 1562 1563
    virDomainEventQueueFree(qemu_driver->domainEventQueue);

    if (qemu_driver->domainEventTimer != -1)
        virEventRemoveTimeout(qemu_driver->domainEventTimer);
1564

1565 1566 1567
    if (qemu_driver->brctl)
        brShutdown(qemu_driver->brctl);

1568 1569
    virCgroupFree(&qemu_driver->cgroup);

1570
    qemuDriverUnlock(qemu_driver);
1571
    virMutexDestroy(&qemu_driver->lock);
H
Hu Tao 已提交
1572
    virThreadPoolFree(qemu_driver->workerPool);
1573
    VIR_FREE(qemu_driver);
1574 1575

    return 0;
1576 1577
}

1578
typedef int qemuLogHandleOutput(virDomainObjPtr vm,
1579 1580
                                const char *output,
                                int fd);
1581 1582 1583 1584 1585

/*
 * Returns -1 for error, 0 on success
 */
static int
1586
qemudReadLogOutput(virDomainObjPtr vm,
1587 1588
                   int fd,
                   char *buf,
G
Guido Günther 已提交
1589
                   size_t buflen,
1590
                   qemuLogHandleOutput func,
1591 1592 1593
                   const char *what,
                   int timeout)
{
1594
    int retries = (timeout*10);
1595
    int got = 0;
1596 1597 1598
    buf[0] = '\0';

    while (retries) {
1599
        ssize_t func_ret, ret;
1600
        int isdead = 0;
G
Guido Günther 已提交
1601

1602
        func_ret = func(vm, buf, fd);
1603

1604 1605
        if (kill(vm->pid, 0) == -1 && errno == ESRCH)
            isdead = 1;
1606

1607 1608
        /* Any failures should be detected before we read the log, so we
         * always have something useful to report on failure. */
1609 1610
        ret = saferead(fd, buf+got, buflen-got-1);
        if (ret < 0) {
1611
            virReportSystemError(errno,
1612 1613 1614 1615 1616
                                 _("Failure while reading %s log output"),
                                 what);
            return -1;
        }

1617 1618 1619
        got += ret;
        buf[got] = '\0';
        if (got == buflen-1) {
1620
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
1621 1622
                            _("Out of space while reading %s log output: %s"),
                            what, buf);
1623 1624 1625 1626
            return -1;
        }

        if (isdead) {
1627
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
1628 1629
                            _("Process exited while reading %s log output: %s"),
                            what, buf);
1630 1631 1632
            return -1;
        }

1633 1634
        if (func_ret <= 0)
            return func_ret;
1635 1636 1637 1638

        usleep(100*1000);
        retries--;
    }
1639

1640
    qemuReportError(VIR_ERR_INTERNAL_ERROR,
1641 1642
                    _("Timed out while reading %s log output: %s"),
                    what, buf);
1643 1644 1645
    return -1;
}

1646

1647 1648 1649 1650 1651 1652 1653 1654
/*
 * Look at a chunk of data from the QEMU stdout logs and try to
 * find a TTY device, as indicated by a line like
 *
 * char device redirected to /dev/pts/3
 *
 * Returns -1 for error, 0 success, 1 continue reading
 */
1655
static int
1656
qemudExtractTTYPath(const char *haystack,
1657 1658
                    size_t *offset,
                    char **path)
1659
{
1660
    static const char needle[] = "char device redirected to";
1661
    char *tmp, *dev;
1662

1663
    VIR_FREE(*path);
1664
    /* First look for our magic string */
1665 1666 1667 1668 1669
    if (!(tmp = strstr(haystack + *offset, needle))) {
        return 1;
    }
    tmp += sizeof(needle);
    dev = tmp;
1670

1671 1672 1673 1674 1675
    /*
     * And look for first whitespace character and nul terminate
     * to mark end of the pty path
     */
    while (*tmp) {
1676
        if (c_isspace(*tmp)) {
1677 1678
            *path = strndup(dev, tmp-dev);
            if (*path == NULL) {
1679
                virReportOOMError();
1680 1681
                return -1;
            }
1682

1683
            /* ... now further update offset till we get EOL */
1684
            *offset = tmp - haystack;
1685 1686
            return 0;
        }
1687
        tmp++;
1688 1689 1690 1691 1692
    }

    /*
     * We found a path, but didn't find any whitespace,
     * so it must be still incomplete - we should at
1693 1694
     * least see a \n - indicate that we want to carry
     * on trying again
1695
     */
1696
    return 1;
1697 1698
}

1699
static int
1700
qemudFindCharDevicePTYsMonitor(virDomainObjPtr vm,
1701 1702 1703 1704 1705 1706 1707
                               virHashTablePtr paths)
{
    int i;

#define LOOKUP_PTYS(array, arraylen, idprefix)                            \
    for (i = 0 ; i < (arraylen) ; i++) {                                  \
        virDomainChrDefPtr chr = (array)[i];                              \
1708
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {                \
1709 1710 1711 1712 1713 1714 1715
            char id[16];                                                  \
                                                                          \
            if (snprintf(id, sizeof(id), idprefix "%i", i) >= sizeof(id)) \
                return -1;                                                \
                                                                          \
            const char *path = (const char *) virHashLookup(paths, id);   \
            if (path == NULL) {                                           \
1716
                if (chr->source.data.file.path == NULL) {                 \
1717 1718
                    /* neither the log output nor 'info chardev' had a */ \
                    /* pty path for this chardev, report an error */      \
1719 1720 1721
                    qemuReportError(VIR_ERR_INTERNAL_ERROR,               \
                                    _("no assigned pty for device %s"), id); \
                    return -1;                                            \
1722 1723 1724 1725 1726
                } else {                                                  \
                    /* 'info chardev' had no pty path for this chardev, */\
                    /* but the log output had, so we're fine */           \
                    continue;                                             \
                }                                                         \
1727 1728
            }                                                             \
                                                                          \
1729 1730
            VIR_FREE(chr->source.data.file.path);                         \
            chr->source.data.file.path = strdup(path);                    \
1731
                                                                          \
1732
            if (chr->source.data.file.path == NULL) {                     \
1733
                virReportOOMError();                                      \
1734 1735
                return -1;                                                \
            }                                                             \
1736 1737 1738 1739 1740 1741
        }                                                                 \
    }

    LOOKUP_PTYS(vm->def->serials,   vm->def->nserials,   "serial");
    LOOKUP_PTYS(vm->def->parallels, vm->def->nparallels, "parallel");
    LOOKUP_PTYS(vm->def->channels,  vm->def->nchannels,  "channel");
C
Cole Robinson 已提交
1742 1743
    if (vm->def->console)
        LOOKUP_PTYS(&vm->def->console, 1,  "console");
1744
#undef LOOKUP_PTYS
1745 1746 1747 1748

    return 0;
}

1749
static int
1750
qemudFindCharDevicePTYs(virDomainObjPtr vm,
1751 1752
                        const char *output,
                        int fd ATTRIBUTE_UNUSED)
1753
{
1754
    size_t offset = 0;
1755
    int ret, i;
1756 1757

    /* The order in which QEMU prints out the PTY paths is
1758 1759
       the order in which it procsses its serial and parallel
       device args. This code must match that ordering.... */
1760

1761
    /* first comes the serial devices */
1762 1763
    for (i = 0 ; i < vm->def->nserials ; i++) {
        virDomainChrDefPtr chr = vm->def->serials[i];
1764
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {
1765
            if ((ret = qemudExtractTTYPath(output, &offset,
1766
                                           &chr->source.data.file.path)) != 0)
1767
                return ret;
1768 1769 1770
        }
    }

1771
    /* then the parallel devices */
1772 1773
    for (i = 0 ; i < vm->def->nparallels ; i++) {
        virDomainChrDefPtr chr = vm->def->parallels[i];
1774
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {
1775
            if ((ret = qemudExtractTTYPath(output, &offset,
1776
                                           &chr->source.data.file.path)) != 0)
1777
                return ret;
1778 1779 1780
        }
    }

1781 1782 1783
    /* then the channel devices */
    for (i = 0 ; i < vm->def->nchannels ; i++) {
        virDomainChrDefPtr chr = vm->def->channels[i];
1784
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {
1785
            if ((ret = qemudExtractTTYPath(output, &offset,
1786
                                           &chr->source.data.file.path)) != 0)
1787 1788 1789 1790
                return ret;
        }
    }

1791
    return 0;
1792 1793
}

1794 1795 1796 1797 1798
static void qemudFreePtyPath(void *payload, const char *name ATTRIBUTE_UNUSED)
{
    VIR_FREE(payload);
}

1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812
static void
qemuReadLogFD(int logfd, char *buf, int maxlen, int off)
{
    int ret;
    char *tmpbuf = buf + off;

    ret = saferead(logfd, tmpbuf, maxlen - off - 1);
    if (ret < 0) {
        ret = 0;
    }

    tmpbuf[ret] = '\0';
}

1813
static int
1814
qemudWaitForMonitor(struct qemud_driver* driver,
1815
                    virDomainObjPtr vm, off_t pos)
1816
{
1817
    char buf[4096] = ""; /* Plenty of space to get startup greeting */
1818
    int logfd;
1819
    int ret = -1;
1820
    virHashTablePtr paths = NULL;
1821

1822
    if ((logfd = qemudLogReadFD(driver->logDir, vm->def->name, pos)) < 0)
1823
        return -1;
1824

1825 1826 1827 1828
    if (qemudReadLogOutput(vm, logfd, buf, sizeof(buf),
                           qemudFindCharDevicePTYs,
                           "console", 30) < 0)
        goto closelog;
1829

1830
    VIR_DEBUG("Connect monitor to %p '%s'", vm, vm->def->name);
1831 1832 1833
    if (qemuConnectMonitor(driver, vm) < 0) {
        goto cleanup;
    }
1834

1835 1836 1837 1838
    /* Try to get the pty path mappings again via the monitor. This is much more
     * reliable if it's available.
     * Note that the monitor itself can be on a pty, so we still need to try the
     * log output method. */
1839
    paths = virHashCreate(0);
1840
    if (paths == NULL) {
1841
        virReportOOMError();
1842 1843 1844
        goto cleanup;
    }

1845
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
1846 1847
    qemuDomainObjPrivatePtr priv = vm->privateData;
    ret = qemuMonitorGetPtyPaths(priv->mon, paths);
1848
    qemuDomainObjExitMonitorWithDriver(driver, vm);
1849 1850 1851

    VIR_DEBUG("qemuMonitorGetPtyPaths returned %i", ret);
    if (ret == 0) {
1852
        ret = qemudFindCharDevicePTYsMonitor(vm, paths);
1853 1854 1855 1856 1857 1858 1859
    }

cleanup:
    if (paths) {
        virHashFree(paths, qemudFreePtyPath);
    }

1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870
    if (kill(vm->pid, 0) == -1 && errno == ESRCH) {
        /* VM is dead, any other error raised in the interim is probably
         * not as important as the qemu cmdline output */
        qemuReadLogFD(logfd, buf, sizeof(buf), strlen(buf));
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("process exited while connecting to monitor: %s"),
                        buf);
        ret = -1;
    }

closelog:
1871
    if (VIR_CLOSE(logfd) < 0) {
1872
        char ebuf[4096];
1873
        VIR_WARN("Unable to close logfile: %s",
1874 1875 1876
                 virStrerror(errno, ebuf, sizeof ebuf));
    }

1877
    return ret;
1878 1879
}

1880
static int
1881
qemuDetectVcpuPIDs(struct qemud_driver *driver,
1882 1883 1884
                   virDomainObjPtr vm) {
    pid_t *cpupids = NULL;
    int ncpupids;
1885
    qemuDomainObjPrivatePtr priv = vm->privateData;
1886

1887
    if (vm->def->virtType != VIR_DOMAIN_VIRT_KVM) {
1888 1889
        priv->nvcpupids = 1;
        if (VIR_ALLOC_N(priv->vcpupids, priv->nvcpupids) < 0) {
1890
            virReportOOMError();
1891 1892
            return -1;
        }
1893
        priv->vcpupids[0] = vm->pid;
1894 1895 1896
        return 0;
    }

1897
    /* What follows is now all KVM specific */
1898

1899
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
1900
    if ((ncpupids = qemuMonitorGetCPUInfo(priv->mon, &cpupids)) < 0) {
1901
        qemuDomainObjExitMonitorWithDriver(driver, vm);
1902
        return -1;
1903
    }
1904
    qemuDomainObjExitMonitorWithDriver(driver, vm);
1905

1906 1907 1908
    /* Treat failure to get VCPU<->PID mapping as non-fatal */
    if (ncpupids == 0)
        return 0;
1909

1910
    if (ncpupids != vm->def->vcpus) {
1911
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
E
Eric Blake 已提交
1912 1913 1914
                        _("got wrong number of vCPU pids from QEMU monitor. "
                          "got %d, wanted %d"),
                        ncpupids, vm->def->vcpus);
1915 1916 1917
        VIR_FREE(cpupids);
        return -1;
    }
1918

1919 1920
    priv->nvcpupids = ncpupids;
    priv->vcpupids = cpupids;
1921 1922 1923
    return 0;
}

1924 1925 1926
/*
 * To be run between fork/exec of QEMU only
 */
1927
static int
1928 1929
qemudInitCpuAffinity(virDomainObjPtr vm)
{
1930
    int i, hostcpus, maxcpu = QEMUD_CPUMASK_LEN;
1931
    virNodeInfo nodeinfo;
1932 1933
    unsigned char *cpumap;
    int cpumaplen;
1934 1935

    DEBUG0("Setting CPU affinity");
1936

1937
    if (nodeGetInfo(NULL, &nodeinfo) < 0)
1938 1939 1940 1941
        return -1;

    /* setaffinity fails if you set bits for CPUs which
     * aren't present, so we have to limit ourselves */
1942 1943 1944
    hostcpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
    if (maxcpu > hostcpus)
        maxcpu = hostcpus;
1945

1946 1947
    cpumaplen = VIR_CPU_MAPLEN(maxcpu);
    if (VIR_ALLOC_N(cpumap, cpumaplen) < 0) {
1948
        virReportOOMError();
1949 1950 1951
        return -1;
    }

D
Daniel P. Berrange 已提交
1952
    if (vm->def->cpumask) {
1953 1954 1955
        /* XXX why don't we keep 'cpumask' in the libvirt cpumap
         * format to start with ?!?! */
        for (i = 0 ; i < maxcpu && i < vm->def->cpumasklen ; i++)
D
Daniel P. Berrange 已提交
1956
            if (vm->def->cpumask[i])
1957
                VIR_USE_CPU(cpumap, i);
D
Daniel P. Berrange 已提交
1958
    } else {
1959 1960 1961 1962
        /* You may think this is redundant, but we can't assume libvirtd
         * itself is running on all pCPUs, so we need to explicitly set
         * the spawned QEMU instance to all pCPUs if no map is given in
         * its config file */
D
Daniel P. Berrange 已提交
1963
        for (i = 0 ; i < maxcpu ; i++)
1964
            VIR_USE_CPU(cpumap, i);
D
Daniel P. Berrange 已提交
1965
    }
1966

1967 1968 1969 1970 1971 1972 1973 1974
    /* We are pressuming we are running between fork/exec of QEMU
     * so use '0' to indicate our own process ID. No threads are
     * running at this point
     */
    if (virProcessInfoSetAffinity(0, /* Self */
                                  cpumap, cpumaplen, maxcpu) < 0) {
        VIR_FREE(cpumap);
        return -1;
1975
    }
1976
    VIR_FREE(cpumap);
1977 1978 1979 1980 1981

    return 0;
}


1982
static int
1983 1984 1985 1986
qemuInitPasswords(virConnectPtr conn,
                  struct qemud_driver *driver,
                  virDomainObjPtr vm,
                  unsigned long long qemuCmdFlags) {
1987
    int ret = 0;
1988
    qemuDomainObjPrivatePtr priv = vm->privateData;
1989

1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001
    if (vm->def->ngraphics == 1) {
        if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC) {
            ret = qemuDomainChangeGraphicsPasswords(driver, vm,
                                                    VIR_DOMAIN_GRAPHICS_TYPE_VNC,
                                                    &vm->def->graphics[0]->data.vnc.auth,
                                                    driver->vncPassword);
        } else if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_SPICE) {
            ret = qemuDomainChangeGraphicsPasswords(driver, vm,
                                                    VIR_DOMAIN_GRAPHICS_TYPE_SPICE,
                                                    &vm->def->graphics[0]->data.spice.auth,
                                                    driver->spicePassword);
        }
2002 2003
    }

2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026
    if (ret < 0)
        goto cleanup;

    if (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE) {
        int i;

        for (i = 0 ; i < vm->def->ndisks ; i++) {
            char *secret;
            size_t secretLen;

            if (!vm->def->disks[i]->encryption ||
                !vm->def->disks[i]->src)
                continue;

            if (getVolumeQcowPassphrase(conn,
                                        vm->def->disks[i],
                                        &secret, &secretLen) < 0)
                goto cleanup;

            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            ret = qemuMonitorSetDrivePassphrase(priv->mon,
                                                vm->def->disks[i]->info.alias,
                                                secret);
2027
            VIR_FREE(secret);
2028 2029 2030 2031 2032 2033 2034
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (ret < 0)
                goto cleanup;
        }
    }

cleanup:
2035
    return ret;
2036 2037 2038
}


2039 2040 2041 2042 2043 2044 2045 2046 2047 2048 2049 2050
#define QEMU_PCI_VENDOR_INTEL     0x8086
#define QEMU_PCI_VENDOR_LSI_LOGIC 0x1000
#define QEMU_PCI_VENDOR_REDHAT    0x1af4
#define QEMU_PCI_VENDOR_CIRRUS    0x1013
#define QEMU_PCI_VENDOR_REALTEK   0x10ec
#define QEMU_PCI_VENDOR_AMD       0x1022
#define QEMU_PCI_VENDOR_ENSONIQ   0x1274
#define QEMU_PCI_VENDOR_VMWARE    0x15ad
#define QEMU_PCI_VENDOR_QEMU      0x1234

#define QEMU_PCI_PRODUCT_DISK_VIRTIO 0x1001

2051 2052
#define QEMU_PCI_PRODUCT_BALLOON_VIRTIO 0x1002

2053 2054 2055 2056 2057 2058 2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260
#define QEMU_PCI_PRODUCT_NIC_NE2K     0x8029
#define QEMU_PCI_PRODUCT_NIC_PCNET    0x2000
#define QEMU_PCI_PRODUCT_NIC_RTL8139  0x8139
#define QEMU_PCI_PRODUCT_NIC_E1000    0x100E
#define QEMU_PCI_PRODUCT_NIC_VIRTIO   0x1000

#define QEMU_PCI_PRODUCT_VGA_CIRRUS 0x00b8
#define QEMU_PCI_PRODUCT_VGA_VMWARE 0x0405
#define QEMU_PCI_PRODUCT_VGA_STDVGA 0x1111

#define QEMU_PCI_PRODUCT_AUDIO_AC97    0x2415
#define QEMU_PCI_PRODUCT_AUDIO_ES1370  0x5000

#define QEMU_PCI_PRODUCT_CONTROLLER_PIIX 0x7010
#define QEMU_PCI_PRODUCT_CONTROLLER_LSI  0x0012

#define QEMU_PCI_PRODUCT_WATCHDOG_I63000ESB 0x25ab

static int
qemuAssignNextPCIAddress(virDomainDeviceInfo *info,
                         int vendor,
                         int product,
                         qemuMonitorPCIAddress *addrs,
                         int naddrs)
{
    int found = 0;
    int i;

    VIR_DEBUG("Look for %x:%x out of %d", vendor, product, naddrs);

    for (i = 0 ; (i < naddrs) && !found; i++) {
        VIR_DEBUG("Maybe %x:%x", addrs[i].vendor, addrs[i].product);
        if (addrs[i].vendor == vendor &&
            addrs[i].product == product) {
            VIR_DEBUG("Match %d", i);
            found = 1;
            break;
        }
    }
    if (!found) {
        return -1;
    }

    /* Blank it out so this device isn't matched again */
    addrs[i].vendor = 0;
    addrs[i].product = 0;

    if (info->type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_NONE)
        info->type = VIR_DOMAIN_DEVICE_ADDRESS_TYPE_PCI;

    if (info->type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_PCI) {
        info->addr.pci.domain = addrs[i].addr.domain;
        info->addr.pci.bus = addrs[i].addr.bus;
        info->addr.pci.slot = addrs[i].addr.slot;
        info->addr.pci.function = addrs[i].addr.function;
    }

    return 0;
}

static int
qemuGetPCIDiskVendorProduct(virDomainDiskDefPtr def,
                            unsigned *vendor,
                            unsigned *product)
{
    switch (def->bus) {
    case VIR_DOMAIN_DISK_BUS_VIRTIO:
        *vendor = QEMU_PCI_VENDOR_REDHAT;
        *product = QEMU_PCI_PRODUCT_DISK_VIRTIO;
        break;

    default:
        return -1;
    }

    return 0;
}

static int
qemuGetPCINetVendorProduct(virDomainNetDefPtr def,
                            unsigned *vendor,
                            unsigned *product)
{
    if (!def->model)
        return -1;

    if (STREQ(def->model, "ne2k_pci")) {
        *vendor = QEMU_PCI_VENDOR_REALTEK;
        *product = QEMU_PCI_PRODUCT_NIC_NE2K;
    } else if (STREQ(def->model, "pcnet")) {
        *vendor = QEMU_PCI_VENDOR_AMD;
        *product = QEMU_PCI_PRODUCT_NIC_PCNET;
    } else if (STREQ(def->model, "rtl8139")) {
        *vendor = QEMU_PCI_VENDOR_REALTEK;
        *product = QEMU_PCI_PRODUCT_NIC_RTL8139;
    } else if (STREQ(def->model, "e1000")) {
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_NIC_E1000;
    } else if (STREQ(def->model, "virtio")) {
        *vendor = QEMU_PCI_VENDOR_REDHAT;
        *product = QEMU_PCI_PRODUCT_NIC_VIRTIO;
    } else {
        VIR_INFO("Unexpected NIC model %s, cannot get PCI address",
                 def->model);
        return -1;
    }
    return 0;
}

static int
qemuGetPCIControllerVendorProduct(virDomainControllerDefPtr def,
                                  unsigned *vendor,
                                  unsigned *product)
{
    switch (def->type) {
    case VIR_DOMAIN_CONTROLLER_TYPE_SCSI:
        *vendor = QEMU_PCI_VENDOR_LSI_LOGIC;
        *product = QEMU_PCI_PRODUCT_CONTROLLER_LSI;
        break;

    case VIR_DOMAIN_CONTROLLER_TYPE_FDC:
        /* XXX we could put in the ISA bridge address, but
           that's not technically the FDC's address */
        return -1;

    case VIR_DOMAIN_CONTROLLER_TYPE_IDE:
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_CONTROLLER_PIIX;
        break;

    default:
        VIR_INFO("Unexpected controller type %s, cannot get PCI address",
                 virDomainControllerTypeToString(def->type));
        return -1;
    }

    return 0;
}

static int
qemuGetPCIVideoVendorProduct(virDomainVideoDefPtr def,
                             unsigned *vendor,
                             unsigned *product)
{
    switch (def->type) {
    case VIR_DOMAIN_VIDEO_TYPE_CIRRUS:
        *vendor = QEMU_PCI_VENDOR_CIRRUS;
        *product = QEMU_PCI_PRODUCT_VGA_CIRRUS;
        break;

    case VIR_DOMAIN_VIDEO_TYPE_VGA:
        *vendor = QEMU_PCI_VENDOR_QEMU;
        *product = QEMU_PCI_PRODUCT_VGA_STDVGA;
        break;

    case VIR_DOMAIN_VIDEO_TYPE_VMVGA:
        *vendor = QEMU_PCI_VENDOR_VMWARE;
        *product = QEMU_PCI_PRODUCT_VGA_VMWARE;
        break;

    default:
        return -1;
    }
    return 0;
}

static int
qemuGetPCISoundVendorProduct(virDomainSoundDefPtr def,
                             unsigned *vendor,
                             unsigned *product)
{
    switch (def->model) {
    case VIR_DOMAIN_SOUND_MODEL_ES1370:
        *vendor = QEMU_PCI_VENDOR_ENSONIQ;
        *product = QEMU_PCI_PRODUCT_AUDIO_ES1370;
        break;

    case VIR_DOMAIN_SOUND_MODEL_AC97:
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_AUDIO_AC97;
        break;

    default:
        return -1;
    }

    return 0;
}

static int
qemuGetPCIWatchdogVendorProduct(virDomainWatchdogDefPtr def,
                                unsigned *vendor,
                                unsigned *product)
{
    switch (def->model) {
    case VIR_DOMAIN_WATCHDOG_MODEL_I6300ESB:
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_WATCHDOG_I63000ESB;
        break;

    default:
        return -1;
    }

    return 0;
}


2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279
static int
qemuGetPCIMemballoonVendorProduct(virDomainMemballoonDefPtr def,
                                  unsigned *vendor,
                                  unsigned *product)
{
    switch (def->model) {
    case VIR_DOMAIN_MEMBALLOON_MODEL_VIRTIO:
        *vendor = QEMU_PCI_VENDOR_REDHAT;
        *product = QEMU_PCI_PRODUCT_BALLOON_VIRTIO;
        break;

    default:
        return -1;
    }

    return 0;
}


2280 2281 2282 2283 2284 2285 2286 2287 2288
/*
 * This entire method assumes that PCI devices in 'info pci'
 * match ordering of devices specified on the command line
 * wrt to devices of matching vendor+product
 *
 * XXXX this might not be a valid assumption if we assign
 * some static addrs on CLI. Have to check that...
 */
static int
2289
qemuDetectPCIAddresses(virDomainObjPtr vm,
2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306
                       qemuMonitorPCIAddress *addrs,
                       int naddrs)
{
    unsigned int vendor = 0, product = 0;
    int i;

    /* XXX should all these vendor/product IDs be kept in the
     * actual device data structure instead ?
     */

    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (qemuGetPCIDiskVendorProduct(vm->def->disks[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->disks[i]->info),
                                     vendor, product,
                                     addrs, naddrs) < 0) {
2307 2308 2309
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for VirtIO disk %s"),
                            vm->def->disks[i]->dst);
2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (qemuGetPCINetVendorProduct(vm->def->nets[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->nets[i]->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2321 2322 2323
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for %s NIC"),
                            vm->def->nets[i]->model);
2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->ncontrollers ; i++) {
        if (qemuGetPCIControllerVendorProduct(vm->def->controllers[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->controllers[i]->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2335 2336 2337
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for controller %s"),
                            virDomainControllerTypeToString(vm->def->controllers[i]->type));
2338 2339 2340 2341 2342 2343 2344 2345 2346 2347 2348
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->nvideos ; i++) {
        if (qemuGetPCIVideoVendorProduct(vm->def->videos[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->videos[i]->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2349 2350 2351
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for video adapter %s"),
                            virDomainVideoTypeToString(vm->def->videos[i]->type));
2352 2353 2354 2355 2356 2357 2358 2359 2360
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->nsounds ; i++) {
        if (qemuGetPCISoundVendorProduct(vm->def->sounds[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->sounds[i]->info),
2361
                                    vendor, product,
2362
                                     addrs,  naddrs) < 0) {
2363 2364 2365
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for sound adapter %s"),
                            virDomainSoundModelTypeToString(vm->def->sounds[i]->model));
2366 2367 2368 2369 2370 2371 2372 2373 2374 2375
            return -1;
        }
    }


    if (vm->def->watchdog &&
        qemuGetPCIWatchdogVendorProduct(vm->def->watchdog, &vendor, &product) == 0) {
        if (qemuAssignNextPCIAddress(&(vm->def->watchdog->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2376 2377 2378
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for watchdog %s"),
                            virDomainWatchdogModelTypeToString(vm->def->watchdog->model));
2379 2380 2381 2382
            return -1;
        }
    }

2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394
    if (vm->def->memballoon &&
        qemuGetPCIMemballoonVendorProduct(vm->def->memballoon, &vendor, &product) == 0) {
        if (qemuAssignNextPCIAddress(&(vm->def->memballoon->info),
                                     vendor, product,
                                     addrs, naddrs) < 0) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for balloon %s"),
                            virDomainMemballoonModelTypeToString(vm->def->memballoon->model));
            return -1;
        }
    }

2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420
    /* XXX console (virtio) */


    /* ... and now things we don't have in our xml */

    /* XXX USB controller ? */

    /* XXX what about other PCI devices (ie bridges) */

    return 0;
}

static int
qemuInitPCIAddresses(struct qemud_driver *driver,
                     virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int naddrs;
    int ret;
    qemuMonitorPCIAddress *addrs = NULL;

    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    naddrs = qemuMonitorGetAllPCIAddresses(priv->mon,
                                           &addrs);
    qemuDomainObjExitMonitorWithDriver(driver, vm);

2421
    ret = qemuDetectPCIAddresses(vm, addrs, naddrs);
2422 2423 2424 2425 2426 2427

    VIR_FREE(addrs);

    return ret;
}

2428 2429 2430

static int qemudNextFreePort(struct qemud_driver *driver,
                             int startPort) {
2431 2432
    int i;

2433
    for (i = startPort ; i < QEMU_VNC_PORT_MAX; i++) {
2434 2435 2436
        int fd;
        int reuse = 1;
        struct sockaddr_in addr;
2437 2438 2439 2440 2441 2442 2443 2444 2445
        bool used = false;

        if (virBitmapGetBit(driver->reservedVNCPorts,
                            i - QEMU_VNC_PORT_MIN, &used) < 0)
            VIR_DEBUG("virBitmapGetBit failed on bit %d", i - QEMU_VNC_PORT_MIN);

        if (used)
            continue;

2446 2447 2448 2449 2450 2451 2452 2453
        addr.sin_family = AF_INET;
        addr.sin_port = htons(i);
        addr.sin_addr.s_addr = htonl(INADDR_ANY);
        fd = socket(PF_INET, SOCK_STREAM, 0);
        if (fd < 0)
            return -1;

        if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, (void*)&reuse, sizeof(reuse)) < 0) {
2454
            VIR_FORCE_CLOSE(fd);
2455 2456 2457 2458 2459
            break;
        }

        if (bind(fd, (struct sockaddr*)&addr, sizeof(addr)) == 0) {
            /* Not in use, lets grab it */
2460
            VIR_FORCE_CLOSE(fd);
2461 2462 2463 2464 2465 2466
            /* Add port to bitmap of reserved ports */
            if (virBitmapSetBit(driver->reservedVNCPorts,
                                i - QEMU_VNC_PORT_MIN) < 0) {
                VIR_DEBUG("virBitmapSetBit failed on bit %d",
                          i - QEMU_VNC_PORT_MIN);
            }
2467 2468
            return i;
        }
2469
        VIR_FORCE_CLOSE(fd);
2470 2471 2472 2473 2474 2475 2476 2477 2478 2479 2480

        if (errno == EADDRINUSE) {
            /* In use, try next */
            continue;
        }
        /* Some other bad failure, get out.. */
        break;
    }
    return -1;
}

2481

2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494
static void
qemuReturnPort(struct qemud_driver *driver,
                int port)
{
    if (port < QEMU_VNC_PORT_MIN)
        return;

    if (virBitmapClearBit(driver->reservedVNCPorts,
                          port - QEMU_VNC_PORT_MIN) < 0)
        VIR_DEBUG("Could not mark port %d as unused", port);
}


2495 2496 2497 2498 2499 2500 2501
static int
qemuAssignPCIAddresses(virDomainDefPtr def)
{
    int ret = -1;
    unsigned long long qemuCmdFlags = 0;
    qemuDomainPCIAddressSetPtr addrs = NULL;

2502 2503 2504
    if (qemuCapsExtractVersionInfo(def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522 2523
        goto cleanup;

    if (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE) {
        if (!(addrs = qemuDomainPCIAddressSetCreate(def)))
            goto cleanup;

        if (qemuAssignDevicePCISlots(def, addrs) < 0)
            goto cleanup;
    }

    ret = 0;

cleanup:
    qemuDomainPCIAddressSetFree(addrs);

    return ret;
}


2524 2525 2526 2527 2528 2529
static int
qemuPrepareChardevDevice(virDomainDefPtr def ATTRIBUTE_UNUSED,
                         virDomainChrDefPtr dev,
                         void *opaque ATTRIBUTE_UNUSED)
{
    int fd;
2530
    if (dev->source.type != VIR_DOMAIN_CHR_TYPE_FILE)
2531 2532
        return 0;

2533 2534
    if ((fd = open(dev->source.data.file.path,
                   O_CREAT | O_APPEND, S_IRUSR|S_IWUSR)) < 0) {
2535 2536
        virReportSystemError(errno,
                             _("Unable to pre-create chardev file '%s'"),
2537
                             dev->source.data.file.path);
2538 2539 2540
        return -1;
    }

2541
    VIR_FORCE_CLOSE(fd);
2542 2543 2544 2545 2546

    return 0;
}


2547 2548 2549 2550
struct qemudHookData {
    virConnectPtr conn;
    virDomainObjPtr vm;
    struct qemud_driver *driver;
2551 2552 2553
};

static int qemudSecurityHook(void *data) {
2554 2555
    struct qemudHookData *h = data;

2556 2557 2558
    /* This must take place before exec(), so that all QEMU
     * memory allocation is on the correct NUMA node
     */
2559
    if (qemuAddToCgroup(h->driver, h->vm->def) < 0)
2560 2561
        return -1;

2562 2563 2564
    /* This must be done after cgroup placement to avoid resetting CPU
     * affinity */
    if (qemudInitCpuAffinity(h->vm) < 0)
2565
        return -1;
2566

2567
    if (virSecurityManagerSetProcessLabel(h->driver->securityManager, h->vm) < 0)
2568 2569 2570
        return -1;

    return 0;
2571 2572
}

2573
static int
2574
qemuPrepareMonitorChr(struct qemud_driver *driver,
2575
                      virDomainChrSourceDefPtr monConfig,
2576 2577
                      const char *vm)
{
2578 2579
    monConfig->type = VIR_DOMAIN_CHR_TYPE_UNIX;
    monConfig->data.nix.listen = true;
2580

2581
    if (virAsprintf(&monConfig->data.nix.path, "%s/%s.monitor",
2582
                    driver->libDir, vm) < 0) {
2583
        virReportOOMError();
2584 2585 2586 2587 2588 2589
        return -1;
    }

    return 0;
}

2590 2591 2592 2593
static int qemuDomainSnapshotSetCurrentActive(virDomainObjPtr vm,
                                              char *snapshotDir);
static int qemuDomainSnapshotSetCurrentInactive(virDomainObjPtr vm,
                                                char *snapshotDir);
C
Chris Lalancette 已提交
2594

2595

2596 2597
#define START_POSTFIX ": starting up\n"
#define SHUTDOWN_POSTFIX ": shutting down\n"
2598

2599 2600
static int qemudStartVMDaemon(virConnectPtr conn,
                              struct qemud_driver *driver,
2601
                              virDomainObjPtr vm,
2602
                              const char *migrateFrom,
2603
                              bool start_paused,
2604
                              int stdin_fd,
2605 2606
                              const char *stdin_path,
                              enum virVMOperationType vmop) {
E
Eric Blake 已提交
2607
    int ret;
2608
    unsigned long long qemuCmdFlags;
2609
    off_t pos = -1;
2610
    char ebuf[1024];
2611
    char *pidfile = NULL;
2612
    int logfile = -1;
2613
    char *timestamp;
2614
    qemuDomainObjPrivatePtr priv = vm->privateData;
E
Eric Blake 已提交
2615
    virCommandPtr cmd = NULL;
2616

2617
    struct qemudHookData hookData;
2618 2619 2620 2621
    hookData.conn = conn;
    hookData.vm = vm;
    hookData.driver = driver;

2622 2623
    DEBUG0("Beginning VM startup process");

D
Daniel P. Berrange 已提交
2624
    if (virDomainObjIsActive(vm)) {
2625 2626
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("VM is already active"));
2627 2628 2629
        return -1;
    }

2630 2631 2632 2633 2634
    /* Must be run before security labelling */
    DEBUG0("Preparing host devices");
    if (qemuPrepareHostDevices(driver, vm->def) < 0)
        goto cleanup;

2635 2636 2637 2638 2639 2640 2641
    DEBUG0("Preparing chr devices");
    if (virDomainChrDefForeach(vm->def,
                               true,
                               qemuPrepareChardevDevice,
                               NULL) < 0)
        goto cleanup;

2642 2643
    /* If you are using a SecurityDriver with dynamic labelling,
       then generate a security label for isolation */
2644
    DEBUG0("Generating domain security label (if required)");
2645 2646 2647
    if (virSecurityManagerGenLabel(driver->securityManager, vm) < 0) {
        qemuDomainSecurityLabelAudit(vm, false);
        goto cleanup;
2648
    }
2649
    qemuDomainSecurityLabelAudit(vm, true);
2650

2651
    DEBUG0("Generating setting domain security labels (if required)");
2652 2653
    if (virSecurityManagerSetAllLabel(driver->securityManager,
                                      vm, stdin_path) < 0)
2654
        goto cleanup;
2655

2656 2657 2658
    /* Ensure no historical cgroup for this VM is lying around bogus
     * settings */
    DEBUG0("Ensuring no historical cgroup is lying around");
2659
    qemuRemoveCgroup(driver, vm, 1);
2660

2661 2662 2663
    if (vm->def->ngraphics == 1) {
        if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC &&
            vm->def->graphics[0]->data.vnc.autoport) {
2664
            int port = qemudNextFreePort(driver, QEMU_VNC_PORT_MIN);
2665 2666 2667 2668 2669 2670 2671 2672
            if (port < 0) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Unable to find an unused VNC port"));
                goto cleanup;
            }
            vm->def->graphics[0]->data.vnc.port = port;
        } else if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_SPICE &&
                   vm->def->graphics[0]->data.spice.autoport) {
2673
            int port = qemudNextFreePort(driver, QEMU_VNC_PORT_MIN);
2674 2675
            int tlsPort = -1;
            if (port < 0) {
2676
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
2677
                                "%s", _("Unable to find an unused SPICE port"));
2678 2679 2680
                goto cleanup;
            }

2681 2682 2683 2684 2685
            if (driver->spiceTLS) {
                tlsPort = qemudNextFreePort(driver, port + 1);
                if (tlsPort < 0) {
                    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                    "%s", _("Unable to find an unused SPICE TLS port"));
2686
                    qemuReturnPort(driver, port);
2687 2688 2689 2690
                    goto cleanup;
                }
            }

2691 2692
            vm->def->graphics[0]->data.spice.port = port;
            vm->def->graphics[0]->data.spice.tlsPort = tlsPort;
2693
        }
2694
    }
2695

L
Laine Stump 已提交
2696
    if (virFileMakePath(driver->logDir) != 0) {
2697
        virReportSystemError(errno,
2698 2699
                             _("cannot create log directory %s"),
                             driver->logDir);
2700
        goto cleanup;
2701 2702
    }

2703
    DEBUG0("Creating domain log file");
2704
    if ((logfile = qemudLogFD(driver, vm->def->name, false)) < 0)
2705
        goto cleanup;
2706

E
Eric Blake 已提交
2707
    DEBUG0("Determining emulator version");
2708 2709 2710
    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
2711
        goto cleanup;
2712

2713
    DEBUG0("Setting up domain cgroup (if required)");
2714
    if (qemuSetupCgroup(driver, vm) < 0)
2715 2716
        goto cleanup;

2717
    if (VIR_ALLOC(priv->monConfig) < 0) {
2718
        virReportOOMError();
2719 2720 2721
        goto cleanup;
    }

2722
    DEBUG0("Preparing monitor state");
2723
    if (qemuPrepareMonitorChr(driver, priv->monConfig, vm->def->name) < 0)
2724
        goto cleanup;
2725

D
Daniel P. Berrange 已提交
2726 2727 2728
#if HAVE_YAJL
    if (qemuCmdFlags & QEMUD_CMD_FLAG_MONITOR_JSON)
        priv->monJSON = 1;
2729
    else
D
Daniel P. Berrange 已提交
2730
#endif
2731
        priv->monJSON = 0;
D
Daniel P. Berrange 已提交
2732

2733
    priv->monitor_warned = 0;
2734
    priv->gotShutdown = false;
2735

D
Daniel P. Berrange 已提交
2736
    if ((ret = virFileDeletePid(driver->stateDir, vm->def->name)) != 0) {
2737
        virReportSystemError(ret,
D
Daniel P. Berrange 已提交
2738 2739 2740 2741 2742
                             _("Cannot remove stale PID file for %s"),
                             vm->def->name);
        goto cleanup;
    }

2743
    if (!(pidfile = virFilePid(driver->stateDir, vm->def->name))) {
2744
        virReportSystemError(errno,
2745 2746 2747
                             "%s", _("Failed to build pidfile path."));
        goto cleanup;
    }
D
Daniel P. Berrange 已提交
2748

2749
    /*
M
Matthew Booth 已提交
2750
     * Normally PCI addresses are assigned in the virDomainCreate
2751 2752 2753 2754 2755
     * or virDomainDefine methods. We might still need to assign
     * some here to cope with the question of upgrades. Regardless
     * we also need to populate the PCi address set cache for later
     * use in hotplug
     */
2756
    if (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE) {
2757
        DEBUG0("Assigning domain PCI addresses");
2758
        /* Populate cache with current addresses */
2759 2760 2761 2762 2763 2764 2765
        if (priv->pciaddrs) {
            qemuDomainPCIAddressSetFree(priv->pciaddrs);
            priv->pciaddrs = NULL;
        }
        if (!(priv->pciaddrs = qemuDomainPCIAddressSetCreate(vm->def)))
            goto cleanup;

2766 2767

        /* Assign any remaining addresses */
2768 2769
        if (qemuAssignDevicePCISlots(vm->def, priv->pciaddrs) < 0)
            goto cleanup;
2770 2771 2772 2773

        priv->persistentAddrs = 1;
    } else {
        priv->persistentAddrs = 0;
2774 2775
    }

2776
    DEBUG0("Building emulator command line");
2777
    vm->def->id = driver->nextvmid++;
2778 2779
    if (!(cmd = qemuBuildCommandLine(conn, driver, vm->def, priv->monConfig,
                                     priv->monJSON != 0, qemuCmdFlags,
2780
                                     migrateFrom, stdin_fd,
2781
                                     vm->current_snapshot, vmop)))
C
Chris Lalancette 已提交
2782 2783
        goto cleanup;

2784
    if (qemuDomainSnapshotSetCurrentInactive(vm, driver->snapshotDir) < 0)
2785
        goto cleanup;
2786

2787 2788 2789 2790 2791 2792 2793 2794 2795 2796 2797 2798 2799 2800 2801 2802
    /* now that we know it is about to start call the hook if present */
    if (virHookPresent(VIR_HOOK_DRIVER_QEMU)) {
        char *xml = virDomainDefFormat(vm->def, 0);
        int hookret;

        hookret = virHookCall(VIR_HOOK_DRIVER_QEMU, vm->def->name,
                    VIR_HOOK_QEMU_OP_START, VIR_HOOK_SUBOP_BEGIN, NULL, xml);
        VIR_FREE(xml);

        /*
         * If the script raised an error abort the launch
         */
        if (hookret < 0)
            goto cleanup;
    }

2803 2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815
    if ((timestamp = virTimestamp()) == NULL) {
        virReportOOMError();
        goto cleanup;
    } else {
        if (safewrite(logfile, timestamp, strlen(timestamp)) < 0 ||
            safewrite(logfile, START_POSTFIX, strlen(START_POSTFIX)) < 0) {
            VIR_WARN("Unable to write timestamp to logfile: %s",
                     virStrerror(errno, ebuf, sizeof ebuf));
        }

        VIR_FREE(timestamp);
    }

E
Eric Blake 已提交
2816
    virCommandWriteArgLog(cmd, logfile);
2817

2818
    if ((pos = lseek(logfile, 0, SEEK_END)) < 0)
2819
        VIR_WARN("Unable to seek to end of logfile: %s",
2820
                 virStrerror(errno, ebuf, sizeof ebuf));
2821

2822 2823
    VIR_DEBUG("Clear emulator capabilities: %d",
              driver->clearEmulatorCapabilities);
E
Eric Blake 已提交
2824 2825 2826 2827 2828
    if (driver->clearEmulatorCapabilities)
        virCommandClearCaps(cmd);

    VIR_WARN("Executing %s", vm->def->emulator);
    virCommandSetPreExecHook(cmd, qemudSecurityHook, &hookData);
2829

E
Eric Blake 已提交
2830 2831 2832 2833 2834 2835 2836 2837
    virCommandSetOutputFD(cmd, &logfile);
    virCommandSetErrorFD(cmd, &logfile);
    virCommandNonblockingFDs(cmd);
    virCommandSetPidFile(cmd, pidfile);
    virCommandDaemonize(cmd);

    ret = virCommandRun(cmd, NULL);
    VIR_WARN("Executing done %s", vm->def->emulator);
2838
    VIR_FREE(pidfile);
G
Guido Günther 已提交
2839 2840 2841

    /* wait for qemu process to to show up */
    if (ret == 0) {
2842
        if (virFileReadPid(driver->stateDir, vm->def->name, &vm->pid)) {
2843 2844
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("Domain %s didn't show up\n"), vm->def->name);
2845
            ret = -1;
G
Guido Günther 已提交
2846
        }
E
Eric Blake 已提交
2847
#if 0
2848
    } else if (ret == -2) {
E
Eric Blake 已提交
2849 2850 2851 2852 2853
        /*
         * XXX this is bogus. It isn't safe to set vm->pid = child
         * because the child no longer exists.
         */

2854 2855 2856 2857 2858 2859 2860 2861 2862
        /* The virExec process that launches the daemon failed. Pending on
         * when it failed (we can't determine for sure), there may be
         * extra info in the domain log (if the hook failed for example).
         *
         * Pretend like things succeeded, and let 'WaitForMonitor' report
         * the log contents for us.
         */
        vm->pid = child;
        ret = 0;
E
Eric Blake 已提交
2863
#endif
2864
    }
2865

2866 2867 2868
    if (migrateFrom)
        start_paused = true;
    vm->state = start_paused ? VIR_DOMAIN_PAUSED : VIR_DOMAIN_RUNNING;
2869

2870
    if (ret == -1) /* The VM failed to start; tear filters before taps */
2871
        virDomainConfVMNWFilterTeardown(vm);
2872

2873
    if (ret == -1) /* The VM failed to start */
2874 2875
        goto cleanup;

2876
    DEBUG0("Waiting for monitor to show up");
2877
    if (qemudWaitForMonitor(driver, vm, pos) < 0)
2878
        goto cleanup;
2879

2880
    DEBUG0("Detecting VCPU PIDs");
2881
    if (qemuDetectVcpuPIDs(driver, vm) < 0)
2882
        goto cleanup;
2883

2884
    DEBUG0("Setting any required VM passwords");
2885
    if (qemuInitPasswords(conn, driver, vm, qemuCmdFlags) < 0)
2886
        goto cleanup;
2887

D
Daniel P. Berrange 已提交
2888 2889 2890
    /* If we have -device, then addresses are assigned explicitly.
     * If not, then we have to detect dynamic ones here */
    if (!(qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE)) {
2891
        DEBUG0("Determining domain device PCI addresses");
D
Daniel P. Berrange 已提交
2892
        if (qemuInitPCIAddresses(driver, vm) < 0)
2893
            goto cleanup;
D
Daniel P. Berrange 已提交
2894
    }
2895

2896
    DEBUG0("Setting initial memory amount");
2897
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
2898
    if (qemuMonitorSetBalloon(priv->mon, vm->def->mem.cur_balloon) < 0) {
2899
        qemuDomainObjExitMonitorWithDriver(driver, vm);
2900
        goto cleanup;
2901
    }
H
Hu Tao 已提交
2902
    qemuDomainObjExitMonitorWithDriver(driver, vm);
2903

2904
    if (!start_paused) {
2905
        DEBUG0("Starting domain CPUs");
2906
        /* Allow the CPUS to start executing */
H
Hu Tao 已提交
2907
        if (doStartCPUs(driver, vm, conn) < 0) {
2908
            if (virGetLastError() == NULL)
2909 2910
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("resume operation failed"));
2911
            goto cleanup;
2912 2913
        }
    }
2914

2915

2916
    DEBUG0("Writing domain status to disk");
2917
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
2918
        goto cleanup;
2919

2920 2921 2922 2923 2924
    /* Do this last, since it depends on domain being active */
    DEBUG0("Setting running domain def as transient");
    if (virDomainObjSetDefTransient(driver->caps, vm) < 0)
        goto cleanup;

E
Eric Blake 已提交
2925
    virCommandFree(cmd);
2926
    VIR_FORCE_CLOSE(logfile);
2927

2928
    return 0;
2929 2930

cleanup:
2931 2932 2933
    /* We jump here if we failed to start the VM for any reason, or
     * if we failed to initialize the now running VM. kill it off and
     * pretend we never started it */
E
Eric Blake 已提交
2934
    virCommandFree(cmd);
2935
    VIR_FORCE_CLOSE(logfile);
E
Eric Blake 已提交
2936
    qemudShutdownVMDaemon(driver, vm, 0);
2937 2938

    return -1;
2939 2940
}

2941
static void qemudShutdownVMDaemon(struct qemud_driver *driver,
2942 2943
                                  virDomainObjPtr vm,
                                  int migrated) {
D
Daniel P. Berrange 已提交
2944
    int ret;
2945
    int retries = 0;
2946
    qemuDomainObjPrivatePtr priv = vm->privateData;
2947
    virErrorPtr orig_err;
2948 2949
    virDomainDefPtr def;
    int i;
2950 2951 2952
    int logfile = -1;
    char *timestamp;
    char ebuf[1024];
D
Daniel P. Berrange 已提交
2953

2954 2955
    VIR_DEBUG("Shutting down VM '%s' pid=%d migrated=%d",
              vm->def->name, vm->pid, migrated);
2956

2957
    if ((logfile = qemudLogFD(driver, vm->def->name, true)) < 0) {
2958 2959 2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980
        /* To not break the normal domain shutdown process, skip the
         * timestamp log writing if failed on opening log file. */
        VIR_WARN("Unable to open logfile: %s",
                  virStrerror(errno, ebuf, sizeof ebuf));
    } else {
        if ((timestamp = virTimestamp()) == NULL) {
            virReportOOMError();
        } else {
            if (safewrite(logfile, timestamp, strlen(timestamp)) < 0 ||
                safewrite(logfile, SHUTDOWN_POSTFIX,
                          strlen(SHUTDOWN_POSTFIX)) < 0) {
                VIR_WARN("Unable to write timestamp to logfile: %s",
                         virStrerror(errno, ebuf, sizeof ebuf));
            }

            VIR_FREE(timestamp);
        }

        if (VIR_CLOSE(logfile) < 0)
             VIR_WARN("Unable to close logfile: %s",
                      virStrerror(errno, ebuf, sizeof ebuf));
    }

2981 2982 2983 2984
    /* This method is routinely used in clean up paths. Disable error
     * reporting so we don't squash a legit error. */
    orig_err = virSaveLastError();

2985
    virDomainConfVMNWFilterTeardown(vm);
S
Stefan Berger 已提交
2986

2987
    if (driver->macFilter) {
2988
        def = vm->def;
2989 2990 2991 2992
        for (i = 0 ; i < def->nnets ; i++) {
            virDomainNetDefPtr net = def->nets[i];
            if (net->ifname == NULL)
                continue;
2993
            if ((errno = networkDisallowMacOnPort(driver, net->ifname,
2994
                                                  net->mac))) {
2995
                virReportSystemError(errno,
2996 2997 2998 2999 3000 3001
             _("failed to remove ebtables rule to allow MAC address on  '%s'"),
                                     net->ifname);
            }
        }
    }

3002
    /* This will safely handle a non-running guest with pid=0 or pid=-1*/
G
Guido Günther 已提交
3003 3004
    if (virKillProcess(vm->pid, 0) == 0 &&
        virKillProcess(vm->pid, SIGTERM) < 0)
3005
        virReportSystemError(errno,
3006 3007
                             _("Failed to send SIGTERM to %s (%d)"),
                             vm->def->name, vm->pid);
3008

3009 3010
    if (priv->mon)
        qemuMonitorClose(priv->mon);
3011

3012
    if (priv->monConfig) {
3013 3014 3015
        if (priv->monConfig->type == VIR_DOMAIN_CHR_TYPE_UNIX)
            unlink(priv->monConfig->data.nix.path);
        virDomainChrSourceDefFree(priv->monConfig);
3016
        priv->monConfig = NULL;
3017 3018
    }

G
Guido Günther 已提交
3019 3020
    /* shut it off for sure */
    virKillProcess(vm->pid, SIGKILL);
3021

3022 3023 3024 3025 3026 3027 3028 3029 3030 3031
    /* now that we know it's stopped call the hook if present */
    if (virHookPresent(VIR_HOOK_DRIVER_QEMU)) {
        char *xml = virDomainDefFormat(vm->def, 0);

        /* we can't stop the operation even if the script raised an error */
        virHookCall(VIR_HOOK_DRIVER_QEMU, vm->def->name,
                    VIR_HOOK_QEMU_OP_STOPPED, VIR_HOOK_SUBOP_END, NULL, xml);
        VIR_FREE(xml);
    }

3032
    /* Reset Security Labels */
3033 3034 3035
    virSecurityManagerRestoreAllLabel(driver->securityManager,
                                      vm, migrated);
    virSecurityManagerReleaseLabel(driver->securityManager, vm);
3036

3037 3038 3039 3040 3041 3042 3043
    /* Clear out dynamically assigned labels */
    if (vm->def->seclabel.type == VIR_DOMAIN_SECLABEL_DYNAMIC) {
        VIR_FREE(vm->def->seclabel.model);
        VIR_FREE(vm->def->seclabel.label);
        VIR_FREE(vm->def->seclabel.imagelabel);
    }

D
Daniel P. Berrange 已提交
3044
    virDomainDefClearDeviceAliases(vm->def);
3045 3046 3047 3048 3049
    if (!priv->persistentAddrs) {
        virDomainDefClearPCIAddresses(vm->def);
        qemuDomainPCIAddressSetFree(priv->pciaddrs);
        priv->pciaddrs = NULL;
    }
3050

3051
    qemuDomainReAttachHostDevices(driver, vm->def);
3052

S
Stefan Berger 已提交
3053 3054 3055 3056
#if WITH_MACVTAP
    def = vm->def;
    for (i = 0; i < def->nnets; i++) {
        virDomainNetDefPtr net = def->nets[i];
3057
        if (net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
3058
            delMacvtap(net->ifname, net->mac, net->data.direct.linkdev,
3059
                       &net->data.direct.virtPortProfile);
3060 3061
            VIR_FREE(net->ifname);
        }
S
Stefan Berger 已提交
3062 3063 3064
    }
#endif

3065
retry:
3066
    if ((ret = qemuRemoveCgroup(driver, vm, 0)) < 0) {
3067 3068 3069 3070 3071 3072 3073 3074
        if (ret == -EBUSY && (retries++ < 5)) {
            usleep(200*1000);
            goto retry;
        }
        VIR_WARN("Failed to remove cgroup for %s",
                 vm->def->name);
    }

3075
    qemudRemoveDomainStatus(driver, vm);
D
Daniel P. Berrange 已提交
3076

3077 3078 3079 3080 3081
    /* Remove VNC port from port reservation bitmap, but only if it was
       reserved by the driver (autoport=yes)
    */
    if ((vm->def->ngraphics == 1) &&
        vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC &&
3082 3083 3084 3085 3086 3087 3088 3089
        vm->def->graphics[0]->data.vnc.autoport) {
        qemuReturnPort(driver, vm->def->graphics[0]->data.vnc.port);
    }
    if ((vm->def->ngraphics == 1) &&
        vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_SPICE &&
        vm->def->graphics[0]->data.spice.autoport) {
        qemuReturnPort(driver, vm->def->graphics[0]->data.spice.port);
        qemuReturnPort(driver, vm->def->graphics[0]->data.spice.tlsPort);
3090 3091
    }

3092
    vm->pid = -1;
3093
    vm->def->id = -1;
3094
    vm->state = VIR_DOMAIN_SHUTOFF;
3095 3096
    VIR_FREE(priv->vcpupids);
    priv->nvcpupids = 0;
3097 3098

    if (vm->newDef) {
3099
        virDomainDefFree(vm->def);
3100
        vm->def = vm->newDef;
3101
        vm->def->id = -1;
3102 3103
        vm->newDef = NULL;
    }
3104 3105 3106 3107 3108

    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
3109 3110
}

3111
static virDrvOpenStatus qemudOpen(virConnectPtr conn,
3112
                                  virConnectAuthPtr auth ATTRIBUTE_UNUSED,
3113
                                  int flags ATTRIBUTE_UNUSED) {
3114
    if (conn->uri == NULL) {
3115 3116 3117
        if (qemu_driver == NULL)
            return VIR_DRV_OPEN_DECLINED;

3118
        conn->uri = xmlParseURI(qemu_driver->privileged ?
3119 3120
                                "qemu:///system" :
                                "qemu:///session");
3121
        if (!conn->uri) {
3122
            virReportOOMError();
3123 3124
            return VIR_DRV_OPEN_ERROR;
        }
3125 3126 3127 3128 3129 3130 3131 3132 3133 3134
    } else {
        /* If URI isn't 'qemu' its definitely not for us */
        if (conn->uri->scheme == NULL ||
            STRNEQ(conn->uri->scheme, "qemu"))
            return VIR_DRV_OPEN_DECLINED;

        /* Allow remote driver to deal with URIs with hostname server */
        if (conn->uri->server != NULL)
            return VIR_DRV_OPEN_DECLINED;

3135
        if (qemu_driver == NULL) {
3136 3137
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("qemu state driver is not active"));
3138 3139 3140
            return VIR_DRV_OPEN_ERROR;
        }

3141
        if (conn->uri->path == NULL) {
3142 3143 3144 3145 3146
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("no QEMU URI path given, try %s"),
                            qemu_driver->privileged
                            ? "qemu:///system"
                            : "qemu:///session");
3147 3148 3149
                return VIR_DRV_OPEN_ERROR;
        }

3150
        if (qemu_driver->privileged) {
3151 3152
            if (STRNEQ (conn->uri->path, "/system") &&
                STRNEQ (conn->uri->path, "/session")) {
3153 3154 3155
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("unexpected QEMU URI path '%s', try qemu:///system"),
                                conn->uri->path);
3156 3157 3158 3159
                return VIR_DRV_OPEN_ERROR;
            }
        } else {
            if (STRNEQ (conn->uri->path, "/session")) {
3160 3161 3162
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("unexpected QEMU URI path '%s', try qemu:///session"),
                                conn->uri->path);
3163 3164 3165
                return VIR_DRV_OPEN_ERROR;
            }
        }
3166 3167 3168 3169 3170 3171 3172
    }
    conn->privateData = qemu_driver;

    return VIR_DRV_OPEN_SUCCESS;
}

static int qemudClose(virConnectPtr conn) {
3173
    struct qemud_driver *driver = conn->privateData;
3174 3175

    /* Get rid of callbacks registered for this conn */
3176
    qemuDriverLock(driver);
3177
    virDomainEventCallbackListRemoveConn(conn, driver->domainEventCallbacks);
3178
    qemuDriverUnlock(driver);
3179 3180 3181 3182 3183 3184

    conn->privateData = NULL;

    return 0;
}

D
Daniel Veillard 已提交
3185 3186 3187 3188 3189
/* Which features are supported by this driver? */
static int
qemudSupportsFeature (virConnectPtr conn ATTRIBUTE_UNUSED, int feature)
{
    switch (feature) {
3190 3191 3192 3193 3194
    case VIR_DRV_FEATURE_MIGRATION_V2:
    case VIR_DRV_FEATURE_MIGRATION_P2P:
        return 1;
    default:
        return 0;
D
Daniel Veillard 已提交
3195 3196 3197
    }
}

3198
static const char *qemudGetType(virConnectPtr conn ATTRIBUTE_UNUSED) {
3199
    return "QEMU";
3200 3201
}

3202

3203 3204 3205 3206 3207 3208 3209 3210 3211 3212 3213 3214 3215
static int qemuIsSecure(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Trivially secure, since always inside the daemon */
    return 1;
}

static int qemuIsEncrypted(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Not encrypted, but remote driver takes care of that */
    return 0;
}


3216 3217 3218 3219
static int kvmGetMaxVCPUs(void) {
    int maxvcpus = 1;

    int r, fd;
3220

3221 3222
    fd = open(KVM_DEVICE, O_RDONLY);
    if (fd < 0) {
3223
        virReportSystemError(errno, _("Unable to open %s"), KVM_DEVICE);
3224
        return -1;
3225 3226 3227 3228 3229 3230
    }

    r = ioctl(fd, KVM_CHECK_EXTENSION, KVM_CAP_NR_VCPUS);
    if (r > 0)
        maxvcpus = r;

3231
    VIR_FORCE_CLOSE(fd);
3232 3233 3234 3235
    return maxvcpus;
}


3236
static int qemudGetMaxVCPUs(virConnectPtr conn ATTRIBUTE_UNUSED, const char *type) {
3237 3238 3239
    if (!type)
        return 16;

3240
    if (STRCASEEQ(type, "qemu"))
3241 3242
        return 16;

3243
    if (STRCASEEQ(type, "kvm"))
3244
        return kvmGetMaxVCPUs();
3245

3246
    if (STRCASEEQ(type, "kqemu"))
3247
        return 1;
3248

3249 3250
    qemuReportError(VIR_ERR_INVALID_ARG,
                    _("unknown type '%s'"), type);
3251 3252 3253
    return -1;
}

3254

3255
static char *qemudGetCapabilities(virConnectPtr conn) {
3256
    struct qemud_driver *driver = conn->privateData;
3257
    virCapsPtr caps = NULL;
3258
    char *xml = NULL;
3259

3260
    qemuDriverLock(driver);
3261

3262
    if ((caps = qemuCreateCapabilities(qemu_driver->caps,
3263
                                       qemu_driver)) == NULL) {
3264 3265 3266
        virCapabilitiesFree(caps);
        goto cleanup;
    }
3267

3268
    virCapabilitiesFree(qemu_driver->caps);
3269 3270 3271
    qemu_driver->caps = caps;

    if ((xml = virCapabilitiesFormatXML(driver->caps)) == NULL)
3272
        virReportOOMError();
3273 3274

cleanup:
3275
    qemuDriverUnlock(driver);
3276

3277
    return xml;
3278 3279 3280
}


3281 3282 3283 3284 3285
static int
qemudGetProcessInfo(unsigned long long *cpuTime, int *lastCpu, int pid,
                    int tid)
{
    char *proc;
D
Daniel P. Berrange 已提交
3286
    FILE *pidinfo;
3287
    unsigned long long usertime, systime;
3288 3289
    int cpu;
    int ret;
D
Daniel P. Berrange 已提交
3290

3291
    if (tid)
3292
        ret = virAsprintf(&proc, "/proc/%d/task/%d/stat", pid, tid);
3293
    else
3294 3295
        ret = virAsprintf(&proc, "/proc/%d/stat", pid);
    if (ret < 0)
D
Daniel P. Berrange 已提交
3296 3297 3298 3299
        return -1;

    if (!(pidinfo = fopen(proc, "r"))) {
        /* VM probably shut down, so fake 0 */
3300 3301 3302 3303
        if (cpuTime)
            *cpuTime = 0;
        if (lastCpu)
            *lastCpu = 0;
3304
        VIR_FREE(proc);
D
Daniel P. Berrange 已提交
3305 3306
        return 0;
    }
3307
    VIR_FREE(proc);
D
Daniel P. Berrange 已提交
3308

3309 3310 3311 3312 3313 3314 3315 3316 3317 3318
    /* See 'man proc' for information about what all these fields are. We're
     * only interested in a very few of them */
    if (fscanf(pidinfo,
               /* pid -> stime */
               "%*d %*s %*c %*d %*d %*d %*d %*d %*u %*u %*u %*u %*u %llu %llu"
               /* cutime -> endcode */
               "%*d %*d %*d %*d %*d %*u %*u %*d %*u %*u %*u %*u"
               /* startstack -> processor */
               "%*u %*u %*u %*u %*u %*u %*u %*u %*u %*u %*d %d",
               &usertime, &systime, &cpu) != 3) {
3319
        VIR_FORCE_FCLOSE(pidinfo);
3320 3321
        VIR_WARN0("cannot parse process status data");
        errno = -EINVAL;
D
Daniel P. Berrange 已提交
3322 3323 3324 3325 3326 3327 3328 3329
        return -1;
    }

    /* We got jiffies
     * We want nanoseconds
     * _SC_CLK_TCK is jiffies per second
     * So calulate thus....
     */
3330 3331 3332 3333 3334
    if (cpuTime)
        *cpuTime = 1000ull * 1000ull * 1000ull * (usertime + systime) / (unsigned long long)sysconf(_SC_CLK_TCK);
    if (lastCpu)
        *lastCpu = cpu;

D
Daniel P. Berrange 已提交
3335

3336 3337
    VIR_DEBUG("Got status for %d/%d user=%llu sys=%llu cpu=%d",
              pid, tid, usertime, systime, cpu);
D
Daniel P. Berrange 已提交
3338

3339
    VIR_FORCE_FCLOSE(pidinfo);
D
Daniel P. Berrange 已提交
3340 3341 3342 3343 3344

    return 0;
}


3345
static virDomainPtr qemudDomainLookupByID(virConnectPtr conn,
3346
                                          int id) {
3347 3348 3349 3350
    struct qemud_driver *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;

3351
    qemuDriverLock(driver);
3352
    vm  = virDomainFindByID(&driver->domains, id);
3353
    qemuDriverUnlock(driver);
3354 3355

    if (!vm) {
3356 3357
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching id %d"), id);
3358
        goto cleanup;
3359 3360
    }

3361
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3362
    if (dom) dom->id = vm->def->id;
3363 3364

cleanup:
3365 3366
    if (vm)
        virDomainObjUnlock(vm);
3367 3368
    return dom;
}
3369

3370
static virDomainPtr qemudDomainLookupByUUID(virConnectPtr conn,
3371
                                            const unsigned char *uuid) {
3372 3373 3374
    struct qemud_driver *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
3375

3376
    qemuDriverLock(driver);
3377
    vm = virDomainFindByUUID(&driver->domains, uuid);
3378 3379
    qemuDriverUnlock(driver);

3380
    if (!vm) {
3381 3382
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(uuid, uuidstr);
3383 3384
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3385
        goto cleanup;
3386 3387
    }

3388
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3389
    if (dom) dom->id = vm->def->id;
3390 3391

cleanup:
3392 3393
    if (vm)
        virDomainObjUnlock(vm);
3394 3395
    return dom;
}
3396

3397
static virDomainPtr qemudDomainLookupByName(virConnectPtr conn,
3398
                                            const char *name) {
3399 3400 3401
    struct qemud_driver *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
3402

3403
    qemuDriverLock(driver);
3404
    vm = virDomainFindByName(&driver->domains, name);
3405 3406
    qemuDriverUnlock(driver);

3407
    if (!vm) {
3408 3409
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching name '%s'"), name);
3410
        goto cleanup;
3411 3412
    }

3413
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3414
    if (dom) dom->id = vm->def->id;
3415 3416

cleanup:
3417 3418
    if (vm)
        virDomainObjUnlock(vm);
3419 3420 3421
    return dom;
}

3422 3423 3424 3425 3426 3427 3428 3429 3430 3431 3432

static int qemuDomainIsActive(virDomainPtr dom)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    qemuDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!obj) {
3433
        qemuReportError(VIR_ERR_NO_DOMAIN, NULL);
3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444 3445 3446 3447 3448 3449 3450 3451 3452 3453
        goto cleanup;
    }
    ret = virDomainObjIsActive(obj);

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}

static int qemuDomainIsPersistent(virDomainPtr dom)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    qemuDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!obj) {
3454
        qemuReportError(VIR_ERR_NO_DOMAIN, NULL);
3455 3456 3457 3458 3459 3460 3461 3462 3463 3464
        goto cleanup;
    }
    ret = obj->persistent;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}

3465 3466 3467 3468 3469 3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484
static int qemuDomainIsUpdated(virDomainPtr dom)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    qemuDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!obj) {
        qemuReportError(VIR_ERR_NO_DOMAIN, NULL);
        goto cleanup;
    }
    ret = obj->updated;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}
3485

3486
static int qemudGetVersion(virConnectPtr conn, unsigned long *version) {
3487 3488 3489
    struct qemud_driver *driver = conn->privateData;
    int ret = -1;

3490
    qemuDriverLock(driver);
3491
    if (qemuCapsExtractVersion(driver->caps, &driver->qemuVersion) < 0)
3492
        goto cleanup;
3493

3494
    *version = driver->qemuVersion;
3495 3496 3497
    ret = 0;

cleanup:
3498
    qemuDriverUnlock(driver);
3499
    return ret;
D
Daniel P. Berrange 已提交
3500 3501
}

3502
static int qemudListDomains(virConnectPtr conn, int *ids, int nids) {
3503
    struct qemud_driver *driver = conn->privateData;
3504
    int n;
3505

3506
    qemuDriverLock(driver);
3507
    n = virDomainObjListGetActiveIDs(&driver->domains, ids, nids);
3508
    qemuDriverUnlock(driver);
3509

3510
    return n;
D
Daniel P. Berrange 已提交
3511
}
3512

3513
static int qemudNumDomains(virConnectPtr conn) {
3514
    struct qemud_driver *driver = conn->privateData;
3515
    int n;
3516

3517
    qemuDriverLock(driver);
3518
    n = virDomainObjListNumOfDomains(&driver->domains, 1);
3519
    qemuDriverUnlock(driver);
3520

3521
    return n;
D
Daniel P. Berrange 已提交
3522
}
3523

3524
static virDomainPtr qemudDomainCreate(virConnectPtr conn, const char *xml,
3525
                                      unsigned int flags) {
3526
    struct qemud_driver *driver = conn->privateData;
3527
    virDomainDefPtr def;
3528
    virDomainObjPtr vm = NULL;
3529
    virDomainPtr dom = NULL;
3530
    virDomainEventPtr event = NULL;
D
Daniel P. Berrange 已提交
3531

3532
    virCheckFlags(VIR_DOMAIN_START_PAUSED, NULL);
3533

3534
    qemuDriverLock(driver);
3535
    if (!(def = virDomainDefParseString(driver->caps, xml,
3536
                                        VIR_DOMAIN_XML_INACTIVE)))
3537
        goto cleanup;
3538

3539
    if (virSecurityManagerVerify(driver->securityManager, def) < 0)
3540 3541
        goto cleanup;

3542 3543
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
3544

3545 3546 3547 3548 3549 3550
    if (qemudCanonicalizeMachine(driver, def) < 0)
        goto cleanup;

    if (qemuAssignPCIAddresses(def) < 0)
        goto cleanup;

3551
    if (!(vm = virDomainAssignDef(driver->caps,
3552
                                  &driver->domains,
3553
                                  def, false)))
3554 3555 3556
        goto cleanup;

    def = NULL;
D
Daniel P. Berrange 已提交
3557

3558 3559 3560
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup; /* XXXX free the 'vm' we created ? */

3561 3562
    if (qemudStartVMDaemon(conn, driver, vm, NULL,
                           (flags & VIR_DOMAIN_START_PAUSED) != 0,
3563
                           -1, NULL, VIR_VM_OP_CREATE) < 0) {
3564
        qemuDomainStartAudit(vm, "booted", false);
3565 3566 3567
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains,
                                    vm);
3568
        vm = NULL;
3569
        goto cleanup;
D
Daniel P. Berrange 已提交
3570
    }
3571 3572 3573 3574

    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);
3575
    qemuDomainStartAudit(vm, "booted", true);
D
Daniel P. Berrange 已提交
3576

3577
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3578
    if (dom) dom->id = vm->def->id;
3579

3580 3581 3582
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3583

3584 3585
cleanup:
    virDomainDefFree(def);
3586 3587
    if (vm)
        virDomainObjUnlock(vm);
3588 3589
    if (event)
        qemuDomainEventQueue(driver, event);
3590
    qemuDriverUnlock(driver);
3591
    return dom;
D
Daniel P. Berrange 已提交
3592 3593 3594
}


3595
static int qemudDomainSuspend(virDomainPtr dom) {
3596 3597 3598
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3599
    virDomainEventPtr event = NULL;
3600
    qemuDomainObjPrivatePtr priv;
3601

3602
    qemuDriverLock(driver);
3603
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3604

D
Daniel P. Berrange 已提交
3605
    if (!vm) {
3606 3607
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3608 3609
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3610
        goto cleanup;
D
Daniel P. Berrange 已提交
3611
    }
D
Daniel P. Berrange 已提交
3612
    if (!virDomainObjIsActive(vm)) {
3613 3614
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3615
        goto cleanup;
D
Daniel P. Berrange 已提交
3616
    }
3617 3618 3619

    priv = vm->privateData;

3620
    if (priv->jobActive == QEMU_JOB_MIGRATION_OUT) {
3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634
        if (vm->state != VIR_DOMAIN_PAUSED) {
            VIR_DEBUG("Requesting domain pause on %s",
                      vm->def->name);
            priv->jobSignals |= QEMU_JOB_SIGNAL_SUSPEND;
        }
        ret = 0;
        goto cleanup;
    } else {
        if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
            goto cleanup;

        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_OPERATION_INVALID,
                            "%s", _("domain is not running"));
3635
            goto endjob;
3636
        }
3637
        if (vm->state != VIR_DOMAIN_PAUSED) {
H
Hu Tao 已提交
3638
            if (doStopCPUs(driver, vm) < 0) {
3639
                goto endjob;
3640
            }
3641 3642 3643 3644 3645 3646 3647
            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_SUSPENDED,
                                             VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
        }
        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            goto endjob;
        ret = 0;
D
Daniel P. Berrange 已提交
3648
    }
3649

3650
endjob:
3651 3652
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3653

3654
cleanup:
3655 3656
    if (vm)
        virDomainObjUnlock(vm);
3657

3658
    if (event)
3659
        qemuDomainEventQueue(driver, event);
3660
    qemuDriverUnlock(driver);
3661
    return ret;
D
Daniel P. Berrange 已提交
3662 3663 3664
}


3665
static int qemudDomainResume(virDomainPtr dom) {
3666 3667 3668
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3669
    virDomainEventPtr event = NULL;
3670

3671
    qemuDriverLock(driver);
3672
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3673

D
Daniel P. Berrange 已提交
3674
    if (!vm) {
3675 3676
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3677 3678
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3679
        goto cleanup;
D
Daniel P. Berrange 已提交
3680
    }
3681 3682 3683 3684

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
3685
    if (!virDomainObjIsActive(vm)) {
3686 3687
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3688
        goto endjob;
D
Daniel P. Berrange 已提交
3689
    }
3690
    if (vm->state == VIR_DOMAIN_PAUSED) {
H
Hu Tao 已提交
3691
        if (doStartCPUs(driver, vm, dom->conn) < 0) {
3692
            if (virGetLastError() == NULL)
3693 3694
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("resume operation failed"));
3695
            goto endjob;
3696
        }
3697 3698 3699
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_UNPAUSED);
D
Daniel P. Berrange 已提交
3700
    }
3701
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
3702
        goto endjob;
3703 3704
    ret = 0;

3705
endjob:
3706 3707
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3708

3709
cleanup:
3710 3711
    if (vm)
        virDomainObjUnlock(vm);
3712
    if (event)
3713
        qemuDomainEventQueue(driver, event);
3714
    qemuDriverUnlock(driver);
3715
    return ret;
D
Daniel P. Berrange 已提交
3716 3717 3718
}


3719
static int qemudDomainShutdown(virDomainPtr dom) {
3720 3721 3722
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3723

3724
    qemuDriverLock(driver);
3725
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3726 3727
    qemuDriverUnlock(driver);

3728
    if (!vm) {
3729 3730
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3731 3732
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3733
        goto cleanup;
3734 3735
    }

3736 3737 3738
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
3739
    if (!virDomainObjIsActive(vm)) {
3740 3741
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3742
        goto endjob;
3743 3744
    }

3745
    qemuDomainObjPrivatePtr priv = vm->privateData;
3746 3747 3748
    qemuDomainObjEnterMonitor(vm);
    ret = qemuMonitorSystemPowerdown(priv->mon);
    qemuDomainObjExitMonitor(vm);
3749

3750
endjob:
3751 3752
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3753

3754
cleanup:
3755 3756
    if (vm)
        virDomainObjUnlock(vm);
3757
    return ret;
3758 3759 3760
}


3761
static int qemudDomainDestroy(virDomainPtr dom) {
3762 3763 3764
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3765
    virDomainEventPtr event = NULL;
3766

3767
    qemuDriverLock(driver);
3768
    vm  = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel P. Berrange 已提交
3769
    if (!vm) {
3770 3771
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3772 3773
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3774
        goto cleanup;
D
Daniel P. Berrange 已提交
3775
    }
3776 3777 3778 3779

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
3780
    if (!virDomainObjIsActive(vm)) {
3781 3782
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3783
        goto endjob;
3784
    }
3785

3786
    qemudShutdownVMDaemon(driver, vm, 0);
3787 3788 3789
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_DESTROYED);
3790 3791
    qemuDomainStopAudit(vm, "destroyed");

3792
    if (!vm->persistent) {
3793 3794 3795
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains,
                                    vm);
3796 3797
        vm = NULL;
    }
3798 3799
    ret = 0;

3800
endjob:
3801 3802 3803
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3804

3805
cleanup:
3806 3807
    if (vm)
        virDomainObjUnlock(vm);
3808 3809
    if (event)
        qemuDomainEventQueue(driver, event);
3810
    qemuDriverUnlock(driver);
3811
    return ret;
D
Daniel P. Berrange 已提交
3812 3813 3814
}


3815
static char *qemudDomainGetOSType(virDomainPtr dom) {
3816 3817 3818
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *type = NULL;
3819

3820
    qemuDriverLock(driver);
3821
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3822
    qemuDriverUnlock(driver);
3823
    if (!vm) {
3824 3825
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3826 3827
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3828
        goto cleanup;
3829 3830
    }

3831
    if (!(type = strdup(vm->def->os.type)))
3832
        virReportOOMError();
3833 3834

cleanup:
3835 3836
    if (vm)
        virDomainObjUnlock(vm);
3837 3838 3839
    return type;
}

3840 3841
/* Returns max memory in kb, 0 if error */
static unsigned long qemudDomainGetMaxMemory(virDomainPtr dom) {
3842 3843 3844
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned long ret = 0;
3845

3846
    qemuDriverLock(driver);
3847
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3848 3849
    qemuDriverUnlock(driver);

3850
    if (!vm) {
3851 3852
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3853 3854
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3855
        goto cleanup;
3856 3857
    }

3858
    ret = vm->def->mem.max_balloon;
3859 3860

cleanup:
3861 3862
    if (vm)
        virDomainObjUnlock(vm);
3863
    return ret;
3864 3865 3866
}

static int qemudDomainSetMemory(virDomainPtr dom, unsigned long newmem) {
3867
    struct qemud_driver *driver = dom->conn->privateData;
3868
    qemuDomainObjPrivatePtr priv;
3869
    virDomainObjPtr vm;
3870
    int ret = -1, r;
3871

3872
    qemuDriverLock(driver);
3873
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3874
    qemuDriverUnlock(driver);
3875
    if (!vm) {
3876 3877
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3878 3879
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3880
        goto cleanup;
3881 3882
    }

3883
    if (newmem > vm->def->mem.max_balloon) {
3884 3885
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("cannot set memory higher than max memory"));
3886
        goto cleanup;
3887 3888
    }

3889 3890 3891
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

3892 3893 3894 3895 3896 3897
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto endjob;
    }

3898 3899 3900 3901 3902 3903
    priv = vm->privateData;
    qemuDomainObjEnterMonitor(vm);
    r = qemuMonitorSetBalloon(priv->mon, newmem);
    qemuDomainObjExitMonitor(vm);
    if (r < 0)
        goto endjob;
3904

3905 3906 3907 3908 3909
    /* Lack of balloon support is a fatal error */
    if (r == 0) {
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        "%s", _("cannot set memory of an active domain"));
        goto endjob;
3910
    }
3911

3912
    ret = 0;
3913
endjob:
3914 3915
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3916

3917
cleanup:
3918 3919
    if (vm)
        virDomainObjUnlock(vm);
3920
    return ret;
3921 3922
}

3923
static int qemudDomainGetInfo(virDomainPtr dom,
3924
                              virDomainInfoPtr info) {
3925 3926 3927
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3928 3929
    int err;
    unsigned long balloon;
3930

3931
    qemuDriverLock(driver);
3932
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3933
    qemuDriverUnlock(driver);
D
Daniel P. Berrange 已提交
3934
    if (!vm) {
3935 3936
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3937 3938
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3939
        goto cleanup;
D
Daniel P. Berrange 已提交
3940 3941
    }

3942
    info->state = vm->state;
D
Daniel P. Berrange 已提交
3943

D
Daniel P. Berrange 已提交
3944
    if (!virDomainObjIsActive(vm)) {
3945
        info->cpuTime = 0;
D
Daniel P. Berrange 已提交
3946
    } else {
3947
        if (qemudGetProcessInfo(&(info->cpuTime), NULL, vm->pid, 0) < 0) {
3948
            qemuReportError(VIR_ERR_OPERATION_FAILED, ("cannot read cputime for domain"));
3949
            goto cleanup;
D
Daniel P. Berrange 已提交
3950 3951 3952
        }
    }

3953
    info->maxMem = vm->def->mem.max_balloon;
3954

D
Daniel P. Berrange 已提交
3955
    if (virDomainObjIsActive(vm)) {
3956
        qemuDomainObjPrivatePtr priv = vm->privateData;
3957 3958 3959

        if ((vm->def->memballoon != NULL) &&
            (vm->def->memballoon->model == VIR_DOMAIN_MEMBALLOON_MODEL_NONE)) {
3960
            info->memory = vm->def->mem.max_balloon;
3961
        } else if (!priv->jobActive) {
3962 3963
            if (qemuDomainObjBeginJob(vm) < 0)
                goto cleanup;
3964 3965 3966 3967 3968 3969 3970 3971 3972
            if (!virDomainObjIsActive(vm))
                err = 0;
            else {
                qemuDomainObjEnterMonitor(vm);
                err = qemuMonitorGetBalloonInfo(priv->mon, &balloon);
                qemuDomainObjExitMonitor(vm);
            }
            if (qemuDomainObjEndJob(vm) == 0) {
                vm = NULL;
3973 3974 3975
                goto cleanup;
            }

3976 3977
            if (err < 0)
                goto cleanup;
3978 3979
            if (err == 0)
                /* Balloon not supported, so maxmem is always the allocation */
3980
                info->memory = vm->def->mem.max_balloon;
3981 3982 3983
            else
                info->memory = balloon;
        } else {
3984
            info->memory = vm->def->mem.cur_balloon;
3985
        }
3986
    } else {
3987
        info->memory = vm->def->mem.cur_balloon;
3988 3989
    }

3990
    info->nrVirtCpu = vm->def->vcpus;
3991 3992 3993
    ret = 0;

cleanup:
3994 3995
    if (vm)
        virDomainObjUnlock(vm);
3996
    return ret;
D
Daniel P. Berrange 已提交
3997 3998 3999
}


4000 4001 4002 4003 4004 4005 4006 4007 4008
/** qemuDomainMigrateOffline:
 * Pause domain for non-live migration.
 */
static int
qemuDomainMigrateOffline(struct qemud_driver *driver,
                         virDomainObjPtr vm)
{
    int ret;

H
Hu Tao 已提交
4009
    ret = doStopCPUs(driver, vm);
4010 4011 4012 4013 4014 4015 4016 4017
    if (ret == 0) {
        virDomainEventPtr event;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_MIGRATED);
        if (event)
            qemuDomainEventQueue(driver, event);
H
Hu Tao 已提交
4018
    }
4019 4020 4021 4022 4023

    return ret;
}


4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037
static int
qemuDomainWaitForMigrationComplete(struct qemud_driver *driver, virDomainObjPtr vm)
{
    int ret = -1;
    int status;
    unsigned long long memProcessed;
    unsigned long long memRemaining;
    unsigned long long memTotal;
    qemuDomainObjPrivatePtr priv = vm->privateData;

    priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;

    while (priv->jobInfo.type == VIR_DOMAIN_JOB_UNBOUNDED) {
        /* Poll every 50ms for progress & to allow cancellation */
4038
        struct timespec ts = { .tv_sec = 0, .tv_nsec = 50 * 1000 * 1000ull };
4039 4040
        struct timeval now;
        int rc;
O
Osier Yang 已提交
4041 4042 4043 4044 4045 4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056
        const char *job;

        switch (priv->jobActive) {
            case QEMU_JOB_MIGRATION_OUT:
                job = _("migration job");
                break;
            case QEMU_JOB_SAVE:
                job = _("domain save job");
                break;
            case QEMU_JOB_DUMP:
                job = _("domain core dump job");
                break;
            default:
                job = _("job");
        }

4057

4058
        if (!virDomainObjIsActive(vm)) {
O
Osier Yang 已提交
4059 4060
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s: %s",
                            job, _("guest unexpectedly quit"));
4061 4062 4063
            goto cleanup;
        }

4064 4065
        if (priv->jobSignals & QEMU_JOB_SIGNAL_CANCEL) {
            priv->jobSignals ^= QEMU_JOB_SIGNAL_CANCEL;
O
Osier Yang 已提交
4066
            VIR_DEBUG0("Cancelling job at client request");
4067 4068 4069 4070
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            rc = qemuMonitorMigrateCancel(priv->mon);
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (rc < 0) {
O
Osier Yang 已提交
4071
                VIR_WARN0("Unable to cancel job");
4072
            }
4073 4074 4075 4076 4077
        } else if (priv->jobSignals & QEMU_JOB_SIGNAL_SUSPEND) {
            priv->jobSignals ^= QEMU_JOB_SIGNAL_SUSPEND;
            VIR_DEBUG0("Pausing domain for non-live migration");
            if (qemuDomainMigrateOffline(driver, vm) < 0)
                VIR_WARN0("Unable to pause domain");
4078 4079 4080 4081 4082 4083 4084 4085 4086 4087 4088
        } else if (priv->jobSignals & QEMU_JOB_SIGNAL_MIGRATE_DOWNTIME) {
            unsigned long long ms = priv->jobSignalsData.migrateDowntime;

            priv->jobSignals ^= QEMU_JOB_SIGNAL_MIGRATE_DOWNTIME;
            priv->jobSignalsData.migrateDowntime = 0;
            VIR_DEBUG("Setting migration downtime to %llums", ms);
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            rc = qemuMonitorSetMigrationDowntime(priv->mon, ms);
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (rc < 0)
                VIR_WARN0("Unable to set migration downtime");
4089 4090
        }

4091 4092 4093 4094
        /* Repeat check because the job signals might have caused
         * guest to die
         */
        if (!virDomainObjIsActive(vm)) {
O
Osier Yang 已提交
4095 4096
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s: %s",
                            job, _("guest unexpectedly quit"));
4097 4098 4099
            goto cleanup;
        }

4100 4101 4102 4103 4104 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115 4116 4117 4118
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
        rc = qemuMonitorGetMigrationStatus(priv->mon,
                                           &status,
                                           &memProcessed,
                                           &memRemaining,
                                           &memTotal);
        qemuDomainObjExitMonitorWithDriver(driver, vm);

        if (rc < 0) {
            priv->jobInfo.type = VIR_DOMAIN_JOB_FAILED;
            goto cleanup;
        }

        if (gettimeofday(&now, NULL) < 0) {
            priv->jobInfo.type = VIR_DOMAIN_JOB_FAILED;
            virReportSystemError(errno, "%s",
                                 _("cannot get time of day"));
            goto cleanup;
        }
4119
        priv->jobInfo.timeElapsed = timeval_to_ms(now) - priv->jobStart;
4120 4121 4122 4123 4124

        switch (status) {
        case QEMU_MONITOR_MIGRATION_STATUS_INACTIVE:
            priv->jobInfo.type = VIR_DOMAIN_JOB_NONE;
            qemuReportError(VIR_ERR_OPERATION_FAILED,
O
Osier Yang 已提交
4125
                            "%s: %s", job, _("is not active"));
4126 4127 4128 4129 4130 4131 4132 4133 4134 4135 4136 4137 4138 4139 4140 4141 4142 4143 4144 4145
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_ACTIVE:
            priv->jobInfo.dataTotal = memTotal;
            priv->jobInfo.dataRemaining = memRemaining;
            priv->jobInfo.dataProcessed = memProcessed;

            priv->jobInfo.memTotal = memTotal;
            priv->jobInfo.memRemaining = memRemaining;
            priv->jobInfo.memProcessed = memProcessed;
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_COMPLETED:
            priv->jobInfo.type = VIR_DOMAIN_JOB_COMPLETED;
            ret = 0;
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_ERROR:
            priv->jobInfo.type = VIR_DOMAIN_JOB_FAILED;
            qemuReportError(VIR_ERR_OPERATION_FAILED,
O
Osier Yang 已提交
4146
                            "%s: %s", job, _("unexpectedly failed"));
4147 4148 4149 4150 4151
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_CANCELLED:
            priv->jobInfo.type = VIR_DOMAIN_JOB_CANCELLED;
            qemuReportError(VIR_ERR_OPERATION_FAILED,
O
Osier Yang 已提交
4152
                            "%s: %s", job, _("canceled by client"));
4153 4154 4155 4156 4157 4158 4159 4160 4161 4162 4163 4164 4165 4166 4167 4168 4169
            break;
        }

        virDomainObjUnlock(vm);
        qemuDriverUnlock(driver);

        nanosleep(&ts, NULL);

        qemuDriverLock(driver);
        virDomainObjLock(vm);
    }

cleanup:
    return ret;
}


4170
#define QEMUD_SAVE_MAGIC "LibvirtQemudSave"
4171 4172 4173
#define QEMUD_SAVE_VERSION 2

enum qemud_save_formats {
4174 4175 4176
    QEMUD_SAVE_FORMAT_RAW = 0,
    QEMUD_SAVE_FORMAT_GZIP = 1,
    QEMUD_SAVE_FORMAT_BZIP2 = 2,
4177 4178
    /*
     * Deprecated by xz and never used as part of a release
4179
     * QEMUD_SAVE_FORMAT_LZMA
4180 4181
     */
    QEMUD_SAVE_FORMAT_XZ = 3,
4182
    QEMUD_SAVE_FORMAT_LZOP = 4,
4183 4184 4185
    /* Note: add new members only at the end.
       These values are used in the on-disk format.
       Do not change or re-use numbers. */
4186 4187

    QEMUD_SAVE_FORMAT_LAST
4188
};
4189

4190 4191 4192 4193 4194
VIR_ENUM_DECL(qemudSaveCompression)
VIR_ENUM_IMPL(qemudSaveCompression, QEMUD_SAVE_FORMAT_LAST,
              "raw",
              "gzip",
              "bzip2",
4195 4196
              "xz",
              "lzop")
4197

4198 4199 4200 4201 4202
struct qemud_save_header {
    char magic[sizeof(QEMUD_SAVE_MAGIC)-1];
    int version;
    int xml_len;
    int was_running;
4203 4204
    int compressed;
    int unused[15];
4205 4206
};

4207 4208 4209 4210 4211 4212 4213
struct fileOpHookData {
    virDomainPtr dom;
    const char *path;
    char *xml;
    struct qemud_save_header *header;
};

4214
/* return -errno on failure, or 0 on success */
4215 4216 4217 4218 4219
static int qemudDomainSaveFileOpHook(int fd, void *data) {
    struct fileOpHookData *hdata = data;
    int ret = 0;

    if (safewrite(fd, hdata->header, sizeof(*hdata->header)) != sizeof(*hdata->header)) {
4220
        ret = -errno;
4221
        qemuReportError(VIR_ERR_OPERATION_FAILED,
4222 4223
                        _("failed to write header to domain save file '%s'"),
                        hdata->path);
4224 4225 4226 4227
        goto endjob;
    }

    if (safewrite(fd, hdata->xml, hdata->header->xml_len) != hdata->header->xml_len) {
4228
        ret = -errno;
4229 4230 4231 4232 4233 4234 4235 4236
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                         _("failed to write xml to '%s'"), hdata->path);
        goto endjob;
    }
endjob:
    return ret;
}

4237 4238 4239
/* this internal function expects the driver lock to already be held on entry */
static int qemudDomainSaveFlag(struct qemud_driver *driver, virDomainPtr dom,
                               virDomainObjPtr vm, const char *path,
4240
                               int compressed)
4241
{
4242
    char *xml = NULL;
4243
    struct qemud_save_header header;
4244 4245
    struct fileOpHookData hdata;
    int bypassSecurityDriver = 0;
4246
    int ret = -1;
4247
    int rc;
4248
    virDomainEventPtr event = NULL;
4249
    qemuDomainObjPrivatePtr priv;
4250 4251
    struct stat sb;
    int is_reg = 0;
4252
    unsigned long long offset;
4253
    virCgroupPtr cgroup = NULL;
4254 4255 4256 4257 4258

    memset(&header, 0, sizeof(header));
    memcpy(header.magic, QEMUD_SAVE_MAGIC, sizeof(header.magic));
    header.version = QEMUD_SAVE_VERSION;

4259
    header.compressed = compressed;
4260

4261
    priv = vm->privateData;
4262

4263 4264 4265
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
4266
    if (!virDomainObjIsActive(vm)) {
4267 4268
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
4269
        goto endjob;
D
Daniel P. Berrange 已提交
4270
    }
4271

O
Osier Yang 已提交
4272 4273
    priv->jobActive = QEMU_JOB_SAVE;

4274 4275 4276
    memset(&priv->jobInfo, 0, sizeof(priv->jobInfo));
    priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;

4277 4278 4279
    /* Pause */
    if (vm->state == VIR_DOMAIN_RUNNING) {
        header.was_running = 1;
H
Hu Tao 已提交
4280
        if (doStopCPUs(driver, vm) < 0)
4281
            goto endjob;
4282 4283 4284 4285 4286 4287

        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("guest unexpectedly quit"));
            goto endjob;
        }
4288 4289 4290
    }

    /* Get XML for the domain */
4291
    xml = virDomainDefFormat(vm->def, VIR_DOMAIN_XML_SECURE);
4292
    if (!xml) {
4293 4294
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to get domain xml"));
4295
        goto endjob;
4296 4297 4298
    }
    header.xml_len = strlen(xml) + 1;

4299 4300 4301 4302 4303 4304 4305 4306 4307 4308 4309 4310 4311
    /* path might be a pre-existing block dev, in which case
     * we need to skip the create step, and also avoid unlink
     * in the failure case */
    if (stat(path, &sb) < 0) {
        /* Avoid throwing an error here, since it is possible
         * that with NFS we can't actually stat() the file.
         * The subsequent codepaths will still raise an error
         * if a truely fatal problem is hit */
        is_reg = 1;
    } else {
        is_reg = S_ISREG(sb.st_mode);
    }

4312 4313 4314 4315 4316
    offset = sizeof(header) + header.xml_len;

    /* Due to way we append QEMU state on our header with dd,
     * we need to ensure there's a 512 byte boundary. Unfortunately
     * we don't have an explicit offset in the header, so we fake
4317 4318
     * it by padding the XML string with NULLs.
     */
4319 4320 4321 4322 4323 4324 4325 4326 4327 4328 4329 4330 4331
    if (offset % QEMU_MONITOR_MIGRATE_TO_FILE_BS) {
        unsigned long long pad =
            QEMU_MONITOR_MIGRATE_TO_FILE_BS -
            (offset % QEMU_MONITOR_MIGRATE_TO_FILE_BS);

        if (VIR_REALLOC_N(xml, header.xml_len + pad) < 0) {
            virReportOOMError();
            goto endjob;
        }
        memset(xml + header.xml_len, 0, pad);
        offset += pad;
        header.xml_len += pad;
    }
4332

4333 4334 4335 4336 4337 4338
    /* Setup hook data needed by virFileOperation hook function */
    hdata.dom = dom;
    hdata.path = path;
    hdata.xml = xml;
    hdata.header = &header;

4339 4340
    /* Write header to file, followed by XML */

4341
    /* First try creating the file as root */
4342 4343 4344 4345
    if (!is_reg) {
        int fd = open(path, O_WRONLY | O_TRUNC);
        if (fd < 0) {
            virReportSystemError(errno, _("unable to open %s"), path);
4346 4347
            goto endjob;
        }
4348
        if (qemudDomainSaveFileOpHook(fd, &hdata) < 0) {
4349
            VIR_FORCE_CLOSE(fd);
4350 4351
            goto endjob;
        }
4352
        if (VIR_CLOSE(fd) < 0) {
4353
            virReportSystemError(errno, _("unable to close %s"), path);
4354 4355
            goto endjob;
        }
4356 4357 4358 4359 4360
    } else {
        if ((rc = virFileOperation(path, O_CREAT|O_TRUNC|O_WRONLY,
                                  S_IRUSR|S_IWUSR,
                                  getuid(), getgid(),
                                  qemudDomainSaveFileOpHook, &hdata,
4361
                                  0)) < 0) {
4362
            /* If we failed as root, and the error was permission-denied
4363 4364
               (EACCES or EPERM), assume it's on a network-connected share
               where root access is restricted (eg, root-squashed NFS). If the
4365 4366 4367 4368
               qemu user (driver->user) is non-root, just set a flag to
               bypass security driver shenanigans, and retry the operation
               after doing setuid to qemu user */

4369
            if (((rc != -EACCES) && (rc != -EPERM)) ||
4370
                driver->user == getuid()) {
4371
                virReportSystemError(-rc, _("Failed to create domain save file '%s'"),
4372 4373 4374
                                     path);
                goto endjob;
            }
4375

4376
            /* On Linux we can also verify the FS-type of the directory. */
4377 4378 4379 4380 4381 4382 4383 4384 4385 4386 4387 4388 4389 4390 4391 4392 4393 4394
            switch (virStorageFileIsSharedFS(path)) {
                case 1:
                   /* it was on a network share, so we'll continue
                    * as outlined above
                    */
                   break;

                case -1:
                   virReportSystemError(errno,
                                        _("Failed to create domain save file "
                                          "'%s': couldn't determine fs type"),
                                        path);
                   goto endjob;
                   break;

                case 0:
                default:
                   /* local file - log the error returned by virFileOperation */
4395
                   virReportSystemError(-rc,
4396 4397 4398 4399
                                        _("Failed to create domain save file '%s'"),
                                        path);
                   goto endjob;
                   break;
4400 4401 4402

            }

4403
            /* Retry creating the file as driver->user */
4404

4405 4406 4407 4408
            if ((rc = virFileOperation(path, O_CREAT|O_TRUNC|O_WRONLY,
                                       S_IRUSR|S_IWUSR|S_IRGRP|S_IWGRP,
                                       driver->user, driver->group,
                                       qemudDomainSaveFileOpHook, &hdata,
4409 4410
                                       VIR_FILE_OP_AS_UID)) < 0) {
                virReportSystemError(-rc, _("Error from child process creating '%s'"),
4411
                                 path);
4412 4413
                goto endjob;
            }
4414

4415 4416 4417
            /* Since we had to setuid to create the file, and the fstype
               is NFS, we assume it's a root-squashing NFS share, and that
               the security driver stuff would have failed anyway */
4418

4419 4420
            bypassSecurityDriver = 1;
        }
4421
    }
4422

4423

4424 4425 4426 4427 4428 4429 4430 4431 4432 4433 4434 4435 4436 4437 4438 4439 4440
    if (!is_reg &&
        qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_DEVICES)) {
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("Unable to find cgroup for %s\n"),
                            vm->def->name);
            goto endjob;
        }
        rc = virCgroupAllowDevicePath(cgroup, path);
        if (rc != 0) {
            virReportSystemError(-rc,
                                 _("Unable to allow device %s for %s"),
                                 path, vm->def->name);
            goto endjob;
        }
    }

4441
    if ((!bypassSecurityDriver) &&
4442 4443
        virSecurityManagerSetSavedStateLabel(driver->securityManager,
                                             vm, path) < 0)
4444 4445
        goto endjob;

4446 4447
    if (header.compressed == QEMUD_SAVE_FORMAT_RAW) {
        const char *args[] = { "cat", NULL };
M
Matthias Bolte 已提交
4448
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
4449 4450 4451
        rc = qemuMonitorMigrateToFile(priv->mon,
                                      QEMU_MONITOR_MIGRATE_BACKGROUND,
                                      args, path, offset);
M
Matthias Bolte 已提交
4452
        qemuDomainObjExitMonitorWithDriver(driver, vm);
4453
    } else {
4454
        const char *prog = qemudSaveCompressionTypeToString(header.compressed);
4455 4456 4457 4458 4459
        const char *args[] = {
            prog,
            "-c",
            NULL
        };
M
Matthias Bolte 已提交
4460
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
4461 4462 4463
        rc = qemuMonitorMigrateToFile(priv->mon,
                                      QEMU_MONITOR_MIGRATE_BACKGROUND,
                                      args, path, offset);
M
Matthias Bolte 已提交
4464
        qemuDomainObjExitMonitorWithDriver(driver, vm);
4465 4466
    }

4467 4468 4469 4470 4471
    if (rc < 0)
        goto endjob;

    rc = qemuDomainWaitForMigrationComplete(driver, vm);

4472
    if (rc < 0)
4473
        goto endjob;
4474

4475
    if ((!bypassSecurityDriver) &&
4476 4477
        virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                 vm, path) < 0)
4478
        VIR_WARN("failed to restore save state label on %s", path);
4479

4480 4481
    if (cgroup != NULL) {
        rc = virCgroupDenyDevicePath(cgroup, path);
4482 4483 4484
        if (rc != 0)
            VIR_WARN("Unable to deny device %s for %s %d",
                     path, vm->def->name, rc);
4485 4486
    }

4487 4488
    ret = 0;

4489
    /* Shut it down */
4490
    qemudShutdownVMDaemon(driver, vm, 0);
4491
    qemuDomainStopAudit(vm, "saved");
4492 4493 4494
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_SAVED);
4495
    if (!vm->persistent) {
4496 4497 4498
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains,
                                    vm);
4499 4500
        vm = NULL;
    }
4501

4502
endjob:
4503
    if (vm) {
4504
        if (ret != 0) {
4505
            if (header.was_running && virDomainObjIsActive(vm)) {
H
Hu Tao 已提交
4506
                rc = doStartCPUs(driver, vm, dom->conn);
4507 4508 4509
                if (rc < 0)
                    VIR_WARN0("Unable to resume guest CPUs after save failure");
            }
4510

4511 4512 4513 4514 4515
            if (cgroup != NULL) {
                rc = virCgroupDenyDevicePath(cgroup, path);
                if (rc != 0)
                    VIR_WARN("Unable to deny device %s for %s: %d",
                             path, vm->def->name, rc);
4516
            }
4517 4518

            if ((!bypassSecurityDriver) &&
4519 4520
                virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                         vm, path) < 0)
4521
                VIR_WARN("failed to restore save state label on %s", path);
4522 4523
        }

4524
        if (qemuDomainObjEndJob(vm) == 0)
4525
            vm = NULL;
4526
    }
4527

4528 4529
cleanup:
    VIR_FREE(xml);
4530
    if (ret != 0 && is_reg)
4531
        unlink(path);
4532 4533
    if (event)
        qemuDomainEventQueue(driver, event);
4534
    virCgroupFree(&cgroup);
4535
    return ret;
D
Daniel P. Berrange 已提交
4536 4537
}

4538 4539 4540 4541 4542 4543 4544 4545 4546 4547 4548 4549 4550 4551 4552 4553
/* Returns true if a compression program is available in PATH */
static bool qemudCompressProgramAvailable(enum qemud_save_formats compress)
{
    const char *prog;
    char *c;

    if (compress == QEMUD_SAVE_FORMAT_RAW)
        return true;
    prog = qemudSaveCompressionTypeToString(compress);
    c = virFindFileInPath(prog);
    if (!c)
        return false;
    VIR_FREE(c);
    return true;
}

4554 4555 4556 4557
static int qemudDomainSave(virDomainPtr dom, const char *path)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int compressed;
4558 4559 4560 4561
    int ret = -1;
    virDomainObjPtr vm = NULL;

    qemuDriverLock(driver);
4562 4563 4564 4565 4566 4567 4568 4569 4570 4571 4572

    if (driver->saveImageFormat == NULL)
        compressed = QEMUD_SAVE_FORMAT_RAW;
    else {
        compressed = qemudSaveCompressionTypeFromString(driver->saveImageFormat);
        if (compressed < 0) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("Invalid save image format specified "
                                    "in configuration file"));
            return -1;
        }
4573 4574 4575 4576 4577 4578
        if (!qemudCompressProgramAvailable(compressed)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("Compression program for image format "
                                    "in configuration file isn't available"));
            return -1;
        }
4579 4580
    }

4581 4582 4583 4584 4585 4586 4587 4588 4589 4590 4591 4592 4593 4594 4595 4596 4597
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    ret = qemudDomainSaveFlag(driver, dom, vm, path, compressed);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);

    return ret;
4598 4599 4600 4601 4602 4603 4604 4605 4606 4607 4608 4609 4610 4611 4612 4613 4614 4615 4616 4617 4618 4619 4620
}

static char *
qemuDomainManagedSavePath(struct qemud_driver *driver, virDomainObjPtr vm) {
    char *ret;

    if (virAsprintf(&ret, "%s/%s.save", driver->saveDir, vm->def->name) < 0) {
        virReportOOMError();
        return(NULL);
    }

    return(ret);
}

static int
qemuDomainManagedSave(virDomainPtr dom, unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    char *name = NULL;
    int ret = -1;
    int compressed;

4621
    virCheckFlags(0, -1);
4622 4623 4624 4625 4626 4627 4628 4629

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
4630
        goto cleanup;
4631 4632 4633 4634
    }

    name = qemuDomainManagedSavePath(driver, vm);
    if (name == NULL)
4635
        goto cleanup;
4636 4637 4638 4639

    VIR_DEBUG("Saving state to %s", name);

    compressed = QEMUD_SAVE_FORMAT_RAW;
4640
    ret = qemudDomainSaveFlag(driver, dom, vm, name, compressed);
4641 4642 4643 4644 4645

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
4646 4647 4648
    VIR_FREE(name);

    return ret;
4649 4650 4651 4652 4653 4654 4655 4656 4657 4658
}

static int
qemuDomainHasManagedSaveImage(virDomainPtr dom, unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    char *name = NULL;

4659
    virCheckFlags(0, -1);
4660 4661 4662 4663 4664 4665 4666 4667 4668 4669 4670 4671 4672 4673 4674 4675 4676 4677 4678 4679 4680 4681 4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    name = qemuDomainManagedSavePath(driver, vm);
    if (name == NULL)
        goto cleanup;

    ret = virFileExists(name);

cleanup:
    VIR_FREE(name);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

static int
qemuDomainManagedSaveRemove(virDomainPtr dom, unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    char *name = NULL;

4693
    virCheckFlags(0, -1);
4694 4695 4696 4697 4698 4699 4700 4701 4702 4703 4704 4705 4706 4707 4708 4709 4710 4711 4712 4713 4714 4715 4716 4717

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    name = qemuDomainManagedSavePath(driver, vm);
    if (name == NULL)
        goto cleanup;

    ret = unlink(name);

cleanup:
    VIR_FREE(name);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}
D
Daniel P. Berrange 已提交
4718

H
Hu Tao 已提交
4719 4720 4721 4722 4723 4724 4725 4726 4727 4728 4729 4730 4731 4732 4733 4734 4735 4736 4737 4738 4739 4740 4741 4742 4743
static int doCoreDump(struct qemud_driver *driver,
                      virDomainObjPtr vm,
                      const char *path,
                      enum qemud_save_formats compress)
{
    int fd = -1;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    priv = vm->privateData;

    /* Create an empty file with appropriate ownership.  */
    if ((fd = open(path, O_CREAT|O_TRUNC|O_WRONLY, S_IRUSR|S_IWUSR)) < 0) {
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("failed to create '%s'"), path);
        goto cleanup;
    }

    if (VIR_CLOSE(fd) < 0) {
        virReportSystemError(errno,
                             _("unable to save file %s"),
                             path);
        goto cleanup;
    }

4744 4745
    if (virSecurityManagerSetSavedStateLabel(driver->securityManager,
                                             vm, path) < 0)
H
Hu Tao 已提交
4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759 4760 4761 4762 4763 4764 4765 4766 4767 4768 4769 4770 4771 4772 4773 4774 4775 4776
        goto cleanup;

    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    if (compress == QEMUD_SAVE_FORMAT_RAW) {
        const char *args[] = {
            "cat",
            NULL,
        };
        ret = qemuMonitorMigrateToFile(priv->mon,
                                       QEMU_MONITOR_MIGRATE_BACKGROUND,
                                       args, path, 0);
    } else {
        const char *prog = qemudSaveCompressionTypeToString(compress);
        const char *args[] = {
            prog,
            "-c",
            NULL,
        };
        ret = qemuMonitorMigrateToFile(priv->mon,
                                       QEMU_MONITOR_MIGRATE_BACKGROUND,
                                       args, path, 0);
    }
    qemuDomainObjExitMonitorWithDriver(driver, vm);
    if (ret < 0)
        goto cleanup;

    ret = qemuDomainWaitForMigrationComplete(driver, vm);

    if (ret < 0)
        goto cleanup;

4777 4778
    if (virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                 vm, path) < 0)
H
Hu Tao 已提交
4779 4780 4781 4782 4783 4784 4785 4786
        goto cleanup;

cleanup:
    if (ret != 0)
        unlink(path);
    return ret;
}

4787 4788 4789 4790 4791
static enum qemud_save_formats
getCompressionType(struct qemud_driver *driver)
{
    int compress = QEMUD_SAVE_FORMAT_RAW;

4792 4793 4794 4795 4796 4797 4798
    /*
     * We reuse "save" flag for "dump" here. Then, we can support the same
     * format in "save" and "dump".
     */
    if (driver->dumpImageFormat) {
        compress = qemudSaveCompressionTypeFromString(driver->dumpImageFormat);
        if (compress < 0) {
4799 4800 4801 4802
            qemuReportError(VIR_ERR_OPERATION_FAILED, "%s",
                            _("Invalid dump image format specified in "
                              "configuration file, using raw"));
            return QEMUD_SAVE_FORMAT_RAW;
4803
        }
4804 4805 4806
        if (!qemudCompressProgramAvailable(compress)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("Compression program for dump image format "
4807 4808 4809
                                    "in configuration file isn't available, "
                                    "using raw"));
            return QEMUD_SAVE_FORMAT_RAW;
4810
        }
4811
    }
4812 4813 4814 4815 4816 4817 4818 4819 4820
    return compress;
}

static int qemudDomainCoreDump(virDomainPtr dom,
                               const char *path,
                               int flags ATTRIBUTE_UNUSED) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int resume = 0, paused = 0;
H
Hu Tao 已提交
4821
    int ret = -1;
4822 4823 4824
    virDomainEventPtr event = NULL;
    qemuDomainObjPrivatePtr priv;

P
Paolo Bonzini 已提交
4825 4826 4827 4828 4829 4830
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
4831 4832
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
P
Paolo Bonzini 已提交
4833 4834
        goto cleanup;
    }
4835
    priv = vm->privateData;
P
Paolo Bonzini 已提交
4836

4837
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
4838 4839
        goto cleanup;

D
Daniel P. Berrange 已提交
4840
    if (!virDomainObjIsActive(vm)) {
4841 4842
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
4843
        goto endjob;
P
Paolo Bonzini 已提交
4844 4845
    }

O
Osier Yang 已提交
4846 4847
    priv->jobActive = QEMU_JOB_DUMP;

P
Paolo Bonzini 已提交
4848 4849
    /* Migrate will always stop the VM, so the resume condition is
       independent of whether the stop command is issued.  */
P
Paolo Bonzini 已提交
4850 4851 4852
    resume = (vm->state == VIR_DOMAIN_RUNNING);

    /* Pause domain for non-live dump */
P
Paolo Bonzini 已提交
4853
    if (!(flags & VIR_DUMP_LIVE) && vm->state == VIR_DOMAIN_RUNNING) {
H
Hu Tao 已提交
4854
        if (doStopCPUs(driver, vm) < 0)
4855
            goto endjob;
P
Paolo Bonzini 已提交
4856
        paused = 1;
4857 4858 4859 4860 4861 4862

        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("guest unexpectedly quit"));
            goto endjob;
        }
P
Paolo Bonzini 已提交
4863 4864
    }

H
Hu Tao 已提交
4865
    ret = doCoreDump(driver, vm, path, getCompressionType(driver));
4866 4867 4868 4869
    if (ret < 0)
        goto endjob;

    paused = 1;
4870 4871

endjob:
4872
    if ((ret == 0) && (flags & VIR_DUMP_CRASH)) {
4873
        qemudShutdownVMDaemon(driver, vm, 0);
4874
        qemuDomainStopAudit(vm, "crashed");
4875 4876 4877 4878 4879
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_CRASHED);
    }

P
Paolo Bonzini 已提交
4880 4881 4882
    /* Since the monitor is always attached to a pty for libvirt, it
       will support synchronous operations so we always get here after
       the migration is complete.  */
4883
    else if (resume && paused && virDomainObjIsActive(vm)) {
H
Hu Tao 已提交
4884
        if (doStartCPUs(driver, vm, dom->conn) < 0) {
4885
            if (virGetLastError() == NULL)
4886 4887
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("resuming after dump failed"));
P
Paolo Bonzini 已提交
4888 4889
        }
    }
4890

4891 4892
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
4893
    else if ((ret == 0) && (flags & VIR_DUMP_CRASH) && !vm->persistent) {
4894 4895 4896 4897
        virDomainRemoveInactive(&driver->domains,
                                vm);
        vm = NULL;
    }
4898 4899

cleanup:
P
Paolo Bonzini 已提交
4900 4901
    if (vm)
        virDomainObjUnlock(vm);
4902 4903
    if (event)
        qemuDomainEventQueue(driver, event);
4904
    qemuDriverUnlock(driver);
P
Paolo Bonzini 已提交
4905 4906 4907
    return ret;
}

H
Hu Tao 已提交
4908 4909 4910 4911 4912 4913 4914 4915 4916 4917 4918 4919 4920 4921 4922 4923 4924 4925 4926 4927 4928 4929 4930 4931 4932 4933 4934 4935 4936 4937 4938 4939 4940 4941 4942 4943 4944
static void processWatchdogEvent(void *data, void *opaque)
{
    int ret;
    struct watchdogEvent *wdEvent = data;
    struct qemud_driver *driver = opaque;

    switch (wdEvent->action) {
    case VIR_DOMAIN_WATCHDOG_ACTION_DUMP:
        {
            char *dumpfile;
            int i;

            i = virAsprintf(&dumpfile, "%s/%s-%u",
                            driver->autoDumpPath,
                            wdEvent->vm->def->name,
                            (unsigned int)time(NULL));

            qemuDriverLock(driver);
            virDomainObjLock(wdEvent->vm);

            if (qemuDomainObjBeginJobWithDriver(driver, wdEvent->vm) < 0)
                break;

            if (!virDomainObjIsActive(wdEvent->vm)) {
                qemuReportError(VIR_ERR_OPERATION_INVALID,
                                "%s", _("domain is not running"));
                break;
            }

            ret = doCoreDump(driver,
                             wdEvent->vm,
                             dumpfile,
                             getCompressionType(driver));
            if (ret < 0)
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("Dump failed"));

H
Hu Tao 已提交
4945
            ret = doStartCPUs(driver, wdEvent->vm, NULL);
H
Hu Tao 已提交
4946 4947 4948 4949 4950 4951 4952 4953 4954 4955 4956 4957 4958 4959 4960 4961 4962

            if (ret < 0)
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("Resuming after dump failed"));

            if (qemuDomainObjEndJob(wdEvent->vm) > 0)
                virDomainObjUnlock(wdEvent->vm);

            qemuDriverUnlock(driver);

            VIR_FREE(dumpfile);
        }
        break;
    }

    VIR_FREE(wdEvent);
}
P
Paolo Bonzini 已提交
4963

4964 4965 4966 4967 4968 4969
static int qemudDomainHotplugVcpus(virDomainObjPtr vm, unsigned int nvcpus)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int i, rc;
    int ret = -1;

4970 4971
    qemuDomainObjEnterMonitor(vm);

4972 4973 4974 4975 4976 4977 4978 4979 4980 4981 4982 4983 4984 4985 4986 4987 4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998 4999 5000 5001
    /* We need different branches here, because we want to offline
     * in reverse order to onlining, so any partial fail leaves us in a
     * reasonably sensible state */
    if (nvcpus > vm->def->vcpus) {
        for (i = vm->def->vcpus ; i < nvcpus ; i++) {
            /* Online new CPU */
            rc = qemuMonitorSetCPU(priv->mon, i, 1);
            if (rc == 0)
                goto unsupported;
            if (rc < 0)
                goto cleanup;

            vm->def->vcpus++;
        }
    } else {
        for (i = vm->def->vcpus - 1 ; i >= nvcpus ; i--) {
            /* Offline old CPU */
            rc = qemuMonitorSetCPU(priv->mon, i, 0);
            if (rc == 0)
                goto unsupported;
            if (rc < 0)
                goto cleanup;

            vm->def->vcpus--;
        }
    }

    ret = 0;

cleanup:
5002
    qemuDomainObjExitMonitor(vm);
5003 5004 5005 5006 5007 5008 5009 5010 5011
    return ret;

unsupported:
    qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                    _("cannot change vcpu count of this domain"));
    goto cleanup;
}


5012 5013 5014 5015
static int
qemudDomainSetVcpusFlags(virDomainPtr dom, unsigned int nvcpus,
                         unsigned int flags)
{
5016 5017
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5018
    virDomainDefPtr persistentDef;
5019 5020
    const char * type;
    int max;
5021
    int ret = -1;
5022

5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033 5034 5035 5036 5037 5038
    virCheckFlags(VIR_DOMAIN_VCPU_LIVE |
                  VIR_DOMAIN_VCPU_CONFIG |
                  VIR_DOMAIN_VCPU_MAXIMUM, -1);

    /* At least one of LIVE or CONFIG must be set.  MAXIMUM cannot be
     * mixed with LIVE.  */
    if ((flags & (VIR_DOMAIN_VCPU_LIVE | VIR_DOMAIN_VCPU_CONFIG)) == 0 ||
        (flags & (VIR_DOMAIN_VCPU_MAXIMUM | VIR_DOMAIN_VCPU_LIVE)) ==
         (VIR_DOMAIN_VCPU_MAXIMUM | VIR_DOMAIN_VCPU_LIVE)) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid flag combination: (0x%x)"), flags);
        return -1;
    }
    if (!nvcpus || (unsigned short) nvcpus != nvcpus) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("argument out of range: %d"), nvcpus);
5039 5040 5041
        return -1;
    }

5042
    qemuDriverLock(driver);
5043
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5044 5045
    qemuDriverUnlock(driver);

5046
    if (!vm) {
5047 5048
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5049 5050
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5051
        goto cleanup;
5052 5053
    }

5054 5055 5056
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

5057
    if (!virDomainObjIsActive(vm) && (flags & VIR_DOMAIN_VCPU_LIVE)) {
5058 5059
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                         "%s", _("domain is not running"));
5060
        goto endjob;
5061 5062
    }

5063 5064 5065 5066 5067 5068
    if (!vm->persistent && (flags & VIR_DOMAIN_VCPU_CONFIG)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID, "%s",
                        _("cannot change persistent config of a transient domain"));
        goto endjob;
    }

5069 5070 5071 5072 5073 5074 5075 5076 5077 5078 5079 5080 5081
    if (!(type = virDomainVirtTypeToString(vm->def->virtType))) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("unknown virt type in domain definition '%d'"),
                        vm->def->virtType);
        goto endjob;
    }

    if ((max = qemudGetMaxVCPUs(NULL, type)) < 0) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("could not determine max vcpus for the domain"));
        goto endjob;
    }

C
Cole Robinson 已提交
5082
    if (!(flags & VIR_DOMAIN_VCPU_MAXIMUM) && vm->def->maxvcpus < max) {
5083 5084 5085
        max = vm->def->maxvcpus;
    }

5086 5087 5088 5089 5090 5091 5092
    if (nvcpus > max) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("requested vcpus is greater than max allowable"
                          " vcpus for the domain: %d > %d"), nvcpus, max);
        goto endjob;
    }

5093 5094 5095
    if (!(persistentDef = virDomainObjGetPersistentDef(driver->caps, vm)))
        goto endjob;

5096 5097
    switch (flags) {
    case VIR_DOMAIN_VCPU_MAXIMUM | VIR_DOMAIN_VCPU_CONFIG:
5098 5099 5100
        persistentDef->maxvcpus = nvcpus;
        if (nvcpus < persistentDef->vcpus)
            persistentDef->vcpus = nvcpus;
5101 5102 5103 5104
        ret = 0;
        break;

    case VIR_DOMAIN_VCPU_CONFIG:
5105
        persistentDef->vcpus = nvcpus;
5106 5107 5108 5109 5110 5111 5112 5113 5114
        ret = 0;
        break;

    case VIR_DOMAIN_VCPU_LIVE:
        ret = qemudDomainHotplugVcpus(vm, nvcpus);
        break;

    case VIR_DOMAIN_VCPU_LIVE | VIR_DOMAIN_VCPU_CONFIG:
        ret = qemudDomainHotplugVcpus(vm, nvcpus);
5115 5116 5117
        if (ret == 0) {
            persistentDef->vcpus = nvcpus;
        }
5118 5119
        break;
    }
5120

5121 5122 5123 5124
    /* Save the persistent config to disk */
    if (flags & VIR_DOMAIN_VCPU_CONFIG)
        ret = virDomainSaveConfig(driver->configDir, persistentDef);

5125 5126 5127
endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
5128

5129
cleanup:
5130 5131
    if (vm)
        virDomainObjUnlock(vm);
5132
    return ret;
5133 5134
}

5135 5136 5137 5138 5139 5140
static int
qemudDomainSetVcpus(virDomainPtr dom, unsigned int nvcpus)
{
    return qemudDomainSetVcpusFlags(dom, nvcpus, VIR_DOMAIN_VCPU_LIVE);
}

5141 5142 5143 5144 5145 5146

static int
qemudDomainPinVcpu(virDomainPtr dom,
                   unsigned int vcpu,
                   unsigned char *cpumap,
                   int maplen) {
5147 5148
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5149
    int maxcpu, hostcpus;
5150
    virNodeInfo nodeinfo;
5151
    int ret = -1;
5152
    qemuDomainObjPrivatePtr priv;
5153

5154
    qemuDriverLock(driver);
5155
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5156 5157
    qemuDriverUnlock(driver);

5158 5159 5160
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5161 5162
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5163 5164 5165
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
5166
    if (!virDomainObjIsActive(vm)) {
5167 5168
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s",_("cannot pin vcpus on an inactive domain"));
5169
        goto cleanup;
5170 5171
    }

5172 5173 5174
    priv = vm->privateData;

    if (vcpu > (priv->nvcpupids-1)) {
5175 5176 5177
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("vcpu number out of range %d > %d"),
                        vcpu, priv->nvcpupids);
5178
        goto cleanup;
5179 5180
    }

5181
    if (nodeGetInfo(dom->conn, &nodeinfo) < 0)
5182
        goto cleanup;
5183

5184
    hostcpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
5185
    maxcpu = maplen * 8;
5186 5187
    if (maxcpu > hostcpus)
        maxcpu = hostcpus;
5188

5189 5190
    if (priv->vcpupids != NULL) {
        if (virProcessInfoSetAffinity(priv->vcpupids[vcpu],
5191
                                      cpumap, maplen, maxcpu) < 0)
5192
            goto cleanup;
5193
    } else {
5194 5195
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        "%s", _("cpu affinity is not supported"));
5196
        goto cleanup;
5197
    }
5198
    ret = 0;
5199

5200
cleanup:
5201 5202
    if (vm)
        virDomainObjUnlock(vm);
5203
    return ret;
5204 5205 5206 5207 5208 5209 5210 5211
}

static int
qemudDomainGetVcpus(virDomainPtr dom,
                    virVcpuInfoPtr info,
                    int maxinfo,
                    unsigned char *cpumaps,
                    int maplen) {
5212 5213
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5214
    virNodeInfo nodeinfo;
5215
    int i, v, maxcpu, hostcpus;
5216
    int ret = -1;
5217
    qemuDomainObjPrivatePtr priv;
5218

5219
    qemuDriverLock(driver);
5220
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5221 5222
    qemuDriverUnlock(driver);

5223 5224 5225
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5226 5227
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5228 5229 5230
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
5231
    if (!virDomainObjIsActive(vm)) {
5232 5233 5234
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s",
                        _("cannot list vcpu pinning for an inactive domain"));
5235
        goto cleanup;
5236 5237
    }

5238 5239
    priv = vm->privateData;

5240
    if (nodeGetInfo(dom->conn, &nodeinfo) < 0)
5241
        goto cleanup;
5242

5243
    hostcpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
5244
    maxcpu = maplen * 8;
5245 5246
    if (maxcpu > hostcpus)
        maxcpu = hostcpus;
5247 5248

    /* Clamp to actual number of vcpus */
5249 5250
    if (maxinfo > priv->nvcpupids)
        maxinfo = priv->nvcpupids;
5251

5252 5253 5254 5255 5256 5257
    if (maxinfo >= 1) {
        if (info != NULL) {
            memset(info, 0, sizeof(*info) * maxinfo);
            for (i = 0 ; i < maxinfo ; i++) {
                info[i].number = i;
                info[i].state = VIR_VCPU_RUNNING;
5258

5259
                if (priv->vcpupids != NULL &&
5260 5261 5262
                    qemudGetProcessInfo(&(info[i].cpuTime),
                                        &(info[i].cpu),
                                        vm->pid,
5263
                                        priv->vcpupids[i]) < 0) {
5264
                    virReportSystemError(errno, "%s",
5265 5266 5267
                                         _("cannot get vCPU placement & pCPU time"));
                    goto cleanup;
                }
5268
            }
5269 5270
        }

5271 5272
        if (cpumaps != NULL) {
            memset(cpumaps, 0, maplen * maxinfo);
5273
            if (priv->vcpupids != NULL) {
5274 5275 5276
                for (v = 0 ; v < maxinfo ; v++) {
                    unsigned char *cpumap = VIR_GET_CPUMAP(cpumaps, maplen, v);

5277
                    if (virProcessInfoGetAffinity(priv->vcpupids[v],
5278
                                                  cpumap, maplen, maxcpu) < 0)
5279
                        goto cleanup;
5280
                }
5281
            } else {
5282 5283
                qemuReportError(VIR_ERR_NO_SUPPORT,
                                "%s", _("cpu affinity is not available"));
5284
                goto cleanup;
5285 5286 5287
            }
        }
    }
5288
    ret = maxinfo;
5289

5290
cleanup:
5291 5292
    if (vm)
        virDomainObjUnlock(vm);
5293
    return ret;
5294 5295 5296
}


5297 5298 5299
static int
qemudDomainGetVcpusFlags(virDomainPtr dom, unsigned int flags)
{
5300 5301
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5302
    virDomainDefPtr def;
5303
    int ret = -1;
5304

5305 5306 5307 5308 5309 5310 5311 5312
    virCheckFlags(VIR_DOMAIN_VCPU_LIVE |
                  VIR_DOMAIN_VCPU_CONFIG |
                  VIR_DOMAIN_VCPU_MAXIMUM, -1);

    /* Exactly one of LIVE or CONFIG must be set.  */
    if (!(flags & VIR_DOMAIN_VCPU_LIVE) == !(flags & VIR_DOMAIN_VCPU_CONFIG)) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid flag combination: (0x%x)"), flags);
5313 5314 5315
        return -1;
    }

5316
    qemuDriverLock(driver);
5317
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5318 5319
    qemuDriverUnlock(driver);

5320
    if (!vm) {
5321 5322
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5323 5324
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5325
        goto cleanup;
5326 5327
    }

5328 5329 5330 5331 5332 5333 5334 5335 5336
    if (flags & VIR_DOMAIN_VCPU_LIVE) {
        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_OPERATION_INVALID, "%s",
                            _("domain not active"));
            goto cleanup;
        }
        def = vm->def;
    } else {
        def = vm->newDef ? vm->newDef : vm->def;
5337 5338
    }

5339
    ret = (flags & VIR_DOMAIN_VCPU_MAXIMUM) ? def->maxvcpus : def->vcpus;
5340

5341
cleanup:
5342 5343
    if (vm)
        virDomainObjUnlock(vm);
5344 5345 5346
    return ret;
}

5347 5348 5349 5350 5351 5352 5353
static int
qemudDomainGetMaxVcpus(virDomainPtr dom)
{
    return qemudDomainGetVcpusFlags(dom, (VIR_DOMAIN_VCPU_LIVE |
                                          VIR_DOMAIN_VCPU_MAXIMUM));
}

5354 5355 5356 5357 5358 5359 5360 5361 5362
static int qemudDomainGetSecurityLabel(virDomainPtr dom, virSecurityLabelPtr seclabel)
{
    struct qemud_driver *driver = (struct qemud_driver *)dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

5363 5364
    memset(seclabel, 0, sizeof(*seclabel));

5365 5366 5367
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5368 5369
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5370 5371 5372
        goto cleanup;
    }

5373
    if (!virDomainVirtTypeToString(vm->def->virtType)) {
5374 5375 5376
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("unknown virt type in domain definition '%d'"),
                        vm->def->virtType);
5377 5378 5379 5380 5381 5382 5383 5384 5385 5386 5387 5388 5389 5390 5391 5392 5393
        goto cleanup;
    }

    /*
     * Theoretically, the pid can be replaced during this operation and
     * return the label of a different process.  If atomicity is needed,
     * further validation will be required.
     *
     * Comment from Dan Berrange:
     *
     *   Well the PID as stored in the virDomainObjPtr can't be changed
     *   because you've got a locked object.  The OS level PID could have
     *   exited, though and in extreme circumstances have cycled through all
     *   PIDs back to ours. We could sanity check that our PID still exists
     *   after reading the label, by checking that our FD connecting to the
     *   QEMU monitor hasn't seen SIGHUP/ERR on poll().
     */
D
Daniel P. Berrange 已提交
5394
    if (virDomainObjIsActive(vm)) {
5395 5396
        if (virSecurityManagerGetProcessLabel(driver->securityManager,
                                              vm, seclabel) < 0) {
5397 5398 5399
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            "%s", _("Failed to get security label"));
            goto cleanup;
5400 5401 5402 5403 5404 5405 5406 5407
        }
    }

    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
5408
    qemuDriverUnlock(driver);
5409 5410 5411
    return ret;
}

5412 5413
static int qemudNodeGetSecurityModel(virConnectPtr conn,
                                     virSecurityModelPtr secmodel)
5414 5415 5416
{
    struct qemud_driver *driver = (struct qemud_driver *)conn->privateData;
    char *p;
5417
    int ret = 0;
5418

5419
    qemuDriverLock(driver);
5420 5421 5422 5423 5424
    memset(secmodel, 0, sizeof(*secmodel));

    /* NULL indicates no driver, which we treat as
     * success, but simply return no data in *secmodel */
    if (driver->caps->host.secModel.model == NULL)
5425
        goto cleanup;
5426

5427 5428
    p = driver->caps->host.secModel.model;
    if (strlen(p) >= VIR_SECURITY_MODEL_BUFLEN-1) {
5429 5430 5431
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("security model string exceeds max %d bytes"),
                        VIR_SECURITY_MODEL_BUFLEN-1);
5432 5433
        ret = -1;
        goto cleanup;
5434 5435 5436 5437 5438
    }
    strcpy(secmodel->model, p);

    p = driver->caps->host.secModel.doi;
    if (strlen(p) >= VIR_SECURITY_DOI_BUFLEN-1) {
5439 5440 5441
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("security DOI string exceeds max %d bytes"),
                        VIR_SECURITY_DOI_BUFLEN-1);
5442 5443
        ret = -1;
        goto cleanup;
5444 5445
    }
    strcpy(secmodel->doi, p);
5446 5447 5448 5449

cleanup:
    qemuDriverUnlock(driver);
    return ret;
5450 5451
}

5452 5453 5454 5455 5456 5457
/* qemudOpenAsUID() - pipe/fork/setuid/open a file, and return the
   pipe fd to caller, so that it can read from the file. Also return
   the pid of the child process, so the caller can wait for it to exit
   after it's finished reading (to avoid a zombie, if nothing
   else). */

5458 5459 5460
static int
qemudOpenAsUID(const char *path, uid_t uid, gid_t gid, pid_t *child_pid)
{
5461 5462 5463 5464 5465 5466 5467 5468 5469 5470 5471 5472 5473 5474 5475 5476 5477 5478 5479 5480 5481 5482 5483 5484 5485 5486 5487
    int pipefd[2];
    int fd = -1;

    *child_pid = -1;

    if (pipe(pipefd) < 0) {
        virReportSystemError(errno,
                             _("failed to create pipe to read '%s'"),
                             path);
        pipefd[0] = pipefd[1] = -1;
        goto parent_cleanup;
    }

    int forkRet = virFork(child_pid);

    if (*child_pid < 0) {
        virReportSystemError(errno,
                             _("failed to fork child to read '%s'"),
                             path);
        goto parent_cleanup;
    }

    if (*child_pid > 0) {

        /* parent */

        /* parent doesn't need the write side of the pipe */
5488
        VIR_FORCE_CLOSE(pipefd[1]);
5489 5490 5491 5492 5493 5494 5495 5496 5497 5498 5499

        if (forkRet < 0) {
            virReportSystemError(errno,
                                 _("failed in parent after forking child to read '%s'"),
                                 path);
            goto parent_cleanup;
        }
        /* caller gets the read side of the pipe */
        fd = pipefd[0];
        pipefd[0] = -1;
parent_cleanup:
5500 5501
        VIR_FORCE_CLOSE(pipefd[0]);
        VIR_FORCE_CLOSE(pipefd[1]);
5502 5503 5504 5505 5506 5507 5508 5509 5510 5511 5512 5513 5514 5515 5516 5517 5518 5519 5520 5521 5522 5523 5524 5525
        if ((fd < 0) && (*child_pid > 0)) {
            /* a child process was started and subsequently an error
               occurred in the parent, so we need to wait for it to
               exit, but its status is inconsequential. */
            while ((waitpid(*child_pid, NULL, 0) == -1)
                   && (errno == EINTR)) {
                /* empty */
            }
            *child_pid = -1;
        }
        return fd;
    }

    /* child */

    /* setuid to the qemu user, then open the file, read it,
       and stuff it into the pipe for the parent process to
       read */
    int exit_code;
    char *buf = NULL;
    size_t bufsize = 1024 * 1024;
    int bytesread;

    /* child doesn't need the read side of the pipe */
5526
    VIR_FORCE_CLOSE(pipefd[0]);
5527 5528 5529 5530 5531 5532 5533 5534 5535

    if (forkRet < 0) {
        exit_code = errno;
        virReportSystemError(errno,
                             _("failed in child after forking to read '%s'"),
                             path);
        goto child_cleanup;
    }

5536 5537 5538
    if (virSetUIDGID(uid, gid) < 0) {
       exit_code = errno;
       goto child_cleanup;
5539 5540
    }

5541 5542 5543 5544 5545 5546 5547 5548
    if ((fd = open(path, O_RDONLY)) < 0) {
        exit_code = errno;
        virReportSystemError(errno,
                             _("cannot open '%s' as uid %d"),
                             path, uid);
        goto child_cleanup;
    }

5549 5550 5551 5552 5553 5554
    if (VIR_ALLOC_N(buf, bufsize) < 0) {
        exit_code = ENOMEM;
        virReportOOMError();
        goto child_cleanup;
    }

5555 5556 5557 5558 5559 5560 5561 5562 5563 5564 5565 5566 5567 5568 5569 5570 5571 5572 5573 5574
    /* read from fd and write to pipefd[1] until EOF */
    do {
        if ((bytesread = saferead(fd, buf, bufsize)) < 0) {
            exit_code = errno;
            virReportSystemError(errno,
                                 _("child failed reading from '%s'"),
                                 path);
            goto child_cleanup;
        }
        if (safewrite(pipefd[1], buf, bytesread) != bytesread) {
            exit_code = errno;
            virReportSystemError(errno, "%s",
                                 _("child failed writing to pipe"));
            goto child_cleanup;
        }
    } while (bytesread > 0);
    exit_code = 0;

child_cleanup:
    VIR_FREE(buf);
5575 5576
    VIR_FORCE_CLOSE(fd);
    VIR_FORCE_CLOSE(pipefd[1]);
5577 5578 5579
    _exit(exit_code);
}

J
Jiri Denemark 已提交
5580 5581 5582 5583
static int qemudDomainSaveImageClose(int fd, pid_t read_pid, int *status)
{
    int ret = 0;

5584 5585 5586 5587
    if (VIR_CLOSE(fd) < 0) {
        virReportSystemError(errno, "%s",
                             _("cannot close file"));
    }
J
Jiri Denemark 已提交
5588 5589 5590 5591 5592 5593 5594 5595 5596 5597 5598 5599 5600 5601 5602 5603

    if (read_pid != -1) {
        /* reap the process that read the file */
        while ((ret = waitpid(read_pid, status, 0)) == -1
               && errno == EINTR) {
            /* empty */
        }
    } else if (status) {
        *status = 0;
    }

    return ret;
}

static int ATTRIBUTE_NONNULL(3) ATTRIBUTE_NONNULL(4) ATTRIBUTE_NONNULL(5)
qemudDomainSaveImageOpen(struct qemud_driver *driver,
5604 5605 5606 5607
                         const char *path,
                         virDomainDefPtr *ret_def,
                         struct qemud_save_header *ret_header,
                         pid_t *ret_read_pid)
J
Jiri Denemark 已提交
5608 5609
{
    int fd;
5610
    pid_t read_pid = -1;
5611
    struct qemud_save_header header;
J
Jiri Denemark 已提交
5612 5613
    char *xml = NULL;
    virDomainDefPtr def = NULL;
5614 5615

    if ((fd = open(path, O_RDONLY)) < 0) {
5616 5617 5618
        if ((driver->user == 0) || (getuid() != 0)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("cannot read domain image"));
J
Jiri Denemark 已提交
5619
            goto error;
5620 5621 5622 5623 5624 5625
        }

        /* Opening as root failed, but qemu runs as a different user
           that might have better luck. Create a pipe, then fork a
           child process to run as the qemu user, which will hopefully
           have the necessary authority to read the file. */
5626 5627
        if ((fd = qemudOpenAsUID(path,
                                 driver->user, driver->group, &read_pid)) < 0) {
5628
            /* error already reported */
J
Jiri Denemark 已提交
5629
            goto error;
5630
        }
5631 5632 5633
    }

    if (saferead(fd, &header, sizeof(header)) != sizeof(header)) {
5634 5635
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to read qemu header"));
J
Jiri Denemark 已提交
5636
        goto error;
5637 5638 5639
    }

    if (memcmp(header.magic, QEMUD_SAVE_MAGIC, sizeof(header.magic)) != 0) {
5640 5641
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("image magic is incorrect"));
J
Jiri Denemark 已提交
5642
        goto error;
5643 5644 5645
    }

    if (header.version > QEMUD_SAVE_VERSION) {
5646 5647 5648
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("image version is not supported (%d > %d)"),
                        header.version, QEMUD_SAVE_VERSION);
J
Jiri Denemark 已提交
5649
        goto error;
5650 5651
    }

5652 5653 5654
    if (header.xml_len <= 0) {
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("invalid XML length: %d"), header.xml_len);
J
Jiri Denemark 已提交
5655
        goto error;
5656 5657
    }

5658 5659
    if (VIR_ALLOC_N(xml, header.xml_len) < 0) {
        virReportOOMError();
J
Jiri Denemark 已提交
5660
        goto error;
5661 5662 5663
    }

    if (saferead(fd, xml, header.xml_len) != header.xml_len) {
5664 5665
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to read XML"));
J
Jiri Denemark 已提交
5666
        goto error;
5667 5668 5669
    }

    /* Create a domain from this XML */
5670
    if (!(def = virDomainDefParseString(driver->caps, xml,
5671
                                        VIR_DOMAIN_XML_INACTIVE))) {
5672 5673
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to parse XML"));
J
Jiri Denemark 已提交
5674
        goto error;
5675 5676
    }

J
Jiri Denemark 已提交
5677
    VIR_FREE(xml);
5678

J
Jiri Denemark 已提交
5679 5680 5681
    *ret_def = def;
    *ret_header = header;
    *ret_read_pid = read_pid;
5682

J
Jiri Denemark 已提交
5683
    return fd;
5684

J
Jiri Denemark 已提交
5685 5686 5687 5688 5689 5690 5691 5692 5693 5694 5695 5696 5697 5698 5699 5700 5701 5702 5703 5704 5705 5706 5707 5708 5709 5710
error:
    virDomainDefFree(def);
    VIR_FREE(xml);
    qemudDomainSaveImageClose(fd, read_pid, NULL);

    return -1;
}

static int ATTRIBUTE_NONNULL(6)
qemudDomainSaveImageStartVM(virConnectPtr conn,
                            struct qemud_driver *driver,
                            virDomainObjPtr vm,
                            int fd,
                            pid_t read_pid,
                            const struct qemud_save_header *header,
                            const char *path)
{
    int ret = -1;
    virDomainEventPtr event;
    int intermediatefd = -1;
    pid_t intermediate_pid = -1;
    int childstat;
    int wait_ret;
    int status;

    if (header->version == 2) {
5711
        const char *intermediate_argv[3] = { NULL, "-dc", NULL };
J
Jiri Denemark 已提交
5712
        const char *prog = qemudSaveCompressionTypeToString(header->compressed);
5713
        if (prog == NULL) {
5714 5715
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            _("Invalid compressed save format %d"),
J
Jiri Denemark 已提交
5716 5717
                            header->compressed);
            goto out;
5718
        }
5719

J
Jiri Denemark 已提交
5720
        if (header->compressed != QEMUD_SAVE_FORMAT_RAW) {
5721
            intermediate_argv[0] = prog;
5722 5723
            intermediatefd = fd;
            fd = -1;
5724
            if (virExec(intermediate_argv, NULL, NULL,
5725
                        &intermediate_pid, intermediatefd, &fd, NULL, 0) < 0) {
5726 5727 5728
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("Failed to start decompression binary %s"),
                                intermediate_argv[0]);
J
Jiri Denemark 已提交
5729
                goto out;
5730 5731 5732
            }
        }
    }
J
Jiri Denemark 已提交
5733

5734
    /* Set the migration source and start it up. */
5735 5736
    ret = qemudStartVMDaemon(conn, driver, vm, "stdio", true, fd, path,
                             VIR_VM_OP_RESTORE);
J
Jiri Denemark 已提交
5737

5738 5739 5740
    if (intermediate_pid != -1) {
        /* Wait for intermediate process to exit */
        while (waitpid(intermediate_pid, &childstat, 0) == -1 &&
J
Jiri Denemark 已提交
5741 5742 5743
               errno == EINTR) {
            /* empty */
        }
5744
    }
5745
    VIR_FORCE_CLOSE(intermediatefd);
J
Jiri Denemark 已提交
5746 5747

    wait_ret = qemudDomainSaveImageClose(fd, read_pid, &status);
5748
    fd = -1;
5749 5750 5751 5752 5753 5754 5755 5756 5757 5758 5759 5760 5761 5762 5763 5764 5765 5766 5767 5768 5769
    if (read_pid != -1) {
        if (wait_ret == -1) {
            virReportSystemError(errno,
                                 _("failed to wait for process reading '%s'"),
                                 path);
            ret = -1;
        } else if (!WIFEXITED(status)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            _("child process exited abnormally reading '%s'"),
                            path);
            ret = -1;
        } else {
            int exit_status = WEXITSTATUS(status);
            if (exit_status != 0) {
                virReportSystemError(exit_status,
                                     _("child process returned error reading '%s'"),
                                     path);
                ret = -1;
            }
        }
    }
J
Jiri Denemark 已提交
5770

5771 5772
    if (ret < 0) {
        qemuDomainStartAudit(vm, "restored", false);
J
Jiri Denemark 已提交
5773
        goto out;
5774
    }
5775

5776 5777 5778
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_RESTORED);
5779
    qemuDomainStartAudit(vm, "restored", true);
J
Jiri Denemark 已提交
5780 5781 5782
    if (event)
        qemuDomainEventQueue(driver, event);

5783

5784
    /* If it was running before, resume it now. */
J
Jiri Denemark 已提交
5785
    if (header->was_running) {
H
Hu Tao 已提交
5786
        if (doStartCPUs(driver, vm, conn) < 0) {
5787
            if (virGetLastError() == NULL)
5788 5789
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("failed to resume domain"));
J
Jiri Denemark 已提交
5790
            goto out;
5791
        }
5792 5793
        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0) {
            VIR_WARN("Failed to save status on vm %s", vm->def->name);
J
Jiri Denemark 已提交
5794
            goto out;
5795
        }
5796
    }
J
Jiri Denemark 已提交
5797

5798
    ret = 0;
5799

J
Jiri Denemark 已提交
5800
out:
5801 5802
    if (virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                 vm, path) < 0)
5803 5804
        VIR_WARN("failed to restore save state label on %s", path);

J
Jiri Denemark 已提交
5805 5806 5807 5808 5809 5810 5811 5812 5813 5814 5815 5816 5817 5818 5819 5820 5821 5822 5823 5824 5825 5826 5827 5828 5829
    return ret;
}

static int qemudDomainRestore(virConnectPtr conn,
                              const char *path) {
    struct qemud_driver *driver = conn->privateData;
    virDomainDefPtr def = NULL;
    virDomainObjPtr vm = NULL;
    int fd = -1;
    pid_t read_pid = -1;
    int ret = -1;
    struct qemud_save_header header;

    qemuDriverLock(driver);

    fd = qemudDomainSaveImageOpen(driver, path, &def, &header, &read_pid);
    if (fd < 0)
        goto cleanup;

    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;

    if (!(vm = virDomainAssignDef(driver->caps,
                                  &driver->domains,
                                  def, true))) {
5830
        /* virDomainAssignDef already set the error */
J
Jiri Denemark 已提交
5831 5832 5833 5834 5835 5836 5837 5838 5839 5840 5841
        goto cleanup;
    }
    def = NULL;

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    ret = qemudDomainSaveImageStartVM(conn, driver, vm, fd,
                                      read_pid, &header, path);

    if (qemuDomainObjEndJob(vm) == 0)
5842
        vm = NULL;
J
Jiri Denemark 已提交
5843 5844 5845 5846
    else if (ret < 0 && !vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
5847

5848 5849
cleanup:
    virDomainDefFree(def);
J
Jiri Denemark 已提交
5850
    qemudDomainSaveImageClose(fd, read_pid, NULL);
5851 5852 5853
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
5854
    return ret;
D
Daniel P. Berrange 已提交
5855 5856
}

J
Jiri Denemark 已提交
5857 5858 5859 5860 5861 5862 5863 5864 5865 5866 5867 5868 5869 5870 5871 5872 5873 5874 5875 5876 5877 5878 5879 5880 5881 5882 5883 5884 5885 5886 5887 5888 5889 5890 5891 5892 5893 5894 5895 5896 5897
static int qemudDomainObjRestore(virConnectPtr conn,
                                 struct qemud_driver *driver,
                                 virDomainObjPtr vm,
                                 const char *path)
{
    virDomainDefPtr def = NULL;
    int fd = -1;
    pid_t read_pid = -1;
    int ret = -1;
    struct qemud_save_header header;

    fd = qemudDomainSaveImageOpen(driver, path, &def, &header, &read_pid);
    if (fd < 0)
        goto cleanup;

    if (STRNEQ(vm->def->name, def->name) ||
        memcmp(vm->def->uuid, def->uuid, VIR_UUID_BUFLEN)) {
        char vm_uuidstr[VIR_UUID_STRING_BUFLEN];
        char def_uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(vm->def->uuid, vm_uuidstr);
        virUUIDFormat(def->uuid, def_uuidstr);
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("cannot restore domain '%s' uuid %s from a file"
                          " which belongs to domain '%s' uuid %s"),
                        vm->def->name, vm_uuidstr,
                        def->name, def_uuidstr);
        goto cleanup;
    }

    virDomainObjAssignDef(vm, def, true);
    def = NULL;

    ret = qemudDomainSaveImageStartVM(conn, driver, vm, fd,
                                      read_pid, &header, path);

cleanup:
    virDomainDefFree(def);
    qemudDomainSaveImageClose(fd, read_pid, NULL);
    return ret;
}

D
Daniel P. Berrange 已提交
5898

5899 5900 5901 5902 5903 5904 5905 5906 5907 5908 5909 5910 5911 5912 5913 5914 5915 5916 5917 5918 5919 5920 5921 5922 5923 5924 5925 5926 5927 5928 5929 5930 5931 5932 5933 5934 5935 5936
static char *qemudVMDumpXML(struct qemud_driver *driver,
                            virDomainObjPtr vm,
                            int flags)
{
    char *ret = NULL;
    virCPUDefPtr cpu = NULL;
    virDomainDefPtr def;
    virCPUDefPtr def_cpu;

    if ((flags & VIR_DOMAIN_XML_INACTIVE) && vm->newDef)
        def = vm->newDef;
    else
        def = vm->def;
    def_cpu = def->cpu;

    /* Update guest CPU requirements according to host CPU */
    if ((flags & VIR_DOMAIN_XML_UPDATE_CPU) && def_cpu && def_cpu->model) {
        if (!driver->caps || !driver->caps->host.cpu) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("cannot get host CPU capabilities"));
            goto cleanup;
        }

        if (!(cpu = virCPUDefCopy(def_cpu))
            || cpuUpdate(cpu, driver->caps->host.cpu))
            goto cleanup;
        def->cpu = cpu;
    }

    ret = virDomainDefFormat(def, flags);

cleanup:
    def->cpu = def_cpu;
    virCPUDefFree(cpu);
    return ret;
}


5937
static char *qemudDomainDumpXML(virDomainPtr dom,
5938
                                int flags) {
5939 5940 5941
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
5942 5943
    unsigned long balloon;
    int err;
5944

5945
    qemuDriverLock(driver);
5946
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5947

D
Daniel P. Berrange 已提交
5948
    if (!vm) {
5949 5950
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5951 5952
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5953
        goto cleanup;
D
Daniel P. Berrange 已提交
5954 5955
    }

5956 5957 5958 5959
    /* Refresh current memory based on balloon info if supported */
    if ((vm->def->memballoon != NULL) &&
        (vm->def->memballoon->model != VIR_DOMAIN_MEMBALLOON_MODEL_NONE) &&
        (virDomainObjIsActive(vm))) {
5960
        qemuDomainObjPrivatePtr priv = vm->privateData;
5961 5962 5963
        /* Don't delay if someone's using the monitor, just use
         * existing most recent data instead */
        if (!priv->jobActive) {
5964
            if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
5965 5966
                goto cleanup;

5967
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
5968
            err = qemuMonitorGetBalloonInfo(priv->mon, &balloon);
5969
            qemuDomainObjExitMonitorWithDriver(driver, vm);
5970 5971 5972 5973
            if (qemuDomainObjEndJob(vm) == 0) {
                vm = NULL;
                goto cleanup;
            }
5974 5975 5976
            if (err < 0)
                goto cleanup;
            if (err > 0)
5977
                vm->def->mem.cur_balloon = balloon;
5978 5979
            /* err == 0 indicates no balloon support, so ignore it */
        }
5980
    }
5981

5982
    ret = qemudVMDumpXML(driver, vm, flags);
5983 5984

cleanup:
5985 5986
    if (vm)
        virDomainObjUnlock(vm);
5987
    qemuDriverUnlock(driver);
5988
    return ret;
D
Daniel P. Berrange 已提交
5989 5990 5991
}


5992 5993 5994 5995
static char *qemuDomainXMLFromNative(virConnectPtr conn,
                                     const char *format,
                                     const char *config,
                                     unsigned int flags ATTRIBUTE_UNUSED) {
5996
    struct qemud_driver *driver = conn->privateData;
5997 5998 5999 6000
    virDomainDefPtr def = NULL;
    char *xml = NULL;

    if (STRNEQ(format, QEMU_CONFIG_FORMAT_ARGV)) {
6001 6002
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("unsupported config type %s"), format);
6003 6004 6005
        goto cleanup;
    }

6006
    qemuDriverLock(driver);
6007
    def = qemuParseCommandLineString(driver->caps, config);
6008
    qemuDriverUnlock(driver);
6009 6010 6011
    if (!def)
        goto cleanup;

6012
    xml = virDomainDefFormat(def, VIR_DOMAIN_XML_INACTIVE);
6013 6014 6015 6016 6017 6018

cleanup:
    virDomainDefFree(def);
    return xml;
}

6019 6020 6021 6022 6023 6024
static char *qemuDomainXMLToNative(virConnectPtr conn,
                                   const char *format,
                                   const char *xmlData,
                                   unsigned int flags ATTRIBUTE_UNUSED) {
    struct qemud_driver *driver = conn->privateData;
    virDomainDefPtr def = NULL;
6025
    virDomainChrSourceDef monConfig;
6026
    unsigned long long qemuCmdFlags;
E
Eric Blake 已提交
6027
    virCommandPtr cmd = NULL;
6028 6029 6030
    char *ret = NULL;
    int i;

6031 6032
    qemuDriverLock(driver);

6033
    if (STRNEQ(format, QEMU_CONFIG_FORMAT_ARGV)) {
6034 6035
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("unsupported config type %s"), format);
6036 6037 6038
        goto cleanup;
    }

6039
    def = virDomainDefParseString(driver->caps, xmlData, 0);
6040 6041 6042
    if (!def)
        goto cleanup;

6043 6044
    /* Since we're just exporting args, we can't do bridge/network/direct
     * setups, since libvirt will normally create TAP/macvtap devices
6045 6046 6047 6048 6049
     * directly. We convert those configs into generic 'ethernet'
     * config and assume the user has suitable 'ifup-qemu' scripts
     */
    for (i = 0 ; i < def->nnets ; i++) {
        virDomainNetDefPtr net = def->nets[i];
6050
        int bootIndex = net->bootIndex;
6051 6052
        if (net->type == VIR_DOMAIN_NET_TYPE_NETWORK ||
            net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
6053 6054 6055 6056 6057 6058 6059 6060 6061 6062 6063 6064 6065 6066 6067 6068 6069 6070 6071 6072
            VIR_FREE(net->data.network.name);

            memset(net, 0, sizeof *net);

            net->type = VIR_DOMAIN_NET_TYPE_ETHERNET;
            net->data.ethernet.dev = NULL;
            net->data.ethernet.script = NULL;
            net->data.ethernet.ipaddr = NULL;
        } else if (net->type == VIR_DOMAIN_NET_TYPE_BRIDGE) {
            char *brname = net->data.bridge.brname;
            char *script = net->data.bridge.script;
            char *ipaddr = net->data.bridge.ipaddr;

            memset(net, 0, sizeof *net);

            net->type = VIR_DOMAIN_NET_TYPE_ETHERNET;
            net->data.ethernet.dev = brname;
            net->data.ethernet.script = script;
            net->data.ethernet.ipaddr = ipaddr;
        }
6073
        net->bootIndex = bootIndex;
6074 6075 6076 6077
    }
    for (i = 0 ; i < def->ngraphics ; i++) {
        if (def->graphics[i]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC &&
            def->graphics[i]->data.vnc.autoport)
6078
            def->graphics[i]->data.vnc.port = QEMU_VNC_PORT_MIN;
6079 6080
    }

6081 6082 6083
    if (qemuCapsExtractVersionInfo(def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
6084 6085
        goto cleanup;

6086
    if (qemuPrepareMonitorChr(driver, &monConfig, def->name) < 0)
6087
        goto cleanup;
6088

6089 6090
    if (!(cmd = qemuBuildCommandLine(conn, driver, def,
                                     &monConfig, false, qemuCmdFlags,
6091
                                     NULL, -1, NULL, VIR_VM_OP_NO_OP)))
6092 6093
        goto cleanup;

E
Eric Blake 已提交
6094
    ret = virCommandToString(cmd);
6095 6096

cleanup:
6097
    qemuDriverUnlock(driver);
6098

E
Eric Blake 已提交
6099
    virCommandFree(cmd);
6100 6101 6102 6103 6104
    virDomainDefFree(def);
    return ret;
}


6105
static int qemudListDefinedDomains(virConnectPtr conn,
6106
                            char **const names, int nnames) {
6107
    struct qemud_driver *driver = conn->privateData;
6108
    int n;
6109

6110
    qemuDriverLock(driver);
6111
    n = virDomainObjListGetInactiveNames(&driver->domains, names, nnames);
6112
    qemuDriverUnlock(driver);
6113
    return n;
D
Daniel P. Berrange 已提交
6114 6115
}

6116
static int qemudNumDefinedDomains(virConnectPtr conn) {
6117
    struct qemud_driver *driver = conn->privateData;
6118
    int n;
6119

6120
    qemuDriverLock(driver);
6121
    n = virDomainObjListNumOfDomains(&driver->domains, 0);
6122
    qemuDriverUnlock(driver);
6123

6124
    return n;
D
Daniel P. Berrange 已提交
6125 6126 6127
}


J
Jiri Denemark 已提交
6128 6129
static int qemudDomainObjStart(virConnectPtr conn,
                               struct qemud_driver *driver,
6130 6131
                               virDomainObjPtr vm,
                               bool start_paused)
J
Jiri Denemark 已提交
6132 6133 6134 6135 6136 6137 6138 6139 6140 6141 6142 6143 6144 6145 6146 6147 6148 6149 6150 6151
{
    int ret = -1;
    char *managed_save;

    /*
     * If there is a managed saved state restore it instead of starting
     * from scratch. In any case the old state is removed.
     */
    managed_save = qemuDomainManagedSavePath(driver, vm);
    if ((managed_save) && (virFileExists(managed_save))) {
        ret = qemudDomainObjRestore(conn, driver, vm, managed_save);

        if (unlink(managed_save) < 0) {
            VIR_WARN("Failed to remove the managed state %s", managed_save);
        }

        if (ret == 0)
            goto cleanup;
    }

6152 6153
    ret = qemudStartVMDaemon(conn, driver, vm, NULL, start_paused, -1, NULL,
                             VIR_VM_OP_CREATE);
6154 6155
    qemuDomainStartAudit(vm, "booted", ret >= 0);
    if (ret >= 0) {
J
Jiri Denemark 已提交
6156 6157 6158 6159 6160 6161 6162 6163 6164 6165 6166 6167 6168
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);
        if (event)
            qemuDomainEventQueue(driver, event);
    }

cleanup:
    VIR_FREE(managed_save);
    return ret;
}

6169 6170 6171
static int
qemudDomainStartWithFlags(virDomainPtr dom, unsigned int flags)
{
6172 6173 6174
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
6175

6176
    virCheckFlags(VIR_DOMAIN_START_PAUSED, -1);
6177

6178
    qemuDriverLock(driver);
6179
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6180

6181
    if (!vm) {
6182 6183
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6184 6185
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6186
        goto cleanup;
6187 6188
    }

6189 6190 6191 6192
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    if (virDomainObjIsActive(vm)) {
6193 6194
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is already running"));
6195 6196 6197
        goto endjob;
    }

6198 6199
    ret = qemudDomainObjStart(dom->conn, driver, vm,
                              (flags & VIR_DOMAIN_START_PAUSED) != 0);
6200

6201
endjob:
6202 6203
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
6204

6205
cleanup:
6206 6207
    if (vm)
        virDomainObjUnlock(vm);
6208
    qemuDriverUnlock(driver);
6209
    return ret;
D
Daniel P. Berrange 已提交
6210 6211
}

6212 6213 6214 6215 6216 6217
static int
qemudDomainStart(virDomainPtr dom)
{
    return qemudDomainStartWithFlags(dom, 0);
}

6218 6219 6220 6221 6222 6223 6224 6225 6226 6227 6228 6229 6230 6231 6232
static int
qemudCanonicalizeMachineFromInfo(virDomainDefPtr def,
                                 virCapsGuestDomainInfoPtr info,
                                 char **canonical)
{
    int i;

    *canonical = NULL;

    for (i = 0; i < info->nmachines; i++) {
        virCapsGuestMachinePtr machine = info->machines[i];

        if (!machine->canonical)
            continue;

6233
        if (STRNEQ(def->os.machine, machine->name))
6234 6235 6236
            continue;

        if (!(*canonical = strdup(machine->canonical))) {
6237
            virReportOOMError();
6238 6239 6240 6241 6242 6243 6244 6245 6246
            return -1;
        }

        break;
    }

    return 0;
}

6247 6248 6249 6250 6251 6252
static int
qemudCanonicalizeMachineDirect(virDomainDefPtr def, char **canonical)
{
    virCapsGuestMachinePtr *machines = NULL;
    int i, nmachines = 0;

6253
    if (qemuCapsProbeMachineTypes(def->emulator, &machines, &nmachines) < 0) {
6254
        virReportOOMError();
6255 6256 6257 6258 6259 6260 6261
        return -1;
    }

    for (i = 0; i < nmachines; i++) {
        if (!machines[i]->canonical)
            continue;

6262
        if (STRNEQ(def->os.machine, machines[i]->name))
6263 6264 6265 6266 6267 6268 6269 6270 6271 6272 6273 6274
            continue;

        *canonical = machines[i]->canonical;
        machines[i]->canonical = NULL;
        break;
    }

    virCapabilitiesFreeMachines(machines, nmachines);

    return 0;
}

6275 6276
int
qemudCanonicalizeMachine(struct qemud_driver *driver, virDomainDefPtr def)
6277 6278 6279 6280 6281 6282
{
    char *canonical = NULL;
    int i;

    for (i = 0; i < driver->caps->nguests; i++) {
        virCapsGuestPtr guest = driver->caps->guests[i];
6283
        virCapsGuestDomainInfoPtr info;
6284 6285 6286
        int j;

        for (j = 0; j < guest->arch.ndomains; j++) {
6287
            info = &guest->arch.domains[j]->info;
6288

6289 6290 6291 6292 6293 6294 6295 6296 6297
            if (!info->emulator || !STREQ(info->emulator, def->emulator))
                continue;

            if (!info->nmachines)
                info = &guest->arch.defaultInfo;

            if (qemudCanonicalizeMachineFromInfo(def, info, &canonical) < 0)
                return -1;
            goto out;
6298 6299
        }

6300 6301 6302 6303
        info = &guest->arch.defaultInfo;

        if (info->emulator && STREQ(info->emulator, def->emulator)) {
            if (qemudCanonicalizeMachineFromInfo(def, info, &canonical) < 0)
6304 6305 6306 6307
                return -1;
            goto out;
        }
    }
6308 6309 6310 6311

    if (qemudCanonicalizeMachineDirect(def, &canonical) < 0)
        return -1;

6312 6313 6314 6315 6316 6317 6318
out:
    if (canonical) {
        VIR_FREE(def->os.machine);
        def->os.machine = canonical;
    }
    return 0;
}
D
Daniel P. Berrange 已提交
6319

6320
static virDomainPtr qemudDomainDefine(virConnectPtr conn, const char *xml) {
6321
    struct qemud_driver *driver = conn->privateData;
6322
    virDomainDefPtr def;
6323
    virDomainObjPtr vm = NULL;
6324
    virDomainPtr dom = NULL;
6325
    virDomainEventPtr event = NULL;
6326
    int dupVM;
6327

6328
    qemuDriverLock(driver);
6329
    if (!(def = virDomainDefParseString(driver->caps, xml,
6330
                                        VIR_DOMAIN_XML_INACTIVE)))
6331
        goto cleanup;
6332

6333
    if (virSecurityManagerVerify(driver->securityManager, def) < 0)
6334 6335
        goto cleanup;

6336 6337
    if ((dupVM = virDomainObjIsDuplicate(&driver->domains, def, 0)) < 0)
        goto cleanup;
6338

6339
    if (qemudCanonicalizeMachine(driver, def) < 0)
6340 6341
        goto cleanup;

6342 6343 6344
    if (qemuAssignPCIAddresses(def) < 0)
        goto cleanup;

6345
    if (!(vm = virDomainAssignDef(driver->caps,
6346
                                  &driver->domains,
6347
                                  def, false))) {
6348
        goto cleanup;
6349
    }
6350
    def = NULL;
6351
    vm->persistent = 1;
6352

6353
    if (virDomainSaveConfig(driver->configDir,
6354
                            vm->newDef ? vm->newDef : vm->def) < 0) {
6355 6356
        virDomainRemoveInactive(&driver->domains,
                                vm);
6357
        vm = NULL;
6358
        goto cleanup;
6359 6360
    }

6361 6362
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
6363
                                     !dupVM ?
6364 6365
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                     VIR_DOMAIN_EVENT_DEFINED_UPDATED);
6366

6367
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
6368
    if (dom) dom->id = vm->def->id;
6369 6370

cleanup:
6371
    virDomainDefFree(def);
6372 6373
    if (vm)
        virDomainObjUnlock(vm);
6374 6375
    if (event)
        qemuDomainEventQueue(driver, event);
6376
    qemuDriverUnlock(driver);
6377
    return dom;
D
Daniel P. Berrange 已提交
6378 6379
}

6380
static int qemudDomainUndefine(virDomainPtr dom) {
6381 6382
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
6383
    virDomainEventPtr event = NULL;
6384
    int ret = -1;
D
Daniel P. Berrange 已提交
6385

6386
    qemuDriverLock(driver);
6387
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6388

D
Daniel P. Berrange 已提交
6389
    if (!vm) {
6390 6391
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6392 6393
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6394
        goto cleanup;
D
Daniel P. Berrange 已提交
6395 6396
    }

D
Daniel P. Berrange 已提交
6397
    if (virDomainObjIsActive(vm)) {
6398 6399
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot delete active domain"));
6400
        goto cleanup;
D
Daniel P. Berrange 已提交
6401 6402
    }

6403
    if (!vm->persistent) {
6404 6405
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("cannot undefine transient domain"));
6406
        goto cleanup;
6407 6408
    }

6409
    if (virDomainDeleteConfig(driver->configDir, driver->autostartDir, vm) < 0)
6410
        goto cleanup;
D
Daniel P. Berrange 已提交
6411

6412 6413 6414
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_UNDEFINED,
                                     VIR_DOMAIN_EVENT_UNDEFINED_REMOVED);
6415

6416 6417
    virDomainRemoveInactive(&driver->domains,
                            vm);
6418
    vm = NULL;
6419
    ret = 0;
D
Daniel P. Berrange 已提交
6420

6421
cleanup:
6422 6423
    if (vm)
        virDomainObjUnlock(vm);
6424 6425
    if (event)
        qemuDomainEventQueue(driver, event);
6426
    qemuDriverUnlock(driver);
6427
    return ret;
D
Daniel P. Berrange 已提交
6428 6429
}

6430

6431 6432
static int qemudDomainAttachDevice(virDomainPtr dom,
                                   const char *xml)
6433
{
6434 6435 6436 6437
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainDeviceDefPtr dev = NULL;
    unsigned long long qemuCmdFlags;
6438
    virCgroupPtr cgroup = NULL;
6439
    int ret = -1;
6440

6441 6442 6443 6444 6445 6446 6447
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6448 6449 6450
        goto cleanup;
    }

6451 6452
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
6453

6454 6455 6456 6457 6458
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot attach device on inactive domain"));
        goto endjob;
    }
6459

6460 6461 6462 6463
    dev = virDomainDeviceDefParse(driver->caps, vm->def, xml,
                                  VIR_DOMAIN_XML_INACTIVE);
    if (dev == NULL)
        goto endjob;
6464

6465 6466 6467 6468
    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
        goto endjob;
6469

6470 6471 6472 6473 6474 6475 6476 6477 6478 6479
    if (dev->type == VIR_DOMAIN_DEVICE_DISK) {
        if (qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_DEVICES)) {
            if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) !=0 ) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("Unable to find cgroup for %s\n"),
                                vm->def->name);
                goto endjob;
            }
            if (qemuSetupDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                goto endjob;
6480 6481
        }

6482 6483 6484 6485 6486 6487 6488 6489 6490 6491
        switch (dev->data.disk->device) {
        case VIR_DOMAIN_DISK_DEVICE_CDROM:
        case VIR_DOMAIN_DISK_DEVICE_FLOPPY:
            ret = qemuDomainChangeEjectableMedia(driver, vm,
                                                 dev->data.disk,
                                                 qemuCmdFlags,
                                                 false);
            if (ret == 0)
                dev->data.disk = NULL;
            break;
6492

6493 6494 6495 6496 6497 6498 6499 6500 6501 6502 6503 6504 6505 6506 6507 6508 6509 6510 6511 6512 6513 6514 6515
        case VIR_DOMAIN_DISK_DEVICE_DISK:
            if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_USB) {
                ret = qemuDomainAttachUsbMassstorageDevice(driver, vm,
                                                           dev->data.disk, qemuCmdFlags);
                if (ret == 0)
                    dev->data.disk = NULL;
            } else if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_VIRTIO) {
                ret = qemuDomainAttachPciDiskDevice(driver, vm,
                                                    dev->data.disk, qemuCmdFlags);
                if (ret == 0)
                    dev->data.disk = NULL;
            } else if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_SCSI) {
                ret = qemuDomainAttachSCSIDisk(driver, vm,
                                               dev->data.disk, qemuCmdFlags);
                if (ret == 0)
                    dev->data.disk = NULL;
            } else {
                qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                                _("disk bus '%s' cannot be hotplugged."),
                                virDomainDiskBusTypeToString(dev->data.disk->bus));
                /* fallthrough */
            }
            break;
6516

6517 6518 6519 6520 6521
        default:
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                            _("disk device type '%s' cannot be hotplugged"),
                            virDomainDiskDeviceTypeToString(dev->data.disk->device));
            /* Fallthrough */
6522
        }
6523 6524 6525 6526
        if (ret != 0 && cgroup) {
            if (qemuTeardownDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                VIR_WARN("Failed to teardown cgroup for disk path %s",
                         NULLSTR(dev->data.disk->src));
6527
        }
6528 6529 6530 6531 6532 6533 6534 6535 6536 6537 6538
    } else if (dev->type == VIR_DOMAIN_DEVICE_CONTROLLER) {
        if (dev->data.controller->type == VIR_DOMAIN_CONTROLLER_TYPE_SCSI) {
            ret = qemuDomainAttachPciControllerDevice(driver, vm,
                                                      dev->data.controller, qemuCmdFlags);
            if (ret == 0)
                dev->data.controller = NULL;
        } else {
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                            _("disk controller bus '%s' cannot be hotplugged."),
                            virDomainControllerTypeToString(dev->data.controller->type));
            /* fallthrough */
6539
        }
6540 6541 6542 6543 6544 6545 6546 6547 6548 6549
    } else if (dev->type == VIR_DOMAIN_DEVICE_NET) {
        ret = qemuDomainAttachNetDevice(dom->conn, driver, vm,
                                        dev->data.net, qemuCmdFlags);
        if (ret == 0)
            dev->data.net = NULL;
    } else if (dev->type == VIR_DOMAIN_DEVICE_HOSTDEV) {
        ret = qemuDomainAttachHostDevice(driver, vm,
                                         dev->data.hostdev, qemuCmdFlags);
        if (ret == 0)
            dev->data.hostdev = NULL;
6550
    } else {
6551 6552 6553 6554
        qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                        _("device type '%s' cannot be attached"),
                        virDomainDeviceTypeToString(dev->type));
        goto endjob;
6555 6556
    }

6557 6558 6559 6560 6561 6562 6563 6564 6565 6566 6567 6568 6569 6570 6571
    if (!ret && virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
        ret = -1;

endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);

    virDomainDeviceDefFree(dev);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
6572 6573 6574
    return ret;
}

6575 6576 6577 6578 6579 6580 6581 6582
static int qemudDomainAttachDeviceFlags(virDomainPtr dom,
                                        const char *xml,
                                        unsigned int flags) {
    if (flags & VIR_DOMAIN_DEVICE_MODIFY_CONFIG) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot modify the persistent configuration of a domain"));
        return -1;
    }
6583

6584 6585
    return qemudDomainAttachDevice(dom, xml);
}
6586

6587

6588 6589 6590 6591 6592 6593 6594 6595 6596 6597 6598
static int qemuDomainUpdateDeviceFlags(virDomainPtr dom,
                                       const char *xml,
                                       unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainDeviceDefPtr dev = NULL;
    unsigned long long qemuCmdFlags;
    virCgroupPtr cgroup = NULL;
    int ret = -1;
    bool force = (flags & VIR_DOMAIN_DEVICE_MODIFY_FORCE) != 0;
6599

6600 6601 6602 6603
    virCheckFlags(VIR_DOMAIN_DEVICE_MODIFY_CURRENT |
                  VIR_DOMAIN_DEVICE_MODIFY_LIVE |
                  VIR_DOMAIN_DEVICE_MODIFY_CONFIG |
                  VIR_DOMAIN_DEVICE_MODIFY_FORCE, -1);
6604

6605 6606 6607
    if (flags & VIR_DOMAIN_DEVICE_MODIFY_CONFIG) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot modify the persistent configuration of a domain"));
6608 6609 6610
        return -1;
    }

6611 6612 6613 6614 6615 6616 6617 6618
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
6619 6620
    }

6621 6622 6623 6624 6625 6626 6627
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot attach device on inactive domain"));
        goto endjob;
6628 6629
    }

6630 6631 6632 6633 6634 6635 6636 6637 6638
    dev = virDomainDeviceDefParse(driver->caps, vm->def, xml,
                                  VIR_DOMAIN_XML_INACTIVE);
    if (dev == NULL)
        goto endjob;

    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
        goto endjob;
6639

6640 6641 6642 6643 6644 6645 6646 6647 6648 6649 6650
    switch (dev->type) {
    case VIR_DOMAIN_DEVICE_DISK:
        if (qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_DEVICES)) {
            if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) !=0 ) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("Unable to find cgroup for %s\n"),
                                vm->def->name);
                goto endjob;
            }
            if (qemuSetupDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                goto endjob;
6651 6652
        }

6653 6654 6655 6656 6657 6658 6659 6660 6661 6662
        switch (dev->data.disk->device) {
        case VIR_DOMAIN_DISK_DEVICE_CDROM:
        case VIR_DOMAIN_DISK_DEVICE_FLOPPY:
            ret = qemuDomainChangeEjectableMedia(driver, vm,
                                                 dev->data.disk,
                                                 qemuCmdFlags,
                                                 force);
            if (ret == 0)
                dev->data.disk = NULL;
            break;
6663

6664

6665 6666 6667 6668 6669 6670
        default:
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                            _("disk bus '%s' cannot be updated."),
                            virDomainDiskBusTypeToString(dev->data.disk->bus));
            break;
        }
6671

6672 6673 6674 6675 6676
        if (ret != 0 && cgroup) {
            if (qemuTeardownDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                VIR_WARN("Failed to teardown cgroup for disk path %s",
                         NULLSTR(dev->data.disk->src));
        }
6677
        break;
6678 6679 6680

    case VIR_DOMAIN_DEVICE_GRAPHICS:
        ret = qemuDomainChangeGraphics(driver, vm, dev->data.graphics);
6681
        break;
6682

6683
    default:
6684
        qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
6685 6686 6687
                        _("disk device type '%s' cannot be updated"),
                        virDomainDiskDeviceTypeToString(dev->data.disk->device));
        break;
6688 6689
    }

6690 6691 6692 6693 6694 6695 6696 6697 6698 6699
    if (!ret && virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
        ret = -1;

endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);
6700

6701 6702 6703 6704
    virDomainDeviceDefFree(dev);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
6705 6706 6707
    return ret;
}

6708

6709 6710
static int qemudDomainDetachDevice(virDomainPtr dom,
                                   const char *xml) {
6711 6712
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
6713
    unsigned long long qemuCmdFlags;
6714 6715
    virDomainDeviceDefPtr dev = NULL;
    int ret = -1;
6716

6717
    qemuDriverLock(driver);
6718
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6719
    if (!vm) {
6720 6721
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6722 6723
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6724
        goto cleanup;
6725 6726
    }

6727 6728 6729
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
6730
    if (!virDomainObjIsActive(vm)) {
6731 6732
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot detach device on inactive domain"));
6733
        goto endjob;
6734 6735
    }

6736
    dev = virDomainDeviceDefParse(driver->caps, vm->def, xml,
6737
                                  VIR_DOMAIN_XML_INACTIVE);
6738
    if (dev == NULL)
6739
        goto endjob;
6740

6741 6742 6743
    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
6744
        goto endjob;
6745 6746

    if (dev->type == VIR_DOMAIN_DEVICE_DISK &&
6747 6748
        dev->data.disk->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
        if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_VIRTIO) {
6749
            ret = qemuDomainDetachPciDiskDevice(driver, vm, dev, qemuCmdFlags);
6750 6751
        }
        else if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_SCSI) {
6752 6753
            ret = qemuDomainDetachSCSIDiskDevice(driver, vm, dev,
                                                 qemuCmdFlags);
6754 6755
        }
        else {
6756
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
6757 6758
                            _("This type of disk cannot be hot unplugged"));
        }
6759
    } else if (dev->type == VIR_DOMAIN_DEVICE_NET) {
6760
        ret = qemuDomainDetachNetDevice(driver, vm, dev, qemuCmdFlags);
6761 6762
    } else if (dev->type == VIR_DOMAIN_DEVICE_CONTROLLER) {
        if (dev->data.controller->type == VIR_DOMAIN_CONTROLLER_TYPE_SCSI) {
6763 6764
            ret = qemuDomainDetachPciControllerDevice(driver, vm, dev,
                                                      qemuCmdFlags);
6765
        } else {
6766
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
6767 6768
                            _("disk controller bus '%s' cannot be hotunplugged."),
                            virDomainControllerTypeToString(dev->data.controller->type));
6769 6770
            /* fallthrough */
        }
6771
    } else if (dev->type == VIR_DOMAIN_DEVICE_HOSTDEV) {
6772
        ret = qemuDomainDetachHostDevice(driver, vm, dev, qemuCmdFlags);
6773
    } else {
6774
        qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
6775
                        "%s", _("This type of device cannot be hot unplugged"));
6776
    }
6777

6778
    if (!ret && virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
6779 6780
        ret = -1;

6781
endjob:
6782 6783
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
6784

6785 6786
cleanup:
    virDomainDeviceDefFree(dev);
6787 6788
    if (vm)
        virDomainObjUnlock(vm);
6789
    qemuDriverUnlock(driver);
6790 6791 6792
    return ret;
}

6793 6794 6795 6796
static int qemudDomainDetachDeviceFlags(virDomainPtr dom,
                                        const char *xml,
                                        unsigned int flags) {
    if (flags & VIR_DOMAIN_DEVICE_MODIFY_CONFIG) {
6797 6798
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot modify the persistent configuration of a domain"));
6799 6800 6801 6802 6803 6804
        return -1;
    }

    return qemudDomainDetachDevice(dom, xml);
}

6805
static int qemudDomainGetAutostart(virDomainPtr dom,
6806
                                   int *autostart) {
6807 6808 6809
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
6810

6811
    qemuDriverLock(driver);
6812
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6813 6814
    qemuDriverUnlock(driver);

6815
    if (!vm) {
6816 6817
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6818 6819
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6820
        goto cleanup;
6821 6822 6823
    }

    *autostart = vm->autostart;
6824
    ret = 0;
6825

6826
cleanup:
6827 6828
    if (vm)
        virDomainObjUnlock(vm);
6829
    return ret;
6830 6831
}

6832
static int qemudDomainSetAutostart(virDomainPtr dom,
6833
                                   int autostart) {
6834 6835
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
6836 6837
    char *configFile = NULL, *autostartLink = NULL;
    int ret = -1;
6838

6839
    qemuDriverLock(driver);
6840
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6841

6842
    if (!vm) {
6843 6844
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6845 6846
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6847
        goto cleanup;
6848 6849
    }

6850
    if (!vm->persistent) {
6851 6852
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("cannot set autostart for transient domain"));
6853
        goto cleanup;
6854 6855
    }

6856 6857
    autostart = (autostart != 0);

6858
    if (vm->autostart != autostart) {
6859
        if ((configFile = virDomainConfigFile(driver->configDir, vm->def->name)) == NULL)
6860
            goto cleanup;
6861
        if ((autostartLink = virDomainConfigFile(driver->autostartDir, vm->def->name)) == NULL)
6862
            goto cleanup;
6863

6864 6865
        if (autostart) {
            int err;
6866

6867
            if ((err = virFileMakePath(driver->autostartDir))) {
6868
                virReportSystemError(err,
6869 6870
                                     _("cannot create autostart directory %s"),
                                     driver->autostartDir);
6871 6872
                goto cleanup;
            }
6873

6874
            if (symlink(configFile, autostartLink) < 0) {
6875
                virReportSystemError(errno,
6876 6877
                                     _("Failed to create symlink '%s to '%s'"),
                                     autostartLink, configFile);
6878 6879 6880 6881
                goto cleanup;
            }
        } else {
            if (unlink(autostartLink) < 0 && errno != ENOENT && errno != ENOTDIR) {
6882
                virReportSystemError(errno,
6883 6884
                                     _("Failed to delete symlink '%s'"),
                                     autostartLink);
6885 6886
                goto cleanup;
            }
6887 6888
        }

6889
        vm->autostart = autostart;
6890
    }
6891
    ret = 0;
6892

6893 6894 6895
cleanup:
    VIR_FREE(configFile);
    VIR_FREE(autostartLink);
6896 6897
    if (vm)
        virDomainObjUnlock(vm);
6898
    qemuDriverUnlock(driver);
6899
    return ret;
6900 6901
}

6902 6903 6904 6905 6906

static char *qemuGetSchedulerType(virDomainPtr dom,
                                  int *nparams)
{
    struct qemud_driver *driver = dom->conn->privateData;
6907
    char *ret = NULL;
6908

6909
    qemuDriverLock(driver);
6910
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_CPU)) {
6911 6912
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
6913
        goto cleanup;
6914 6915 6916 6917 6918 6919 6920
    }

    if (nparams)
        *nparams = 1;

    ret = strdup("posix");
    if (!ret)
6921
        virReportOOMError();
6922 6923 6924

cleanup:
    qemuDriverUnlock(driver);
6925 6926 6927
    return ret;
}

6928 6929 6930 6931 6932 6933 6934 6935 6936 6937 6938 6939 6940 6941 6942 6943 6944 6945 6946 6947 6948 6949 6950 6951 6952 6953 6954 6955 6956 6957 6958 6959 6960 6961 6962 6963 6964 6965 6966 6967 6968 6969 6970 6971 6972 6973 6974 6975 6976 6977 6978 6979 6980 6981 6982 6983 6984 6985 6986 6987 6988 6989 6990 6991 6992 6993 6994

static int qemuDomainSetMemoryParameters(virDomainPtr dom,
                                         virMemoryParameterPtr params,
                                         int nparams,
                                         unsigned int flags ATTRIBUTE_UNUSED)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int i;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;

    qemuDriverLock(driver);
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_MEMORY)) {
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
        goto cleanup;
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
        goto cleanup;
    }

    ret = 0;
    for (i = 0; i < nparams; i++) {
        virMemoryParameterPtr param = &params[i];

        if (STREQ(param->field, VIR_DOMAIN_MEMORY_HARD_LIMIT)) {
            int rc;
            if (param->type != VIR_DOMAIN_MEMORY_PARAM_ULLONG) {
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for memory hard_limit tunable, expected a 'ullong'"));
                ret = -1;
                continue;
            }

            rc = virCgroupSetMemoryHardLimit(group, params[i].value.ul);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to set memory hard_limit tunable"));
                ret = -1;
            }
        } else if (STREQ(param->field, VIR_DOMAIN_MEMORY_SOFT_LIMIT)) {
            int rc;
            if (param->type != VIR_DOMAIN_MEMORY_PARAM_ULLONG) {
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for memory soft_limit tunable, expected a 'ullong'"));
                ret = -1;
                continue;
            }

            rc = virCgroupSetMemorySoftLimit(group, params[i].value.ul);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to set memory soft_limit tunable"));
                ret = -1;
            }
6995
        } else if (STREQ(param->field, VIR_DOMAIN_MEMORY_SWAP_HARD_LIMIT)) {
6996 6997 6998 6999 7000 7001 7002 7003 7004 7005 7006 7007 7008 7009 7010 7011 7012 7013 7014 7015 7016 7017 7018 7019 7020 7021 7022 7023 7024 7025 7026 7027 7028
            int rc;
            if (param->type != VIR_DOMAIN_MEMORY_PARAM_ULLONG) {
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for swap_hard_limit tunable, expected a 'ullong'"));
                ret = -1;
                continue;
            }

            rc = virCgroupSetSwapHardLimit(group, params[i].value.ul);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to set swap_hard_limit tunable"));
                ret = -1;
            }
        } else if (STREQ(param->field, VIR_DOMAIN_MEMORY_MIN_GUARANTEE)) {
            qemuReportError(VIR_ERR_INVALID_ARG,
                            _("Memory tunable `%s' not implemented"), param->field);
            ret = -1;
        } else {
            qemuReportError(VIR_ERR_INVALID_ARG,
                            _("Parameter `%s' not supported"), param->field);
            ret = -1;
        }
    }

cleanup:
    virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

7029 7030 7031 7032 7033 7034 7035 7036 7037
static int qemuDomainGetMemoryParameters(virDomainPtr dom,
                                         virMemoryParameterPtr params,
                                         int *nparams,
                                         unsigned int flags ATTRIBUTE_UNUSED)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int i;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
7038
    unsigned long long val;
7039 7040 7041 7042 7043 7044 7045 7046 7047 7048 7049 7050 7051 7052 7053 7054 7055 7056 7057 7058 7059 7060 7061 7062 7063 7064 7065 7066 7067 7068 7069 7070 7071 7072 7073 7074 7075 7076 7077 7078 7079 7080 7081 7082 7083 7084 7085 7086 7087 7088
    int ret = -1;
    int rc;

    qemuDriverLock(driver);

    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_MEMORY)) {
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
        goto cleanup;
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
        goto cleanup;
    }

    if ((*nparams) == 0) {
        /* Current number of memory parameters supported by cgroups */
        *nparams = QEMU_NB_MEM_PARAM;
        ret = 0;
        goto cleanup;
    }

    if ((*nparams) != QEMU_NB_MEM_PARAM) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("Invalid parameter count"));
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
        goto cleanup;
    }

    for (i = 0; i < *nparams; i++) {
        virMemoryParameterPtr param = &params[i];
        val = 0;
        param->value.ul = 0;
        param->type = VIR_DOMAIN_MEMORY_PARAM_ULLONG;

        switch(i) {
        case 0: /* fill memory hard limit here */
            rc = virCgroupGetMemoryHardLimit(group, &val);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to get memory hard limit"));
7089
                goto cleanup;
7090 7091 7092 7093
            }
            if (virStrcpyStatic(param->field, VIR_DOMAIN_MEMORY_HARD_LIMIT) == NULL) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Field memory hard limit too long for destination"));
7094
                goto cleanup;
7095 7096 7097 7098 7099 7100 7101 7102 7103
            }
            param->value.ul = val;
            break;

        case 1: /* fill memory soft limit here */
            rc = virCgroupGetMemorySoftLimit(group, &val);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to get memory soft limit"));
7104
                goto cleanup;
7105 7106 7107 7108
            }
            if (virStrcpyStatic(param->field, VIR_DOMAIN_MEMORY_SOFT_LIMIT) == NULL) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Field memory soft limit too long for destination"));
7109
                goto cleanup;
7110 7111 7112 7113 7114 7115 7116 7117 7118
            }
            param->value.ul = val;
            break;

        case 2: /* fill swap hard limit here */
            rc = virCgroupGetSwapHardLimit(group, &val);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to get swap hard limit"));
7119
                goto cleanup;
7120
            }
7121
            if (virStrcpyStatic(param->field, VIR_DOMAIN_MEMORY_SWAP_HARD_LIMIT) == NULL) {
7122 7123
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Field swap hard limit too long for destination"));
7124
                goto cleanup;
7125 7126 7127 7128 7129 7130 7131 7132 7133 7134
            }
            param->value.ul = val;
            break;

        default:
            break;
            /* should not hit here */
        }
    }

7135 7136
    ret = 0;

7137 7138 7139 7140 7141 7142 7143 7144 7145
cleanup:
    if (group)
        virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

7146 7147 7148 7149 7150 7151 7152 7153 7154 7155
static int qemuSetSchedulerParameters(virDomainPtr dom,
                                      virSchedParameterPtr params,
                                      int nparams)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int i;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;

7156
    qemuDriverLock(driver);
7157
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_CPU)) {
7158 7159
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
7160
        goto cleanup;
7161 7162 7163 7164 7165
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
7166 7167
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
7168 7169 7170 7171
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
7172 7173
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
7174 7175 7176 7177 7178 7179 7180 7181 7182
        goto cleanup;
    }

    for (i = 0; i < nparams; i++) {
        virSchedParameterPtr param = &params[i];

        if (STREQ(param->field, "cpu_shares")) {
            int rc;
            if (param->type != VIR_DOMAIN_SCHED_FIELD_ULLONG) {
7183 7184
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for cpu_shares tunable, expected a 'ullong'"));
7185 7186 7187 7188 7189
                goto cleanup;
            }

            rc = virCgroupSetCpuShares(group, params[i].value.ul);
            if (rc != 0) {
7190
                virReportSystemError(-rc, "%s",
7191 7192 7193 7194
                                     _("unable to set cpu shares tunable"));
                goto cleanup;
            }
        } else {
7195 7196
            qemuReportError(VIR_ERR_INVALID_ARG,
                            _("Invalid parameter `%s'"), param->field);
7197 7198 7199 7200 7201 7202 7203 7204 7205
            goto cleanup;
        }
    }
    ret = 0;

cleanup:
    virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
7206
    qemuDriverUnlock(driver);
7207 7208 7209 7210 7211 7212 7213 7214 7215 7216 7217 7218 7219 7220
    return ret;
}

static int qemuGetSchedulerParameters(virDomainPtr dom,
                                      virSchedParameterPtr params,
                                      int *nparams)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    unsigned long long val;
    int ret = -1;
    int rc;

7221
    qemuDriverLock(driver);
7222
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_CPU)) {
7223 7224
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
7225
        goto cleanup;
7226 7227 7228
    }

    if ((*nparams) != 1) {
7229 7230
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("Invalid parameter count"));
7231
        goto cleanup;
7232 7233 7234 7235 7236
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
7237 7238
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
7239 7240 7241 7242
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
7243 7244
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
7245 7246 7247 7248 7249
        goto cleanup;
    }

    rc = virCgroupGetCpuShares(group, &val);
    if (rc != 0) {
7250
        virReportSystemError(-rc, "%s",
7251 7252 7253 7254 7255
                             _("unable to get cpu shares tunable"));
        goto cleanup;
    }
    params[0].value.ul = val;
    params[0].type = VIR_DOMAIN_SCHED_FIELD_ULLONG;
C
Chris Lalancette 已提交
7256
    if (virStrcpyStatic(params[0].field, "cpu_shares") == NULL) {
7257 7258
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("Field cpu_shares too long for destination"));
C
Chris Lalancette 已提交
7259 7260
        goto cleanup;
    }
7261 7262 7263 7264 7265 7266 7267

    ret = 0;

cleanup:
    virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
7268
    qemuDriverUnlock(driver);
7269 7270 7271 7272
    return ret;
}


7273 7274 7275 7276 7277 7278 7279 7280 7281
/* This uses the 'info blockstats' monitor command which was
 * integrated into both qemu & kvm in late 2007.  If the command is
 * not supported we detect this and return the appropriate error.
 */
static int
qemudDomainBlockStats (virDomainPtr dom,
                       const char *path,
                       struct _virDomainBlockStats *stats)
{
7282
    struct qemud_driver *driver = dom->conn->privateData;
7283
    int i, ret = -1;
7284
    virDomainObjPtr vm;
7285
    virDomainDiskDefPtr disk = NULL;
7286

7287
    qemuDriverLock(driver);
7288
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7289
    qemuDriverUnlock(driver);
7290
    if (!vm) {
7291 7292
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7293 7294
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7295
        goto cleanup;
7296
    }
7297 7298 7299 7300

    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
7301
    if (!virDomainObjIsActive (vm)) {
7302 7303
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7304
        goto endjob;
7305 7306
    }

7307 7308 7309 7310 7311 7312 7313 7314
    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (STREQ(path, vm->def->disks[i]->dst)) {
            disk = vm->def->disks[i];
            break;
        }
    }

    if (!disk) {
7315 7316
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid path: %s"), path);
7317
        goto endjob;
7318 7319
    }

7320
    if (!disk->info.alias) {
7321 7322
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("missing disk device alias name for %s"), disk->dst);
7323
        goto endjob;
7324
    }
7325

7326
    qemuDomainObjPrivatePtr priv = vm->privateData;
7327 7328
    qemuDomainObjEnterMonitor(vm);
    ret = qemuMonitorGetBlockStatsInfo(priv->mon,
7329
                                       disk->info.alias,
7330 7331 7332 7333 7334 7335
                                       &stats->rd_req,
                                       &stats->rd_bytes,
                                       &stats->wr_req,
                                       &stats->wr_bytes,
                                       &stats->errs);
    qemuDomainObjExitMonitor(vm);
7336

7337
endjob:
7338 7339
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
7340

7341
cleanup:
7342 7343
    if (vm)
        virDomainObjUnlock(vm);
7344
    return ret;
7345 7346
}

7347
#ifdef __linux__
7348 7349 7350 7351 7352
static int
qemudDomainInterfaceStats (virDomainPtr dom,
                           const char *path,
                           struct _virDomainInterfaceStats *stats)
{
7353 7354
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
7355
    int i;
7356
    int ret = -1;
7357

7358
    qemuDriverLock(driver);
7359
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7360 7361
    qemuDriverUnlock(driver);

7362
    if (!vm) {
7363 7364
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7365 7366
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7367
        goto cleanup;
7368 7369
    }

D
Daniel P. Berrange 已提交
7370
    if (!virDomainObjIsActive(vm)) {
7371 7372
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7373
        goto cleanup;
7374 7375 7376
    }

    /* Check the path is one of the domain's network interfaces. */
7377 7378
    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (vm->def->nets[i]->ifname &&
7379 7380 7381 7382
            STREQ (vm->def->nets[i]->ifname, path)) {
            ret = 0;
            break;
        }
7383 7384
    }

7385
    if (ret == 0)
7386
        ret = linuxDomainInterfaceStats(path, stats);
7387
    else
7388 7389
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid path, '%s' is not a known interface"), path);
7390

7391
cleanup:
7392 7393
    if (vm)
        virDomainObjUnlock(vm);
7394 7395
    return ret;
}
7396
#else
7397 7398 7399 7400
static int
qemudDomainInterfaceStats (virDomainPtr dom,
                           const char *path ATTRIBUTE_UNUSED,
                           struct _virDomainInterfaceStats *stats ATTRIBUTE_UNUSED)
7401 7402
    qemuReportError(VIR_ERR_NO_SUPPORT,
                    "%s", __FUNCTION__);
7403 7404
    return -1;
}
7405
#endif
7406

7407 7408 7409 7410 7411 7412 7413 7414 7415 7416 7417 7418 7419 7420 7421 7422
static int
qemudDomainMemoryStats (virDomainPtr dom,
                        struct _virDomainMemoryStat *stats,
                        unsigned int nr_stats)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned int ret = -1;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7423 7424
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7425 7426 7427
        goto cleanup;
    }

7428 7429 7430
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

7431 7432 7433
    if (virDomainObjIsActive(vm)) {
        qemuDomainObjPrivatePtr priv = vm->privateData;
        qemuDomainObjEnterMonitor(vm);
7434
        ret = qemuMonitorGetMemoryStats(priv->mon, stats, nr_stats);
7435 7436
        qemuDomainObjExitMonitor(vm);
    } else {
7437 7438
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7439 7440
    }

7441 7442 7443
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

7444 7445 7446 7447 7448 7449
cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

7450 7451 7452 7453 7454 7455 7456
static int
qemudDomainBlockPeek (virDomainPtr dom,
                      const char *path,
                      unsigned long long offset, size_t size,
                      void *buffer,
                      unsigned int flags ATTRIBUTE_UNUSED)
{
7457 7458 7459
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int fd = -1, ret = -1, i;
7460

7461
    qemuDriverLock(driver);
7462
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7463 7464
    qemuDriverUnlock(driver);

7465
    if (!vm) {
7466 7467
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7468 7469
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7470
        goto cleanup;
7471 7472 7473
    }

    if (!path || path[0] == '\0') {
7474 7475
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("NULL or empty path"));
7476
        goto cleanup;
7477 7478 7479
    }

    /* Check the path belongs to this domain. */
7480 7481
    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (vm->def->disks[i]->src != NULL &&
7482 7483 7484 7485
            STREQ (vm->def->disks[i]->src, path)) {
            ret = 0;
            break;
        }
7486 7487
    }

7488 7489 7490 7491 7492
    if (ret == 0) {
        ret = -1;
        /* The path is correct, now try to open it and get its size. */
        fd = open (path, O_RDONLY);
        if (fd == -1) {
7493 7494
            virReportSystemError(errno,
                                 _("%s: failed to open"), path);
7495 7496
            goto cleanup;
        }
7497

7498 7499 7500 7501 7502 7503
        /* Seek and read. */
        /* NB. Because we configure with AC_SYS_LARGEFILE, off_t should
         * be 64 bits on all platforms.
         */
        if (lseek (fd, offset, SEEK_SET) == (off_t) -1 ||
            saferead (fd, buffer, size) == (ssize_t) -1) {
7504 7505
            virReportSystemError(errno,
                                 _("%s: failed to seek or read"), path);
7506 7507 7508 7509 7510
            goto cleanup;
        }

        ret = 0;
    } else {
7511 7512
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("invalid path"));
7513 7514
    }

7515
cleanup:
7516
    VIR_FORCE_CLOSE(fd);
7517 7518
    if (vm)
        virDomainObjUnlock(vm);
7519 7520 7521
    return ret;
}

R
Richard W.M. Jones 已提交
7522 7523 7524 7525 7526 7527
static int
qemudDomainMemoryPeek (virDomainPtr dom,
                       unsigned long long offset, size_t size,
                       void *buffer,
                       unsigned int flags)
{
7528 7529
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
7530
    char *tmp = NULL;
R
Richard W.M. Jones 已提交
7531 7532
    int fd = -1, ret = -1;

7533
    qemuDriverLock(driver);
7534
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7535
    qemuDriverUnlock(driver);
R
Richard W.M. Jones 已提交
7536 7537

    if (!vm) {
7538 7539
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7540 7541
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7542 7543 7544
        goto cleanup;
    }

7545
    if (flags != VIR_MEMORY_VIRTUAL && flags != VIR_MEMORY_PHYSICAL) {
7546 7547
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("flags parameter must be VIR_MEMORY_VIRTUAL or VIR_MEMORY_PHYSICAL"));
7548
        goto cleanup;
R
Richard W.M. Jones 已提交
7549 7550
    }

7551 7552 7553
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
7554
    if (!virDomainObjIsActive(vm)) {
7555 7556
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7557
        goto endjob;
R
Richard W.M. Jones 已提交
7558 7559
    }

7560
    if (virAsprintf(&tmp, "%s/qemu.mem.XXXXXX", driver->cacheDir) < 0) {
7561
        virReportOOMError();
7562
        goto endjob;
7563 7564
    }

R
Richard W.M. Jones 已提交
7565 7566
    /* Create a temporary filename. */
    if ((fd = mkstemp (tmp)) == -1) {
7567 7568
        virReportSystemError(errno,
                             _("mkstemp(\"%s\") failed"), tmp);
7569
        goto endjob;
R
Richard W.M. Jones 已提交
7570 7571
    }

7572
    qemuDomainObjPrivatePtr priv = vm->privateData;
7573
    qemuDomainObjEnterMonitor(vm);
7574
    if (flags == VIR_MEMORY_VIRTUAL) {
7575 7576
        if (qemuMonitorSaveVirtualMemory(priv->mon, offset, size, tmp) < 0) {
            qemuDomainObjExitMonitor(vm);
7577
            goto endjob;
7578
        }
7579
    } else {
7580 7581
        if (qemuMonitorSavePhysicalMemory(priv->mon, offset, size, tmp) < 0) {
            qemuDomainObjExitMonitor(vm);
7582
            goto endjob;
7583
        }
R
Richard W.M. Jones 已提交
7584
    }
7585
    qemuDomainObjExitMonitor(vm);
R
Richard W.M. Jones 已提交
7586 7587 7588

    /* Read the memory file into buffer. */
    if (saferead (fd, buffer, size) == (ssize_t) -1) {
7589 7590 7591
        virReportSystemError(errno,
                             _("failed to read temporary file "
                               "created with template %s"), tmp);
7592
        goto endjob;
R
Richard W.M. Jones 已提交
7593 7594 7595
    }

    ret = 0;
7596

7597
endjob:
7598 7599
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
7600

7601
cleanup:
7602
    VIR_FREE(tmp);
7603
    VIR_FORCE_CLOSE(fd);
R
Richard W.M. Jones 已提交
7604
    unlink (tmp);
7605 7606
    if (vm)
        virDomainObjUnlock(vm);
R
Richard W.M. Jones 已提交
7607 7608 7609
    return ret;
}

7610

7611 7612 7613 7614 7615 7616 7617 7618 7619 7620
static int qemuDomainGetBlockInfo(virDomainPtr dom,
                                  const char *path,
                                  virDomainBlockInfoPtr info,
                                  unsigned int flags) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
    int fd = -1;
    off_t end;
    virStorageFileMetadata meta;
7621
    virDomainDiskDefPtr disk = NULL;
7622 7623
    struct stat sb;
    int i;
7624
    int format;
7625 7626 7627 7628 7629 7630 7631 7632 7633 7634 7635 7636 7637 7638 7639 7640 7641 7642 7643 7644 7645 7646 7647 7648

    virCheckFlags(0, -1);

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!path || path[0] == '\0') {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("NULL or empty path"));
        goto cleanup;
    }

    /* Check the path belongs to this domain. */
    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (vm->def->disks[i]->src != NULL &&
            STREQ (vm->def->disks[i]->src, path)) {
7649
            disk = vm->def->disks[i];
7650 7651 7652 7653
            break;
        }
    }

7654
    if (!disk) {
7655 7656 7657 7658 7659 7660 7661 7662 7663 7664 7665 7666 7667 7668
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid path %s not assigned to domain"), path);
        goto cleanup;
    }

    /* The path is correct, now try to open it and get its size. */
    fd = open (path, O_RDONLY);
    if (fd == -1) {
        virReportSystemError(errno,
                             _("failed to open path '%s'"), path);
        goto cleanup;
    }

    /* Probe for magic formats */
7669 7670 7671 7672 7673 7674 7675 7676
    if (disk->driverType) {
        if ((format = virStorageFileFormatTypeFromString(disk->driverType)) < 0) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("unknown disk format %s for %s"),
                            disk->driverType, disk->src);
            goto cleanup;
        }
    } else {
7677 7678 7679 7680 7681 7682 7683
        if (driver->allowDiskFormatProbing) {
            if ((format = virStorageFileProbeFormat(disk->src)) < 0)
                goto cleanup;
        } else {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("no disk format for %s and probing is disabled"),
                            disk->src);
7684
            goto cleanup;
7685
        }
7686 7687 7688 7689 7690
    }

    if (virStorageFileGetMetadataFromFD(path, fd,
                                        format,
                                        &meta) < 0)
7691 7692 7693 7694 7695 7696 7697 7698 7699 7700
        goto cleanup;

    /* Get info for normal formats */
    if (fstat(fd, &sb) < 0) {
        virReportSystemError(errno,
                             _("cannot stat file '%s'"), path);
        goto cleanup;
    }

    if (S_ISREG(sb.st_mode)) {
7701
#ifndef WIN32
7702 7703 7704 7705 7706 7707 7708 7709 7710 7711 7712 7713 7714 7715 7716 7717 7718 7719 7720 7721 7722 7723 7724 7725 7726 7727 7728 7729
        info->physical = (unsigned long long)sb.st_blocks *
            (unsigned long long)DEV_BSIZE;
#else
        info->physical = sb.st_size;
#endif
        /* Regular files may be sparse, so logical size (capacity) is not same
         * as actual physical above
         */
        info->capacity = sb.st_size;
    } else {
        /* NB. Because we configure with AC_SYS_LARGEFILE, off_t should
         * be 64 bits on all platforms.
         */
        end = lseek (fd, 0, SEEK_END);
        if (end == (off_t)-1) {
            virReportSystemError(errno,
                                 _("failed to seek to end of %s"), path);
            goto cleanup;
        }
        info->physical = end;
        info->capacity = end;
    }

    /* If the file we probed has a capacity set, then override
     * what we calculated from file/block extents */
    if (meta.capacity)
        info->capacity = meta.capacity;

7730
    /* Set default value .. */
7731 7732
    info->allocation = info->physical;

7733 7734 7735
    /* ..but if guest is running & not using raw
       disk format and on a block device, then query
       highest allocated extent from QEMU */
7736
    if (disk->type == VIR_DOMAIN_DISK_TYPE_BLOCK &&
7737
        format != VIR_STORAGE_FILE_RAW &&
7738 7739 7740 7741
        S_ISBLK(sb.st_mode)) {
        qemuDomainObjPrivatePtr priv = vm->privateData;
        if (qemuDomainObjBeginJob(vm) < 0)
            goto cleanup;
7742 7743 7744 7745 7746 7747 7748 7749 7750
        if (!virDomainObjIsActive(vm))
            ret = 0;
        else {
            qemuDomainObjEnterMonitor(vm);
            ret = qemuMonitorGetBlockExtent(priv->mon,
                                            disk->info.alias,
                                            &info->allocation);
            qemuDomainObjExitMonitor(vm);
        }
7751 7752 7753 7754 7755 7756

        if (qemuDomainObjEndJob(vm) == 0)
            vm = NULL;
    } else {
        ret = 0;
    }
7757 7758

cleanup:
7759
    VIR_FORCE_CLOSE(fd);
7760 7761 7762 7763 7764 7765
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}


7766
static int
7767 7768 7769 7770
qemuDomainEventRegister(virConnectPtr conn,
                        virConnectDomainEventCallback callback,
                        void *opaque,
                        virFreeCallback freecb)
7771
{
7772 7773 7774
    struct qemud_driver *driver = conn->privateData;
    int ret;

7775
    qemuDriverLock(driver);
7776 7777
    ret = virDomainEventCallbackListAdd(conn, driver->domainEventCallbacks,
                                        callback, opaque, freecb);
7778
    qemuDriverUnlock(driver);
7779

7780
    return ret;
7781 7782
}

7783

7784
static int
7785 7786
qemuDomainEventDeregister(virConnectPtr conn,
                          virConnectDomainEventCallback callback)
7787
{
7788 7789 7790
    struct qemud_driver *driver = conn->privateData;
    int ret;

7791
    qemuDriverLock(driver);
7792 7793 7794 7795 7796 7797
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDelete(conn, driver->domainEventCallbacks,
                                                   callback);
    else
        ret = virDomainEventCallbackListRemove(conn, driver->domainEventCallbacks,
                                               callback);
7798
    qemuDriverUnlock(driver);
7799

7800
    return ret;
7801 7802
}

7803 7804 7805 7806 7807 7808 7809 7810 7811 7812 7813 7814 7815 7816 7817 7818 7819 7820 7821 7822 7823 7824 7825 7826 7827 7828 7829 7830 7831 7832 7833 7834 7835 7836 7837 7838 7839 7840 7841 7842 7843 7844 7845

static int
qemuDomainEventRegisterAny(virConnectPtr conn,
                           virDomainPtr dom,
                           int eventID,
                           virConnectDomainEventGenericCallback callback,
                           void *opaque,
                           virFreeCallback freecb)
{
    struct qemud_driver *driver = conn->privateData;
    int ret;

    qemuDriverLock(driver);
    ret = virDomainEventCallbackListAddID(conn,
                                          driver->domainEventCallbacks,
                                          dom, eventID,
                                          callback, opaque, freecb);
    qemuDriverUnlock(driver);

    return ret;
}


static int
qemuDomainEventDeregisterAny(virConnectPtr conn,
                             int callbackID)
{
    struct qemud_driver *driver = conn->privateData;
    int ret;

    qemuDriverLock(driver);
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDeleteID(conn, driver->domainEventCallbacks,
                                                     callbackID);
    else
        ret = virDomainEventCallbackListRemoveID(conn, driver->domainEventCallbacks,
                                                 callbackID);
    qemuDriverUnlock(driver);

    return ret;
}


7846 7847
static void qemuDomainEventDispatchFunc(virConnectPtr conn,
                                        virDomainEventPtr event,
7848
                                        virConnectDomainEventGenericCallback cb,
7849 7850
                                        void *cbopaque,
                                        void *opaque)
7851
{
7852
    struct qemud_driver *driver = opaque;
7853

7854 7855 7856 7857 7858 7859 7860 7861 7862 7863 7864 7865 7866 7867 7868 7869 7870 7871 7872 7873 7874 7875 7876 7877 7878 7879 7880 7881 7882 7883 7884 7885 7886 7887 7888 7889 7890 7891 7892 7893 7894 7895 7896 7897
    /* Drop the lock whle dispatching, for sake of re-entrancy */
    qemuDriverUnlock(driver);
    virDomainEventDispatchDefaultFunc(conn, event, cb, cbopaque, NULL);
    qemuDriverLock(driver);
}

static void qemuDomainEventFlush(int timer ATTRIBUTE_UNUSED, void *opaque)
{
    struct qemud_driver *driver = opaque;
    virDomainEventQueue tempQueue;

    qemuDriverLock(driver);

    driver->domainEventDispatching = 1;

    /* Copy the queue, so we're reentrant safe */
    tempQueue.count = driver->domainEventQueue->count;
    tempQueue.events = driver->domainEventQueue->events;
    driver->domainEventQueue->count = 0;
    driver->domainEventQueue->events = NULL;

    virEventUpdateTimeout(driver->domainEventTimer, -1);
    virDomainEventQueueDispatch(&tempQueue,
                                driver->domainEventCallbacks,
                                qemuDomainEventDispatchFunc,
                                driver);

    /* Purge any deleted callbacks */
    virDomainEventCallbackListPurgeMarked(driver->domainEventCallbacks);

    driver->domainEventDispatching = 0;
    qemuDriverUnlock(driver);
}


/* driver must be locked before calling */
static void qemuDomainEventQueue(struct qemud_driver *driver,
                                 virDomainEventPtr event)
{
    if (virDomainEventQueuePush(driver->domainEventQueue,
                                event) < 0)
        virDomainEventFree(event);
    if (qemu_driver->domainEventQueue->count == 1)
        virEventUpdateTimeout(driver->domainEventTimer, 0);
7898 7899
}

D
Daniel Veillard 已提交
7900 7901
/* Migration support. */

7902 7903 7904 7905 7906
static bool ATTRIBUTE_NONNULL(1)
qemuDomainIsMigratable(virDomainDefPtr def)
{
    if (def->nhostdevs > 0) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
7907
            "%s", _("Domain with assigned host devices cannot be migrated"));
7908 7909 7910 7911 7912 7913
        return false;
    }

    return true;
}

C
Chris Lalancette 已提交
7914 7915 7916 7917 7918 7919 7920 7921 7922 7923 7924 7925 7926 7927 7928 7929 7930 7931 7932 7933 7934
/* Prepare is the first step, and it runs on the destination host.
 *
 * This version starts an empty VM listening on a localhost TCP port, and
 * sets up the corresponding virStream to handle the incoming data.
 */
static int
qemudDomainMigratePrepareTunnel(virConnectPtr dconn,
                                virStreamPtr st,
                                unsigned long flags,
                                const char *dname,
                                unsigned long resource ATTRIBUTE_UNUSED,
                                const char *dom_xml)
{
    struct qemud_driver *driver = dconn->privateData;
    virDomainDefPtr def = NULL;
    virDomainObjPtr vm = NULL;
    char *migrateFrom;
    virDomainEventPtr event = NULL;
    int ret = -1;
    int internalret;
    char *unixfile = NULL;
7935
    unsigned long long qemuCmdFlags;
7936 7937 7938 7939 7940 7941 7942 7943
    qemuDomainObjPrivatePtr priv = NULL;
    struct timeval now;

    if (gettimeofday(&now, NULL) < 0) {
        virReportSystemError(errno, "%s",
                             _("cannot get time of day"));
        return -1;
    }
C
Chris Lalancette 已提交
7944 7945 7946

    qemuDriverLock(driver);
    if (!dom_xml) {
7947 7948
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("no domain XML passed"));
C
Chris Lalancette 已提交
7949 7950 7951
        goto cleanup;
    }
    if (!(flags & VIR_MIGRATE_TUNNELLED)) {
7952
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
7953 7954 7955 7956
                         "%s", _("PrepareTunnel called but no TUNNELLED flag set"));
        goto cleanup;
    }
    if (st == NULL) {
7957 7958
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("tunnelled migration requested but NULL stream passed"));
C
Chris Lalancette 已提交
7959 7960 7961 7962
        goto cleanup;
    }

    /* Parse the domain XML. */
7963
    if (!(def = virDomainDefParseString(driver->caps, dom_xml,
C
Chris Lalancette 已提交
7964
                                        VIR_DOMAIN_XML_INACTIVE))) {
7965 7966
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to parse XML"));
C
Chris Lalancette 已提交
7967 7968 7969
        goto cleanup;
    }

7970 7971 7972
    if (!qemuDomainIsMigratable(def))
        goto cleanup;

C
Chris Lalancette 已提交
7973
    /* Target domain name, maybe renamed. */
7974 7975 7976 7977 7978 7979
    if (dname) {
        VIR_FREE(def->name);
        def->name = strdup(dname);
        if (def->name == NULL)
            goto cleanup;
    }
C
Chris Lalancette 已提交
7980

7981 7982
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
C
Chris Lalancette 已提交
7983

7984
    if (!(vm = virDomainAssignDef(driver->caps,
C
Chris Lalancette 已提交
7985
                                  &driver->domains,
7986
                                  def, true))) {
7987
        /* virDomainAssignDef already set the error */
C
Chris Lalancette 已提交
7988 7989 7990
        goto cleanup;
    }
    def = NULL;
7991
    priv = vm->privateData;
C
Chris Lalancette 已提交
7992

7993 7994
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
7995
    priv->jobActive = QEMU_JOB_MIGRATION_OUT;
7996

C
Chris Lalancette 已提交
7997 7998 7999 8000
    /* Domain starts inactive, even if the domain XML had an id field. */
    vm->def->id = -1;

    if (virAsprintf(&unixfile, "%s/qemu.tunnelmigrate.dest.%s",
8001
                    driver->libDir, vm->def->name) < 0) {
8002
        virReportOOMError();
8003
        goto endjob;
C
Chris Lalancette 已提交
8004 8005 8006 8007
    }
    unlink(unixfile);

    /* check that this qemu version supports the interactive exec */
8008
    if (qemuCapsExtractVersionInfo(vm->def->emulator, NULL, &qemuCmdFlags) < 0) {
8009 8010 8011
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("Cannot determine QEMU argv syntax %s"),
                        vm->def->emulator);
8012
        goto endjob;
C
Chris Lalancette 已提交
8013 8014 8015 8016 8017 8018
    }
    if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_UNIX)
        internalret = virAsprintf(&migrateFrom, "unix:%s", unixfile);
    else if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_EXEC)
        internalret = virAsprintf(&migrateFrom, "exec:nc -U -l %s", unixfile);
    else {
8019 8020
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("Destination qemu is too old to support tunnelled migration"));
8021
        goto endjob;
C
Chris Lalancette 已提交
8022 8023
    }
    if (internalret < 0) {
8024
        virReportOOMError();
8025
        goto endjob;
C
Chris Lalancette 已提交
8026 8027 8028 8029
    }
    /* Start the QEMU daemon, with the same command-line arguments plus
     * -incoming unix:/path/to/file or exec:nc -U /path/to/file
     */
8030
    internalret = qemudStartVMDaemon(dconn, driver, vm, migrateFrom, true,
8031
                                     -1, NULL, VIR_VM_OP_MIGRATE_IN_START);
C
Chris Lalancette 已提交
8032 8033
    VIR_FREE(migrateFrom);
    if (internalret < 0) {
8034
        qemuDomainStartAudit(vm, "migrated", false);
C
Chris Lalancette 已提交
8035 8036 8037 8038 8039 8040 8041
        /* Note that we don't set an error here because qemudStartVMDaemon
         * should have already done that.
         */
        if (!vm->persistent) {
            virDomainRemoveInactive(&driver->domains, vm);
            vm = NULL;
        }
8042
        goto endjob;
C
Chris Lalancette 已提交
8043 8044
    }

8045 8046 8047
    if (virFDStreamConnectUNIX(st,
                               unixfile,
                               false) < 0) {
8048
        qemuDomainStartAudit(vm, "migrated", false);
8049
        qemudShutdownVMDaemon(driver, vm, 0);
8050
        if (!vm->persistent) {
8051 8052
            if (qemuDomainObjEndJob(vm) > 0)
                virDomainRemoveInactive(&driver->domains, vm);
8053 8054
            vm = NULL;
        }
8055
        virReportSystemError(errno,
C
Chris Lalancette 已提交
8056 8057
                             _("cannot open unix socket '%s' for tunnelled migration"),
                             unixfile);
8058
        goto endjob;
C
Chris Lalancette 已提交
8059 8060
    }

8061
    qemuDomainStartAudit(vm, "migrated", true);
8062

C
Chris Lalancette 已提交
8063 8064 8065 8066 8067
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_MIGRATED);
    ret = 0;

8068
endjob:
8069 8070 8071
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
8072

8073 8074 8075 8076 8077 8078 8079 8080 8081
    /* We set a fake job active which is held across
     * API calls until the finish() call. This prevents
     * any other APIs being invoked while incoming
     * migration is taking place
     */
    if (vm &&
        virDomainObjIsActive(vm)) {
        priv->jobActive = QEMU_JOB_MIGRATION_IN;
        priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;
8082
        priv->jobStart = timeval_to_ms(now);
8083 8084
    }

C
Chris Lalancette 已提交
8085 8086
cleanup:
    virDomainDefFree(def);
8087 8088
    if (unixfile)
        unlink(unixfile);
C
Chris Lalancette 已提交
8089 8090 8091 8092 8093 8094 8095 8096 8097
    VIR_FREE(unixfile);
    if (vm)
        virDomainObjUnlock(vm);
    if (event)
        qemuDomainEventQueue(driver, event);
    qemuDriverUnlock(driver);
    return ret;
}

D
Daniel Veillard 已提交
8098 8099 8100 8101
/* Prepare is the first step, and it runs on the destination host.
 *
 * This starts an empty VM listening on a TCP port.
 */
8102
static int ATTRIBUTE_NONNULL (5)
D
Daniel Veillard 已提交
8103 8104 8105 8106 8107
qemudDomainMigratePrepare2 (virConnectPtr dconn,
                            char **cookie ATTRIBUTE_UNUSED,
                            int *cookielen ATTRIBUTE_UNUSED,
                            const char *uri_in,
                            char **uri_out,
C
Chris Lalancette 已提交
8108
                            unsigned long flags,
D
Daniel Veillard 已提交
8109 8110 8111 8112 8113
                            const char *dname,
                            unsigned long resource ATTRIBUTE_UNUSED,
                            const char *dom_xml)
{
    static int port = 0;
8114 8115
    struct qemud_driver *driver = dconn->privateData;
    virDomainDefPtr def = NULL;
D
Daniel Veillard 已提交
8116 8117
    virDomainObjPtr vm = NULL;
    int this_port;
C
Chris Lalancette 已提交
8118
    char *hostname = NULL;
D
Daniel Veillard 已提交
8119 8120
    char migrateFrom [64];
    const char *p;
8121
    virDomainEventPtr event = NULL;
8122
    int ret = -1;
8123
    int internalret;
8124 8125 8126 8127 8128 8129 8130 8131
    qemuDomainObjPrivatePtr priv = NULL;
    struct timeval now;

    if (gettimeofday(&now, NULL) < 0) {
        virReportSystemError(errno, "%s",
                             _("cannot get time of day"));
        return -1;
    }
8132

C
Chris Lalancette 已提交
8133 8134 8135 8136 8137 8138 8139 8140 8141
    virCheckFlags(VIR_MIGRATE_LIVE |
                  VIR_MIGRATE_PEER2PEER |
                  VIR_MIGRATE_TUNNELLED |
                  VIR_MIGRATE_PERSIST_DEST |
                  VIR_MIGRATE_UNDEFINE_SOURCE |
                  VIR_MIGRATE_PAUSED |
                  VIR_MIGRATE_NON_SHARED_DISK |
                  VIR_MIGRATE_NON_SHARED_INC, -1);

8142
    *uri_out = NULL;
D
Daniel Veillard 已提交
8143

8144
    qemuDriverLock(driver);
C
Chris Lalancette 已提交
8145 8146 8147 8148
    if (flags & VIR_MIGRATE_TUNNELLED) {
        /* this is a logical error; we never should have gotten here with
         * VIR_MIGRATE_TUNNELLED set
         */
8149 8150
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("Tunnelled migration requested but invalid RPC method called"));
C
Chris Lalancette 已提交
8151 8152 8153
        goto cleanup;
    }

D
Daniel Veillard 已提交
8154
    if (!dom_xml) {
8155 8156
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("no domain XML passed"));
8157
        goto cleanup;
D
Daniel Veillard 已提交
8158 8159 8160 8161 8162 8163 8164 8165 8166 8167 8168 8169 8170 8171 8172 8173 8174
    }

    /* The URI passed in may be NULL or a string "tcp://somehostname:port".
     *
     * If the URI passed in is NULL then we allocate a port number
     * from our pool of port numbers and return a URI of
     * "tcp://ourhostname:port".
     *
     * If the URI passed in is not NULL then we try to parse out the
     * port number and use that (note that the hostname is assumed
     * to be a correct hostname which refers to the target machine).
     */
    if (uri_in == NULL) {
        this_port = QEMUD_MIGRATION_FIRST_PORT + port++;
        if (port == QEMUD_MIGRATION_NUM_PORTS) port = 0;

        /* Get hostname */
C
Chris Lalancette 已提交
8175
        if ((hostname = virGetHostname(NULL)) == NULL)
8176
            goto cleanup;
D
Daniel Veillard 已提交
8177

C
Chris Lalancette 已提交
8178 8179 8180 8181 8182 8183
        if (STRPREFIX(hostname, "localhost")) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("hostname on destination resolved to localhost, but migration requires an FQDN"));
            goto cleanup;
        }

8184 8185 8186 8187 8188
        /* XXX this really should have been a properly well-formed
         * URI, but we can't add in tcp:// now without breaking
         * compatability with old targets. We at least make the
         * new targets accept both syntaxes though.
         */
D
Daniel Veillard 已提交
8189
        /* Caller frees */
8190 8191
        internalret = virAsprintf(uri_out, "tcp:%s:%d", hostname, this_port);
        if (internalret < 0) {
8192
            virReportOOMError();
8193
            goto cleanup;
D
Daniel Veillard 已提交
8194 8195 8196 8197 8198 8199
        }
    } else {
        /* Check the URI starts with "tcp:".  We will escape the
         * URI when passing it to the qemu monitor, so bad
         * characters in hostname part don't matter.
         */
8200
        if (!STRPREFIX (uri_in, "tcp:")) {
8201 8202
            qemuReportError (VIR_ERR_INVALID_ARG,
                             "%s", _("only tcp URIs are supported for KVM/QEMU migrations"));
8203
            goto cleanup;
D
Daniel Veillard 已提交
8204 8205 8206 8207
        }

        /* Get the port number. */
        p = strrchr (uri_in, ':');
8208 8209 8210 8211 8212 8213 8214 8215
        if (p == strchr(uri_in, ':')) {
            /* Generate a port */
            this_port = QEMUD_MIGRATION_FIRST_PORT + port++;
            if (port == QEMUD_MIGRATION_NUM_PORTS)
                port = 0;

            /* Caller frees */
            if (virAsprintf(uri_out, "%s:%d", uri_in, this_port) < 0) {
8216
                virReportOOMError();
8217 8218 8219 8220 8221 8222 8223
                goto cleanup;
            }

        } else {
            p++; /* definitely has a ':' in it, see above */
            this_port = virParseNumber (&p);
            if (this_port == -1 || p-uri_in != strlen (uri_in)) {
8224 8225
                qemuReportError(VIR_ERR_INVALID_ARG,
                                "%s", _("URI ended with incorrect ':port'"));
8226 8227
                goto cleanup;
            }
D
Daniel Veillard 已提交
8228 8229 8230
        }
    }

8231
    if (*uri_out)
8232 8233
        VIR_DEBUG("Generated uri_out=%s", *uri_out);

D
Daniel Veillard 已提交
8234
    /* Parse the domain XML. */
8235
    if (!(def = virDomainDefParseString(driver->caps, dom_xml,
8236
                                        VIR_DOMAIN_XML_INACTIVE))) {
8237 8238
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to parse XML"));
8239
        goto cleanup;
D
Daniel Veillard 已提交
8240 8241
    }

8242 8243 8244
    if (!qemuDomainIsMigratable(def))
        goto cleanup;

D
Daniel Veillard 已提交
8245
    /* Target domain name, maybe renamed. */
8246 8247 8248 8249 8250 8251
    if (dname) {
        VIR_FREE(def->name);
        def->name = strdup(dname);
        if (def->name == NULL)
            goto cleanup;
    }
D
Daniel Veillard 已提交
8252

8253 8254
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
8255

8256
    if (!(vm = virDomainAssignDef(driver->caps,
D
Daniel Veillard 已提交
8257
                                  &driver->domains,
8258
                                  def, true))) {
8259
        /* virDomainAssignDef already set the error */
8260
        goto cleanup;
D
Daniel Veillard 已提交
8261
    }
8262
    def = NULL;
8263
    priv = vm->privateData;
D
Daniel Veillard 已提交
8264

8265 8266
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
8267
    priv->jobActive = QEMU_JOB_MIGRATION_OUT;
8268

D
Daniel Veillard 已提交
8269 8270 8271 8272 8273 8274 8275
    /* Domain starts inactive, even if the domain XML had an id field. */
    vm->def->id = -1;

    /* Start the QEMU daemon, with the same command-line arguments plus
     * -incoming tcp:0.0.0.0:port
     */
    snprintf (migrateFrom, sizeof (migrateFrom), "tcp:0.0.0.0:%d", this_port);
8276
    if (qemudStartVMDaemon (dconn, driver, vm, migrateFrom, true,
8277
                            -1, NULL, VIR_VM_OP_MIGRATE_IN_START) < 0) {
8278
        qemuDomainStartAudit(vm, "migrated", false);
8279 8280 8281
        /* Note that we don't set an error here because qemudStartVMDaemon
         * should have already done that.
         */
8282
        if (!vm->persistent) {
8283 8284
            if (qemuDomainObjEndJob(vm) > 0)
                virDomainRemoveInactive(&driver->domains, vm);
8285 8286
            vm = NULL;
        }
8287
        goto endjob;
D
Daniel Veillard 已提交
8288
    }
8289

8290
    qemuDomainStartAudit(vm, "migrated", true);
8291 8292 8293
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_MIGRATED);
8294
    ret = 0;
D
Daniel Veillard 已提交
8295

8296
endjob:
8297 8298 8299
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
8300

8301 8302 8303 8304 8305 8306 8307 8308 8309
    /* We set a fake job active which is held across
     * API calls until the finish() call. This prevents
     * any other APIs being invoked while incoming
     * migration is taking place
     */
    if (vm &&
        virDomainObjIsActive(vm)) {
        priv->jobActive = QEMU_JOB_MIGRATION_IN;
        priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;
8310
        priv->jobStart = timeval_to_ms(now);
8311 8312
    }

8313
cleanup:
C
Chris Lalancette 已提交
8314
    VIR_FREE(hostname);
8315
    virDomainDefFree(def);
C
Chris Lalancette 已提交
8316
    if (ret != 0)
8317
        VIR_FREE(*uri_out);
8318 8319
    if (vm)
        virDomainObjUnlock(vm);
8320 8321
    if (event)
        qemuDomainEventQueue(driver, event);
8322
    qemuDriverUnlock(driver);
8323
    return ret;
C
Chris Lalancette 已提交
8324 8325 8326

}

8327 8328 8329 8330

/* Perform migration using QEMU's native TCP migrate support,
 * not encrypted obviously
 */
8331
static int doNativeMigrate(struct qemud_driver *driver,
8332 8333
                           virDomainObjPtr vm,
                           const char *uri,
8334
                           unsigned int flags,
8335 8336 8337 8338
                           const char *dname ATTRIBUTE_UNUSED,
                           unsigned long resource)
{
    int ret = -1;
8339
    xmlURIPtr uribits = NULL;
8340
    qemuDomainObjPrivatePtr priv = vm->privateData;
8341
    unsigned int background_flags = QEMU_MONITOR_MIGRATE_BACKGROUND;
8342

8343 8344 8345 8346 8347
    /* Issue the migrate command. */
    if (STRPREFIX(uri, "tcp:") && !STRPREFIX(uri, "tcp://")) {
        /* HACK: source host generates bogus URIs, so fix them up */
        char *tmpuri;
        if (virAsprintf(&tmpuri, "tcp://%s", uri + strlen("tcp:")) < 0) {
8348
            virReportOOMError();
8349 8350 8351 8352 8353 8354 8355 8356
            goto cleanup;
        }
        uribits = xmlParseURI(tmpuri);
        VIR_FREE(tmpuri);
    } else {
        uribits = xmlParseURI(uri);
    }
    if (!uribits) {
8357 8358
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot parse URI %s"), uri);
8359 8360 8361
        goto cleanup;
    }

8362
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
8363
    if (resource > 0 &&
8364
        qemuMonitorSetMigrationSpeed(priv->mon, resource) < 0) {
8365
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8366
        goto cleanup;
8367
    }
8368

8369 8370 8371 8372 8373 8374 8375 8376
    if (flags & VIR_MIGRATE_NON_SHARED_DISK)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_DISK;

    if (flags & VIR_MIGRATE_NON_SHARED_INC)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_INC;

    if (qemuMonitorMigrateToHost(priv->mon, background_flags, uribits->server,
                                 uribits->port) < 0) {
8377
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8378 8379
        goto cleanup;
    }
8380
    qemuDomainObjExitMonitorWithDriver(driver, vm);
8381

8382
    if (qemuDomainWaitForMigrationComplete(driver, vm) < 0)
8383 8384 8385 8386 8387 8388 8389 8390 8391 8392
        goto cleanup;

    ret = 0;

cleanup:
    xmlFreeURI(uribits);
    return ret;
}


8393 8394
#define TUNNEL_SEND_BUF_SIZE 65536

8395
static int doTunnelSendAll(virStreamPtr st,
8396 8397
                           int sock)
{
8398 8399 8400 8401 8402 8403 8404 8405
    char *buffer;
    int nbytes = TUNNEL_SEND_BUF_SIZE;

    if (VIR_ALLOC_N(buffer, TUNNEL_SEND_BUF_SIZE) < 0) {
        virReportOOMError();
        virStreamAbort(st);
        return -1;
    }
8406 8407 8408 8409 8410

    /* XXX should honour the 'resource' parameter here */
    for (;;) {
        nbytes = saferead(sock, buffer, nbytes);
        if (nbytes < 0) {
8411
            virReportSystemError(errno, "%s",
8412
                                 _("tunnelled migration failed to read from qemu"));
8413 8414
            virStreamAbort(st);
            VIR_FREE(buffer);
8415 8416 8417 8418 8419 8420 8421
            return -1;
        }
        else if (nbytes == 0)
            /* EOF; get out of here */
            break;

        if (virStreamSend(st, buffer, nbytes) < 0) {
8422 8423
            qemuReportError(VIR_ERR_OPERATION_FAILED, "%s",
                            _("Failed to write migration data to remote libvirtd"));
8424
            VIR_FREE(buffer);
8425 8426 8427 8428
            return -1;
        }
    }

8429 8430
    VIR_FREE(buffer);

8431 8432 8433 8434 8435 8436 8437
    if (virStreamFinish(st) < 0)
        /* virStreamFinish set the error for us */
        return -1;

    return 0;
}

C
Chris Lalancette 已提交
8438
static int doTunnelMigrate(virDomainPtr dom,
8439
                           struct qemud_driver *driver,
8440
                           virConnectPtr dconn,
C
Chris Lalancette 已提交
8441
                           virDomainObjPtr vm,
8442
                           const char *dom_xml,
C
Chris Lalancette 已提交
8443 8444 8445 8446 8447
                           const char *uri,
                           unsigned long flags,
                           const char *dname,
                           unsigned long resource)
{
8448
    qemuDomainObjPrivatePtr priv = vm->privateData;
8449 8450
    int client_sock = -1;
    int qemu_sock = -1;
C
Chris Lalancette 已提交
8451 8452
    struct sockaddr_un sa_qemu, sa_client;
    socklen_t addrlen;
8453
    virDomainPtr ddomain = NULL;
C
Chris Lalancette 已提交
8454
    int retval = -1;
8455
    virStreamPtr st = NULL;
C
Chris Lalancette 已提交
8456 8457
    char *unixfile = NULL;
    int internalret;
8458
    unsigned long long qemuCmdFlags;
C
Chris Lalancette 已提交
8459 8460
    int status;
    unsigned long long transferred, remaining, total;
8461
    unsigned int background_flags = QEMU_MONITOR_MIGRATE_BACKGROUND;
C
Chris Lalancette 已提交
8462

8463 8464 8465 8466 8467 8468 8469 8470
    /*
     * The order of operations is important here to avoid touching
     * the source VM until we are very sure we can successfully
     * start the migration operation.
     *
     *   1. setup local support infrastructure (eg sockets)
     *   2. setup destination fully
     *   3. start migration on source
C
Chris Lalancette 已提交
8471 8472
     */

8473

8474
    /* Stage 1. setup local support infrastructure */
C
Chris Lalancette 已提交
8475 8476

    if (virAsprintf(&unixfile, "%s/qemu.tunnelmigrate.src.%s",
8477
                    driver->libDir, vm->def->name) < 0) {
8478
        virReportOOMError();
8479
        goto cleanup;
C
Chris Lalancette 已提交
8480 8481 8482 8483
    }

    qemu_sock = socket(AF_UNIX, SOCK_STREAM, 0);
    if (qemu_sock < 0) {
8484
        virReportSystemError(errno, "%s",
C
Chris Lalancette 已提交
8485
                             _("cannot open tunnelled migration socket"));
8486
        goto cleanup;
C
Chris Lalancette 已提交
8487 8488 8489 8490 8491
    }
    memset(&sa_qemu, 0, sizeof(sa_qemu));
    sa_qemu.sun_family = AF_UNIX;
    if (virStrcpy(sa_qemu.sun_path, unixfile,
                  sizeof(sa_qemu.sun_path)) == NULL) {
8492 8493 8494
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("Unix socket '%s' too big for destination"),
                        unixfile);
8495
        goto cleanup;
C
Chris Lalancette 已提交
8496 8497 8498
    }
    unlink(unixfile);
    if (bind(qemu_sock, (struct sockaddr *)&sa_qemu, sizeof(sa_qemu)) < 0) {
8499
        virReportSystemError(errno,
C
Chris Lalancette 已提交
8500 8501
                             _("Cannot bind to unix socket '%s' for tunnelled migration"),
                             unixfile);
8502
        goto cleanup;
C
Chris Lalancette 已提交
8503 8504
    }
    if (listen(qemu_sock, 1) < 0) {
8505
        virReportSystemError(errno,
C
Chris Lalancette 已提交
8506 8507
                             _("Cannot listen on unix socket '%s' for tunnelled migration"),
                             unixfile);
8508
        goto cleanup;
C
Chris Lalancette 已提交
8509 8510
    }

8511 8512 8513 8514 8515 8516 8517
    if (chown(unixfile, qemu_driver->user, qemu_driver->group) < 0) {
        virReportSystemError(errno,
                             _("Cannot change unix socket '%s' owner"),
                             unixfile);
        goto cleanup;
    }

C
Chris Lalancette 已提交
8518
    /* check that this qemu version supports the unix migration */
8519
    if (qemuCapsExtractVersionInfo(vm->def->emulator, NULL, &qemuCmdFlags) < 0) {
8520 8521 8522
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("Cannot extract Qemu version from '%s'"),
                        vm->def->emulator);
8523 8524 8525 8526 8527
        goto cleanup;
    }

    if (!(qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_UNIX) &&
        !(qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_EXEC)) {
8528 8529
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("Source qemu is too old to support tunnelled migration"));
8530
        goto cleanup;
C
Chris Lalancette 已提交
8531
    }
8532 8533 8534 8535 8536 8537 8538 8539 8540 8541 8542 8543


    /* Stage 2. setup destination fully
     *
     * Once stage 2 has completed successfully, we *must* call finish
     * to cleanup the target whether we succeed or fail
     */
    st = virStreamNew(dconn, 0);
    if (st == NULL)
        /* virStreamNew only fails on OOM, and it reports the error itself */
        goto cleanup;

8544
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8545 8546 8547
    internalret = dconn->driver->domainMigratePrepareTunnel(dconn, st,
                                                            flags, dname,
                                                            resource, dom_xml);
8548
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8549 8550 8551 8552 8553

    if (internalret < 0)
        /* domainMigratePrepareTunnel sets the error for us */
        goto cleanup;

8554 8555 8556 8557 8558 8559 8560 8561 8562
    /* the domain may have shutdown or crashed while we had the locks dropped
     * in qemuDomainObjEnterRemoteWithDriver, so check again
     */
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8563
    /*   3. start migration on source */
8564
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
8565 8566 8567 8568 8569 8570 8571 8572
    if (flags & VIR_MIGRATE_NON_SHARED_DISK)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_DISK;
    if (flags & VIR_MIGRATE_NON_SHARED_INC)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_INC;
    if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_UNIX){
        internalret = qemuMonitorMigrateToUnix(priv->mon, background_flags,
                                               unixfile);
    }
C
Chris Lalancette 已提交
8573 8574
    else if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_EXEC) {
        const char *args[] = { "nc", "-U", unixfile, NULL };
8575
        internalret = qemuMonitorMigrateToCommand(priv->mon, QEMU_MONITOR_MIGRATE_BACKGROUND, args);
8576 8577
    } else {
        internalret = -1;
C
Chris Lalancette 已提交
8578
    }
8579
    qemuDomainObjExitMonitorWithDriver(driver, vm);
C
Chris Lalancette 已提交
8580
    if (internalret < 0) {
8581 8582
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("tunnelled migration monitor command failed"));
8583
        goto finish;
C
Chris Lalancette 已提交
8584 8585
    }

8586 8587 8588 8589 8590 8591
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8592 8593 8594
    /* From this point onwards we *must* call cancel to abort the
     * migration on source if anything goes wrong */

C
Chris Lalancette 已提交
8595 8596 8597
    /* it is also possible that the migrate didn't fail initially, but
     * rather failed later on.  Check the output of "info migrate"
     */
8598
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
8599 8600
    if (qemuMonitorGetMigrationStatus(priv->mon,
                                      &status,
C
Chris Lalancette 已提交
8601 8602 8603
                                      &transferred,
                                      &remaining,
                                      &total) < 0) {
8604
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8605
        goto cancel;
C
Chris Lalancette 已提交
8606
    }
8607
    qemuDomainObjExitMonitorWithDriver(driver, vm);
C
Chris Lalancette 已提交
8608 8609

    if (status == QEMU_MONITOR_MIGRATION_STATUS_ERROR) {
8610 8611
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s",_("migrate failed"));
8612
        goto cancel;
C
Chris Lalancette 已提交
8613 8614 8615 8616 8617 8618
    }

    addrlen = sizeof(sa_client);
    while ((client_sock = accept(qemu_sock, (struct sockaddr *)&sa_client, &addrlen)) < 0) {
        if (errno == EAGAIN || errno == EINTR)
            continue;
8619
        virReportSystemError(errno, "%s",
C
Chris Lalancette 已提交
8620
                             _("tunnelled migration failed to accept from qemu"));
8621
        goto cancel;
C
Chris Lalancette 已提交
8622 8623
    }

8624
    retval = doTunnelSendAll(st, client_sock);
8625

8626
cancel:
8627
    if (retval != 0 && virDomainObjIsActive(vm)) {
8628
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
8629
        qemuMonitorMigrateCancel(priv->mon);
8630
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8631
    }
C
Chris Lalancette 已提交
8632

8633
finish:
C
Chris Lalancette 已提交
8634
    dname = dname ? dname : dom->name;
8635
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
C
Chris Lalancette 已提交
8636 8637
    ddomain = dconn->driver->domainMigrateFinish2
        (dconn, dname, NULL, 0, uri, flags, retval);
8638
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8639 8640

cleanup:
8641 8642
    VIR_FORCE_CLOSE(client_sock);
    VIR_FORCE_CLOSE(qemu_sock);
8643

C
Chris Lalancette 已提交
8644 8645 8646
    if (ddomain)
        virUnrefDomain(ddomain);

8647 8648 8649 8650
    if (unixfile) {
        unlink(unixfile);
        VIR_FREE(unixfile);
    }
C
Chris Lalancette 已提交
8651

8652 8653 8654
    if (st)
        /* don't call virStreamFree(), because that resets any pending errors */
        virUnrefStream(st);
8655 8656 8657 8658
    return retval;
}


8659 8660 8661 8662
/* This is essentially a simplified re-impl of
 * virDomainMigrateVersion2 from libvirt.c, but running in source
 * libvirtd context, instead of client app context */
static int doNonTunnelMigrate(virDomainPtr dom,
8663
                              struct qemud_driver *driver,
8664 8665 8666 8667 8668 8669 8670 8671 8672 8673 8674
                              virConnectPtr dconn,
                              virDomainObjPtr vm,
                              const char *dom_xml,
                              const char *uri ATTRIBUTE_UNUSED,
                              unsigned long flags,
                              const char *dname,
                              unsigned long resource)
{
    virDomainPtr ddomain = NULL;
    int retval = -1;
    char *uri_out = NULL;
8675
    int rc;
8676

8677
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8678 8679
    /* NB we don't pass 'uri' into this, since that's the libvirtd
     * URI in this context - so we let dest pick it */
8680 8681 8682 8683 8684 8685 8686 8687 8688
    rc = dconn->driver->domainMigratePrepare2(dconn,
                                              NULL, /* cookie */
                                              0, /* cookielen */
                                              NULL, /* uri */
                                              &uri_out,
                                              flags, dname,
                                              resource, dom_xml);
    qemuDomainObjExitRemoteWithDriver(driver, vm);
    if (rc < 0)
8689 8690 8691
        /* domainMigratePrepare2 sets the error for us */
        goto cleanup;

8692 8693 8694 8695 8696 8697 8698 8699 8700
    /* the domain may have shutdown or crashed while we had the locks dropped
     * in qemuDomainObjEnterRemoteWithDriver, so check again
     */
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8701
    if (uri_out == NULL) {
8702 8703
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("domainMigratePrepare2 did not set uri"));
8704
        goto cleanup;
8705 8706
    }

8707
    if (doNativeMigrate(driver, vm, uri_out, flags, dname, resource) < 0)
8708 8709 8710 8711 8712 8713
        goto finish;

    retval = 0;

finish:
    dname = dname ? dname : dom->name;
8714
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8715 8716
    ddomain = dconn->driver->domainMigrateFinish2
        (dconn, dname, NULL, 0, uri_out, flags, retval);
8717
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8718 8719 8720 8721 8722 8723 8724 8725 8726

    if (ddomain)
        virUnrefDomain(ddomain);

cleanup:
    return retval;
}


8727
static int doPeer2PeerMigrate(virDomainPtr dom,
8728
                              struct qemud_driver *driver,
8729 8730 8731 8732 8733 8734 8735 8736 8737
                              virDomainObjPtr vm,
                              const char *uri,
                              unsigned long flags,
                              const char *dname,
                              unsigned long resource)
{
    int ret = -1;
    virConnectPtr dconn = NULL;
    char *dom_xml;
8738
    bool p2p;
8739 8740 8741 8742 8743

    /* the order of operations is important here; we make sure the
     * destination side is completely setup before we touch the source
     */

8744
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8745
    dconn = virConnectOpen(uri);
8746
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8747
    if (dconn == NULL) {
8748 8749
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("Failed to connect to remote libvirt URI %s"), uri);
8750 8751
        return -1;
    }
8752 8753 8754 8755 8756 8757

    qemuDomainObjEnterRemoteWithDriver(driver, vm);
    p2p = VIR_DRV_SUPPORTS_FEATURE(dconn->driver, dconn,
                                   VIR_DRV_FEATURE_MIGRATION_P2P);
    qemuDomainObjExitRemoteWithDriver(driver, vm);
    if (!p2p) {
8758 8759
        qemuReportError(VIR_ERR_OPERATION_FAILED, "%s",
                        _("Destination libvirt does not support peer-to-peer migration protocol"));
8760 8761 8762
        goto cleanup;
    }

8763 8764 8765 8766 8767 8768 8769
    /* domain may have been stopped while we were talking to remote daemon */
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8770 8771 8772
    dom_xml = qemudVMDumpXML(driver, vm,
                             VIR_DOMAIN_XML_SECURE |
                             VIR_DOMAIN_XML_UPDATE_CPU);
8773
    if (!dom_xml) {
8774 8775
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to get domain xml"));
8776 8777 8778
        goto cleanup;
    }

8779
    if (flags & VIR_MIGRATE_TUNNELLED)
8780
        ret = doTunnelMigrate(dom, driver, dconn, vm, dom_xml, uri, flags, dname, resource);
8781
    else
8782
        ret = doNonTunnelMigrate(dom, driver, dconn, vm, dom_xml, uri, flags, dname, resource);
8783 8784 8785

cleanup:
    VIR_FREE(dom_xml);
C
Chris Lalancette 已提交
8786 8787 8788
    /* don't call virConnectClose(), because that resets any pending errors */
    virUnrefConnect(dconn);

8789
    return ret;
D
Daniel Veillard 已提交
8790 8791
}

8792

D
Daniel Veillard 已提交
8793 8794 8795 8796 8797 8798
/* Perform is the second step, and it runs on the source host. */
static int
qemudDomainMigratePerform (virDomainPtr dom,
                           const char *cookie ATTRIBUTE_UNUSED,
                           int cookielen ATTRIBUTE_UNUSED,
                           const char *uri,
8799
                           unsigned long flags,
8800
                           const char *dname,
D
Daniel Veillard 已提交
8801 8802
                           unsigned long resource)
{
8803 8804
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
8805
    virDomainEventPtr event = NULL;
8806
    int ret = -1;
8807
    int resume = 0;
8808
    qemuDomainObjPrivatePtr priv;
D
Daniel Veillard 已提交
8809

C
Chris Lalancette 已提交
8810 8811 8812 8813 8814 8815 8816 8817 8818
    virCheckFlags(VIR_MIGRATE_LIVE |
                  VIR_MIGRATE_PEER2PEER |
                  VIR_MIGRATE_TUNNELLED |
                  VIR_MIGRATE_PERSIST_DEST |
                  VIR_MIGRATE_UNDEFINE_SOURCE |
                  VIR_MIGRATE_PAUSED |
                  VIR_MIGRATE_NON_SHARED_DISK |
                  VIR_MIGRATE_NON_SHARED_INC, -1);

8819
    qemuDriverLock(driver);
8820
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel Veillard 已提交
8821
    if (!vm) {
8822 8823
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
8824 8825
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
8826
        goto cleanup;
D
Daniel Veillard 已提交
8827
    }
8828
    priv = vm->privateData;
D
Daniel Veillard 已提交
8829

8830 8831
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
8832
    priv->jobActive = QEMU_JOB_MIGRATION_OUT;
8833

D
Daniel P. Berrange 已提交
8834
    if (!virDomainObjIsActive(vm)) {
8835 8836
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
8837
        goto endjob;
D
Daniel Veillard 已提交
8838 8839
    }

8840 8841 8842
    memset(&priv->jobInfo, 0, sizeof(priv->jobInfo));
    priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;

8843
    resume = vm->state == VIR_DOMAIN_RUNNING;
8844
    if (!(flags & VIR_MIGRATE_LIVE) && vm->state == VIR_DOMAIN_RUNNING) {
8845
        if (qemuDomainMigrateOffline(driver, vm) < 0)
8846
            goto endjob;
8847 8848
    }

8849
    if ((flags & (VIR_MIGRATE_TUNNELLED | VIR_MIGRATE_PEER2PEER))) {
8850
        if (doPeer2PeerMigrate(dom, driver, vm, uri, flags, dname, resource) < 0)
8851
            /* doPeer2PeerMigrate already set the error, so just get out */
8852
            goto endjob;
8853
    } else {
8854
        if (doNativeMigrate(driver, vm, uri, flags, dname, resource) < 0)
8855
            goto endjob;
8856 8857
    }

D
Daniel Veillard 已提交
8858
    /* Clean up the source domain. */
8859
    qemudShutdownVMDaemon(driver, vm, 1);
8860
    qemuDomainStopAudit(vm, "migrated");
8861
    resume = 0;
8862 8863 8864 8865

    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_MIGRATED);
C
Chris Lalancette 已提交
8866
    if (!vm->persistent || (flags & VIR_MIGRATE_UNDEFINE_SOURCE)) {
8867
        virDomainDeleteConfig(driver->configDir, driver->autostartDir, vm);
8868 8869
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains, vm);
8870 8871
        vm = NULL;
    }
8872
    ret = 0;
D
Daniel Veillard 已提交
8873

8874
endjob:
8875
    if (resume && vm->state == VIR_DOMAIN_PAUSED) {
8876
        /* we got here through some sort of failure; start the domain again */
H
Hu Tao 已提交
8877
        if (doStartCPUs(driver, vm, dom->conn) < 0) {
8878 8879 8880 8881
            /* Hm, we already know we are in error here.  We don't want to
             * overwrite the previous error, though, so we just throw something
             * to the logs and hope for the best
             */
8882
            VIR_ERROR(_("Failed to resume guest %s after failure"),
8883
                      vm->def->name);
8884 8885 8886 8887 8888 8889
        }

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
    }
8890 8891 8892
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
8893

8894
cleanup:
8895 8896
    if (vm)
        virDomainObjUnlock(vm);
8897 8898
    if (event)
        qemuDomainEventQueue(driver, event);
8899
    qemuDriverUnlock(driver);
8900
    return ret;
D
Daniel Veillard 已提交
8901 8902
}

8903
#if WITH_MACVTAP
8904 8905 8906 8907 8908 8909 8910 8911 8912 8913 8914 8915 8916 8917 8918 8919 8920 8921 8922 8923 8924 8925 8926 8927 8928 8929 8930 8931 8932 8933 8934 8935 8936 8937
static void
qemudVPAssociatePortProfiles(virDomainDefPtr def) {
    int i;
    int last_good_net = -1;
    virDomainNetDefPtr net;

    for (i = 0; i < def->nnets; i++) {
        net = def->nets[i];
        if (net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
            if (vpAssociatePortProfileId(net->ifname,
                                         net->mac,
                                         net->data.direct.linkdev,
                                         &net->data.direct.virtPortProfile,
                                         def->uuid,
                                         VIR_VM_OP_MIGRATE_IN_FINISH) != 0)
                goto err_exit;
        }
        last_good_net = i;
    }

    return;

err_exit:
    for (i = 0; i < last_good_net; i++) {
        net = def->nets[i];
        if (net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
            vpDisassociatePortProfileId(net->ifname,
                                        net->mac,
                                        net->data.direct.linkdev,
                                        &net->data.direct.virtPortProfile,
                                        VIR_VM_OP_MIGRATE_IN_FINISH);
        }
    }
}
8938 8939 8940 8941
#else /* !WITH_MACVTAP */
static void
qemudVPAssociatePortProfiles(virDomainDefPtr def ATTRIBUTE_UNUSED) { }
#endif /* WITH_MACVTAP */
8942

D
Daniel Veillard 已提交
8943 8944 8945 8946 8947 8948 8949
/* Finish is the third and final step, and it runs on the destination host. */
static virDomainPtr
qemudDomainMigrateFinish2 (virConnectPtr dconn,
                           const char *dname,
                           const char *cookie ATTRIBUTE_UNUSED,
                           int cookielen ATTRIBUTE_UNUSED,
                           const char *uri ATTRIBUTE_UNUSED,
C
Chris Lalancette 已提交
8950
                           unsigned long flags,
D
Daniel Veillard 已提交
8951 8952
                           int retcode)
{
8953 8954 8955
    struct qemud_driver *driver = dconn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
8956
    virDomainEventPtr event = NULL;
8957
    virErrorPtr orig_err;
C
Chris Lalancette 已提交
8958
    int newVM = 1;
8959
    qemuDomainObjPrivatePtr priv = NULL;
D
Daniel Veillard 已提交
8960

C
Chris Lalancette 已提交
8961 8962 8963 8964 8965 8966 8967 8968 8969
    virCheckFlags(VIR_MIGRATE_LIVE |
                  VIR_MIGRATE_PEER2PEER |
                  VIR_MIGRATE_TUNNELLED |
                  VIR_MIGRATE_PERSIST_DEST |
                  VIR_MIGRATE_UNDEFINE_SOURCE |
                  VIR_MIGRATE_PAUSED |
                  VIR_MIGRATE_NON_SHARED_DISK |
                  VIR_MIGRATE_NON_SHARED_INC, NULL);

8970 8971 8972
    /* Migration failed. Save the current error so nothing squashes it */
    orig_err = virSaveLastError();

8973
    qemuDriverLock(driver);
8974
    vm = virDomainFindByName(&driver->domains, dname);
D
Daniel Veillard 已提交
8975
    if (!vm) {
8976 8977
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching name '%s'"), dname);
8978
        goto cleanup;
D
Daniel Veillard 已提交
8979 8980
    }

8981 8982 8983 8984 8985 8986 8987 8988 8989
    priv = vm->privateData;
    if (priv->jobActive != QEMU_JOB_MIGRATION_IN) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("domain '%s' is not processing incoming migration"), dname);
        goto cleanup;
    }
    priv->jobActive = QEMU_JOB_NONE;
    memset(&priv->jobInfo, 0, sizeof(priv->jobInfo));

8990 8991 8992
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel Veillard 已提交
8993 8994 8995 8996
    /* Did the migration go as planned?  If yes, return the domain
     * object, but if no, clean up the empty qemu process.
     */
    if (retcode == 0) {
8997 8998 8999 9000 9001 9002
        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("guest unexpectedly quit"));
            goto cleanup;
        }

9003 9004
        qemudVPAssociatePortProfiles(vm->def);

C
Chris Lalancette 已提交
9005 9006 9007 9008 9009
        if (flags & VIR_MIGRATE_PERSIST_DEST) {
            if (vm->persistent)
                newVM = 0;
            vm->persistent = 1;

9010
            if (virDomainSaveConfig(driver->configDir, vm->def) < 0) {
C
Chris Lalancette 已提交
9011 9012 9013 9014 9015 9016 9017 9018 9019 9020
                /* Hmpf.  Migration was successful, but making it persistent
                 * was not.  If we report successful, then when this domain
                 * shuts down, management tools are in for a surprise.  On the
                 * other hand, if we report failure, then the management tools
                 * might try to restart the domain on the source side, even
                 * though the domain is actually running on the destination.
                 * Return a NULL dom pointer, and hope that this is a rare
                 * situation and management tools are smart.
                 */
                vm = NULL;
9021
                goto endjob;
C
Chris Lalancette 已提交
9022 9023 9024 9025 9026 9027 9028 9029 9030
            }

            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_DEFINED,
                                             newVM ?
                                             VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                             VIR_DOMAIN_EVENT_DEFINED_UPDATED);
            if (event)
                qemuDomainEventQueue(driver, event);
9031
            event = NULL;
C
Chris Lalancette 已提交
9032 9033

        }
D
Daniel Veillard 已提交
9034
        dom = virGetDomain (dconn, vm->def->name, vm->def->uuid);
9035

9036 9037 9038 9039 9040
        if (!(flags & VIR_MIGRATE_PAUSED)) {
            /* run 'cont' on the destination, which allows migration on qemu
             * >= 0.10.6 to work properly.  This isn't strictly necessary on
             * older qemu's, but it also doesn't hurt anything there
             */
H
Hu Tao 已提交
9041
            if (doStartCPUs(driver, vm, dconn) < 0) {
9042
                if (virGetLastError() == NULL)
9043 9044
                    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                    "%s", _("resume operation failed"));
9045 9046
                goto endjob;
            }
9047 9048
        }

9049 9050 9051
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
9052 9053 9054 9055 9056 9057
        if (vm->state == VIR_DOMAIN_PAUSED) {
            qemuDomainEventQueue(driver, event);
            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_SUSPENDED,
                                             VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
        }
9058 9059 9060 9061
        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0) {
            VIR_WARN("Failed to save status on vm %s", vm->def->name);
            goto endjob;
        }
D
Daniel Veillard 已提交
9062
    } else {
9063
        qemudShutdownVMDaemon(driver, vm, 1);
9064
        qemuDomainStopAudit(vm, "failed");
9065 9066 9067
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_FAILED);
9068
        if (!vm->persistent) {
9069 9070
            if (qemuDomainObjEndJob(vm) > 0)
                virDomainRemoveInactive(&driver->domains, vm);
9071 9072
            vm = NULL;
        }
D
Daniel Veillard 已提交
9073
    }
9074

9075
endjob:
9076 9077 9078
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
9079

9080
cleanup:
9081 9082 9083 9084
    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
9085 9086
    if (vm)
        virDomainObjUnlock(vm);
9087 9088
    if (event)
        qemuDomainEventQueue(driver, event);
9089
    qemuDriverUnlock(driver);
9090
    return dom;
D
Daniel Veillard 已提交
9091 9092
}

9093 9094 9095 9096 9097 9098 9099 9100 9101 9102 9103 9104 9105 9106 9107 9108
static int
qemudNodeDeviceGetPciInfo (virNodeDevicePtr dev,
                           unsigned *domain,
                           unsigned *bus,
                           unsigned *slot,
                           unsigned *function)
{
    virNodeDeviceDefPtr def = NULL;
    virNodeDevCapsDefPtr cap;
    char *xml = NULL;
    int ret = -1;

    xml = virNodeDeviceGetXMLDesc(dev, 0);
    if (!xml)
        goto out;

9109
    def = virNodeDeviceDefParseString(xml, EXISTING_DEVICE);
9110 9111 9112 9113 9114 9115 9116 9117 9118 9119 9120 9121 9122 9123 9124 9125 9126
    if (!def)
        goto out;

    cap = def->caps;
    while (cap) {
        if (cap->type == VIR_NODE_DEV_CAP_PCI_DEV) {
            *domain   = cap->data.pci_dev.domain;
            *bus      = cap->data.pci_dev.bus;
            *slot     = cap->data.pci_dev.slot;
            *function = cap->data.pci_dev.function;
            break;
        }

        cap = cap->next;
    }

    if (!cap) {
9127 9128
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("device %s is not a PCI device"), dev->name);
9129 9130 9131 9132 9133 9134 9135 9136 9137 9138 9139 9140 9141
        goto out;
    }

    ret = 0;
out:
    virNodeDeviceDefFree(def);
    VIR_FREE(xml);
    return ret;
}

static int
qemudNodeDeviceDettach (virNodeDevicePtr dev)
{
9142
    struct qemud_driver *driver = dev->conn->privateData;
9143 9144 9145 9146 9147 9148 9149
    pciDevice *pci;
    unsigned domain, bus, slot, function;
    int ret = -1;

    if (qemudNodeDeviceGetPciInfo(dev, &domain, &bus, &slot, &function) < 0)
        return -1;

9150
    pci = pciGetDevice(domain, bus, slot, function);
9151 9152 9153
    if (!pci)
        return -1;

9154 9155
    qemuDriverLock(driver);
    if (pciDettachDevice(pci, driver->activePciHostdevs) < 0)
9156 9157 9158 9159
        goto out;

    ret = 0;
out:
9160
    qemuDriverUnlock(driver);
9161
    pciFreeDevice(pci);
9162 9163 9164 9165 9166 9167
    return ret;
}

static int
qemudNodeDeviceReAttach (virNodeDevicePtr dev)
{
9168
    struct qemud_driver *driver = dev->conn->privateData;
9169 9170 9171 9172 9173 9174 9175
    pciDevice *pci;
    unsigned domain, bus, slot, function;
    int ret = -1;

    if (qemudNodeDeviceGetPciInfo(dev, &domain, &bus, &slot, &function) < 0)
        return -1;

9176
    pci = pciGetDevice(domain, bus, slot, function);
9177 9178 9179
    if (!pci)
        return -1;

9180 9181
    qemuDriverLock(driver);
    if (pciReAttachDevice(pci, driver->activePciHostdevs) < 0)
9182 9183 9184 9185
        goto out;

    ret = 0;
out:
9186
    qemuDriverUnlock(driver);
9187
    pciFreeDevice(pci);
9188 9189 9190 9191 9192 9193
    return ret;
}

static int
qemudNodeDeviceReset (virNodeDevicePtr dev)
{
9194
    struct qemud_driver *driver = dev->conn->privateData;
9195 9196 9197 9198 9199 9200 9201
    pciDevice *pci;
    unsigned domain, bus, slot, function;
    int ret = -1;

    if (qemudNodeDeviceGetPciInfo(dev, &domain, &bus, &slot, &function) < 0)
        return -1;

9202
    pci = pciGetDevice(domain, bus, slot, function);
9203 9204 9205
    if (!pci)
        return -1;

9206 9207
    qemuDriverLock(driver);

9208
    if (pciResetDevice(pci, driver->activePciHostdevs, NULL) < 0)
9209 9210 9211 9212
        goto out;

    ret = 0;
out:
9213
    qemuDriverUnlock(driver);
9214
    pciFreeDevice(pci);
9215 9216 9217
    return ret;
}

9218 9219 9220 9221 9222 9223 9224 9225 9226 9227 9228
static int
qemuCPUCompare(virConnectPtr conn,
               const char *xmlDesc,
               unsigned int flags ATTRIBUTE_UNUSED)
{
    struct qemud_driver *driver = conn->privateData;
    int ret = VIR_CPU_COMPARE_ERROR;

    qemuDriverLock(driver);

    if (!driver->caps || !driver->caps->host.cpu) {
9229 9230
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        "%s", _("cannot get host CPU capabilities"));
9231 9232
    }
    else
9233
        ret = cpuCompareXML(driver->caps->host.cpu, xmlDesc);
9234 9235 9236 9237 9238 9239

    qemuDriverUnlock(driver);

    return ret;
}

9240

9241 9242 9243 9244 9245 9246 9247 9248 9249 9250 9251 9252 9253
static char *
qemuCPUBaseline(virConnectPtr conn ATTRIBUTE_UNUSED,
                const char **xmlCPUs,
                unsigned int ncpus,
                unsigned int flags ATTRIBUTE_UNUSED)
{
    char *cpu;

    cpu = cpuBaselineXML(xmlCPUs, ncpus, NULL, 0);

    return cpu;
}

9254 9255 9256 9257 9258 9259 9260 9261 9262 9263 9264 9265 9266 9267 9268 9269 9270 9271 9272 9273 9274 9275 9276

static int qemuDomainGetJobInfo(virDomainPtr dom,
                                virDomainJobInfoPtr info) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    priv = vm->privateData;

    if (virDomainObjIsActive(vm)) {
        if (priv->jobActive) {
9277 9278
            struct timeval now;

9279
            memcpy(info, &priv->jobInfo, sizeof(*info));
9280 9281 9282 9283 9284 9285 9286 9287 9288 9289 9290

            /* Refresh elapsed time again just to ensure it
             * is fully updated. This is primarily for benefit
             * of incoming migration which we don't currently
             * monitor actively in the background thread
             */
            if (gettimeofday(&now, NULL) < 0) {
                virReportSystemError(errno, "%s",
                                     _("cannot get time of day"));
                goto cleanup;
            }
9291
            info->timeElapsed = timeval_to_ms(now) - priv->jobStart;
9292 9293 9294 9295 9296 9297 9298 9299 9300 9301 9302 9303 9304 9305 9306 9307 9308 9309 9310
        } else {
            memset(info, 0, sizeof(*info));
            info->type = VIR_DOMAIN_JOB_NONE;
        }
    } else {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}


9311 9312 9313 9314 9315 9316 9317 9318 9319 9320 9321 9322 9323 9324 9325 9326 9327 9328 9329 9330 9331 9332
static int qemuDomainAbortJob(virDomainPtr dom) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    priv = vm->privateData;

    if (virDomainObjIsActive(vm)) {
        if (priv->jobActive) {
            VIR_DEBUG("Requesting cancellation of job on vm %s", vm->def->name);
9333
            priv->jobSignals |= QEMU_JOB_SIGNAL_CANCEL;
9334 9335 9336 9337 9338 9339 9340 9341 9342 9343 9344 9345 9346 9347 9348 9349 9350 9351 9352 9353
        } else {
            qemuReportError(VIR_ERR_OPERATION_INVALID,
                            "%s", _("no job is active on the domain"));
            goto cleanup;
        }
    } else {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}


9354 9355 9356 9357 9358 9359 9360 9361 9362 9363
static int
qemuDomainMigrateSetMaxDowntime(virDomainPtr dom,
                                unsigned long long downtime,
                                unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    qemuDomainObjPrivatePtr priv;
    int ret = -1;

9364
    virCheckFlags(0, -1);
9365 9366 9367 9368 9369 9370 9371 9372 9373 9374 9375 9376 9377 9378 9379 9380 9381 9382 9383 9384

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    priv = vm->privateData;

9385
    if (priv->jobActive != QEMU_JOB_MIGRATION_OUT) {
9386 9387 9388 9389 9390 9391 9392 9393 9394 9395 9396 9397 9398 9399 9400 9401 9402
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not being migrated"));
        goto cleanup;
    }

    VIR_DEBUG("Requesting migration downtime change to %llums", downtime);
    priv->jobSignals |= QEMU_JOB_SIGNAL_MIGRATE_DOWNTIME;
    priv->jobSignalsData.migrateDowntime = downtime;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

C
Chris Lalancette 已提交
9403 9404 9405 9406 9407 9408 9409 9410 9411 9412 9413 9414 9415 9416
static char *qemuFindQemuImgBinary(void)
{
    char *ret;

    ret = virFindFileInPath("kvm-img");
    if (ret == NULL)
        ret = virFindFileInPath("qemu-img");
    if (ret == NULL)
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("unable to find kvm-img or qemu-img"));

    return ret;
}

9417 9418 9419
static int qemuDomainSnapshotWriteMetadata(virDomainObjPtr vm,
                                           virDomainSnapshotObjPtr snapshot,
                                           char *snapshotDir)
C
Chris Lalancette 已提交
9420 9421 9422 9423 9424 9425 9426 9427 9428 9429
{
    int fd = -1;
    char *newxml = NULL;
    int ret = -1;
    char *snapDir = NULL;
    char *snapFile = NULL;
    int err;
    char uuidstr[VIR_UUID_STRING_BUFLEN];

    virUUIDFormat(vm->def->uuid, uuidstr);
9430
    newxml = virDomainSnapshotDefFormat(uuidstr, snapshot->def, 1);
C
Chris Lalancette 已提交
9431 9432 9433 9434 9435 9436 9437 9438 9439 9440 9441 9442 9443 9444 9445 9446
    if (newxml == NULL) {
        virReportOOMError();
        return -1;
    }

    if (virAsprintf(&snapDir, "%s/%s", snapshotDir, vm->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }
    err = virFileMakePath(snapDir);
    if (err < 0) {
        virReportSystemError(err, _("cannot create snapshot directory '%s'"),
                             snapDir);
        goto cleanup;
    }

9447
    if (virAsprintf(&snapFile, "%s/%s.xml", snapDir, snapshot->def->name) < 0) {
C
Chris Lalancette 已提交
9448 9449 9450 9451 9452 9453 9454 9455 9456 9457 9458 9459 9460 9461 9462 9463 9464 9465 9466 9467 9468
        virReportOOMError();
        goto cleanup;
    }
    fd = open(snapFile, O_CREAT|O_TRUNC|O_WRONLY, S_IRUSR|S_IWUSR);
    if (fd < 0) {
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("failed to create snapshot file '%s'"), snapFile);
        goto cleanup;
    }
    if (safewrite(fd, newxml, strlen(newxml)) != strlen(newxml)) {
        virReportSystemError(errno, _("Failed to write snapshot data to %s"),
                             snapFile);
        goto cleanup;
    }

    ret = 0;

cleanup:
    VIR_FREE(snapFile);
    VIR_FREE(snapDir);
    VIR_FREE(newxml);
9469
    VIR_FORCE_CLOSE(fd);
C
Chris Lalancette 已提交
9470 9471 9472
    return ret;
}

9473 9474
static int qemuDomainSnapshotSetCurrentActive(virDomainObjPtr vm,
                                              char *snapshotDir)
C
Chris Lalancette 已提交
9475 9476 9477 9478
{
    if (vm->current_snapshot) {
        vm->current_snapshot->def->active = 1;

9479 9480
        return qemuDomainSnapshotWriteMetadata(vm, vm->current_snapshot,
                                               snapshotDir);
C
Chris Lalancette 已提交
9481 9482 9483 9484 9485
    }

    return 0;
}

9486 9487
static int qemuDomainSnapshotSetCurrentInactive(virDomainObjPtr vm,
                                                char *snapshotDir)
C
Chris Lalancette 已提交
9488 9489 9490 9491
{
    if (vm->current_snapshot) {
        vm->current_snapshot->def->active = 0;

9492 9493
        return qemuDomainSnapshotWriteMetadata(vm, vm->current_snapshot,
                                               snapshotDir);
C
Chris Lalancette 已提交
9494 9495 9496 9497 9498 9499 9500 9501 9502 9503 9504 9505 9506 9507 9508 9509 9510 9511 9512
    }

    return 0;
}


static int qemuDomainSnapshotIsAllowed(virDomainObjPtr vm)
{
    int i;

    /* FIXME: we need to figure out what else here might succeed; in
     * particular, if it's a raw device but on LVM, we could probably make
     * that succeed as well
     */
    for (i = 0; i < vm->def->ndisks; i++) {
        if (vm->def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK &&
            (!vm->def->disks[i]->driverType ||
             STRNEQ(vm->def->disks[i]->driverType, "qcow2"))) {
            qemuReportError(VIR_ERR_OPERATION_INVALID,
9513 9514
                            _("Disk '%s' does not support snapshotting"),
                            vm->def->disks[i]->src);
C
Chris Lalancette 已提交
9515 9516 9517 9518 9519 9520 9521 9522 9523
            return 0;
        }
    }

    return 1;
}

static virDomainSnapshotPtr qemuDomainSnapshotCreateXML(virDomainPtr domain,
                                                        const char *xmlDesc,
9524
                                                        unsigned int flags)
C
Chris Lalancette 已提交
9525 9526 9527 9528 9529 9530 9531 9532 9533 9534
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    virDomainSnapshotObjPtr snap = NULL;
    virDomainSnapshotPtr snapshot = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    virDomainSnapshotDefPtr def;
    const char *qemuimgarg[] = { NULL, "snapshot", "-c", NULL, NULL, NULL };
    int i;

9535 9536
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9537 9538 9539 9540 9541 9542 9543 9544 9545 9546 9547 9548 9549 9550 9551 9552 9553 9554 9555 9556 9557 9558 9559 9560 9561 9562 9563 9564 9565 9566 9567 9568 9569 9570 9571 9572 9573 9574 9575 9576 9577 9578 9579 9580 9581 9582 9583 9584 9585 9586 9587 9588 9589 9590 9591 9592 9593 9594 9595 9596 9597
    qemuDriverLock(driver);
    virUUIDFormat(domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    /* in a perfect world, we would allow qemu to tell us this.  The problem
     * is that qemu only does this check device-by-device; so if you had a
     * domain that booted from a large qcow2 device, but had a secondary raw
     * device attached, you wouldn't find out that you can't snapshot your
     * guest until *after* it had spent the time to snapshot the boot device.
     * This is probably a bug in qemu, but we'll work around it here for now.
     */
    if (!qemuDomainSnapshotIsAllowed(vm))
        goto cleanup;

    if (!(def = virDomainSnapshotDefParseString(xmlDesc, 1)))
        goto cleanup;

    if (!(snap = virDomainSnapshotAssignDef(&vm->snapshots, def)))
        goto cleanup;

    /* actually do the snapshot */
    if (!virDomainObjIsActive(vm)) {
        qemuimgarg[0] = qemuFindQemuImgBinary();
        if (qemuimgarg[0] == NULL)
            /* qemuFindQemuImgBinary set the error */
            goto cleanup;

        qemuimgarg[3] = snap->def->name;

        for (i = 0; i < vm->def->ndisks; i++) {
            /* FIXME: we also need to handle LVM here */
            /* FIXME: if we fail halfway through this loop, we are in an
             * inconsistent state.  I'm not quite sure what to do about that
             */
            if (vm->def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
                if (!vm->def->disks[i]->driverType ||
                    STRNEQ(vm->def->disks[i]->driverType, "qcow2")) {
                    qemuReportError(VIR_ERR_OPERATION_INVALID,
                                    _("Disk device '%s' does not support snapshotting"),
                                    vm->def->disks[i]->info.alias);
                    goto cleanup;
                }

                qemuimgarg[4] = vm->def->disks[i]->src;

                if (virRun(qemuimgarg, NULL) < 0) {
                    virReportSystemError(errno,
                                         _("Failed to run '%s' to create snapshot '%s' from disk '%s'"),
                                         qemuimgarg[0], snap->def->name,
                                         vm->def->disks[i]->src);
                    goto cleanup;
                }
            }
        }
    }
    else {
9598 9599 9600 9601 9602
        qemuDomainObjPrivatePtr priv;
        int ret;

        if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
            goto cleanup;
C
Chris Lalancette 已提交
9603 9604
        priv = vm->privateData;
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
9605
        ret = qemuMonitorCreateSnapshot(priv->mon, def->name);
C
Chris Lalancette 已提交
9606
        qemuDomainObjExitMonitorWithDriver(driver, vm);
9607
        if (qemuDomainObjEndJob(vm) == 0) {
9608
            vm = NULL;
9609 9610
            goto cleanup;
        }
9611 9612
        if (ret < 0)
            goto cleanup;
C
Chris Lalancette 已提交
9613 9614 9615 9616 9617 9618 9619 9620 9621 9622 9623 9624 9625 9626 9627 9628 9629 9630 9631 9632
    }

    snap->def->state = vm->state;

    /* FIXME: if we fail after this point, there's not a whole lot we can
     * do; we've successfully taken the snapshot, and we are now running
     * on it, so we have to go forward the best we can
     */

    if (vm->current_snapshot) {
        def->parent = strdup(vm->current_snapshot->def->name);
        if (def->parent == NULL) {
            virReportOOMError();
            goto cleanup;
        }
    }

    /* Now we set the new current_snapshot for the domain */
    vm->current_snapshot = snap;

9633 9634 9635
    if (qemuDomainSnapshotWriteMetadata(vm, vm->current_snapshot,
                                        driver->snapshotDir) < 0)
        /* qemuDomainSnapshotWriteMetadata set the error */
C
Chris Lalancette 已提交
9636 9637 9638 9639 9640 9641 9642 9643 9644 9645 9646 9647 9648 9649
        goto cleanup;

    snapshot = virGetDomainSnapshot(domain, snap->def->name);

cleanup:
    VIR_FREE(qemuimgarg[0]);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return snapshot;
}

static int qemuDomainSnapshotListNames(virDomainPtr domain, char **names,
                                       int nameslen,
9650
                                       unsigned int flags)
C
Chris Lalancette 已提交
9651 9652 9653 9654 9655
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int n = -1;

9656 9657
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9658 9659 9660 9661 9662 9663 9664 9665 9666 9667 9668 9669 9670 9671 9672 9673 9674 9675 9676 9677
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    n = virDomainSnapshotObjListGetNames(&vm->snapshots, names, nameslen);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return n;
}

static int qemuDomainSnapshotNum(virDomainPtr domain,
9678
                                 unsigned int flags)
C
Chris Lalancette 已提交
9679 9680 9681 9682 9683
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int n = -1;

9684 9685
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9686 9687 9688 9689 9690 9691 9692 9693 9694 9695 9696 9697 9698 9699 9700 9701 9702 9703 9704 9705 9706
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    n = virDomainSnapshotObjListNum(&vm->snapshots);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return n;
}

static virDomainSnapshotPtr qemuDomainSnapshotLookupByName(virDomainPtr domain,
                                                           const char *name,
9707
                                                           unsigned int flags)
C
Chris Lalancette 已提交
9708 9709 9710 9711 9712 9713
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm;
    virDomainSnapshotObjPtr snap = NULL;
    virDomainSnapshotPtr snapshot = NULL;

9714 9715
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9716 9717 9718 9719 9720 9721 9722 9723 9724 9725 9726 9727 9728 9729 9730 9731 9732 9733 9734 9735 9736 9737 9738 9739 9740 9741 9742
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no snapshot with matching name '%s'"), name);
        goto cleanup;
    }

    snapshot = virGetDomainSnapshot(domain, snap->def->name);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return snapshot;
}

static int qemuDomainHasCurrentSnapshot(virDomainPtr domain,
9743
                                        unsigned int flags)
C
Chris Lalancette 已提交
9744 9745 9746 9747 9748
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

9749 9750
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9751 9752 9753 9754 9755 9756 9757 9758 9759 9760 9761 9762 9763 9764 9765 9766 9767 9768 9769 9770
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    ret = (vm->current_snapshot != NULL);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

static virDomainSnapshotPtr qemuDomainSnapshotCurrent(virDomainPtr domain,
9771
                                                      unsigned int flags)
C
Chris Lalancette 已提交
9772 9773 9774 9775 9776
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm;
    virDomainSnapshotPtr snapshot = NULL;

9777 9778
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9779 9780 9781 9782 9783 9784 9785 9786 9787 9788 9789 9790 9791 9792 9793 9794 9795 9796 9797 9798 9799 9800 9801 9802 9803 9804
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!vm->current_snapshot) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT, "%s",
                        _("the domain does not have a current snapshot"));
        goto cleanup;
    }

    snapshot = virGetDomainSnapshot(domain, vm->current_snapshot->def->name);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return snapshot;
}

static char *qemuDomainSnapshotDumpXML(virDomainSnapshotPtr snapshot,
9805
                                       unsigned int flags)
C
Chris Lalancette 已提交
9806 9807 9808 9809 9810 9811 9812
{
    struct qemud_driver *driver = snapshot->domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    char *xml = NULL;
    virDomainSnapshotObjPtr snap = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];

9813 9814
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9815 9816 9817 9818 9819 9820 9821 9822 9823 9824 9825 9826 9827 9828 9829 9830 9831 9832 9833 9834 9835 9836 9837 9838 9839 9840 9841
    qemuDriverLock(driver);
    virUUIDFormat(snapshot->domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, snapshot->domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, snapshot->name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no domain snapshot with matching name '%s'"),
                        snapshot->name);
        goto cleanup;
    }

    xml = virDomainSnapshotDefFormat(uuidstr, snap->def, 0);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return xml;
}

static int qemuDomainRevertToSnapshot(virDomainSnapshotPtr snapshot,
9842
                                      unsigned int flags)
C
Chris Lalancette 已提交
9843 9844 9845 9846 9847 9848 9849 9850 9851 9852
{
    struct qemud_driver *driver = snapshot->domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    virDomainSnapshotObjPtr snap = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    virDomainEventPtr event = NULL;
    qemuDomainObjPrivatePtr priv;
    int rc;

9853 9854
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9855 9856 9857 9858 9859 9860 9861 9862 9863 9864 9865 9866 9867 9868 9869 9870 9871 9872 9873 9874 9875 9876 9877 9878 9879 9880 9881 9882 9883 9884 9885
    qemuDriverLock(driver);
    virUUIDFormat(snapshot->domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, snapshot->domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, snapshot->name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no domain snapshot with matching name '%s'"),
                        snapshot->name);
        goto cleanup;
    }

    vm->current_snapshot = snap;

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    if (snap->def->state == VIR_DOMAIN_RUNNING
        || snap->def->state == VIR_DOMAIN_PAUSED) {

        if (virDomainObjIsActive(vm)) {
            priv = vm->privateData;
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            rc = qemuMonitorLoadSnapshot(priv->mon, snap->def->name);
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (rc < 0)
9886
                goto endjob;
C
Chris Lalancette 已提交
9887 9888
        }
        else {
9889
            if (qemuDomainSnapshotSetCurrentActive(vm, driver->snapshotDir) < 0)
9890
                goto endjob;
C
Chris Lalancette 已提交
9891 9892

            rc = qemudStartVMDaemon(snapshot->domain->conn, driver, vm, NULL,
9893
                                    false, -1, NULL, VIR_VM_OP_CREATE);
9894
            qemuDomainStartAudit(vm, "from-snapshot", rc >= 0);
9895
            if (qemuDomainSnapshotSetCurrentInactive(vm, driver->snapshotDir) < 0)
9896
                goto endjob;
C
Chris Lalancette 已提交
9897
            if (rc < 0)
9898
                goto endjob;
C
Chris Lalancette 已提交
9899 9900 9901 9902 9903 9904
        }

        if (snap->def->state == VIR_DOMAIN_PAUSED) {
            /* qemu unconditionally starts the domain running again after
             * loadvm, so let's pause it to keep consistency
             */
H
Hu Tao 已提交
9905 9906
            rc = doStopCPUs(driver, vm);
            if (rc < 0)
9907
                goto endjob;
C
Chris Lalancette 已提交
9908 9909 9910 9911 9912 9913 9914 9915 9916 9917 9918 9919 9920 9921 9922 9923 9924 9925
        }

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_FROM_SNAPSHOT);
    }
    else {
        /* qemu is a little funny with running guests and the restoration
         * of snapshots.  If the snapshot was taken online,
         * then after a "loadvm" monitor command, the VM is set running
         * again.  If the snapshot was taken offline, then after a "loadvm"
         * monitor command the VM is left paused.  Unpausing it leads to
         * the memory state *before* the loadvm with the disk *after* the
         * loadvm, which obviously is bound to corrupt something.
         * Therefore we destroy the domain and set it to "off" in this case.
         */

        if (virDomainObjIsActive(vm)) {
9926
            qemudShutdownVMDaemon(driver, vm, 0);
9927
            qemuDomainStopAudit(vm, "from-snapshot");
C
Chris Lalancette 已提交
9928 9929 9930
            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_STOPPED,
                                             VIR_DOMAIN_EVENT_STOPPED_FROM_SNAPSHOT);
9931 9932 9933 9934
            if (!vm->persistent) {
                if (qemuDomainObjEndJob(vm) > 0)
                    virDomainRemoveInactive(&driver->domains, vm);
                vm = NULL;
9935
                goto cleanup;
9936
            }
C
Chris Lalancette 已提交
9937 9938
        }

9939
        if (qemuDomainSnapshotSetCurrentActive(vm, driver->snapshotDir) < 0)
9940
            goto endjob;
C
Chris Lalancette 已提交
9941 9942 9943 9944 9945 9946
    }

    vm->state = snap->def->state;

    ret = 0;

9947
endjob:
C
Chris Lalancette 已提交
9948 9949 9950
    if (vm && qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

9951
cleanup:
C
Chris Lalancette 已提交
9952 9953 9954 9955 9956 9957 9958 9959 9960 9961 9962 9963 9964 9965 9966 9967 9968 9969 9970 9971 9972 9973 9974 9975 9976 9977 9978 9979 9980 9981 9982 9983 9984 9985 9986 9987 9988 9989 9990 9991 9992 9993 9994 9995 9996 9997 9998 9999 10000 10001 10002 10003 10004 10005 10006 10007 10008 10009 10010 10011 10012 10013 10014 10015 10016 10017 10018 10019 10020 10021 10022 10023 10024 10025 10026 10027 10028 10029 10030 10031 10032 10033 10034 10035 10036 10037 10038 10039 10040 10041 10042 10043 10044 10045 10046 10047 10048 10049 10050 10051 10052 10053 10054 10055 10056 10057 10058 10059 10060 10061 10062 10063 10064 10065 10066 10067 10068 10069 10070 10071 10072 10073 10074 10075
    if (event)
        qemuDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);

    return ret;
}

static int qemuDomainSnapshotDiscard(struct qemud_driver *driver,
                                     virDomainObjPtr vm,
                                     virDomainSnapshotObjPtr snap)
{
    const char *qemuimgarg[] = { NULL, "snapshot", "-d", NULL, NULL, NULL };
    char *snapFile = NULL;
    int ret = -1;
    int i;
    qemuDomainObjPrivatePtr priv;
    virDomainSnapshotObjPtr parentsnap;

    if (!virDomainObjIsActive(vm)) {
        qemuimgarg[0] = qemuFindQemuImgBinary();
        if (qemuimgarg[0] == NULL)
            /* qemuFindQemuImgBinary set the error */
            goto cleanup;

        qemuimgarg[3] = snap->def->name;

        for (i = 0; i < vm->def->ndisks; i++) {
            /* FIXME: we also need to handle LVM here */
            if (vm->def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
                if (!vm->def->disks[i]->driverType ||
                    STRNEQ(vm->def->disks[i]->driverType, "qcow2")) {
                    /* we continue on even in the face of error, since other
                     * disks in this VM may have this snapshot in place
                     */
                    continue;
                }

                qemuimgarg[4] = vm->def->disks[i]->src;

                if (virRun(qemuimgarg, NULL) < 0) {
                    /* we continue on even in the face of error, since other
                     * disks in this VM may have this snapshot in place
                     */
                    continue;
                }
            }
        }
    }
    else {
        priv = vm->privateData;
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
        /* we continue on even in the face of error */
        qemuMonitorDeleteSnapshot(priv->mon, snap->def->name);
        qemuDomainObjExitMonitorWithDriver(driver, vm);
    }

    if (snap == vm->current_snapshot) {
        if (snap->def->parent) {
            parentsnap = virDomainSnapshotFindByName(&vm->snapshots,
                                                     snap->def->parent);
            if (!parentsnap) {
                qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                                _("no domain snapshot parent with matching name '%s'"),
                                snap->def->parent);
                goto cleanup;
            }

            /* Now we set the new current_snapshot for the domain */
            vm->current_snapshot = parentsnap;
        }
        else
            vm->current_snapshot = NULL;
    }

    if (virAsprintf(&snapFile, "%s/%s/%s.xml", driver->snapshotDir,
                    vm->def->name, snap->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }
    unlink(snapFile);

    virDomainSnapshotObjListRemove(&vm->snapshots, snap);

    ret = 0;

cleanup:
    VIR_FREE(snapFile);
    VIR_FREE(qemuimgarg[0]);

    return ret;
}

struct snap_remove {
    struct qemud_driver *driver;
    virDomainObjPtr vm;
    char *parent;
    int err;
};

static void qemuDomainSnapshotDiscardChildren(void *payload,
                                              const char *name ATTRIBUTE_UNUSED,
                                              void *data)
{
    virDomainSnapshotObjPtr snap = payload;
    struct snap_remove *curr = data;
    struct snap_remove this;

    if (snap->def->parent && STREQ(snap->def->parent, curr->parent)) {
        this.driver = curr->driver;
        this.vm = curr->vm;
        this.parent = snap->def->name;
        this.err = 0;
        virHashForEach(curr->vm->snapshots.objs,
                       qemuDomainSnapshotDiscardChildren, &this);

        if (this.err)
            curr->err = this.err;
        else
            this.err = qemuDomainSnapshotDiscard(curr->driver, curr->vm, snap);
    }
}

10076 10077 10078 10079 10080 10081 10082 10083 10084 10085 10086 10087 10088 10089 10090 10091 10092 10093 10094 10095 10096 10097 10098 10099 10100 10101 10102 10103 10104 10105 10106 10107 10108 10109 10110 10111 10112
struct snap_reparent {
    struct qemud_driver *driver;
    virDomainSnapshotObjPtr snap;
    virDomainObjPtr vm;
    int err;
};

static void
qemuDomainSnapshotReparentChildren(void *payload,
                                   const char *name ATTRIBUTE_UNUSED,
                                   void *data)
{
    virDomainSnapshotObjPtr snap = payload;
    struct snap_reparent *rep = data;

    if (rep->err < 0) {
        return;
    }

    if (snap->def->parent && STREQ(snap->def->parent, rep->snap->def->name)) {
        VIR_FREE(snap->def->parent);

        if (rep->snap->def->parent != NULL) {
            snap->def->parent = strdup(rep->snap->def->parent);

            if (snap->def->parent == NULL) {
                virReportOOMError();
                rep->err = -1;
                return;
            }
        }

        rep->err = qemuDomainSnapshotWriteMetadata(rep->vm, snap,
                                                   rep->driver->snapshotDir);
    }
}

C
Chris Lalancette 已提交
10113 10114 10115 10116 10117 10118 10119 10120 10121
static int qemuDomainSnapshotDelete(virDomainSnapshotPtr snapshot,
                                    unsigned int flags)
{
    struct qemud_driver *driver = snapshot->domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    virDomainSnapshotObjPtr snap = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    struct snap_remove rem;
10122
    struct snap_reparent rep;
C
Chris Lalancette 已提交
10123

10124 10125
    virCheckFlags(VIR_DOMAIN_SNAPSHOT_DELETE_CHILDREN, -1);

C
Chris Lalancette 已提交
10126 10127 10128 10129 10130 10131 10132 10133 10134 10135 10136 10137 10138 10139 10140 10141 10142
    qemuDriverLock(driver);
    virUUIDFormat(snapshot->domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, snapshot->domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, snapshot->name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no domain snapshot with matching name '%s'"),
                        snapshot->name);
        goto cleanup;
    }

10143 10144 10145
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

C
Chris Lalancette 已提交
10146 10147 10148 10149 10150 10151 10152 10153
    if (flags & VIR_DOMAIN_SNAPSHOT_DELETE_CHILDREN) {
        rem.driver = driver;
        rem.vm = vm;
        rem.parent = snap->def->name;
        rem.err = 0;
        virHashForEach(vm->snapshots.objs, qemuDomainSnapshotDiscardChildren,
                       &rem);
        if (rem.err < 0)
10154
            goto endjob;
10155 10156 10157 10158 10159 10160 10161 10162 10163
    } else {
        rep.driver = driver;
        rep.snap = snap;
        rep.vm = vm;
        rep.err = 0;
        virHashForEach(vm->snapshots.objs, qemuDomainSnapshotReparentChildren,
                       &rep);
        if (rep.err < 0)
            goto endjob;
C
Chris Lalancette 已提交
10164 10165 10166 10167
    }

    ret = qemuDomainSnapshotDiscard(driver, vm, snap);

10168 10169 10170 10171
endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

C
Chris Lalancette 已提交
10172 10173 10174 10175 10176 10177
cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}
10178

10179 10180 10181 10182 10183 10184 10185 10186 10187 10188 10189 10190 10191 10192 10193 10194 10195 10196 10197 10198 10199 10200 10201 10202 10203 10204 10205 10206 10207 10208 10209 10210 10211 10212 10213 10214 10215 10216 10217 10218 10219 10220 10221 10222 10223 10224 10225 10226 10227 10228 10229
static int qemuDomainMonitorCommand(virDomainPtr domain, const char *cmd,
                                    char **result, unsigned int flags)
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    virCheckFlags(0, -1);

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
   }

    priv = vm->privateData;

    if (!priv->monitor_warned) {
        VIR_INFO("Qemu monitor command '%s' executed; libvirt results may be unpredictable!",
                 cmd);
        priv->monitor_warned = 1;
    }

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorArbitraryCommand(priv->mon, cmd, result);
    qemuDomainObjExitMonitorWithDriver(driver, vm);
    if (qemuDomainObjEndJob(vm) == 0) {
        vm = NULL;
        goto cleanup;
    }

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

10230 10231 10232 10233 10234 10235 10236 10237 10238 10239 10240 10241 10242 10243 10244 10245 10246 10247 10248 10249 10250 10251 10252 10253 10254 10255 10256 10257 10258 10259 10260 10261 10262 10263 10264 10265 10266 10267 10268 10269 10270 10271 10272 10273 10274 10275 10276 10277 10278 10279 10280 10281 10282 10283 10284 10285 10286

static int
qemuDomainOpenConsole(virDomainPtr dom,
                      const char *devname,
                      virStreamPtr st,
                      unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    int ret = -1;
    int i;
    virDomainChrDefPtr chr = NULL;

    virCheckFlags(0, -1);

    qemuDriverLock(driver);
    virUUIDFormat(dom->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    if (devname) {
        if (vm->def->console &&
            STREQ(devname, vm->def->console->info.alias))
            chr = vm->def->console;
        for (i = 0 ; !chr && i < vm->def->nserials ; i++) {
            if (STREQ(devname, vm->def->serials[i]->info.alias))
                chr = vm->def->serials[i];
        }
        for (i = 0 ; !chr && i < vm->def->nparallels ; i++) {
            if (STREQ(devname, vm->def->parallels[i]->info.alias))
                chr = vm->def->parallels[i];
        }
    } else {
        if (vm->def->console)
            chr = vm->def->console;
        else if (vm->def->nserials)
            chr = vm->def->serials[0];
    }

    if (!chr) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find character device %s"),
                        NULLSTR(devname));
        goto cleanup;
    }

10287
    if (chr->source.type != VIR_DOMAIN_CHR_TYPE_PTY) {
10288 10289 10290 10291 10292 10293
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("character device %s is not using a PTY"),
                        NULLSTR(devname));
        goto cleanup;
    }

10294
    if (virFDStreamOpenFile(st, chr->source.data.file.path, O_RDWR) < 0)
10295 10296 10297 10298 10299 10300 10301 10302 10303 10304 10305
        goto cleanup;

    ret = 0;
cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}


10306 10307 10308 10309 10310
static virDriver qemuDriver = {
    VIR_DRV_QEMU,
    "QEMU",
    qemudOpen, /* open */
    qemudClose, /* close */
D
Daniel Veillard 已提交
10311
    qemudSupportsFeature, /* supports_feature */
10312 10313
    qemudGetType, /* type */
    qemudGetVersion, /* version */
10314
    NULL, /* libvirtVersion (impl. in libvirt.c) */
10315
    virGetHostname, /* getHostname */
10316
    qemudGetMaxVCPUs, /* getMaxVcpus */
10317
    nodeGetInfo, /* nodeGetInfo */
10318 10319 10320
    qemudGetCapabilities, /* getCapabilities */
    qemudListDomains, /* listDomains */
    qemudNumDomains, /* numOfDomains */
10321
    qemudDomainCreate, /* domainCreateXML */
10322 10323 10324 10325 10326
    qemudDomainLookupByID, /* domainLookupByID */
    qemudDomainLookupByUUID, /* domainLookupByUUID */
    qemudDomainLookupByName, /* domainLookupByName */
    qemudDomainSuspend, /* domainSuspend */
    qemudDomainResume, /* domainResume */
10327
    qemudDomainShutdown, /* domainShutdown */
10328 10329 10330
    NULL, /* domainReboot */
    qemudDomainDestroy, /* domainDestroy */
    qemudDomainGetOSType, /* domainGetOSType */
10331
    qemudDomainGetMaxMemory, /* domainGetMaxMemory */
10332
    NULL, /* domainSetMaxMemory */
10333
    qemudDomainSetMemory, /* domainSetMemory */
10334 10335 10336
    qemudDomainGetInfo, /* domainGetInfo */
    qemudDomainSave, /* domainSave */
    qemudDomainRestore, /* domainRestore */
P
Paolo Bonzini 已提交
10337
    qemudDomainCoreDump, /* domainCoreDump */
10338
    qemudDomainSetVcpus, /* domainSetVcpus */
10339 10340
    qemudDomainSetVcpusFlags, /* domainSetVcpusFlags */
    qemudDomainGetVcpusFlags, /* domainGetVcpusFlags */
10341 10342
    qemudDomainPinVcpu, /* domainPinVcpu */
    qemudDomainGetVcpus, /* domainGetVcpus */
10343
    qemudDomainGetMaxVcpus, /* domainGetMaxVcpus */
10344 10345
    qemudDomainGetSecurityLabel, /* domainGetSecurityLabel */
    qemudNodeGetSecurityModel, /* nodeGetSecurityModel */
10346
    qemudDomainDumpXML, /* domainDumpXML */
10347
    qemuDomainXMLFromNative, /* domainXmlFromNative */
10348
    qemuDomainXMLToNative, /* domainXMLToNative */
10349 10350
    qemudListDefinedDomains, /* listDefinedDomains */
    qemudNumDefinedDomains, /* numOfDefinedDomains */
10351
    qemudDomainStart, /* domainCreate */
10352
    qemudDomainStartWithFlags, /* domainCreateWithFlags */
10353 10354
    qemudDomainDefine, /* domainDefineXML */
    qemudDomainUndefine, /* domainUndefine */
10355
    qemudDomainAttachDevice, /* domainAttachDevice */
10356
    qemudDomainAttachDeviceFlags, /* domainAttachDeviceFlags */
10357
    qemudDomainDetachDevice, /* domainDetachDevice */
10358
    qemudDomainDetachDeviceFlags, /* domainDetachDeviceFlags */
10359
    qemuDomainUpdateDeviceFlags, /* domainUpdateDeviceFlags */
10360 10361
    qemudDomainGetAutostart, /* domainGetAutostart */
    qemudDomainSetAutostart, /* domainSetAutostart */
10362 10363 10364
    qemuGetSchedulerType, /* domainGetSchedulerType */
    qemuGetSchedulerParameters, /* domainGetSchedulerParameters */
    qemuSetSchedulerParameters, /* domainSetSchedulerParameters */
D
Daniel Veillard 已提交
10365 10366
    NULL, /* domainMigratePrepare (v1) */
    qemudDomainMigratePerform, /* domainMigratePerform */
10367
    NULL, /* domainMigrateFinish */
10368
    qemudDomainBlockStats, /* domainBlockStats */
10369
    qemudDomainInterfaceStats, /* domainInterfaceStats */
10370
    qemudDomainMemoryStats, /* domainMemoryStats */
10371
    qemudDomainBlockPeek, /* domainBlockPeek */
R
Richard W.M. Jones 已提交
10372
    qemudDomainMemoryPeek, /* domainMemoryPeek */
10373
    qemuDomainGetBlockInfo, /* domainGetBlockInfo */
10374 10375
    nodeGetCellsFreeMemory, /* nodeGetCellsFreeMemory */
    nodeGetFreeMemory,  /* getFreeMemory */
10376 10377
    qemuDomainEventRegister, /* domainEventRegister */
    qemuDomainEventDeregister, /* domainEventDeregister */
D
Daniel Veillard 已提交
10378 10379
    qemudDomainMigratePrepare2, /* domainMigratePrepare2 */
    qemudDomainMigrateFinish2, /* domainMigrateFinish2 */
10380 10381 10382
    qemudNodeDeviceDettach, /* nodeDeviceDettach */
    qemudNodeDeviceReAttach, /* nodeDeviceReAttach */
    qemudNodeDeviceReset, /* nodeDeviceReset */
C
Chris Lalancette 已提交
10383
    qemudDomainMigratePrepareTunnel, /* domainMigratePrepareTunnel */
10384 10385 10386 10387
    qemuIsEncrypted, /* isEncrypted */
    qemuIsSecure, /* isSecure */
    qemuDomainIsActive, /* domainIsActive */
    qemuDomainIsPersistent, /* domainIsPersistent */
10388
    qemuDomainIsUpdated, /* domainIsUpdated */
10389
    qemuCPUCompare, /* cpuCompare */
10390
    qemuCPUBaseline, /* cpuBaseline */
10391
    qemuDomainGetJobInfo, /* domainGetJobInfo */
10392
    qemuDomainAbortJob, /* domainAbortJob */
10393
    qemuDomainMigrateSetMaxDowntime, /* domainMigrateSetMaxDowntime */
10394 10395
    qemuDomainEventRegisterAny, /* domainEventRegisterAny */
    qemuDomainEventDeregisterAny, /* domainEventDeregisterAny */
10396 10397 10398
    qemuDomainManagedSave, /* domainManagedSave */
    qemuDomainHasManagedSaveImage, /* domainHasManagedSaveImage */
    qemuDomainManagedSaveRemove, /* domainManagedSaveRemove */
C
Chris Lalancette 已提交
10399 10400 10401 10402 10403 10404 10405 10406 10407
    qemuDomainSnapshotCreateXML, /* domainSnapshotCreateXML */
    qemuDomainSnapshotDumpXML, /* domainSnapshotDumpXML */
    qemuDomainSnapshotNum, /* domainSnapshotNum */
    qemuDomainSnapshotListNames, /* domainSnapshotListNames */
    qemuDomainSnapshotLookupByName, /* domainSnapshotLookupByName */
    qemuDomainHasCurrentSnapshot, /* domainHasCurrentSnapshot */
    qemuDomainSnapshotCurrent, /* domainSnapshotCurrent */
    qemuDomainRevertToSnapshot, /* domainRevertToSnapshot */
    qemuDomainSnapshotDelete, /* domainSnapshotDelete */
10408
    qemuDomainMonitorCommand, /* qemuDomainMonitorCommand */
10409
    qemuDomainSetMemoryParameters, /* domainSetMemoryParameters */
10410
    qemuDomainGetMemoryParameters, /* domainGetMemoryParameters */
10411
    qemuDomainOpenConsole, /* domainOpenConsole */
10412 10413 10414
};


10415
static virStateDriver qemuStateDriver = {
10416
    .name = "QEMU",
10417 10418 10419 10420
    .initialize = qemudStartup,
    .cleanup = qemudShutdown,
    .reload = qemudReload,
    .active = qemudActive,
10421
};
10422

S
Stefan Berger 已提交
10423
static int
10424
qemudVMFilterRebuild(virConnectPtr conn ATTRIBUTE_UNUSED,
S
Stefan Berger 已提交
10425 10426 10427
                     virHashIterator iter, void *data)
{
    virHashForEach(qemu_driver->domains.objs, iter, data);
10428

S
Stefan Berger 已提交
10429 10430 10431
    return 0;
}

10432 10433 10434 10435 10436 10437 10438 10439 10440 10441 10442 10443 10444 10445 10446 10447 10448 10449 10450 10451 10452 10453
static int
qemudVMFiltersInstantiate(virConnectPtr conn,
                          virDomainDefPtr def)
{
    int err = 0;
    int i;

    if (!conn)
        return 1;

    for (i = 0 ; i < def->nnets ; i++) {
        virDomainNetDefPtr net = def->nets[i];
        if ((net->filter) && (net->ifname)) {
           if (virDomainConfNWFilterInstantiate(conn, net)) {
                err = 1;
                break;
            }
        }
    }

    return err;
}
S
Stefan Berger 已提交
10454

10455 10456 10457 10458 10459 10460 10461 10462 10463 10464 10465 10466 10467

static void
qemudVMDriverLock(void) {
    qemuDriverLock(qemu_driver);
};


static void
qemudVMDriverUnlock(void) {
    qemuDriverUnlock(qemu_driver);
};


S
Stefan Berger 已提交
10468 10469 10470
static virNWFilterCallbackDriver qemuCallbackDriver = {
    .name = "QEMU",
    .vmFilterRebuild = qemudVMFilterRebuild,
10471 10472
    .vmDriverLock = qemudVMDriverLock,
    .vmDriverUnlock = qemudVMDriverUnlock,
S
Stefan Berger 已提交
10473 10474
};

10475
int qemuRegister(void) {
10476 10477
    virRegisterDriver(&qemuDriver);
    virRegisterStateDriver(&qemuStateDriver);
S
Stefan Berger 已提交
10478
    virNWFilterRegisterCallbackDriver(&qemuCallbackDriver);
10479 10480
    return 0;
}