qemu_driver.c 320.2 KB
Newer Older
D
Daniel P. Berrange 已提交
1 2 3
/*
 * driver.c: core driver methods for managing qemu guests
 *
4
 * Copyright (C) 2006-2011 Red Hat, Inc.
D
Daniel P. Berrange 已提交
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 * Copyright (C) 2006 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307  USA
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

24
#include <config.h>
25

D
Daniel P. Berrange 已提交
26 27
#include <sys/types.h>
#include <sys/poll.h>
28
#include <sys/time.h>
D
Daniel P. Berrange 已提交
29 30 31
#include <dirent.h>
#include <limits.h>
#include <string.h>
32
#include <stdbool.h>
D
Daniel P. Berrange 已提交
33 34 35 36 37
#include <stdio.h>
#include <stdarg.h>
#include <stdlib.h>
#include <unistd.h>
#include <errno.h>
38
#include <sys/utsname.h>
39 40 41 42
#include <sys/stat.h>
#include <fcntl.h>
#include <signal.h>
#include <paths.h>
43
#include <stdio.h>
44
#include <sys/wait.h>
45
#include <sys/ioctl.h>
46
#include <sys/un.h>
D
Daniel P. Berrange 已提交
47

48

49
#include "virterror_internal.h"
50
#include "logging.h"
51
#include "datatypes.h"
52 53
#include "qemu_driver.h"
#include "qemu_conf.h"
54
#include "qemu_capabilities.h"
55
#include "qemu_command.h"
56
#include "qemu_cgroup.h"
57
#include "qemu_hostdev.h"
58
#include "qemu_hotplug.h"
59
#include "qemu_monitor.h"
60
#include "qemu_bridge_filter.h"
61
#include "qemu_audit.h"
J
Jim Meyering 已提交
62
#include "c-ctype.h"
63
#include "event.h"
64
#include "buf.h"
65
#include "util.h"
66
#include "nodeinfo.h"
67
#include "stats_linux.h"
68
#include "capabilities.h"
69
#include "memory.h"
70
#include "uuid.h"
71
#include "domain_conf.h"
72 73
#include "node_device_conf.h"
#include "pci.h"
74
#include "hostusb.h"
75
#include "processinfo.h"
C
Chris Lalancette 已提交
76
#include "libvirt_internal.h"
77
#include "xml.h"
78
#include "cpu/cpu.h"
79
#include "macvtap.h"
80
#include "sysinfo.h"
81
#include "domain_nwfilter.h"
82
#include "hooks.h"
83
#include "storage_file.h"
84
#include "files.h"
85
#include "fdstream.h"
86
#include "configmake.h"
H
Hu Tao 已提交
87
#include "threadpool.h"
88

89 90
#define VIR_FROM_THIS VIR_FROM_QEMU

91 92 93
#define QEMU_VNC_PORT_MIN  5900
#define QEMU_VNC_PORT_MAX  65535

94 95
#define QEMU_NB_MEM_PARAM  3

96

97 98
#define timeval_to_ms(tv)       (((tv).tv_sec * 1000ull) + ((tv).tv_usec / 1000))

H
Hu Tao 已提交
99 100 101 102 103 104 105 106
struct watchdogEvent
{
    virDomainObjPtr vm;
    int action;
};

static void processWatchdogEvent(void *data, void *opaque);

107 108
static int qemudShutdown(void);

109 110 111
static void qemuDomainEventFlush(int timer, void *opaque);
static void qemuDomainEventQueue(struct qemud_driver *driver,
                                 virDomainEventPtr event);
112

J
Jiri Denemark 已提交
113 114
static int qemudDomainObjStart(virConnectPtr conn,
                               struct qemud_driver *driver,
115 116
                               virDomainObjPtr vm,
                               bool start_paused);
J
Jiri Denemark 已提交
117

118 119
static int qemudStartVMDaemon(virConnectPtr conn,
                              struct qemud_driver *driver,
120
                              virDomainObjPtr vm,
121
                              const char *migrateFrom,
122
                              bool start_paused,
123
                              int stdin_fd,
124 125
                              const char *stdin_path,
                              enum virVMOperationType vmop);
126

127
static void qemudShutdownVMDaemon(struct qemud_driver *driver,
128 129
                                  virDomainObjPtr vm,
                                  int migrated);
130

131
static int qemudDomainGetMaxVcpus(virDomainPtr dom);
132

133
static int qemuDetectVcpuPIDs(struct qemud_driver *driver,
134
                              virDomainObjPtr vm);
135

136 137 138
static int qemudVMFiltersInstantiate(virConnectPtr conn,
                                     virDomainDefPtr def);

J
Jim Meyering 已提交
139
static struct qemud_driver *qemu_driver = NULL;
140

141

H
Hu Tao 已提交
142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
static int doStartCPUs(struct qemud_driver *driver, virDomainObjPtr vm, virConnectPtr conn)
{
    int ret;
    qemuDomainObjPrivatePtr priv = vm->privateData;

    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorStartCPUs(priv->mon, conn);
    if (ret == 0) {
        vm->state = VIR_DOMAIN_RUNNING;
    }
    qemuDomainObjExitMonitorWithDriver(driver, vm);

    return ret;
}

H
Hu Tao 已提交
157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172
static int doStopCPUs(struct qemud_driver *driver, virDomainObjPtr vm)
{
    int ret;
    int oldState = vm->state;
    qemuDomainObjPrivatePtr priv = vm->privateData;

    vm->state = VIR_DOMAIN_PAUSED;
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorStopCPUs(priv->mon);
    qemuDomainObjExitMonitorWithDriver(driver, vm);
    if (ret < 0) {
        vm->state = oldState;
    }
    return ret;
}

173

174
static int
175
qemudLogFD(struct qemud_driver *driver, const char* name, bool append)
176
{
177
    char *logfile;
178
    mode_t logmode;
179
    int fd = -1;
180

181
    if (virAsprintf(&logfile, "%s/%s.log", driver->logDir, name) < 0) {
182
        virReportOOMError();
183 184 185 186
        return -1;
    }

    logmode = O_CREAT | O_WRONLY;
187
    /* Only logrotate files in /var/log, so only append if running privileged */
188
    if (driver->privileged || append)
189
        logmode |= O_APPEND;
190 191 192
    else
        logmode |= O_TRUNC;

193
    if ((fd = open(logfile, logmode, S_IRUSR | S_IWUSR)) < 0) {
194
        virReportSystemError(errno,
195 196
                             _("failed to create logfile %s"),
                             logfile);
197
        VIR_FREE(logfile);
198 199
        return -1;
    }
200
    VIR_FREE(logfile);
201
    if (virSetCloseExec(fd) < 0) {
202
        virReportSystemError(errno, "%s",
203
                             _("Unable to set VM logfile close-on-exec flag"));
204
        VIR_FORCE_CLOSE(fd);
205 206 207 208 209 210
        return -1;
    }
    return fd;
}


211
static int
212
qemudLogReadFD(const char* logDir, const char* name, off_t pos)
213
{
214
    char *logfile;
215
    mode_t logmode = O_RDONLY;
216
    int fd = -1;
217

218
    if (virAsprintf(&logfile, "%s/%s.log", logDir, name) < 0) {
219 220 221
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("failed to build logfile name %s/%s.log"),
                        logDir, name);
222 223 224 225
        return -1;
    }

    if ((fd = open(logfile, logmode)) < 0) {
226
        virReportSystemError(errno,
227 228
                             _("failed to create logfile %s"),
                             logfile);
229
        VIR_FREE(logfile);
230 231
        return -1;
    }
232
    if (virSetCloseExec(fd) < 0) {
233
        virReportSystemError(errno, "%s",
234
                             _("Unable to set VM logfile close-on-exec flag"));
235
        VIR_FORCE_CLOSE(fd);
236
        VIR_FREE(logfile);
237 238
        return -1;
    }
239
    if (pos < 0 || lseek(fd, pos, SEEK_SET) < 0) {
240
        virReportSystemError(pos < 0 ? 0 : errno,
241 242
                             _("Unable to seek to %lld in %s"),
                             (long long) pos, logfile);
243
        VIR_FORCE_CLOSE(fd);
244
    }
245
    VIR_FREE(logfile);
246 247 248 249
    return fd;
}


250 251 252 253 254 255 256 257 258
struct qemuAutostartData {
    struct qemud_driver *driver;
    virConnectPtr conn;
};
static void
qemuAutostartDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
{
    virDomainObjPtr vm = payload;
    struct qemuAutostartData *data = opaque;
259
    virErrorPtr err;
260 261

    virDomainObjLock(vm);
262 263 264 265 266 267 268 269 270
    virResetLastError();
    if (qemuDomainObjBeginJobWithDriver(data->driver, vm) < 0) {
        err = virGetLastError();
        VIR_ERROR(_("Failed to start job on VM '%s': %s"),
                  vm->def->name,
                  err ? err->message : _("unknown error"));
    } else {
        if (vm->autostart &&
            !virDomainObjIsActive(vm) &&
271
            qemudDomainObjStart(data->conn, data->driver, vm, false) < 0) {
272
            err = virGetLastError();
273
            VIR_ERROR(_("Failed to autostart VM '%s': %s"),
274
                      vm->def->name,
275
                      err ? err->message : _("unknown error"));
276
        }
277 278 279

        if (qemuDomainObjEndJob(vm) == 0)
            vm = NULL;
280
    }
281 282 283

    if (vm)
        virDomainObjUnlock(vm);
284 285
}

286 287
static void
qemudAutostartConfigs(struct qemud_driver *driver) {
288 289 290 291 292
    /* XXX: Figure out a better way todo this. The domain
     * startup code needs a connection handle in order
     * to lookup the bridge associated with a virtual
     * network
     */
293 294 295
    virConnectPtr conn = virConnectOpen(driver->privileged ?
                                        "qemu:///system" :
                                        "qemu:///session");
296
    /* Ignoring NULL conn which is mostly harmless here */
297
    struct qemuAutostartData data = { driver, conn };
298

299
    qemuDriverLock(driver);
300
    virHashForEach(driver->domains.objs, qemuAutostartDomain, &data);
301
    qemuDriverUnlock(driver);
302

303 304
    if (conn)
        virConnectClose(conn);
305 306
}

307 308 309 310 311 312 313 314 315

/**
 * qemudRemoveDomainStatus
 *
 * remove all state files of a domain from statedir
 *
 * Returns 0 on success
 */
static int
316
qemudRemoveDomainStatus(struct qemud_driver *driver,
317 318
                        virDomainObjPtr vm)
{
319
    char ebuf[1024];
320 321 322
    char *file = NULL;

    if (virAsprintf(&file, "%s/%s.xml", driver->stateDir, vm->def->name) < 0) {
323
        virReportOOMError();
D
Daniel Veillard 已提交
324
        return(-1);
325 326
    }

327
    if (unlink(file) < 0 && errno != ENOENT && errno != ENOTDIR)
328
        VIR_WARN("Failed to remove domain XML for %s: %s",
D
Daniel Veillard 已提交
329 330 331
                 vm->def->name, virStrerror(errno, ebuf, sizeof(ebuf)));
    VIR_FREE(file);

332
    if (virFileDeletePid(driver->stateDir, vm->def->name) != 0)
333
        VIR_WARN("Failed to remove PID file for %s: %s",
334
                 vm->def->name, virStrerror(errno, ebuf, sizeof(ebuf)));
335

D
Daniel Veillard 已提交
336

337
    return 0;
338 339
}

340 341 342 343 344 345 346 347 348 349 350 351 352

/*
 * This is a callback registered with a qemuMonitorPtr  instance,
 * and to be invoked when the monitor console hits an end of file
 * condition, or error, thus indicating VM shutdown should be
 * performed
 */
static void
qemuHandleMonitorEOF(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                     virDomainObjPtr vm,
                     int hasError) {
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event = NULL;
353
    qemuDomainObjPrivatePtr priv;
354

355
    VIR_DEBUG("Received EOF on %p '%s'", vm, vm->def->name);
356

357 358
    virDomainObjLock(vm);

359 360 361 362 363 364
    if (!virDomainObjIsActive(vm)) {
        VIR_DEBUG("Domain %p is not active, ignoring EOF", vm);
        virDomainObjUnlock(vm);
        return;
    }

365 366 367 368 369 370 371
    priv = vm->privateData;
    if (!hasError && priv->monJSON && !priv->gotShutdown) {
        VIR_DEBUG("Monitor connection to '%s' closed without SHUTDOWN event; "
                  "assuming the domain crashed", vm->def->name);
        hasError = 1;
    }

372 373 374 375 376 377
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     hasError ?
                                     VIR_DOMAIN_EVENT_STOPPED_FAILED :
                                     VIR_DOMAIN_EVENT_STOPPED_SHUTDOWN);

378
    qemudShutdownVMDaemon(driver, vm, 0);
379 380
    qemuDomainStopAudit(vm, hasError ? "failed" : "shutdown");

381 382 383 384 385 386 387 388 389 390 391 392 393
    if (!vm->persistent)
        virDomainRemoveInactive(&driver->domains, vm);
    else
        virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }
}


394 395 396
static virDomainDiskDefPtr
findDomainDiskByPath(virDomainObjPtr vm,
                     const char *path)
397 398 399 400 401 402 403
{
    int i;

    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk;

        disk = vm->def->disks[i];
404 405
        if (disk->src != NULL && STREQ(disk->src, path))
            return disk;
406
    }
407 408 409 410

    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                    _("no disk found with path %s"),
                    path);
411 412 413
    return NULL;
}

414 415 416 417 418 419
static virDomainDiskDefPtr
findDomainDiskByAlias(virDomainObjPtr vm,
                      const char *alias)
{
    int i;

420 421 422
    if (STRPREFIX(alias, QEMU_DRIVE_HOST_PREFIX))
        alias += strlen(QEMU_DRIVE_HOST_PREFIX);

423 424 425 426 427 428 429 430 431 432 433 434 435 436
    for (i = 0; i < vm->def->ndisks; i++) {
        virDomainDiskDefPtr disk;

        disk = vm->def->disks[i];
        if (disk->info.alias != NULL && STREQ(disk->info.alias, alias))
            return disk;
    }

    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                    _("no disk found with alias %s"),
                    alias);
    return NULL;
}

437
static int
438 439 440 441
getVolumeQcowPassphrase(virConnectPtr conn,
                        virDomainDiskDefPtr disk,
                        char **secretRet,
                        size_t *secretLen)
442 443 444 445 446
{
    virSecretPtr secret;
    char *passphrase;
    unsigned char *data;
    size_t size;
447
    int ret = -1;
448
    virStorageEncryptionPtr enc;
449

450 451 452 453 454 455 456
    if (!disk->encryption) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("disk %s does not have any encryption information"),
                        disk->src);
        return -1;
    }
    enc = disk->encryption;
457 458

    if (!conn) {
459
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
460
                        "%s", _("cannot find secrets without a connection"));
461
        goto cleanup;
462 463 464 465 466
    }

    if (conn->secretDriver == NULL ||
        conn->secretDriver->lookupByUUID == NULL ||
        conn->secretDriver->getValue == NULL) {
467 468
        qemuReportError(VIR_ERR_NO_SUPPORT, "%s",
                        _("secret storage not supported"));
469
        goto cleanup;
470 471 472 473 474 475
    }

    if (enc->format != VIR_STORAGE_ENCRYPTION_FORMAT_QCOW ||
        enc->nsecrets != 1 ||
        enc->secrets[0]->type !=
        VIR_STORAGE_ENCRYPTION_SECRET_TYPE_PASSPHRASE) {
476
        qemuReportError(VIR_ERR_XML_ERROR,
477
                        _("invalid <encryption> for volume %s"), disk->src);
478
        goto cleanup;
479 480 481 482 483
    }

    secret = conn->secretDriver->lookupByUUID(conn,
                                              enc->secrets[0]->uuid);
    if (secret == NULL)
484
        goto cleanup;
485 486 487 488
    data = conn->secretDriver->getValue(secret, &size,
                                        VIR_SECRET_GET_VALUE_INTERNAL_CALL);
    virUnrefSecret(secret);
    if (data == NULL)
489
        goto cleanup;
490 491 492 493

    if (memchr(data, '\0', size) != NULL) {
        memset(data, 0, size);
        VIR_FREE(data);
494
        qemuReportError(VIR_ERR_XML_ERROR,
495
                        _("format='qcow' passphrase for %s must not contain a "
496
                          "'\\0'"), disk->src);
497
        goto cleanup;
498 499 500 501 502
    }

    if (VIR_ALLOC_N(passphrase, size + 1) < 0) {
        memset(data, 0, size);
        VIR_FREE(data);
503
        virReportOOMError();
504
        goto cleanup;
505 506 507 508 509 510 511 512 513 514
    }
    memcpy(passphrase, data, size);
    passphrase[size] = '\0';

    memset(data, 0, size);
    VIR_FREE(data);

    *secretRet = passphrase;
    *secretLen = size;

515 516 517
    ret = 0;

cleanup:
518 519
    return ret;
}
520

521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541
static int
findVolumeQcowPassphrase(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virConnectPtr conn,
                         virDomainObjPtr vm,
                         const char *path,
                         char **secretRet,
                         size_t *secretLen)
{
    virDomainDiskDefPtr disk;
    int ret = -1;

    virDomainObjLock(vm);
    disk = findDomainDiskByPath(vm, path);

    if (!disk)
        goto cleanup;

    ret = getVolumeQcowPassphrase(conn, disk, secretRet, secretLen);

cleanup:
    virDomainObjUnlock(vm);
542
    return ret;
543 544
}

545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566

static int
qemuHandleDomainReset(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                      virDomainObjPtr vm)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event;

    virDomainObjLock(vm);
    event = virDomainEventRebootNewFromObj(vm);
    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;
}


567 568 569 570 571 572 573 574 575 576 577 578
static int
qemuHandleDomainShutdown(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virDomainObjPtr vm)
{
    virDomainObjLock(vm);
    ((qemuDomainObjPrivatePtr) vm->privateData)->gotShutdown = true;
    virDomainObjUnlock(vm);

    return 0;
}


579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610
static int
qemuHandleDomainStop(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                     virDomainObjPtr vm)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event = NULL;

    virDomainObjLock(vm);
    if (vm->state == VIR_DOMAIN_RUNNING) {
        VIR_DEBUG("Transitioned guest %s to paused state due to unknown event", vm->def->name);

        vm->state = VIR_DOMAIN_PAUSED;
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);

        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            VIR_WARN("Unable to save status on vm %s after IO error", vm->def->name);
    }
    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        if (event)
            qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;
}


611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639
static int
qemuHandleDomainRTCChange(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                          virDomainObjPtr vm,
                          long long offset)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event;

    virDomainObjLock(vm);
    event = virDomainEventRTCChangeNewFromObj(vm, offset);

    if (vm->def->clock.offset == VIR_DOMAIN_CLOCK_OFFSET_VARIABLE)
        vm->def->clock.data.adjustment = offset;

    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
        VIR_WARN0("unable to save domain status with RTC change");

    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;
}


640 641 642 643 644 645
static int
qemuHandleDomainWatchdog(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virDomainObjPtr vm,
                         int action)
{
    struct qemud_driver *driver = qemu_driver;
646 647
    virDomainEventPtr watchdogEvent = NULL;
    virDomainEventPtr lifecycleEvent = NULL;
648 649

    virDomainObjLock(vm);
650 651 652 653 654 655 656 657 658 659 660 661 662 663
    watchdogEvent = virDomainEventWatchdogNewFromObj(vm, action);

    if (action == VIR_DOMAIN_EVENT_WATCHDOG_PAUSE &&
        vm->state == VIR_DOMAIN_RUNNING) {
        VIR_DEBUG("Transitioned guest %s to paused state due to watchdog", vm->def->name);

        vm->state = VIR_DOMAIN_PAUSED;
        lifecycleEvent = virDomainEventNewFromObj(vm,
                                                  VIR_DOMAIN_EVENT_SUSPENDED,
                                                  VIR_DOMAIN_EVENT_SUSPENDED_WATCHDOG);

        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            VIR_WARN("Unable to save status on vm %s after IO error", vm->def->name);
    }
H
Hu Tao 已提交
664 665 666 667 668 669 670 671 672 673 674

    if (vm->def->watchdog->action == VIR_DOMAIN_WATCHDOG_ACTION_DUMP) {
        struct watchdogEvent *wdEvent;
        if (VIR_ALLOC(wdEvent) == 0) {
            wdEvent->action = VIR_DOMAIN_WATCHDOG_ACTION_DUMP;
            wdEvent->vm = vm;
            ignore_value(virThreadPoolSendJob(driver->workerPool, wdEvent));
        } else
            virReportOOMError();
    }

675 676
    virDomainObjUnlock(vm);

677
    if (watchdogEvent || lifecycleEvent) {
678
        qemuDriverLock(driver);
679 680 681 682
        if (watchdogEvent)
            qemuDomainEventQueue(driver, watchdogEvent);
        if (lifecycleEvent)
            qemuDomainEventQueue(driver, lifecycleEvent);
683 684 685 686 687 688 689
        qemuDriverUnlock(driver);
    }

    return 0;
}


690 691 692 693
static int
qemuHandleDomainIOError(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                        virDomainObjPtr vm,
                        const char *diskAlias,
694 695
                        int action,
                        const char *reason)
696 697
{
    struct qemud_driver *driver = qemu_driver;
698
    virDomainEventPtr ioErrorEvent = NULL;
699
    virDomainEventPtr ioErrorEvent2 = NULL;
700
    virDomainEventPtr lifecycleEvent = NULL;
701 702 703 704 705 706 707 708 709 710 711 712 713 714 715
    const char *srcPath;
    const char *devAlias;
    virDomainDiskDefPtr disk;

    virDomainObjLock(vm);
    disk = findDomainDiskByAlias(vm, diskAlias);

    if (disk) {
        srcPath = disk->src;
        devAlias = disk->info.alias;
    } else {
        srcPath = "";
        devAlias = "";
    }

716
    ioErrorEvent = virDomainEventIOErrorNewFromObj(vm, srcPath, devAlias, action);
717
    ioErrorEvent2 = virDomainEventIOErrorReasonNewFromObj(vm, srcPath, devAlias, action, reason);
718 719 720 721 722 723 724 725 726 727 728 729 730

    if (action == VIR_DOMAIN_EVENT_IO_ERROR_PAUSE &&
        vm->state == VIR_DOMAIN_RUNNING) {
        VIR_DEBUG("Transitioned guest %s to paused state due to IO error", vm->def->name);

        vm->state = VIR_DOMAIN_PAUSED;
        lifecycleEvent = virDomainEventNewFromObj(vm,
                                                  VIR_DOMAIN_EVENT_SUSPENDED,
                                                  VIR_DOMAIN_EVENT_SUSPENDED_IOERROR);

        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            VIR_WARN("Unable to save status on vm %s after IO error", vm->def->name);
    }
731 732
    virDomainObjUnlock(vm);

733
    if (ioErrorEvent || ioErrorEvent2 || lifecycleEvent) {
734
        qemuDriverLock(driver);
735 736
        if (ioErrorEvent)
            qemuDomainEventQueue(driver, ioErrorEvent);
737 738
        if (ioErrorEvent2)
            qemuDomainEventQueue(driver, ioErrorEvent2);
739 740
        if (lifecycleEvent)
            qemuDomainEventQueue(driver, lifecycleEvent);
741 742 743 744 745 746 747
        qemuDriverUnlock(driver);
    }

    return 0;
}


748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839
static int
qemuHandleDomainGraphics(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                         virDomainObjPtr vm,
                         int phase,
                         int localFamily,
                         const char *localNode,
                         const char *localService,
                         int remoteFamily,
                         const char *remoteNode,
                         const char *remoteService,
                         const char *authScheme,
                         const char *x509dname,
                         const char *saslUsername)
{
    struct qemud_driver *driver = qemu_driver;
    virDomainEventPtr event;
    virDomainEventGraphicsAddressPtr localAddr = NULL;
    virDomainEventGraphicsAddressPtr remoteAddr = NULL;
    virDomainEventGraphicsSubjectPtr subject = NULL;
    int i;

    virDomainObjLock(vm);

    if (VIR_ALLOC(localAddr) < 0)
        goto no_memory;
    localAddr->family = localFamily;
    if (!(localAddr->service = strdup(localService)) ||
        !(localAddr->node = strdup(localNode)))
        goto no_memory;

    if (VIR_ALLOC(remoteAddr) < 0)
        goto no_memory;
    remoteAddr->family = remoteFamily;
    if (!(remoteAddr->service = strdup(remoteService)) ||
        !(remoteAddr->node = strdup(remoteNode)))
        goto no_memory;

    if (VIR_ALLOC(subject) < 0)
        goto no_memory;
    if (x509dname) {
        if (VIR_REALLOC_N(subject->identities, subject->nidentity+1) < 0)
            goto no_memory;
        if (!(subject->identities[subject->nidentity].type = strdup("x509dname")) ||
            !(subject->identities[subject->nidentity].name = strdup(x509dname)))
            goto no_memory;
        subject->nidentity++;
    }
    if (saslUsername) {
        if (VIR_REALLOC_N(subject->identities, subject->nidentity+1) < 0)
            goto no_memory;
        if (!(subject->identities[subject->nidentity].type = strdup("saslUsername")) ||
            !(subject->identities[subject->nidentity].name = strdup(saslUsername)))
            goto no_memory;
        subject->nidentity++;
    }

    event = virDomainEventGraphicsNewFromObj(vm, phase, localAddr, remoteAddr, authScheme, subject);
    virDomainObjUnlock(vm);

    if (event) {
        qemuDriverLock(driver);
        qemuDomainEventQueue(driver, event);
        qemuDriverUnlock(driver);
    }

    return 0;

no_memory:
    virReportOOMError();
    if (localAddr) {
        VIR_FREE(localAddr->service);
        VIR_FREE(localAddr->node);
        VIR_FREE(localAddr);
    }
    if (remoteAddr) {
        VIR_FREE(remoteAddr->service);
        VIR_FREE(remoteAddr->node);
        VIR_FREE(remoteAddr);
    }
    if (subject) {
        for (i = 0 ; i < subject->nidentity ; i++) {
            VIR_FREE(subject->identities[i].type);
            VIR_FREE(subject->identities[i].name);
        }
        VIR_FREE(subject->identities);
        VIR_FREE(subject);
    }

    return -1;
}


840 841 842 843 844 845 846 847 848
static void qemuHandleMonitorDestroy(qemuMonitorPtr mon,
                                     virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    if (priv->mon == mon)
        priv->mon = NULL;
    virDomainObjUnref(vm);
}

849
static qemuMonitorCallbacks monitorCallbacks = {
850
    .destroy = qemuHandleMonitorDestroy,
851 852
    .eofNotify = qemuHandleMonitorEOF,
    .diskSecretLookup = findVolumeQcowPassphrase,
853
    .domainShutdown = qemuHandleDomainShutdown,
854
    .domainStop = qemuHandleDomainStop,
855
    .domainReset = qemuHandleDomainReset,
856
    .domainRTCChange = qemuHandleDomainRTCChange,
857
    .domainWatchdog = qemuHandleDomainWatchdog,
858
    .domainIOError = qemuHandleDomainIOError,
859
    .domainGraphics = qemuHandleDomainGraphics,
860 861
};

862
static int
863
qemuConnectMonitor(struct qemud_driver *driver, virDomainObjPtr vm)
864
{
865
    qemuDomainObjPrivatePtr priv = vm->privateData;
866
    int ret = -1;
867

868
    if (virSecurityManagerSetSocketLabel(driver->securityManager, vm) < 0) {
869 870
        VIR_ERROR(_("Failed to set security context for monitor for %s"),
                  vm->def->name);
871 872 873
        goto error;
    }

874 875 876 877 878 879 880 881 882 883 884
    /* Hold an extra reference because we can't allow 'vm' to be
     * deleted while the monitor is active */
    virDomainObjRef(vm);

    priv->mon = qemuMonitorOpen(vm,
                                priv->monConfig,
                                priv->monJSON,
                                &monitorCallbacks);

    if (priv->mon == NULL)
        virDomainObjUnref(vm);
885

886
    if (virSecurityManagerClearSocketLabel(driver->securityManager, vm) < 0) {
887 888
        VIR_ERROR(_("Failed to clear security context for monitor for %s"),
                  vm->def->name);
889
        goto error;
890
    }
891

892 893 894 895 896 897
    if (priv->mon == NULL) {
        VIR_INFO("Failed to connect monitor for %s", vm->def->name);
        goto error;
    }


898 899 900 901
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorSetCapabilities(priv->mon);
    qemuDomainObjExitMonitorWithDriver(driver, vm);

902
error:
903
    if (ret < 0)
904 905 906
        qemuMonitorClose(priv->mon);

    return ret;
907
}
908

909 910 911 912
struct virReconnectDomainData {
    virConnectPtr conn;
    struct qemud_driver *driver;
};
913 914 915
/*
 * Open an existing VM's monitor, re-detect VCPU threads
 * and re-reserve the security labels in use
916
 */
917 918
static void
qemuReconnectDomain(void *payload, const char *name ATTRIBUTE_UNUSED, void *opaque)
919
{
920
    virDomainObjPtr obj = payload;
921 922
    struct virReconnectDomainData *data = opaque;
    struct qemud_driver *driver = data->driver;
923
    qemuDomainObjPrivatePtr priv;
924
    unsigned long long qemuCmdFlags;
925
    virConnectPtr conn = data->conn;
926 927

    virDomainObjLock(obj);
928

929 930
    VIR_DEBUG("Reconnect monitor to %p '%s'", obj, obj->def->name);

931 932
    priv = obj->privateData;

933
    /* XXX check PID liveliness & EXE path */
934
    if (qemuConnectMonitor(driver, obj) < 0)
935
        goto error;
936

937 938 939 940
    if (qemuUpdateActivePciHostdevs(driver, obj->def) < 0) {
        goto error;
    }

941 942 943
    /* XXX we should be persisting the original flags in the XML
     * not re-detecting them, since the binary may have changed
     * since launch time */
944 945 946
    if (qemuCapsExtractVersionInfo(obj->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) >= 0 &&
947
        (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE)) {
948 949
        priv->persistentAddrs = 1;

950 951 952 953
        if (!(priv->pciaddrs = qemuDomainPCIAddressSetCreate(obj->def)) ||
            qemuAssignDevicePCISlots(obj->def, priv->pciaddrs) < 0)
            goto error;
    }
954

955
    if (virSecurityManagerReserveLabel(driver->securityManager, obj) < 0)
956
        goto error;
957

958 959 960
    if (qemudVMFiltersInstantiate(conn, obj->def))
        goto error;

961 962
    if (obj->def->id >= driver->nextvmid)
        driver->nextvmid = obj->def->id + 1;
963

964 965
    virDomainObjUnlock(obj);
    return;
966

967
error:
968 969 970
    /* We can't get the monitor back, so must kill the VM
     * to remove danger of it ending up running twice if
     * user tries to start it again later */
971
    qemudShutdownVMDaemon(driver, obj, 0);
972 973 974 975
    if (!obj->persistent)
        virDomainRemoveInactive(&driver->domains, obj);
    else
        virDomainObjUnlock(obj);
976
}
977

978
/**
979
 * qemudReconnectDomains
980 981 982 983 984
 *
 * Try to re-open the resources for live VMs that we care
 * about.
 */
static void
985
qemuReconnectDomains(virConnectPtr conn, struct qemud_driver *driver)
986
{
987 988
    struct virReconnectDomainData data = {conn, driver};
    virHashForEach(driver->domains.objs, qemuReconnectDomain, &data);
989 990
}

991

992
static int
993
qemuSecurityInit(struct qemud_driver *driver)
994
{
995 996 997 998
    virSecurityManagerPtr mgr = virSecurityManagerNew(driver->securityDriverName,
                                                      driver->allowDiskFormatProbing);
    if (!mgr)
        goto error;
999

1000 1001 1002 1003 1004 1005 1006
    if (driver->privileged) {
        virSecurityManagerPtr dac = virSecurityManagerNewDAC(driver->user,
                                                             driver->group,
                                                             driver->allowDiskFormatProbing,
                                                             driver->dynamicOwnership);
        if (!dac)
            goto error;
1007

1008 1009 1010
        if (!(driver->securityManager = virSecurityManagerNewStack(mgr,
                                                                   dac)))
            goto error;
1011
    } else {
1012
        driver->securityManager = mgr;
1013 1014
    }

1015
    return 0;
1016 1017 1018 1019 1020

error:
    VIR_ERROR0(_("Failed to initialize security drivers"));
    virSecurityManagerFree(mgr);
    return -1;
1021
}
1022 1023


1024 1025
static virCapsPtr
qemuCreateCapabilities(virCapsPtr oldcaps,
1026
                       struct qemud_driver *driver)
1027 1028 1029 1030
{
    virCapsPtr caps;

    /* Basic host arch / guest machine capabilities */
1031
    if (!(caps = qemuCapsInit(oldcaps))) {
1032
        virReportOOMError();
1033 1034 1035
        return NULL;
    }

1036 1037 1038 1039 1040 1041 1042 1043
    if (driver->allowDiskFormatProbing) {
        caps->defaultDiskDriverName = NULL;
        caps->defaultDiskDriverType = NULL;
    } else {
        caps->defaultDiskDriverName = "qemu";
        caps->defaultDiskDriverType = "raw";
    }

1044 1045
    qemuDomainSetPrivateDataHooks(caps);
    qemuDomainSetNamespaceHooks(caps);
1046

1047 1048 1049 1050 1051
    if (virGetHostUUID(caps->host.host_uuid)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                         "%s", _("cannot get the host uuid"));
        goto err_exit;
    }
1052 1053

    /* Security driver data */
1054
    const char *doi, *model;
1055

1056 1057 1058
    doi = virSecurityManagerGetDOI(driver->securityManager);
    model = virSecurityManagerGetModel(driver->securityManager);
    if (STRNEQ(model, "none")) {
1059 1060 1061 1062 1063 1064
        if (!(caps->host.secModel.model = strdup(model)))
            goto no_memory;
        if (!(caps->host.secModel.doi = strdup(doi)))
            goto no_memory;
    }

1065 1066 1067
    VIR_DEBUG("Initialized caps for security driver \"%s\" with "
              "DOI \"%s\"", model, doi);

1068 1069 1070
    return caps;

no_memory:
1071
    virReportOOMError();
1072
err_exit:
1073 1074 1075
    virCapabilitiesFree(caps);
    return NULL;
}
1076

C
Chris Lalancette 已提交
1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093
static void qemuDomainSnapshotLoad(void *payload,
                                   const char *name ATTRIBUTE_UNUSED,
                                   void *data)
{
    virDomainObjPtr vm = (virDomainObjPtr)payload;
    char *baseDir = (char *)data;
    char *snapDir = NULL;
    DIR *dir = NULL;
    struct dirent *entry;
    char *xmlStr;
    int ret;
    char *fullpath;
    virDomainSnapshotDefPtr def = NULL;
    char ebuf[1024];

    virDomainObjLock(vm);
    if (virAsprintf(&snapDir, "%s/%s", baseDir, vm->def->name) < 0) {
1094
        VIR_ERROR(_("Failed to allocate memory for snapshot directory for domain %s"),
C
Chris Lalancette 已提交
1095 1096 1097 1098 1099 1100 1101 1102 1103
                   vm->def->name);
        goto cleanup;
    }

    VIR_INFO("Scanning for snapshots for domain %s in %s", vm->def->name,
             snapDir);

    if (!(dir = opendir(snapDir))) {
        if (errno != ENOENT)
1104
            VIR_ERROR(_("Failed to open snapshot directory %s for domain %s: %s"),
C
Chris Lalancette 已提交
1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118
                      snapDir, vm->def->name,
                      virStrerror(errno, ebuf, sizeof(ebuf)));
        goto cleanup;
    }

    while ((entry = readdir(dir))) {
        if (entry->d_name[0] == '.')
            continue;

        /* NB: ignoring errors, so one malformed config doesn't
           kill the whole process */
        VIR_INFO("Loading snapshot file '%s'", entry->d_name);

        if (virAsprintf(&fullpath, "%s/%s", snapDir, entry->d_name) < 0) {
1119
            VIR_ERROR0(_("Failed to allocate memory for path"));
C
Chris Lalancette 已提交
1120 1121 1122 1123 1124 1125
            continue;
        }

        ret = virFileReadAll(fullpath, 1024*1024*1, &xmlStr);
        if (ret < 0) {
            /* Nothing we can do here, skip this one */
1126
            VIR_ERROR(_("Failed to read snapshot file %s: %s"), fullpath,
C
Chris Lalancette 已提交
1127
                      virStrerror(errno, ebuf, sizeof(ebuf)));
1128
            VIR_FREE(fullpath);
C
Chris Lalancette 已提交
1129 1130 1131 1132 1133 1134
            continue;
        }

        def = virDomainSnapshotDefParseString(xmlStr, 0);
        if (def == NULL) {
            /* Nothing we can do here, skip this one */
1135
            VIR_ERROR(_("Failed to parse snapshot XML from file '%s'"), fullpath);
1136
            VIR_FREE(fullpath);
C
Chris Lalancette 已提交
1137 1138 1139 1140
            VIR_FREE(xmlStr);
            continue;
        }

1141
        virDomainSnapshotAssignDef(&vm->snapshots, def);
C
Chris Lalancette 已提交
1142

1143
        VIR_FREE(fullpath);
C
Chris Lalancette 已提交
1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164
        VIR_FREE(xmlStr);
    }

    /* FIXME: qemu keeps internal track of snapshots.  We can get access
     * to this info via the "info snapshots" monitor command for running
     * domains, or via "qemu-img snapshot -l" for shutoff domains.  It would
     * be nice to update our internal state based on that, but there is a
     * a problem.  qemu doesn't track all of the same metadata that we do.
     * In particular we wouldn't be able to fill in the <parent>, which is
     * pretty important in our metadata.
     */

    virResetLastError();

cleanup:
    if (dir)
        closedir(dir);
    VIR_FREE(snapDir);
    virDomainObjUnlock(vm);
}

1165 1166 1167 1168 1169 1170
/**
 * qemudStartup:
 *
 * Initialization function for the QEmu daemon
 */
static int
1171
qemudStartup(int privileged) {
1172
    char *base = NULL;
1173
    char *driverConf = NULL;
1174
    int rc;
1175
    virConnectPtr conn = NULL;
1176

1177
    if (VIR_ALLOC(qemu_driver) < 0)
1178 1179
        return -1;

1180
    if (virMutexInit(&qemu_driver->lock) < 0) {
1181
        VIR_ERROR0(_("cannot initialize mutex"));
1182 1183 1184
        VIR_FREE(qemu_driver);
        return -1;
    }
1185
    qemuDriverLock(qemu_driver);
1186
    qemu_driver->privileged = privileged;
1187

1188 1189 1190
    /* Don't have a dom0 so start from 1 */
    qemu_driver->nextvmid = 1;

1191 1192 1193
    if (virDomainObjListInit(&qemu_driver->domains) < 0)
        goto out_of_memory;

1194
    /* Init callback list */
1195
    if (VIR_ALLOC(qemu_driver->domainEventCallbacks) < 0)
1196
        goto out_of_memory;
1197 1198 1199 1200 1201 1202
    if (!(qemu_driver->domainEventQueue = virDomainEventQueueNew()))
        goto out_of_memory;

    if ((qemu_driver->domainEventTimer =
         virEventAddTimeout(-1, qemuDomainEventFlush, qemu_driver, NULL)) < 0)
        goto error;
1203

1204 1205 1206 1207 1208
    /* Allocate bitmap for vnc port reservation */
    if ((qemu_driver->reservedVNCPorts =
         virBitmapAlloc(QEMU_VNC_PORT_MAX - QEMU_VNC_PORT_MIN)) == NULL)
        goto out_of_memory;

1209 1210 1211 1212
    /* read the host sysinfo */
    if (privileged)
        qemu_driver->hostsysinfo = virSysinfoRead();

1213
    if (privileged) {
1214
        if (virAsprintf(&qemu_driver->logDir,
1215
                        "%s/log/libvirt/qemu", LOCALSTATEDIR) == -1)
1216
            goto out_of_memory;
1217

1218
        if ((base = strdup (SYSCONFDIR "/libvirt")) == NULL)
1219
            goto out_of_memory;
1220 1221

        if (virAsprintf(&qemu_driver->stateDir,
1222
                      "%s/run/libvirt/qemu", LOCALSTATEDIR) == -1)
1223
            goto out_of_memory;
1224 1225

        if (virAsprintf(&qemu_driver->libDir,
1226
                      "%s/lib/libvirt/qemu", LOCALSTATEDIR) == -1)
1227 1228 1229
            goto out_of_memory;

        if (virAsprintf(&qemu_driver->cacheDir,
1230
                      "%s/cache/libvirt/qemu", LOCALSTATEDIR) == -1)
1231
            goto out_of_memory;
1232
        if (virAsprintf(&qemu_driver->saveDir,
1233
                      "%s/lib/libvirt/qemu/save", LOCALSTATEDIR) == -1)
1234
            goto out_of_memory;
C
Chris Lalancette 已提交
1235
        if (virAsprintf(&qemu_driver->snapshotDir,
1236
                        "%s/lib/libvirt/qemu/snapshot", LOCALSTATEDIR) == -1)
C
Chris Lalancette 已提交
1237
            goto out_of_memory;
H
Hu Tao 已提交
1238 1239 1240
        if (virAsprintf(&qemu_driver->autoDumpPath,
                        "%s/lib/libvirt/qemu/dump", LOCALSTATEDIR) == -1)
            goto out_of_memory;
1241
    } else {
1242
        uid_t uid = geteuid();
1243
        char *userdir = virGetUserDirectory(uid);
1244
        if (!userdir)
1245
            goto error;
1246

1247
        if (virAsprintf(&qemu_driver->logDir,
1248 1249
                        "%s/.libvirt/qemu/log", userdir) == -1) {
            VIR_FREE(userdir);
1250
            goto out_of_memory;
1251
        }
1252

1253 1254
        if (virAsprintf(&base, "%s/.libvirt", userdir) == -1) {
            VIR_FREE(userdir);
1255
            goto out_of_memory;
1256 1257
        }
        VIR_FREE(userdir);
1258 1259 1260

        if (virAsprintf(&qemu_driver->stateDir, "%s/qemu/run", base) == -1)
            goto out_of_memory;
1261 1262 1263 1264
        if (virAsprintf(&qemu_driver->libDir, "%s/qemu/lib", base) == -1)
            goto out_of_memory;
        if (virAsprintf(&qemu_driver->cacheDir, "%s/qemu/cache", base) == -1)
            goto out_of_memory;
1265 1266
        if (virAsprintf(&qemu_driver->saveDir, "%s/qemu/save", base) == -1)
            goto out_of_memory;
C
Chris Lalancette 已提交
1267 1268
        if (virAsprintf(&qemu_driver->snapshotDir, "%s/qemu/snapshot", base) == -1)
            goto out_of_memory;
H
Hu Tao 已提交
1269 1270
        if (virAsprintf(&qemu_driver->autoDumpPath, "%s/qemu/dump", base) == -1)
            goto out_of_memory;
1271 1272
    }

L
Laine Stump 已提交
1273
    if (virFileMakePath(qemu_driver->stateDir) != 0) {
1274
        char ebuf[1024];
1275
        VIR_ERROR(_("Failed to create state dir '%s': %s"),
1276
                  qemu_driver->stateDir, virStrerror(errno, ebuf, sizeof ebuf));
1277
        goto error;
1278
    }
L
Laine Stump 已提交
1279
    if (virFileMakePath(qemu_driver->libDir) != 0) {
1280
        char ebuf[1024];
1281
        VIR_ERROR(_("Failed to create lib dir '%s': %s"),
1282 1283 1284
                  qemu_driver->libDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
L
Laine Stump 已提交
1285
    if (virFileMakePath(qemu_driver->cacheDir) != 0) {
1286
        char ebuf[1024];
1287
        VIR_ERROR(_("Failed to create cache dir '%s': %s"),
1288 1289 1290
                  qemu_driver->cacheDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
1291 1292 1293 1294 1295 1296
    if (virFileMakePath(qemu_driver->saveDir) != 0) {
        char ebuf[1024];
        VIR_ERROR(_("Failed to create save dir '%s': %s"),
                  qemu_driver->saveDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
C
Chris Lalancette 已提交
1297 1298 1299 1300 1301 1302
    if (virFileMakePath(qemu_driver->snapshotDir) != 0) {
        char ebuf[1024];
        VIR_ERROR(_("Failed to create save dir '%s': %s"),
                  qemu_driver->snapshotDir, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
H
Hu Tao 已提交
1303 1304 1305 1306 1307 1308
    if (virFileMakePath(qemu_driver->autoDumpPath) != 0) {
        char ebuf[1024];
        VIR_ERROR(_("Failed to create dump dir '%s': %s"),
                  qemu_driver->autoDumpPath, virStrerror(errno, ebuf, sizeof ebuf));
        goto error;
    }
1309 1310 1311 1312

    /* Configuration paths are either ~/.libvirt/qemu/... (session) or
     * /etc/libvirt/qemu/... (system).
     */
1313 1314 1315
    if (virAsprintf(&driverConf, "%s/qemu.conf", base) < 0 ||
        virAsprintf(&qemu_driver->configDir, "%s/qemu", base) < 0 ||
        virAsprintf(&qemu_driver->autostartDir, "%s/qemu/autostart", base) < 0)
1316 1317
        goto out_of_memory;

1318
    VIR_FREE(base);
1319

1320 1321 1322 1323 1324 1325 1326
    rc = virCgroupForDriver("qemu", &qemu_driver->cgroup, privileged, 1);
    if (rc < 0) {
        char buf[1024];
        VIR_WARN("Unable to create cgroup for driver: %s",
                 virStrerror(-rc, buf, sizeof(buf)));
    }

1327 1328 1329
    if (qemudLoadDriverConfig(qemu_driver, driverConf) < 0) {
        goto error;
    }
1330
    VIR_FREE(driverConf);
1331

1332
    if (qemuSecurityInit(qemu_driver) < 0)
1333
        goto error;
D
Daniel P. Berrange 已提交
1334

1335
    if ((qemu_driver->caps = qemuCreateCapabilities(NULL,
1336
                                                    qemu_driver)) == NULL)
1337
        goto error;
1338

1339
    if ((qemu_driver->activePciHostdevs = pciDeviceListNew()) == NULL)
1340 1341
        goto error;

1342 1343
    if (privileged) {
        if (chown(qemu_driver->libDir, qemu_driver->user, qemu_driver->group) < 0) {
1344
            virReportSystemError(errno,
1345 1346 1347 1348 1349
                                 _("unable to set ownership of '%s' to user %d:%d"),
                                 qemu_driver->libDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
        if (chown(qemu_driver->cacheDir, qemu_driver->user, qemu_driver->group) < 0) {
1350
            virReportSystemError(errno,
1351 1352 1353 1354
                                 _("unable to set ownership of '%s' to %d:%d"),
                                 qemu_driver->cacheDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
1355 1356 1357 1358 1359 1360
        if (chown(qemu_driver->saveDir, qemu_driver->user, qemu_driver->group) < 0) {
            virReportSystemError(errno,
                                 _("unable to set ownership of '%s' to %d:%d"),
                                 qemu_driver->saveDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
C
Chris Lalancette 已提交
1361 1362 1363 1364 1365 1366
        if (chown(qemu_driver->snapshotDir, qemu_driver->user, qemu_driver->group) < 0) {
            virReportSystemError(errno,
                                 _("unable to set ownership of '%s' to %d:%d"),
                                 qemu_driver->snapshotDir, qemu_driver->user, qemu_driver->group);
            goto error;
        }
1367 1368
    }

1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382
    /* If hugetlbfs is present, then we need to create a sub-directory within
     * it, since we can't assume the root mount point has permissions that
     * will let our spawned QEMU instances use it.
     *
     * NB the check for '/', since user may config "" to disable hugepages
     * even when mounted
     */
    if (qemu_driver->hugetlbfs_mount &&
        qemu_driver->hugetlbfs_mount[0] == '/') {
        char *mempath = NULL;
        if (virAsprintf(&mempath, "%s/libvirt/qemu", qemu_driver->hugetlbfs_mount) < 0)
            goto out_of_memory;

        if ((rc = virFileMakePath(mempath)) != 0) {
1383
            virReportSystemError(rc,
1384 1385 1386 1387 1388 1389
                                 _("unable to create hugepage path %s"), mempath);
            VIR_FREE(mempath);
            goto error;
        }
        if (qemu_driver->privileged &&
            chown(mempath, qemu_driver->user, qemu_driver->group) < 0) {
1390
            virReportSystemError(errno,
1391 1392 1393 1394 1395 1396 1397 1398 1399
                                 _("unable to set ownership on %s to %d:%d"),
                                 mempath, qemu_driver->user, qemu_driver->group);
            VIR_FREE(mempath);
            goto error;
        }

        qemu_driver->hugepage_path = mempath;
    }

1400
    /* Get all the running persistent or transient configs first */
1401
    if (virDomainLoadAllConfigs(qemu_driver->caps,
1402 1403 1404 1405 1406 1407
                                &qemu_driver->domains,
                                qemu_driver->stateDir,
                                NULL,
                                1, NULL, NULL) < 0)
        goto error;

1408 1409 1410 1411 1412
    conn = virConnectOpen(qemu_driver->privileged ?
                          "qemu:///system" :
                          "qemu:///session");

    qemuReconnectDomains(conn, qemu_driver);
1413 1414

    /* Then inactive persistent configs */
1415
    if (virDomainLoadAllConfigs(qemu_driver->caps,
1416 1417
                                &qemu_driver->domains,
                                qemu_driver->configDir,
1418
                                qemu_driver->autostartDir,
1419
                                0, NULL, NULL) < 0)
1420
        goto error;
C
Chris Lalancette 已提交
1421 1422 1423 1424 1425


    virHashForEach(qemu_driver->domains.objs, qemuDomainSnapshotLoad,
                   qemu_driver->snapshotDir);

1426 1427
    qemuDriverUnlock(qemu_driver);

1428 1429
    qemudAutostartConfigs(qemu_driver);

H
Hu Tao 已提交
1430 1431 1432 1433
    qemu_driver->workerPool = virThreadPoolNew(0, 1, processWatchdogEvent, qemu_driver);
    if (!qemu_driver->workerPool)
        goto error;

1434 1435
    if (conn)
        virConnectClose(conn);
1436

1437 1438
    return 0;

1439
out_of_memory:
1440
    virReportOOMError();
1441 1442 1443
error:
    if (qemu_driver)
        qemuDriverUnlock(qemu_driver);
1444 1445
    if (conn)
        virConnectClose(conn);
1446
    VIR_FREE(base);
1447
    VIR_FREE(driverConf);
1448
    qemudShutdown();
1449 1450 1451
    return -1;
}

1452 1453 1454 1455
static void qemudNotifyLoadDomain(virDomainObjPtr vm, int newVM, void *opaque)
{
    struct qemud_driver *driver = opaque;

1456 1457 1458 1459 1460 1461 1462 1463
    if (newVM) {
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED);
        if (event)
            qemuDomainEventQueue(driver, event);
    }
1464 1465
}

1466 1467 1468 1469 1470 1471 1472 1473
/**
 * qemudReload:
 *
 * Function to restart the QEmu daemon, it will recheck the configuration
 * files and update its state and the networking
 */
static int
qemudReload(void) {
1474 1475 1476
    if (!qemu_driver)
        return 0;

1477
    qemuDriverLock(qemu_driver);
1478
    virDomainLoadAllConfigs(qemu_driver->caps,
1479 1480
                            &qemu_driver->domains,
                            qemu_driver->configDir,
1481
                            qemu_driver->autostartDir,
1482
                            0, qemudNotifyLoadDomain, qemu_driver);
1483
    qemuDriverUnlock(qemu_driver);
1484

1485
    qemudAutostartConfigs(qemu_driver);
1486 1487

    return 0;
1488 1489
}

1490 1491 1492 1493 1494 1495 1496 1497 1498 1499
/**
 * qemudActive:
 *
 * Checks if the QEmu daemon is active, i.e. has an active domain or
 * an active network
 *
 * Returns 1 if active, 0 otherwise
 */
static int
qemudActive(void) {
1500
    int active = 0;
1501

1502 1503 1504
    if (!qemu_driver)
        return 0;

1505
    /* XXX having to iterate here is not great because it requires many locks */
1506
    qemuDriverLock(qemu_driver);
1507
    active = virDomainObjListNumOfDomains(&qemu_driver->domains, 1);
1508 1509
    qemuDriverUnlock(qemu_driver);
    return active;
1510 1511
}

1512 1513 1514 1515 1516 1517 1518
/**
 * qemudShutdown:
 *
 * Shutdown the QEmu daemon, it will stop all active domains and networks
 */
static int
qemudShutdown(void) {
1519
    int i;
1520

1521
    if (!qemu_driver)
1522
        return -1;
1523

1524
    qemuDriverLock(qemu_driver);
1525
    pciDeviceListFree(qemu_driver->activePciHostdevs);
1526 1527
    virCapabilitiesFree(qemu_driver->caps);

1528
    virDomainObjListDeinit(&qemu_driver->domains);
1529
    virBitmapFree(qemu_driver->reservedVNCPorts);
1530

1531 1532
    virSysinfoDefFree(qemu_driver->hostsysinfo);

1533 1534
    VIR_FREE(qemu_driver->configDir);
    VIR_FREE(qemu_driver->autostartDir);
E
Eric Blake 已提交
1535
    VIR_FREE(qemu_driver->logDir);
1536
    VIR_FREE(qemu_driver->stateDir);
1537 1538
    VIR_FREE(qemu_driver->libDir);
    VIR_FREE(qemu_driver->cacheDir);
1539
    VIR_FREE(qemu_driver->saveDir);
C
Chris Lalancette 已提交
1540
    VIR_FREE(qemu_driver->snapshotDir);
H
Hu Tao 已提交
1541
    VIR_FREE(qemu_driver->autoDumpPath);
1542
    VIR_FREE(qemu_driver->vncTLSx509certdir);
J
Jim Meyering 已提交
1543
    VIR_FREE(qemu_driver->vncListen);
1544
    VIR_FREE(qemu_driver->vncPassword);
1545
    VIR_FREE(qemu_driver->vncSASLdir);
E
Eric Blake 已提交
1546 1547 1548
    VIR_FREE(qemu_driver->spiceTLSx509certdir);
    VIR_FREE(qemu_driver->spiceListen);
    VIR_FREE(qemu_driver->spicePassword);
1549 1550
    VIR_FREE(qemu_driver->hugetlbfs_mount);
    VIR_FREE(qemu_driver->hugepage_path);
E
Eric Blake 已提交
1551 1552 1553
    VIR_FREE(qemu_driver->saveImageFormat);
    VIR_FREE(qemu_driver->dumpImageFormat);

1554 1555
    virSecurityManagerFree(qemu_driver->securityManager);

E
Eric Blake 已提交
1556
    ebtablesContextFree(qemu_driver->ebtables);
D
Daniel P. Berrange 已提交
1557

1558 1559 1560 1561 1562 1563
    if (qemu_driver->cgroupDeviceACL) {
        for (i = 0 ; qemu_driver->cgroupDeviceACL[i] != NULL ; i++)
            VIR_FREE(qemu_driver->cgroupDeviceACL[i]);
        VIR_FREE(qemu_driver->cgroupDeviceACL);
    }

1564 1565
    /* Free domain callback list */
    virDomainEventCallbackListFree(qemu_driver->domainEventCallbacks);
1566 1567 1568 1569
    virDomainEventQueueFree(qemu_driver->domainEventQueue);

    if (qemu_driver->domainEventTimer != -1)
        virEventRemoveTimeout(qemu_driver->domainEventTimer);
1570

1571 1572 1573
    if (qemu_driver->brctl)
        brShutdown(qemu_driver->brctl);

1574 1575
    virCgroupFree(&qemu_driver->cgroup);

1576
    qemuDriverUnlock(qemu_driver);
1577
    virMutexDestroy(&qemu_driver->lock);
H
Hu Tao 已提交
1578
    virThreadPoolFree(qemu_driver->workerPool);
1579
    VIR_FREE(qemu_driver);
1580 1581

    return 0;
1582 1583
}

1584
typedef int qemuLogHandleOutput(virDomainObjPtr vm,
1585 1586
                                const char *output,
                                int fd);
1587 1588 1589 1590 1591

/*
 * Returns -1 for error, 0 on success
 */
static int
1592
qemudReadLogOutput(virDomainObjPtr vm,
1593 1594
                   int fd,
                   char *buf,
G
Guido Günther 已提交
1595
                   size_t buflen,
1596
                   qemuLogHandleOutput func,
1597 1598 1599
                   const char *what,
                   int timeout)
{
1600
    int retries = (timeout*10);
1601
    int got = 0;
1602 1603 1604
    buf[0] = '\0';

    while (retries) {
1605
        ssize_t func_ret, ret;
1606
        int isdead = 0;
G
Guido Günther 已提交
1607

1608
        func_ret = func(vm, buf, fd);
1609

1610 1611
        if (kill(vm->pid, 0) == -1 && errno == ESRCH)
            isdead = 1;
1612

1613 1614
        /* Any failures should be detected before we read the log, so we
         * always have something useful to report on failure. */
1615 1616
        ret = saferead(fd, buf+got, buflen-got-1);
        if (ret < 0) {
1617
            virReportSystemError(errno,
1618 1619 1620 1621 1622
                                 _("Failure while reading %s log output"),
                                 what);
            return -1;
        }

1623 1624 1625
        got += ret;
        buf[got] = '\0';
        if (got == buflen-1) {
1626
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
1627 1628
                            _("Out of space while reading %s log output: %s"),
                            what, buf);
1629 1630 1631 1632
            return -1;
        }

        if (isdead) {
1633
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
1634 1635
                            _("Process exited while reading %s log output: %s"),
                            what, buf);
1636 1637 1638
            return -1;
        }

1639 1640
        if (func_ret <= 0)
            return func_ret;
1641 1642 1643 1644

        usleep(100*1000);
        retries--;
    }
1645

1646
    qemuReportError(VIR_ERR_INTERNAL_ERROR,
1647 1648
                    _("Timed out while reading %s log output: %s"),
                    what, buf);
1649 1650 1651
    return -1;
}

1652

1653 1654 1655 1656 1657 1658 1659 1660
/*
 * Look at a chunk of data from the QEMU stdout logs and try to
 * find a TTY device, as indicated by a line like
 *
 * char device redirected to /dev/pts/3
 *
 * Returns -1 for error, 0 success, 1 continue reading
 */
1661
static int
1662
qemudExtractTTYPath(const char *haystack,
1663 1664
                    size_t *offset,
                    char **path)
1665
{
1666
    static const char needle[] = "char device redirected to";
1667
    char *tmp, *dev;
1668

1669
    VIR_FREE(*path);
1670
    /* First look for our magic string */
1671 1672 1673 1674 1675
    if (!(tmp = strstr(haystack + *offset, needle))) {
        return 1;
    }
    tmp += sizeof(needle);
    dev = tmp;
1676

1677 1678 1679 1680 1681
    /*
     * And look for first whitespace character and nul terminate
     * to mark end of the pty path
     */
    while (*tmp) {
1682
        if (c_isspace(*tmp)) {
1683 1684
            *path = strndup(dev, tmp-dev);
            if (*path == NULL) {
1685
                virReportOOMError();
1686 1687
                return -1;
            }
1688

1689
            /* ... now further update offset till we get EOL */
1690
            *offset = tmp - haystack;
1691 1692
            return 0;
        }
1693
        tmp++;
1694 1695 1696 1697 1698
    }

    /*
     * We found a path, but didn't find any whitespace,
     * so it must be still incomplete - we should at
1699 1700
     * least see a \n - indicate that we want to carry
     * on trying again
1701
     */
1702
    return 1;
1703 1704
}

1705
static int
1706
qemudFindCharDevicePTYsMonitor(virDomainObjPtr vm,
1707 1708 1709 1710 1711 1712 1713
                               virHashTablePtr paths)
{
    int i;

#define LOOKUP_PTYS(array, arraylen, idprefix)                            \
    for (i = 0 ; i < (arraylen) ; i++) {                                  \
        virDomainChrDefPtr chr = (array)[i];                              \
1714
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {                \
1715 1716 1717 1718 1719 1720 1721
            char id[16];                                                  \
                                                                          \
            if (snprintf(id, sizeof(id), idprefix "%i", i) >= sizeof(id)) \
                return -1;                                                \
                                                                          \
            const char *path = (const char *) virHashLookup(paths, id);   \
            if (path == NULL) {                                           \
1722
                if (chr->source.data.file.path == NULL) {                 \
1723 1724
                    /* neither the log output nor 'info chardev' had a */ \
                    /* pty path for this chardev, report an error */      \
1725 1726 1727
                    qemuReportError(VIR_ERR_INTERNAL_ERROR,               \
                                    _("no assigned pty for device %s"), id); \
                    return -1;                                            \
1728 1729 1730 1731 1732
                } else {                                                  \
                    /* 'info chardev' had no pty path for this chardev, */\
                    /* but the log output had, so we're fine */           \
                    continue;                                             \
                }                                                         \
1733 1734
            }                                                             \
                                                                          \
1735 1736
            VIR_FREE(chr->source.data.file.path);                         \
            chr->source.data.file.path = strdup(path);                    \
1737
                                                                          \
1738
            if (chr->source.data.file.path == NULL) {                     \
1739
                virReportOOMError();                                      \
1740 1741
                return -1;                                                \
            }                                                             \
1742 1743 1744 1745 1746 1747
        }                                                                 \
    }

    LOOKUP_PTYS(vm->def->serials,   vm->def->nserials,   "serial");
    LOOKUP_PTYS(vm->def->parallels, vm->def->nparallels, "parallel");
    LOOKUP_PTYS(vm->def->channels,  vm->def->nchannels,  "channel");
C
Cole Robinson 已提交
1748 1749
    if (vm->def->console)
        LOOKUP_PTYS(&vm->def->console, 1,  "console");
1750
#undef LOOKUP_PTYS
1751 1752 1753 1754

    return 0;
}

1755
static int
1756
qemudFindCharDevicePTYs(virDomainObjPtr vm,
1757 1758
                        const char *output,
                        int fd ATTRIBUTE_UNUSED)
1759
{
1760
    size_t offset = 0;
1761
    int ret, i;
1762 1763

    /* The order in which QEMU prints out the PTY paths is
1764 1765
       the order in which it procsses its serial and parallel
       device args. This code must match that ordering.... */
1766

1767
    /* first comes the serial devices */
1768 1769
    for (i = 0 ; i < vm->def->nserials ; i++) {
        virDomainChrDefPtr chr = vm->def->serials[i];
1770
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {
1771
            if ((ret = qemudExtractTTYPath(output, &offset,
1772
                                           &chr->source.data.file.path)) != 0)
1773
                return ret;
1774 1775 1776
        }
    }

1777
    /* then the parallel devices */
1778 1779
    for (i = 0 ; i < vm->def->nparallels ; i++) {
        virDomainChrDefPtr chr = vm->def->parallels[i];
1780
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {
1781
            if ((ret = qemudExtractTTYPath(output, &offset,
1782
                                           &chr->source.data.file.path)) != 0)
1783
                return ret;
1784 1785 1786
        }
    }

1787 1788 1789
    /* then the channel devices */
    for (i = 0 ; i < vm->def->nchannels ; i++) {
        virDomainChrDefPtr chr = vm->def->channels[i];
1790
        if (chr->source.type == VIR_DOMAIN_CHR_TYPE_PTY) {
1791
            if ((ret = qemudExtractTTYPath(output, &offset,
1792
                                           &chr->source.data.file.path)) != 0)
1793 1794 1795 1796
                return ret;
        }
    }

1797
    return 0;
1798 1799
}

1800 1801 1802 1803 1804
static void qemudFreePtyPath(void *payload, const char *name ATTRIBUTE_UNUSED)
{
    VIR_FREE(payload);
}

1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818
static void
qemuReadLogFD(int logfd, char *buf, int maxlen, int off)
{
    int ret;
    char *tmpbuf = buf + off;

    ret = saferead(logfd, tmpbuf, maxlen - off - 1);
    if (ret < 0) {
        ret = 0;
    }

    tmpbuf[ret] = '\0';
}

1819
static int
1820
qemudWaitForMonitor(struct qemud_driver* driver,
1821
                    virDomainObjPtr vm, off_t pos)
1822
{
1823
    char buf[4096] = ""; /* Plenty of space to get startup greeting */
1824
    int logfd;
1825
    int ret = -1;
1826
    virHashTablePtr paths = NULL;
1827

1828
    if ((logfd = qemudLogReadFD(driver->logDir, vm->def->name, pos)) < 0)
1829
        return -1;
1830

1831 1832 1833 1834
    if (qemudReadLogOutput(vm, logfd, buf, sizeof(buf),
                           qemudFindCharDevicePTYs,
                           "console", 30) < 0)
        goto closelog;
1835

1836
    VIR_DEBUG("Connect monitor to %p '%s'", vm, vm->def->name);
1837 1838 1839
    if (qemuConnectMonitor(driver, vm) < 0) {
        goto cleanup;
    }
1840

1841 1842 1843 1844
    /* Try to get the pty path mappings again via the monitor. This is much more
     * reliable if it's available.
     * Note that the monitor itself can be on a pty, so we still need to try the
     * log output method. */
1845
    paths = virHashCreate(0);
1846
    if (paths == NULL) {
1847
        virReportOOMError();
1848 1849 1850
        goto cleanup;
    }

1851
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
1852 1853
    qemuDomainObjPrivatePtr priv = vm->privateData;
    ret = qemuMonitorGetPtyPaths(priv->mon, paths);
1854
    qemuDomainObjExitMonitorWithDriver(driver, vm);
1855 1856 1857

    VIR_DEBUG("qemuMonitorGetPtyPaths returned %i", ret);
    if (ret == 0) {
1858
        ret = qemudFindCharDevicePTYsMonitor(vm, paths);
1859 1860 1861 1862 1863 1864 1865
    }

cleanup:
    if (paths) {
        virHashFree(paths, qemudFreePtyPath);
    }

1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876
    if (kill(vm->pid, 0) == -1 && errno == ESRCH) {
        /* VM is dead, any other error raised in the interim is probably
         * not as important as the qemu cmdline output */
        qemuReadLogFD(logfd, buf, sizeof(buf), strlen(buf));
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("process exited while connecting to monitor: %s"),
                        buf);
        ret = -1;
    }

closelog:
1877
    if (VIR_CLOSE(logfd) < 0) {
1878
        char ebuf[4096];
1879
        VIR_WARN("Unable to close logfile: %s",
1880 1881 1882
                 virStrerror(errno, ebuf, sizeof ebuf));
    }

1883
    return ret;
1884 1885
}

1886
static int
1887
qemuDetectVcpuPIDs(struct qemud_driver *driver,
1888 1889 1890
                   virDomainObjPtr vm) {
    pid_t *cpupids = NULL;
    int ncpupids;
1891
    qemuDomainObjPrivatePtr priv = vm->privateData;
1892

1893
    if (vm->def->virtType != VIR_DOMAIN_VIRT_KVM) {
1894 1895
        priv->nvcpupids = 1;
        if (VIR_ALLOC_N(priv->vcpupids, priv->nvcpupids) < 0) {
1896
            virReportOOMError();
1897 1898
            return -1;
        }
1899
        priv->vcpupids[0] = vm->pid;
1900 1901 1902
        return 0;
    }

1903
    /* What follows is now all KVM specific */
1904

1905
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
1906
    if ((ncpupids = qemuMonitorGetCPUInfo(priv->mon, &cpupids)) < 0) {
1907
        qemuDomainObjExitMonitorWithDriver(driver, vm);
1908
        return -1;
1909
    }
1910
    qemuDomainObjExitMonitorWithDriver(driver, vm);
1911

1912 1913 1914
    /* Treat failure to get VCPU<->PID mapping as non-fatal */
    if (ncpupids == 0)
        return 0;
1915

1916
    if (ncpupids != vm->def->vcpus) {
1917
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
E
Eric Blake 已提交
1918 1919 1920
                        _("got wrong number of vCPU pids from QEMU monitor. "
                          "got %d, wanted %d"),
                        ncpupids, vm->def->vcpus);
1921 1922 1923
        VIR_FREE(cpupids);
        return -1;
    }
1924

1925 1926
    priv->nvcpupids = ncpupids;
    priv->vcpupids = cpupids;
1927 1928 1929
    return 0;
}

1930 1931 1932
/*
 * To be run between fork/exec of QEMU only
 */
1933
static int
1934 1935
qemudInitCpuAffinity(virDomainObjPtr vm)
{
1936
    int i, hostcpus, maxcpu = QEMUD_CPUMASK_LEN;
1937
    virNodeInfo nodeinfo;
1938 1939
    unsigned char *cpumap;
    int cpumaplen;
1940 1941

    DEBUG0("Setting CPU affinity");
1942

1943
    if (nodeGetInfo(NULL, &nodeinfo) < 0)
1944 1945 1946 1947
        return -1;

    /* setaffinity fails if you set bits for CPUs which
     * aren't present, so we have to limit ourselves */
1948 1949 1950
    hostcpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
    if (maxcpu > hostcpus)
        maxcpu = hostcpus;
1951

1952 1953
    cpumaplen = VIR_CPU_MAPLEN(maxcpu);
    if (VIR_ALLOC_N(cpumap, cpumaplen) < 0) {
1954
        virReportOOMError();
1955 1956 1957
        return -1;
    }

D
Daniel P. Berrange 已提交
1958
    if (vm->def->cpumask) {
1959 1960 1961
        /* XXX why don't we keep 'cpumask' in the libvirt cpumap
         * format to start with ?!?! */
        for (i = 0 ; i < maxcpu && i < vm->def->cpumasklen ; i++)
D
Daniel P. Berrange 已提交
1962
            if (vm->def->cpumask[i])
1963
                VIR_USE_CPU(cpumap, i);
D
Daniel P. Berrange 已提交
1964
    } else {
1965 1966 1967 1968
        /* You may think this is redundant, but we can't assume libvirtd
         * itself is running on all pCPUs, so we need to explicitly set
         * the spawned QEMU instance to all pCPUs if no map is given in
         * its config file */
D
Daniel P. Berrange 已提交
1969
        for (i = 0 ; i < maxcpu ; i++)
1970
            VIR_USE_CPU(cpumap, i);
D
Daniel P. Berrange 已提交
1971
    }
1972

1973 1974 1975 1976 1977 1978 1979 1980
    /* We are pressuming we are running between fork/exec of QEMU
     * so use '0' to indicate our own process ID. No threads are
     * running at this point
     */
    if (virProcessInfoSetAffinity(0, /* Self */
                                  cpumap, cpumaplen, maxcpu) < 0) {
        VIR_FREE(cpumap);
        return -1;
1981
    }
1982
    VIR_FREE(cpumap);
1983 1984 1985 1986 1987

    return 0;
}


1988
static int
1989 1990 1991 1992
qemuInitPasswords(virConnectPtr conn,
                  struct qemud_driver *driver,
                  virDomainObjPtr vm,
                  unsigned long long qemuCmdFlags) {
1993
    int ret = 0;
1994
    qemuDomainObjPrivatePtr priv = vm->privateData;
1995

1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007
    if (vm->def->ngraphics == 1) {
        if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC) {
            ret = qemuDomainChangeGraphicsPasswords(driver, vm,
                                                    VIR_DOMAIN_GRAPHICS_TYPE_VNC,
                                                    &vm->def->graphics[0]->data.vnc.auth,
                                                    driver->vncPassword);
        } else if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_SPICE) {
            ret = qemuDomainChangeGraphicsPasswords(driver, vm,
                                                    VIR_DOMAIN_GRAPHICS_TYPE_SPICE,
                                                    &vm->def->graphics[0]->data.spice.auth,
                                                    driver->spicePassword);
        }
2008 2009
    }

2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032
    if (ret < 0)
        goto cleanup;

    if (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE) {
        int i;

        for (i = 0 ; i < vm->def->ndisks ; i++) {
            char *secret;
            size_t secretLen;

            if (!vm->def->disks[i]->encryption ||
                !vm->def->disks[i]->src)
                continue;

            if (getVolumeQcowPassphrase(conn,
                                        vm->def->disks[i],
                                        &secret, &secretLen) < 0)
                goto cleanup;

            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            ret = qemuMonitorSetDrivePassphrase(priv->mon,
                                                vm->def->disks[i]->info.alias,
                                                secret);
2033
            VIR_FREE(secret);
2034 2035 2036 2037 2038 2039 2040
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (ret < 0)
                goto cleanup;
        }
    }

cleanup:
2041
    return ret;
2042 2043 2044
}


2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055 2056
#define QEMU_PCI_VENDOR_INTEL     0x8086
#define QEMU_PCI_VENDOR_LSI_LOGIC 0x1000
#define QEMU_PCI_VENDOR_REDHAT    0x1af4
#define QEMU_PCI_VENDOR_CIRRUS    0x1013
#define QEMU_PCI_VENDOR_REALTEK   0x10ec
#define QEMU_PCI_VENDOR_AMD       0x1022
#define QEMU_PCI_VENDOR_ENSONIQ   0x1274
#define QEMU_PCI_VENDOR_VMWARE    0x15ad
#define QEMU_PCI_VENDOR_QEMU      0x1234

#define QEMU_PCI_PRODUCT_DISK_VIRTIO 0x1001

2057 2058
#define QEMU_PCI_PRODUCT_BALLOON_VIRTIO 0x1002

2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266
#define QEMU_PCI_PRODUCT_NIC_NE2K     0x8029
#define QEMU_PCI_PRODUCT_NIC_PCNET    0x2000
#define QEMU_PCI_PRODUCT_NIC_RTL8139  0x8139
#define QEMU_PCI_PRODUCT_NIC_E1000    0x100E
#define QEMU_PCI_PRODUCT_NIC_VIRTIO   0x1000

#define QEMU_PCI_PRODUCT_VGA_CIRRUS 0x00b8
#define QEMU_PCI_PRODUCT_VGA_VMWARE 0x0405
#define QEMU_PCI_PRODUCT_VGA_STDVGA 0x1111

#define QEMU_PCI_PRODUCT_AUDIO_AC97    0x2415
#define QEMU_PCI_PRODUCT_AUDIO_ES1370  0x5000

#define QEMU_PCI_PRODUCT_CONTROLLER_PIIX 0x7010
#define QEMU_PCI_PRODUCT_CONTROLLER_LSI  0x0012

#define QEMU_PCI_PRODUCT_WATCHDOG_I63000ESB 0x25ab

static int
qemuAssignNextPCIAddress(virDomainDeviceInfo *info,
                         int vendor,
                         int product,
                         qemuMonitorPCIAddress *addrs,
                         int naddrs)
{
    int found = 0;
    int i;

    VIR_DEBUG("Look for %x:%x out of %d", vendor, product, naddrs);

    for (i = 0 ; (i < naddrs) && !found; i++) {
        VIR_DEBUG("Maybe %x:%x", addrs[i].vendor, addrs[i].product);
        if (addrs[i].vendor == vendor &&
            addrs[i].product == product) {
            VIR_DEBUG("Match %d", i);
            found = 1;
            break;
        }
    }
    if (!found) {
        return -1;
    }

    /* Blank it out so this device isn't matched again */
    addrs[i].vendor = 0;
    addrs[i].product = 0;

    if (info->type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_NONE)
        info->type = VIR_DOMAIN_DEVICE_ADDRESS_TYPE_PCI;

    if (info->type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_PCI) {
        info->addr.pci.domain = addrs[i].addr.domain;
        info->addr.pci.bus = addrs[i].addr.bus;
        info->addr.pci.slot = addrs[i].addr.slot;
        info->addr.pci.function = addrs[i].addr.function;
    }

    return 0;
}

static int
qemuGetPCIDiskVendorProduct(virDomainDiskDefPtr def,
                            unsigned *vendor,
                            unsigned *product)
{
    switch (def->bus) {
    case VIR_DOMAIN_DISK_BUS_VIRTIO:
        *vendor = QEMU_PCI_VENDOR_REDHAT;
        *product = QEMU_PCI_PRODUCT_DISK_VIRTIO;
        break;

    default:
        return -1;
    }

    return 0;
}

static int
qemuGetPCINetVendorProduct(virDomainNetDefPtr def,
                            unsigned *vendor,
                            unsigned *product)
{
    if (!def->model)
        return -1;

    if (STREQ(def->model, "ne2k_pci")) {
        *vendor = QEMU_PCI_VENDOR_REALTEK;
        *product = QEMU_PCI_PRODUCT_NIC_NE2K;
    } else if (STREQ(def->model, "pcnet")) {
        *vendor = QEMU_PCI_VENDOR_AMD;
        *product = QEMU_PCI_PRODUCT_NIC_PCNET;
    } else if (STREQ(def->model, "rtl8139")) {
        *vendor = QEMU_PCI_VENDOR_REALTEK;
        *product = QEMU_PCI_PRODUCT_NIC_RTL8139;
    } else if (STREQ(def->model, "e1000")) {
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_NIC_E1000;
    } else if (STREQ(def->model, "virtio")) {
        *vendor = QEMU_PCI_VENDOR_REDHAT;
        *product = QEMU_PCI_PRODUCT_NIC_VIRTIO;
    } else {
        VIR_INFO("Unexpected NIC model %s, cannot get PCI address",
                 def->model);
        return -1;
    }
    return 0;
}

static int
qemuGetPCIControllerVendorProduct(virDomainControllerDefPtr def,
                                  unsigned *vendor,
                                  unsigned *product)
{
    switch (def->type) {
    case VIR_DOMAIN_CONTROLLER_TYPE_SCSI:
        *vendor = QEMU_PCI_VENDOR_LSI_LOGIC;
        *product = QEMU_PCI_PRODUCT_CONTROLLER_LSI;
        break;

    case VIR_DOMAIN_CONTROLLER_TYPE_FDC:
        /* XXX we could put in the ISA bridge address, but
           that's not technically the FDC's address */
        return -1;

    case VIR_DOMAIN_CONTROLLER_TYPE_IDE:
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_CONTROLLER_PIIX;
        break;

    default:
        VIR_INFO("Unexpected controller type %s, cannot get PCI address",
                 virDomainControllerTypeToString(def->type));
        return -1;
    }

    return 0;
}

static int
qemuGetPCIVideoVendorProduct(virDomainVideoDefPtr def,
                             unsigned *vendor,
                             unsigned *product)
{
    switch (def->type) {
    case VIR_DOMAIN_VIDEO_TYPE_CIRRUS:
        *vendor = QEMU_PCI_VENDOR_CIRRUS;
        *product = QEMU_PCI_PRODUCT_VGA_CIRRUS;
        break;

    case VIR_DOMAIN_VIDEO_TYPE_VGA:
        *vendor = QEMU_PCI_VENDOR_QEMU;
        *product = QEMU_PCI_PRODUCT_VGA_STDVGA;
        break;

    case VIR_DOMAIN_VIDEO_TYPE_VMVGA:
        *vendor = QEMU_PCI_VENDOR_VMWARE;
        *product = QEMU_PCI_PRODUCT_VGA_VMWARE;
        break;

    default:
        return -1;
    }
    return 0;
}

static int
qemuGetPCISoundVendorProduct(virDomainSoundDefPtr def,
                             unsigned *vendor,
                             unsigned *product)
{
    switch (def->model) {
    case VIR_DOMAIN_SOUND_MODEL_ES1370:
        *vendor = QEMU_PCI_VENDOR_ENSONIQ;
        *product = QEMU_PCI_PRODUCT_AUDIO_ES1370;
        break;

    case VIR_DOMAIN_SOUND_MODEL_AC97:
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_AUDIO_AC97;
        break;

    default:
        return -1;
    }

    return 0;
}

static int
qemuGetPCIWatchdogVendorProduct(virDomainWatchdogDefPtr def,
                                unsigned *vendor,
                                unsigned *product)
{
    switch (def->model) {
    case VIR_DOMAIN_WATCHDOG_MODEL_I6300ESB:
        *vendor = QEMU_PCI_VENDOR_INTEL;
        *product = QEMU_PCI_PRODUCT_WATCHDOG_I63000ESB;
        break;

    default:
        return -1;
    }

    return 0;
}


2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285
static int
qemuGetPCIMemballoonVendorProduct(virDomainMemballoonDefPtr def,
                                  unsigned *vendor,
                                  unsigned *product)
{
    switch (def->model) {
    case VIR_DOMAIN_MEMBALLOON_MODEL_VIRTIO:
        *vendor = QEMU_PCI_VENDOR_REDHAT;
        *product = QEMU_PCI_PRODUCT_BALLOON_VIRTIO;
        break;

    default:
        return -1;
    }

    return 0;
}


2286 2287 2288 2289 2290 2291 2292 2293 2294
/*
 * This entire method assumes that PCI devices in 'info pci'
 * match ordering of devices specified on the command line
 * wrt to devices of matching vendor+product
 *
 * XXXX this might not be a valid assumption if we assign
 * some static addrs on CLI. Have to check that...
 */
static int
2295
qemuDetectPCIAddresses(virDomainObjPtr vm,
2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312
                       qemuMonitorPCIAddress *addrs,
                       int naddrs)
{
    unsigned int vendor = 0, product = 0;
    int i;

    /* XXX should all these vendor/product IDs be kept in the
     * actual device data structure instead ?
     */

    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (qemuGetPCIDiskVendorProduct(vm->def->disks[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->disks[i]->info),
                                     vendor, product,
                                     addrs, naddrs) < 0) {
2313 2314 2315
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for VirtIO disk %s"),
                            vm->def->disks[i]->dst);
2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (qemuGetPCINetVendorProduct(vm->def->nets[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->nets[i]->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2327 2328 2329
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for %s NIC"),
                            vm->def->nets[i]->model);
2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->ncontrollers ; i++) {
        if (qemuGetPCIControllerVendorProduct(vm->def->controllers[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->controllers[i]->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2341 2342 2343
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for controller %s"),
                            virDomainControllerTypeToString(vm->def->controllers[i]->type));
2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->nvideos ; i++) {
        if (qemuGetPCIVideoVendorProduct(vm->def->videos[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->videos[i]->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2355 2356 2357
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for video adapter %s"),
                            virDomainVideoTypeToString(vm->def->videos[i]->type));
2358 2359 2360 2361 2362 2363 2364 2365 2366
            return -1;
        }
    }

    for (i = 0 ; i < vm->def->nsounds ; i++) {
        if (qemuGetPCISoundVendorProduct(vm->def->sounds[i], &vendor, &product) < 0)
            continue;

        if (qemuAssignNextPCIAddress(&(vm->def->sounds[i]->info),
2367
                                    vendor, product,
2368
                                     addrs,  naddrs) < 0) {
2369 2370 2371
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for sound adapter %s"),
                            virDomainSoundModelTypeToString(vm->def->sounds[i]->model));
2372 2373 2374 2375 2376 2377 2378 2379 2380 2381
            return -1;
        }
    }


    if (vm->def->watchdog &&
        qemuGetPCIWatchdogVendorProduct(vm->def->watchdog, &vendor, &product) == 0) {
        if (qemuAssignNextPCIAddress(&(vm->def->watchdog->info),
                                     vendor, product,
                                     addrs,  naddrs) < 0) {
2382 2383 2384
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for watchdog %s"),
                            virDomainWatchdogModelTypeToString(vm->def->watchdog->model));
2385 2386 2387 2388
            return -1;
        }
    }

2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400
    if (vm->def->memballoon &&
        qemuGetPCIMemballoonVendorProduct(vm->def->memballoon, &vendor, &product) == 0) {
        if (qemuAssignNextPCIAddress(&(vm->def->memballoon->info),
                                     vendor, product,
                                     addrs, naddrs) < 0) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("cannot find PCI address for balloon %s"),
                            virDomainMemballoonModelTypeToString(vm->def->memballoon->model));
            return -1;
        }
    }

2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426
    /* XXX console (virtio) */


    /* ... and now things we don't have in our xml */

    /* XXX USB controller ? */

    /* XXX what about other PCI devices (ie bridges) */

    return 0;
}

static int
qemuInitPCIAddresses(struct qemud_driver *driver,
                     virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int naddrs;
    int ret;
    qemuMonitorPCIAddress *addrs = NULL;

    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    naddrs = qemuMonitorGetAllPCIAddresses(priv->mon,
                                           &addrs);
    qemuDomainObjExitMonitorWithDriver(driver, vm);

2427
    ret = qemuDetectPCIAddresses(vm, addrs, naddrs);
2428 2429 2430 2431 2432 2433

    VIR_FREE(addrs);

    return ret;
}

2434 2435 2436

static int qemudNextFreePort(struct qemud_driver *driver,
                             int startPort) {
2437 2438
    int i;

2439
    for (i = startPort ; i < QEMU_VNC_PORT_MAX; i++) {
2440 2441 2442
        int fd;
        int reuse = 1;
        struct sockaddr_in addr;
2443 2444 2445 2446 2447 2448 2449 2450 2451
        bool used = false;

        if (virBitmapGetBit(driver->reservedVNCPorts,
                            i - QEMU_VNC_PORT_MIN, &used) < 0)
            VIR_DEBUG("virBitmapGetBit failed on bit %d", i - QEMU_VNC_PORT_MIN);

        if (used)
            continue;

2452 2453 2454 2455 2456 2457 2458 2459
        addr.sin_family = AF_INET;
        addr.sin_port = htons(i);
        addr.sin_addr.s_addr = htonl(INADDR_ANY);
        fd = socket(PF_INET, SOCK_STREAM, 0);
        if (fd < 0)
            return -1;

        if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, (void*)&reuse, sizeof(reuse)) < 0) {
2460
            VIR_FORCE_CLOSE(fd);
2461 2462 2463 2464 2465
            break;
        }

        if (bind(fd, (struct sockaddr*)&addr, sizeof(addr)) == 0) {
            /* Not in use, lets grab it */
2466
            VIR_FORCE_CLOSE(fd);
2467 2468 2469 2470 2471 2472
            /* Add port to bitmap of reserved ports */
            if (virBitmapSetBit(driver->reservedVNCPorts,
                                i - QEMU_VNC_PORT_MIN) < 0) {
                VIR_DEBUG("virBitmapSetBit failed on bit %d",
                          i - QEMU_VNC_PORT_MIN);
            }
2473 2474
            return i;
        }
2475
        VIR_FORCE_CLOSE(fd);
2476 2477 2478 2479 2480 2481 2482 2483 2484 2485 2486

        if (errno == EADDRINUSE) {
            /* In use, try next */
            continue;
        }
        /* Some other bad failure, get out.. */
        break;
    }
    return -1;
}

2487

2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500
static void
qemuReturnPort(struct qemud_driver *driver,
                int port)
{
    if (port < QEMU_VNC_PORT_MIN)
        return;

    if (virBitmapClearBit(driver->reservedVNCPorts,
                          port - QEMU_VNC_PORT_MIN) < 0)
        VIR_DEBUG("Could not mark port %d as unused", port);
}


2501 2502 2503 2504 2505 2506 2507
static int
qemuAssignPCIAddresses(virDomainDefPtr def)
{
    int ret = -1;
    unsigned long long qemuCmdFlags = 0;
    qemuDomainPCIAddressSetPtr addrs = NULL;

2508 2509 2510
    if (qemuCapsExtractVersionInfo(def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526 2527 2528 2529
        goto cleanup;

    if (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE) {
        if (!(addrs = qemuDomainPCIAddressSetCreate(def)))
            goto cleanup;

        if (qemuAssignDevicePCISlots(def, addrs) < 0)
            goto cleanup;
    }

    ret = 0;

cleanup:
    qemuDomainPCIAddressSetFree(addrs);

    return ret;
}


2530 2531 2532 2533 2534 2535
static int
qemuPrepareChardevDevice(virDomainDefPtr def ATTRIBUTE_UNUSED,
                         virDomainChrDefPtr dev,
                         void *opaque ATTRIBUTE_UNUSED)
{
    int fd;
2536
    if (dev->source.type != VIR_DOMAIN_CHR_TYPE_FILE)
2537 2538
        return 0;

2539 2540
    if ((fd = open(dev->source.data.file.path,
                   O_CREAT | O_APPEND, S_IRUSR|S_IWUSR)) < 0) {
2541 2542
        virReportSystemError(errno,
                             _("Unable to pre-create chardev file '%s'"),
2543
                             dev->source.data.file.path);
2544 2545 2546
        return -1;
    }

2547
    VIR_FORCE_CLOSE(fd);
2548 2549 2550 2551 2552

    return 0;
}


2553 2554 2555 2556
struct qemudHookData {
    virConnectPtr conn;
    virDomainObjPtr vm;
    struct qemud_driver *driver;
2557 2558 2559
};

static int qemudSecurityHook(void *data) {
2560 2561
    struct qemudHookData *h = data;

2562 2563 2564
    /* This must take place before exec(), so that all QEMU
     * memory allocation is on the correct NUMA node
     */
2565
    if (qemuAddToCgroup(h->driver, h->vm->def) < 0)
2566 2567
        return -1;

2568 2569 2570
    /* This must be done after cgroup placement to avoid resetting CPU
     * affinity */
    if (qemudInitCpuAffinity(h->vm) < 0)
2571
        return -1;
2572

2573
    if (virSecurityManagerSetProcessLabel(h->driver->securityManager, h->vm) < 0)
2574 2575 2576
        return -1;

    return 0;
2577 2578
}

2579
static int
2580
qemuPrepareMonitorChr(struct qemud_driver *driver,
2581
                      virDomainChrSourceDefPtr monConfig,
2582 2583
                      const char *vm)
{
2584 2585
    monConfig->type = VIR_DOMAIN_CHR_TYPE_UNIX;
    monConfig->data.nix.listen = true;
2586

2587
    if (virAsprintf(&monConfig->data.nix.path, "%s/%s.monitor",
2588
                    driver->libDir, vm) < 0) {
2589
        virReportOOMError();
2590 2591 2592 2593 2594 2595
        return -1;
    }

    return 0;
}

2596 2597 2598 2599
static int qemuDomainSnapshotSetCurrentActive(virDomainObjPtr vm,
                                              char *snapshotDir);
static int qemuDomainSnapshotSetCurrentInactive(virDomainObjPtr vm,
                                                char *snapshotDir);
C
Chris Lalancette 已提交
2600

2601

2602 2603
#define START_POSTFIX ": starting up\n"
#define SHUTDOWN_POSTFIX ": shutting down\n"
2604

2605 2606
static int qemudStartVMDaemon(virConnectPtr conn,
                              struct qemud_driver *driver,
2607
                              virDomainObjPtr vm,
2608
                              const char *migrateFrom,
2609
                              bool start_paused,
2610
                              int stdin_fd,
2611 2612
                              const char *stdin_path,
                              enum virVMOperationType vmop) {
E
Eric Blake 已提交
2613
    int ret;
2614
    unsigned long long qemuCmdFlags;
2615
    off_t pos = -1;
2616
    char ebuf[1024];
2617
    char *pidfile = NULL;
2618
    int logfile = -1;
2619
    char *timestamp;
2620
    qemuDomainObjPrivatePtr priv = vm->privateData;
E
Eric Blake 已提交
2621
    virCommandPtr cmd = NULL;
2622

2623
    struct qemudHookData hookData;
2624 2625 2626 2627
    hookData.conn = conn;
    hookData.vm = vm;
    hookData.driver = driver;

2628 2629
    DEBUG0("Beginning VM startup process");

D
Daniel P. Berrange 已提交
2630
    if (virDomainObjIsActive(vm)) {
2631 2632
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("VM is already active"));
2633 2634 2635
        return -1;
    }

2636 2637 2638 2639 2640 2641 2642 2643
    /* Do this upfront, so any part of the startup process can add
     * runtime state to vm->def that won't be persisted. This let's us
     * report implicit runtime defaults in the XML, like vnc listen/socket
     */
    DEBUG0("Setting current domain def as transient");
    if (virDomainObjSetDefTransient(driver->caps, vm, true) < 0)
        goto cleanup;

2644 2645 2646 2647 2648
    /* Must be run before security labelling */
    DEBUG0("Preparing host devices");
    if (qemuPrepareHostDevices(driver, vm->def) < 0)
        goto cleanup;

2649 2650 2651 2652 2653 2654 2655
    DEBUG0("Preparing chr devices");
    if (virDomainChrDefForeach(vm->def,
                               true,
                               qemuPrepareChardevDevice,
                               NULL) < 0)
        goto cleanup;

2656 2657
    /* If you are using a SecurityDriver with dynamic labelling,
       then generate a security label for isolation */
2658
    DEBUG0("Generating domain security label (if required)");
2659 2660 2661
    if (virSecurityManagerGenLabel(driver->securityManager, vm) < 0) {
        qemuDomainSecurityLabelAudit(vm, false);
        goto cleanup;
2662
    }
2663
    qemuDomainSecurityLabelAudit(vm, true);
2664

2665
    DEBUG0("Generating setting domain security labels (if required)");
2666 2667
    if (virSecurityManagerSetAllLabel(driver->securityManager,
                                      vm, stdin_path) < 0)
2668
        goto cleanup;
2669

2670 2671 2672
    /* Ensure no historical cgroup for this VM is lying around bogus
     * settings */
    DEBUG0("Ensuring no historical cgroup is lying around");
2673
    qemuRemoveCgroup(driver, vm, 1);
2674

2675 2676
    if (vm->def->ngraphics == 1) {
        if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC &&
2677
            !vm->def->graphics[0]->data.vnc.socket &&
2678
            vm->def->graphics[0]->data.vnc.autoport) {
2679
            int port = qemudNextFreePort(driver, QEMU_VNC_PORT_MIN);
2680 2681 2682 2683 2684 2685 2686 2687
            if (port < 0) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Unable to find an unused VNC port"));
                goto cleanup;
            }
            vm->def->graphics[0]->data.vnc.port = port;
        } else if (vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_SPICE &&
                   vm->def->graphics[0]->data.spice.autoport) {
2688
            int port = qemudNextFreePort(driver, QEMU_VNC_PORT_MIN);
2689 2690
            int tlsPort = -1;
            if (port < 0) {
2691
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
2692
                                "%s", _("Unable to find an unused SPICE port"));
2693 2694 2695
                goto cleanup;
            }

2696 2697 2698 2699 2700
            if (driver->spiceTLS) {
                tlsPort = qemudNextFreePort(driver, port + 1);
                if (tlsPort < 0) {
                    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                    "%s", _("Unable to find an unused SPICE TLS port"));
2701
                    qemuReturnPort(driver, port);
2702 2703 2704 2705
                    goto cleanup;
                }
            }

2706 2707
            vm->def->graphics[0]->data.spice.port = port;
            vm->def->graphics[0]->data.spice.tlsPort = tlsPort;
2708
        }
2709
    }
2710

L
Laine Stump 已提交
2711
    if (virFileMakePath(driver->logDir) != 0) {
2712
        virReportSystemError(errno,
2713 2714
                             _("cannot create log directory %s"),
                             driver->logDir);
2715
        goto cleanup;
2716 2717
    }

2718
    DEBUG0("Creating domain log file");
2719
    if ((logfile = qemudLogFD(driver, vm->def->name, false)) < 0)
2720
        goto cleanup;
2721

E
Eric Blake 已提交
2722
    DEBUG0("Determining emulator version");
2723 2724 2725
    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
2726
        goto cleanup;
2727

2728
    DEBUG0("Setting up domain cgroup (if required)");
2729
    if (qemuSetupCgroup(driver, vm) < 0)
2730 2731
        goto cleanup;

2732
    if (VIR_ALLOC(priv->monConfig) < 0) {
2733
        virReportOOMError();
2734 2735 2736
        goto cleanup;
    }

2737
    DEBUG0("Preparing monitor state");
2738
    if (qemuPrepareMonitorChr(driver, priv->monConfig, vm->def->name) < 0)
2739
        goto cleanup;
2740

D
Daniel P. Berrange 已提交
2741 2742 2743
#if HAVE_YAJL
    if (qemuCmdFlags & QEMUD_CMD_FLAG_MONITOR_JSON)
        priv->monJSON = 1;
2744
    else
D
Daniel P. Berrange 已提交
2745
#endif
2746
        priv->monJSON = 0;
D
Daniel P. Berrange 已提交
2747

2748
    priv->monitor_warned = 0;
2749
    priv->gotShutdown = false;
2750

D
Daniel P. Berrange 已提交
2751
    if ((ret = virFileDeletePid(driver->stateDir, vm->def->name)) != 0) {
2752
        virReportSystemError(ret,
D
Daniel P. Berrange 已提交
2753 2754 2755 2756 2757
                             _("Cannot remove stale PID file for %s"),
                             vm->def->name);
        goto cleanup;
    }

2758
    if (!(pidfile = virFilePid(driver->stateDir, vm->def->name))) {
2759
        virReportSystemError(errno,
2760 2761 2762
                             "%s", _("Failed to build pidfile path."));
        goto cleanup;
    }
D
Daniel P. Berrange 已提交
2763

2764
    /*
M
Matthew Booth 已提交
2765
     * Normally PCI addresses are assigned in the virDomainCreate
2766 2767 2768 2769 2770
     * or virDomainDefine methods. We might still need to assign
     * some here to cope with the question of upgrades. Regardless
     * we also need to populate the PCi address set cache for later
     * use in hotplug
     */
2771
    if (qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE) {
2772
        DEBUG0("Assigning domain PCI addresses");
2773
        /* Populate cache with current addresses */
2774 2775 2776 2777 2778 2779 2780
        if (priv->pciaddrs) {
            qemuDomainPCIAddressSetFree(priv->pciaddrs);
            priv->pciaddrs = NULL;
        }
        if (!(priv->pciaddrs = qemuDomainPCIAddressSetCreate(vm->def)))
            goto cleanup;

2781 2782

        /* Assign any remaining addresses */
2783 2784
        if (qemuAssignDevicePCISlots(vm->def, priv->pciaddrs) < 0)
            goto cleanup;
2785 2786 2787 2788

        priv->persistentAddrs = 1;
    } else {
        priv->persistentAddrs = 0;
2789 2790
    }

2791
    DEBUG0("Building emulator command line");
2792
    vm->def->id = driver->nextvmid++;
2793 2794
    if (!(cmd = qemuBuildCommandLine(conn, driver, vm->def, priv->monConfig,
                                     priv->monJSON != 0, qemuCmdFlags,
2795
                                     migrateFrom, stdin_fd,
2796
                                     vm->current_snapshot, vmop)))
C
Chris Lalancette 已提交
2797 2798
        goto cleanup;

2799
    if (qemuDomainSnapshotSetCurrentInactive(vm, driver->snapshotDir) < 0)
2800
        goto cleanup;
2801

2802 2803 2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815 2816 2817
    /* now that we know it is about to start call the hook if present */
    if (virHookPresent(VIR_HOOK_DRIVER_QEMU)) {
        char *xml = virDomainDefFormat(vm->def, 0);
        int hookret;

        hookret = virHookCall(VIR_HOOK_DRIVER_QEMU, vm->def->name,
                    VIR_HOOK_QEMU_OP_START, VIR_HOOK_SUBOP_BEGIN, NULL, xml);
        VIR_FREE(xml);

        /*
         * If the script raised an error abort the launch
         */
        if (hookret < 0)
            goto cleanup;
    }

2818 2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830
    if ((timestamp = virTimestamp()) == NULL) {
        virReportOOMError();
        goto cleanup;
    } else {
        if (safewrite(logfile, timestamp, strlen(timestamp)) < 0 ||
            safewrite(logfile, START_POSTFIX, strlen(START_POSTFIX)) < 0) {
            VIR_WARN("Unable to write timestamp to logfile: %s",
                     virStrerror(errno, ebuf, sizeof ebuf));
        }

        VIR_FREE(timestamp);
    }

E
Eric Blake 已提交
2831
    virCommandWriteArgLog(cmd, logfile);
2832

2833
    if ((pos = lseek(logfile, 0, SEEK_END)) < 0)
2834
        VIR_WARN("Unable to seek to end of logfile: %s",
2835
                 virStrerror(errno, ebuf, sizeof ebuf));
2836

2837 2838
    VIR_DEBUG("Clear emulator capabilities: %d",
              driver->clearEmulatorCapabilities);
E
Eric Blake 已提交
2839 2840 2841 2842 2843
    if (driver->clearEmulatorCapabilities)
        virCommandClearCaps(cmd);

    VIR_WARN("Executing %s", vm->def->emulator);
    virCommandSetPreExecHook(cmd, qemudSecurityHook, &hookData);
2844

E
Eric Blake 已提交
2845 2846 2847 2848 2849 2850 2851 2852
    virCommandSetOutputFD(cmd, &logfile);
    virCommandSetErrorFD(cmd, &logfile);
    virCommandNonblockingFDs(cmd);
    virCommandSetPidFile(cmd, pidfile);
    virCommandDaemonize(cmd);

    ret = virCommandRun(cmd, NULL);
    VIR_WARN("Executing done %s", vm->def->emulator);
2853
    VIR_FREE(pidfile);
G
Guido Günther 已提交
2854 2855 2856

    /* wait for qemu process to to show up */
    if (ret == 0) {
2857
        if (virFileReadPid(driver->stateDir, vm->def->name, &vm->pid)) {
2858 2859
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("Domain %s didn't show up\n"), vm->def->name);
2860
            ret = -1;
G
Guido Günther 已提交
2861
        }
E
Eric Blake 已提交
2862
#if 0
2863
    } else if (ret == -2) {
E
Eric Blake 已提交
2864 2865 2866 2867 2868
        /*
         * XXX this is bogus. It isn't safe to set vm->pid = child
         * because the child no longer exists.
         */

2869 2870 2871 2872 2873 2874 2875 2876 2877
        /* The virExec process that launches the daemon failed. Pending on
         * when it failed (we can't determine for sure), there may be
         * extra info in the domain log (if the hook failed for example).
         *
         * Pretend like things succeeded, and let 'WaitForMonitor' report
         * the log contents for us.
         */
        vm->pid = child;
        ret = 0;
E
Eric Blake 已提交
2878
#endif
2879
    }
2880

2881 2882 2883
    if (migrateFrom)
        start_paused = true;
    vm->state = start_paused ? VIR_DOMAIN_PAUSED : VIR_DOMAIN_RUNNING;
2884

2885
    if (ret == -1) /* The VM failed to start; tear filters before taps */
2886
        virDomainConfVMNWFilterTeardown(vm);
2887

2888
    if (ret == -1) /* The VM failed to start */
2889 2890
        goto cleanup;

2891
    DEBUG0("Waiting for monitor to show up");
2892
    if (qemudWaitForMonitor(driver, vm, pos) < 0)
2893
        goto cleanup;
2894

2895
    DEBUG0("Detecting VCPU PIDs");
2896
    if (qemuDetectVcpuPIDs(driver, vm) < 0)
2897
        goto cleanup;
2898

2899
    DEBUG0("Setting any required VM passwords");
2900
    if (qemuInitPasswords(conn, driver, vm, qemuCmdFlags) < 0)
2901
        goto cleanup;
2902

D
Daniel P. Berrange 已提交
2903 2904 2905
    /* If we have -device, then addresses are assigned explicitly.
     * If not, then we have to detect dynamic ones here */
    if (!(qemuCmdFlags & QEMUD_CMD_FLAG_DEVICE)) {
2906
        DEBUG0("Determining domain device PCI addresses");
D
Daniel P. Berrange 已提交
2907
        if (qemuInitPCIAddresses(driver, vm) < 0)
2908
            goto cleanup;
D
Daniel P. Berrange 已提交
2909
    }
2910

2911
    DEBUG0("Setting initial memory amount");
2912
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
2913
    if (qemuMonitorSetBalloon(priv->mon, vm->def->mem.cur_balloon) < 0) {
2914
        qemuDomainObjExitMonitorWithDriver(driver, vm);
2915
        goto cleanup;
2916
    }
H
Hu Tao 已提交
2917
    qemuDomainObjExitMonitorWithDriver(driver, vm);
2918

2919
    if (!start_paused) {
2920
        DEBUG0("Starting domain CPUs");
2921
        /* Allow the CPUS to start executing */
H
Hu Tao 已提交
2922
        if (doStartCPUs(driver, vm, conn) < 0) {
2923
            if (virGetLastError() == NULL)
2924 2925
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("resume operation failed"));
2926
            goto cleanup;
2927 2928
        }
    }
2929

2930

2931
    DEBUG0("Writing domain status to disk");
2932
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
2933 2934
        goto cleanup;

E
Eric Blake 已提交
2935
    virCommandFree(cmd);
2936
    VIR_FORCE_CLOSE(logfile);
2937

2938
    return 0;
2939 2940

cleanup:
2941 2942 2943
    /* We jump here if we failed to start the VM for any reason, or
     * if we failed to initialize the now running VM. kill it off and
     * pretend we never started it */
E
Eric Blake 已提交
2944
    virCommandFree(cmd);
2945
    VIR_FORCE_CLOSE(logfile);
E
Eric Blake 已提交
2946
    qemudShutdownVMDaemon(driver, vm, 0);
2947 2948

    return -1;
2949 2950
}

2951
static void qemudShutdownVMDaemon(struct qemud_driver *driver,
2952 2953
                                  virDomainObjPtr vm,
                                  int migrated) {
D
Daniel P. Berrange 已提交
2954
    int ret;
2955
    int retries = 0;
2956
    qemuDomainObjPrivatePtr priv = vm->privateData;
2957
    virErrorPtr orig_err;
2958 2959
    virDomainDefPtr def;
    int i;
2960 2961 2962
    int logfile = -1;
    char *timestamp;
    char ebuf[1024];
D
Daniel P. Berrange 已提交
2963

2964 2965
    VIR_DEBUG("Shutting down VM '%s' pid=%d migrated=%d",
              vm->def->name, vm->pid, migrated);
2966

2967
    if ((logfile = qemudLogFD(driver, vm->def->name, true)) < 0) {
2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986 2987 2988 2989 2990
        /* To not break the normal domain shutdown process, skip the
         * timestamp log writing if failed on opening log file. */
        VIR_WARN("Unable to open logfile: %s",
                  virStrerror(errno, ebuf, sizeof ebuf));
    } else {
        if ((timestamp = virTimestamp()) == NULL) {
            virReportOOMError();
        } else {
            if (safewrite(logfile, timestamp, strlen(timestamp)) < 0 ||
                safewrite(logfile, SHUTDOWN_POSTFIX,
                          strlen(SHUTDOWN_POSTFIX)) < 0) {
                VIR_WARN("Unable to write timestamp to logfile: %s",
                         virStrerror(errno, ebuf, sizeof ebuf));
            }

            VIR_FREE(timestamp);
        }

        if (VIR_CLOSE(logfile) < 0)
             VIR_WARN("Unable to close logfile: %s",
                      virStrerror(errno, ebuf, sizeof ebuf));
    }

2991 2992 2993 2994
    /* This method is routinely used in clean up paths. Disable error
     * reporting so we don't squash a legit error. */
    orig_err = virSaveLastError();

2995
    virDomainConfVMNWFilterTeardown(vm);
S
Stefan Berger 已提交
2996

2997
    if (driver->macFilter) {
2998
        def = vm->def;
2999 3000 3001 3002
        for (i = 0 ; i < def->nnets ; i++) {
            virDomainNetDefPtr net = def->nets[i];
            if (net->ifname == NULL)
                continue;
3003
            if ((errno = networkDisallowMacOnPort(driver, net->ifname,
3004
                                                  net->mac))) {
3005
                virReportSystemError(errno,
3006 3007 3008 3009 3010 3011
             _("failed to remove ebtables rule to allow MAC address on  '%s'"),
                                     net->ifname);
            }
        }
    }

3012
    /* This will safely handle a non-running guest with pid=0 or pid=-1*/
G
Guido Günther 已提交
3013 3014
    if (virKillProcess(vm->pid, 0) == 0 &&
        virKillProcess(vm->pid, SIGTERM) < 0)
3015
        virReportSystemError(errno,
3016 3017
                             _("Failed to send SIGTERM to %s (%d)"),
                             vm->def->name, vm->pid);
3018

3019 3020
    if (priv->mon)
        qemuMonitorClose(priv->mon);
3021

3022
    if (priv->monConfig) {
3023 3024 3025
        if (priv->monConfig->type == VIR_DOMAIN_CHR_TYPE_UNIX)
            unlink(priv->monConfig->data.nix.path);
        virDomainChrSourceDefFree(priv->monConfig);
3026
        priv->monConfig = NULL;
3027 3028
    }

G
Guido Günther 已提交
3029 3030
    /* shut it off for sure */
    virKillProcess(vm->pid, SIGKILL);
3031

3032 3033 3034 3035 3036 3037 3038 3039 3040 3041
    /* now that we know it's stopped call the hook if present */
    if (virHookPresent(VIR_HOOK_DRIVER_QEMU)) {
        char *xml = virDomainDefFormat(vm->def, 0);

        /* we can't stop the operation even if the script raised an error */
        virHookCall(VIR_HOOK_DRIVER_QEMU, vm->def->name,
                    VIR_HOOK_QEMU_OP_STOPPED, VIR_HOOK_SUBOP_END, NULL, xml);
        VIR_FREE(xml);
    }

3042
    /* Reset Security Labels */
3043 3044 3045
    virSecurityManagerRestoreAllLabel(driver->securityManager,
                                      vm, migrated);
    virSecurityManagerReleaseLabel(driver->securityManager, vm);
3046

3047 3048 3049 3050 3051 3052 3053
    /* Clear out dynamically assigned labels */
    if (vm->def->seclabel.type == VIR_DOMAIN_SECLABEL_DYNAMIC) {
        VIR_FREE(vm->def->seclabel.model);
        VIR_FREE(vm->def->seclabel.label);
        VIR_FREE(vm->def->seclabel.imagelabel);
    }

D
Daniel P. Berrange 已提交
3054
    virDomainDefClearDeviceAliases(vm->def);
3055 3056 3057 3058 3059
    if (!priv->persistentAddrs) {
        virDomainDefClearPCIAddresses(vm->def);
        qemuDomainPCIAddressSetFree(priv->pciaddrs);
        priv->pciaddrs = NULL;
    }
3060

3061
    qemuDomainReAttachHostDevices(driver, vm->def);
3062

S
Stefan Berger 已提交
3063 3064 3065 3066
#if WITH_MACVTAP
    def = vm->def;
    for (i = 0; i < def->nnets; i++) {
        virDomainNetDefPtr net = def->nets[i];
3067
        if (net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
3068
            delMacvtap(net->ifname, net->mac, net->data.direct.linkdev,
3069
                       &net->data.direct.virtPortProfile);
3070 3071
            VIR_FREE(net->ifname);
        }
S
Stefan Berger 已提交
3072 3073 3074
    }
#endif

3075
retry:
3076
    if ((ret = qemuRemoveCgroup(driver, vm, 0)) < 0) {
3077 3078 3079 3080 3081 3082 3083 3084
        if (ret == -EBUSY && (retries++ < 5)) {
            usleep(200*1000);
            goto retry;
        }
        VIR_WARN("Failed to remove cgroup for %s",
                 vm->def->name);
    }

3085
    qemudRemoveDomainStatus(driver, vm);
D
Daniel P. Berrange 已提交
3086

3087 3088 3089 3090 3091
    /* Remove VNC port from port reservation bitmap, but only if it was
       reserved by the driver (autoport=yes)
    */
    if ((vm->def->ngraphics == 1) &&
        vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC &&
3092 3093 3094 3095 3096 3097 3098 3099
        vm->def->graphics[0]->data.vnc.autoport) {
        qemuReturnPort(driver, vm->def->graphics[0]->data.vnc.port);
    }
    if ((vm->def->ngraphics == 1) &&
        vm->def->graphics[0]->type == VIR_DOMAIN_GRAPHICS_TYPE_SPICE &&
        vm->def->graphics[0]->data.spice.autoport) {
        qemuReturnPort(driver, vm->def->graphics[0]->data.spice.port);
        qemuReturnPort(driver, vm->def->graphics[0]->data.spice.tlsPort);
3100 3101
    }

3102
    vm->pid = -1;
3103
    vm->def->id = -1;
3104
    vm->state = VIR_DOMAIN_SHUTOFF;
3105 3106
    VIR_FREE(priv->vcpupids);
    priv->nvcpupids = 0;
3107 3108

    if (vm->newDef) {
3109
        virDomainDefFree(vm->def);
3110
        vm->def = vm->newDef;
3111
        vm->def->id = -1;
3112 3113
        vm->newDef = NULL;
    }
3114 3115 3116 3117 3118

    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
3119 3120
}

3121
static virDrvOpenStatus qemudOpen(virConnectPtr conn,
3122
                                  virConnectAuthPtr auth ATTRIBUTE_UNUSED,
3123
                                  int flags ATTRIBUTE_UNUSED) {
3124
    if (conn->uri == NULL) {
3125 3126 3127
        if (qemu_driver == NULL)
            return VIR_DRV_OPEN_DECLINED;

3128
        conn->uri = xmlParseURI(qemu_driver->privileged ?
3129 3130
                                "qemu:///system" :
                                "qemu:///session");
3131
        if (!conn->uri) {
3132
            virReportOOMError();
3133 3134
            return VIR_DRV_OPEN_ERROR;
        }
3135 3136 3137 3138 3139 3140 3141 3142 3143 3144
    } else {
        /* If URI isn't 'qemu' its definitely not for us */
        if (conn->uri->scheme == NULL ||
            STRNEQ(conn->uri->scheme, "qemu"))
            return VIR_DRV_OPEN_DECLINED;

        /* Allow remote driver to deal with URIs with hostname server */
        if (conn->uri->server != NULL)
            return VIR_DRV_OPEN_DECLINED;

3145
        if (qemu_driver == NULL) {
3146 3147
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("qemu state driver is not active"));
3148 3149 3150
            return VIR_DRV_OPEN_ERROR;
        }

3151
        if (conn->uri->path == NULL) {
3152 3153 3154 3155 3156
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("no QEMU URI path given, try %s"),
                            qemu_driver->privileged
                            ? "qemu:///system"
                            : "qemu:///session");
3157 3158 3159
                return VIR_DRV_OPEN_ERROR;
        }

3160
        if (qemu_driver->privileged) {
3161 3162
            if (STRNEQ (conn->uri->path, "/system") &&
                STRNEQ (conn->uri->path, "/session")) {
3163 3164 3165
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("unexpected QEMU URI path '%s', try qemu:///system"),
                                conn->uri->path);
3166 3167 3168 3169
                return VIR_DRV_OPEN_ERROR;
            }
        } else {
            if (STRNEQ (conn->uri->path, "/session")) {
3170 3171 3172
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("unexpected QEMU URI path '%s', try qemu:///session"),
                                conn->uri->path);
3173 3174 3175
                return VIR_DRV_OPEN_ERROR;
            }
        }
3176 3177 3178 3179 3180 3181 3182
    }
    conn->privateData = qemu_driver;

    return VIR_DRV_OPEN_SUCCESS;
}

static int qemudClose(virConnectPtr conn) {
3183
    struct qemud_driver *driver = conn->privateData;
3184 3185

    /* Get rid of callbacks registered for this conn */
3186
    qemuDriverLock(driver);
3187
    virDomainEventCallbackListRemoveConn(conn, driver->domainEventCallbacks);
3188
    qemuDriverUnlock(driver);
3189 3190 3191 3192 3193 3194

    conn->privateData = NULL;

    return 0;
}

D
Daniel Veillard 已提交
3195 3196 3197 3198 3199
/* Which features are supported by this driver? */
static int
qemudSupportsFeature (virConnectPtr conn ATTRIBUTE_UNUSED, int feature)
{
    switch (feature) {
3200 3201 3202 3203 3204
    case VIR_DRV_FEATURE_MIGRATION_V2:
    case VIR_DRV_FEATURE_MIGRATION_P2P:
        return 1;
    default:
        return 0;
D
Daniel Veillard 已提交
3205 3206 3207
    }
}

3208
static const char *qemudGetType(virConnectPtr conn ATTRIBUTE_UNUSED) {
3209
    return "QEMU";
3210 3211
}

3212

3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224 3225
static int qemuIsSecure(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Trivially secure, since always inside the daemon */
    return 1;
}

static int qemuIsEncrypted(virConnectPtr conn ATTRIBUTE_UNUSED)
{
    /* Not encrypted, but remote driver takes care of that */
    return 0;
}


3226 3227 3228 3229
static int kvmGetMaxVCPUs(void) {
    int maxvcpus = 1;

    int r, fd;
3230

3231 3232
    fd = open(KVM_DEVICE, O_RDONLY);
    if (fd < 0) {
3233
        virReportSystemError(errno, _("Unable to open %s"), KVM_DEVICE);
3234
        return -1;
3235 3236 3237 3238 3239 3240
    }

    r = ioctl(fd, KVM_CHECK_EXTENSION, KVM_CAP_NR_VCPUS);
    if (r > 0)
        maxvcpus = r;

3241
    VIR_FORCE_CLOSE(fd);
3242 3243 3244 3245
    return maxvcpus;
}


3246
static int qemudGetMaxVCPUs(virConnectPtr conn ATTRIBUTE_UNUSED, const char *type) {
3247 3248 3249
    if (!type)
        return 16;

3250
    if (STRCASEEQ(type, "qemu"))
3251 3252
        return 16;

3253
    if (STRCASEEQ(type, "kvm"))
3254
        return kvmGetMaxVCPUs();
3255

3256
    if (STRCASEEQ(type, "kqemu"))
3257
        return 1;
3258

3259 3260
    qemuReportError(VIR_ERR_INVALID_ARG,
                    _("unknown type '%s'"), type);
3261 3262 3263
    return -1;
}

3264

3265
static char *qemudGetCapabilities(virConnectPtr conn) {
3266
    struct qemud_driver *driver = conn->privateData;
3267
    virCapsPtr caps = NULL;
3268
    char *xml = NULL;
3269

3270
    qemuDriverLock(driver);
3271

3272
    if ((caps = qemuCreateCapabilities(qemu_driver->caps,
3273
                                       qemu_driver)) == NULL) {
3274 3275 3276
        virCapabilitiesFree(caps);
        goto cleanup;
    }
3277

3278
    virCapabilitiesFree(qemu_driver->caps);
3279 3280 3281
    qemu_driver->caps = caps;

    if ((xml = virCapabilitiesFormatXML(driver->caps)) == NULL)
3282
        virReportOOMError();
3283 3284

cleanup:
3285
    qemuDriverUnlock(driver);
3286

3287
    return xml;
3288 3289 3290
}


3291 3292 3293 3294 3295
static int
qemudGetProcessInfo(unsigned long long *cpuTime, int *lastCpu, int pid,
                    int tid)
{
    char *proc;
D
Daniel P. Berrange 已提交
3296
    FILE *pidinfo;
3297
    unsigned long long usertime, systime;
3298 3299
    int cpu;
    int ret;
D
Daniel P. Berrange 已提交
3300

3301
    if (tid)
3302
        ret = virAsprintf(&proc, "/proc/%d/task/%d/stat", pid, tid);
3303
    else
3304 3305
        ret = virAsprintf(&proc, "/proc/%d/stat", pid);
    if (ret < 0)
D
Daniel P. Berrange 已提交
3306 3307 3308 3309
        return -1;

    if (!(pidinfo = fopen(proc, "r"))) {
        /* VM probably shut down, so fake 0 */
3310 3311 3312 3313
        if (cpuTime)
            *cpuTime = 0;
        if (lastCpu)
            *lastCpu = 0;
3314
        VIR_FREE(proc);
D
Daniel P. Berrange 已提交
3315 3316
        return 0;
    }
3317
    VIR_FREE(proc);
D
Daniel P. Berrange 已提交
3318

3319 3320 3321 3322 3323 3324 3325 3326 3327 3328
    /* See 'man proc' for information about what all these fields are. We're
     * only interested in a very few of them */
    if (fscanf(pidinfo,
               /* pid -> stime */
               "%*d %*s %*c %*d %*d %*d %*d %*d %*u %*u %*u %*u %*u %llu %llu"
               /* cutime -> endcode */
               "%*d %*d %*d %*d %*d %*u %*u %*d %*u %*u %*u %*u"
               /* startstack -> processor */
               "%*u %*u %*u %*u %*u %*u %*u %*u %*u %*u %*d %d",
               &usertime, &systime, &cpu) != 3) {
3329
        VIR_FORCE_FCLOSE(pidinfo);
3330 3331
        VIR_WARN0("cannot parse process status data");
        errno = -EINVAL;
D
Daniel P. Berrange 已提交
3332 3333 3334 3335 3336 3337 3338 3339
        return -1;
    }

    /* We got jiffies
     * We want nanoseconds
     * _SC_CLK_TCK is jiffies per second
     * So calulate thus....
     */
3340 3341 3342 3343 3344
    if (cpuTime)
        *cpuTime = 1000ull * 1000ull * 1000ull * (usertime + systime) / (unsigned long long)sysconf(_SC_CLK_TCK);
    if (lastCpu)
        *lastCpu = cpu;

D
Daniel P. Berrange 已提交
3345

3346 3347
    VIR_DEBUG("Got status for %d/%d user=%llu sys=%llu cpu=%d",
              pid, tid, usertime, systime, cpu);
D
Daniel P. Berrange 已提交
3348

3349
    VIR_FORCE_FCLOSE(pidinfo);
D
Daniel P. Berrange 已提交
3350 3351 3352 3353 3354

    return 0;
}


3355
static virDomainPtr qemudDomainLookupByID(virConnectPtr conn,
3356
                                          int id) {
3357 3358 3359 3360
    struct qemud_driver *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;

3361
    qemuDriverLock(driver);
3362
    vm  = virDomainFindByID(&driver->domains, id);
3363
    qemuDriverUnlock(driver);
3364 3365

    if (!vm) {
3366 3367
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching id %d"), id);
3368
        goto cleanup;
3369 3370
    }

3371
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3372
    if (dom) dom->id = vm->def->id;
3373 3374

cleanup:
3375 3376
    if (vm)
        virDomainObjUnlock(vm);
3377 3378
    return dom;
}
3379

3380
static virDomainPtr qemudDomainLookupByUUID(virConnectPtr conn,
3381
                                            const unsigned char *uuid) {
3382 3383 3384
    struct qemud_driver *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
3385

3386
    qemuDriverLock(driver);
3387
    vm = virDomainFindByUUID(&driver->domains, uuid);
3388 3389
    qemuDriverUnlock(driver);

3390
    if (!vm) {
3391 3392
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(uuid, uuidstr);
3393 3394
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3395
        goto cleanup;
3396 3397
    }

3398
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3399
    if (dom) dom->id = vm->def->id;
3400 3401

cleanup:
3402 3403
    if (vm)
        virDomainObjUnlock(vm);
3404 3405
    return dom;
}
3406

3407
static virDomainPtr qemudDomainLookupByName(virConnectPtr conn,
3408
                                            const char *name) {
3409 3410 3411
    struct qemud_driver *driver = conn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
3412

3413
    qemuDriverLock(driver);
3414
    vm = virDomainFindByName(&driver->domains, name);
3415 3416
    qemuDriverUnlock(driver);

3417
    if (!vm) {
3418 3419
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching name '%s'"), name);
3420
        goto cleanup;
3421 3422
    }

3423
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3424
    if (dom) dom->id = vm->def->id;
3425 3426

cleanup:
3427 3428
    if (vm)
        virDomainObjUnlock(vm);
3429 3430 3431
    return dom;
}

3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442

static int qemuDomainIsActive(virDomainPtr dom)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    qemuDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!obj) {
3443
        qemuReportError(VIR_ERR_NO_DOMAIN, NULL);
3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461 3462 3463
        goto cleanup;
    }
    ret = virDomainObjIsActive(obj);

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}

static int qemuDomainIsPersistent(virDomainPtr dom)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    qemuDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!obj) {
3464
        qemuReportError(VIR_ERR_NO_DOMAIN, NULL);
3465 3466 3467 3468 3469 3470 3471 3472 3473 3474
        goto cleanup;
    }
    ret = obj->persistent;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}

3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485 3486 3487 3488 3489 3490 3491 3492 3493 3494
static int qemuDomainIsUpdated(virDomainPtr dom)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr obj;
    int ret = -1;

    qemuDriverLock(driver);
    obj = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!obj) {
        qemuReportError(VIR_ERR_NO_DOMAIN, NULL);
        goto cleanup;
    }
    ret = obj->updated;

cleanup:
    if (obj)
        virDomainObjUnlock(obj);
    return ret;
}
3495

3496
static int qemudGetVersion(virConnectPtr conn, unsigned long *version) {
3497 3498 3499
    struct qemud_driver *driver = conn->privateData;
    int ret = -1;

3500
    qemuDriverLock(driver);
3501
    if (qemuCapsExtractVersion(driver->caps, &driver->qemuVersion) < 0)
3502
        goto cleanup;
3503

3504
    *version = driver->qemuVersion;
3505 3506 3507
    ret = 0;

cleanup:
3508
    qemuDriverUnlock(driver);
3509
    return ret;
D
Daniel P. Berrange 已提交
3510 3511
}

3512
static int qemudListDomains(virConnectPtr conn, int *ids, int nids) {
3513
    struct qemud_driver *driver = conn->privateData;
3514
    int n;
3515

3516
    qemuDriverLock(driver);
3517
    n = virDomainObjListGetActiveIDs(&driver->domains, ids, nids);
3518
    qemuDriverUnlock(driver);
3519

3520
    return n;
D
Daniel P. Berrange 已提交
3521
}
3522

3523
static int qemudNumDomains(virConnectPtr conn) {
3524
    struct qemud_driver *driver = conn->privateData;
3525
    int n;
3526

3527
    qemuDriverLock(driver);
3528
    n = virDomainObjListNumOfDomains(&driver->domains, 1);
3529
    qemuDriverUnlock(driver);
3530

3531
    return n;
D
Daniel P. Berrange 已提交
3532
}
3533

3534
static virDomainPtr qemudDomainCreate(virConnectPtr conn, const char *xml,
3535
                                      unsigned int flags) {
3536
    struct qemud_driver *driver = conn->privateData;
3537
    virDomainDefPtr def;
3538
    virDomainObjPtr vm = NULL;
3539
    virDomainPtr dom = NULL;
3540
    virDomainEventPtr event = NULL;
D
Daniel P. Berrange 已提交
3541

3542
    virCheckFlags(VIR_DOMAIN_START_PAUSED, NULL);
3543

3544
    qemuDriverLock(driver);
3545
    if (!(def = virDomainDefParseString(driver->caps, xml,
3546
                                        VIR_DOMAIN_XML_INACTIVE)))
3547
        goto cleanup;
3548

3549
    if (virSecurityManagerVerify(driver->securityManager, def) < 0)
3550 3551
        goto cleanup;

3552 3553
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
3554

3555 3556 3557 3558 3559 3560
    if (qemudCanonicalizeMachine(driver, def) < 0)
        goto cleanup;

    if (qemuAssignPCIAddresses(def) < 0)
        goto cleanup;

3561
    if (!(vm = virDomainAssignDef(driver->caps,
3562
                                  &driver->domains,
3563
                                  def, false)))
3564 3565 3566
        goto cleanup;

    def = NULL;
D
Daniel P. Berrange 已提交
3567

3568 3569 3570
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup; /* XXXX free the 'vm' we created ? */

3571 3572
    if (qemudStartVMDaemon(conn, driver, vm, NULL,
                           (flags & VIR_DOMAIN_START_PAUSED) != 0,
3573
                           -1, NULL, VIR_VM_OP_CREATE) < 0) {
3574
        qemuDomainStartAudit(vm, "booted", false);
3575 3576 3577
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains,
                                    vm);
3578
        vm = NULL;
3579
        goto cleanup;
D
Daniel P. Berrange 已提交
3580
    }
3581 3582 3583 3584

    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);
3585
    qemuDomainStartAudit(vm, "booted", true);
D
Daniel P. Berrange 已提交
3586

3587
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
3588
    if (dom) dom->id = vm->def->id;
3589

3590 3591 3592
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3593

3594 3595
cleanup:
    virDomainDefFree(def);
3596 3597
    if (vm)
        virDomainObjUnlock(vm);
3598 3599
    if (event)
        qemuDomainEventQueue(driver, event);
3600
    qemuDriverUnlock(driver);
3601
    return dom;
D
Daniel P. Berrange 已提交
3602 3603 3604
}


3605
static int qemudDomainSuspend(virDomainPtr dom) {
3606 3607 3608
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3609
    virDomainEventPtr event = NULL;
3610
    qemuDomainObjPrivatePtr priv;
3611

3612
    qemuDriverLock(driver);
3613
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3614

D
Daniel P. Berrange 已提交
3615
    if (!vm) {
3616 3617
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3618 3619
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3620
        goto cleanup;
D
Daniel P. Berrange 已提交
3621
    }
D
Daniel P. Berrange 已提交
3622
    if (!virDomainObjIsActive(vm)) {
3623 3624
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3625
        goto cleanup;
D
Daniel P. Berrange 已提交
3626
    }
3627 3628 3629

    priv = vm->privateData;

3630
    if (priv->jobActive == QEMU_JOB_MIGRATION_OUT) {
3631 3632 3633 3634 3635 3636 3637 3638 3639 3640 3641 3642 3643 3644
        if (vm->state != VIR_DOMAIN_PAUSED) {
            VIR_DEBUG("Requesting domain pause on %s",
                      vm->def->name);
            priv->jobSignals |= QEMU_JOB_SIGNAL_SUSPEND;
        }
        ret = 0;
        goto cleanup;
    } else {
        if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
            goto cleanup;

        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_OPERATION_INVALID,
                            "%s", _("domain is not running"));
3645
            goto endjob;
3646
        }
3647
        if (vm->state != VIR_DOMAIN_PAUSED) {
H
Hu Tao 已提交
3648
            if (doStopCPUs(driver, vm) < 0) {
3649
                goto endjob;
3650
            }
3651 3652 3653 3654 3655 3656 3657
            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_SUSPENDED,
                                             VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
        }
        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
            goto endjob;
        ret = 0;
D
Daniel P. Berrange 已提交
3658
    }
3659

3660
endjob:
3661 3662
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3663

3664
cleanup:
3665 3666
    if (vm)
        virDomainObjUnlock(vm);
3667

3668
    if (event)
3669
        qemuDomainEventQueue(driver, event);
3670
    qemuDriverUnlock(driver);
3671
    return ret;
D
Daniel P. Berrange 已提交
3672 3673 3674
}


3675
static int qemudDomainResume(virDomainPtr dom) {
3676 3677 3678
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3679
    virDomainEventPtr event = NULL;
3680

3681
    qemuDriverLock(driver);
3682
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3683

D
Daniel P. Berrange 已提交
3684
    if (!vm) {
3685 3686
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3687 3688
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3689
        goto cleanup;
D
Daniel P. Berrange 已提交
3690
    }
3691 3692 3693 3694

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
3695
    if (!virDomainObjIsActive(vm)) {
3696 3697
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3698
        goto endjob;
D
Daniel P. Berrange 已提交
3699
    }
3700
    if (vm->state == VIR_DOMAIN_PAUSED) {
H
Hu Tao 已提交
3701
        if (doStartCPUs(driver, vm, dom->conn) < 0) {
3702
            if (virGetLastError() == NULL)
3703 3704
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("resume operation failed"));
3705
            goto endjob;
3706
        }
3707 3708 3709
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_UNPAUSED);
D
Daniel P. Berrange 已提交
3710
    }
3711
    if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
3712
        goto endjob;
3713 3714
    ret = 0;

3715
endjob:
3716 3717
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3718

3719
cleanup:
3720 3721
    if (vm)
        virDomainObjUnlock(vm);
3722
    if (event)
3723
        qemuDomainEventQueue(driver, event);
3724
    qemuDriverUnlock(driver);
3725
    return ret;
D
Daniel P. Berrange 已提交
3726 3727 3728
}


3729
static int qemudDomainShutdown(virDomainPtr dom) {
3730 3731 3732
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3733

3734
    qemuDriverLock(driver);
3735
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3736 3737
    qemuDriverUnlock(driver);

3738
    if (!vm) {
3739 3740
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3741 3742
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3743
        goto cleanup;
3744 3745
    }

3746 3747 3748
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
3749
    if (!virDomainObjIsActive(vm)) {
3750 3751
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3752
        goto endjob;
3753 3754
    }

3755
    qemuDomainObjPrivatePtr priv = vm->privateData;
3756 3757 3758
    qemuDomainObjEnterMonitor(vm);
    ret = qemuMonitorSystemPowerdown(priv->mon);
    qemuDomainObjExitMonitor(vm);
3759

3760
endjob:
3761 3762
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3763

3764
cleanup:
3765 3766
    if (vm)
        virDomainObjUnlock(vm);
3767
    return ret;
3768 3769 3770
}


3771
static int qemudDomainDestroy(virDomainPtr dom) {
3772 3773 3774
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3775
    virDomainEventPtr event = NULL;
3776

3777
    qemuDriverLock(driver);
3778
    vm  = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel P. Berrange 已提交
3779
    if (!vm) {
3780 3781
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3782 3783
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3784
        goto cleanup;
D
Daniel P. Berrange 已提交
3785
    }
3786 3787 3788 3789

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
3790
    if (!virDomainObjIsActive(vm)) {
3791 3792
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
3793
        goto endjob;
3794
    }
3795

3796
    qemudShutdownVMDaemon(driver, vm, 0);
3797 3798 3799
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_DESTROYED);
3800 3801
    qemuDomainStopAudit(vm, "destroyed");

3802
    if (!vm->persistent) {
3803 3804 3805
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains,
                                    vm);
3806 3807
        vm = NULL;
    }
3808 3809
    ret = 0;

3810
endjob:
3811 3812 3813
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3814

3815
cleanup:
3816 3817
    if (vm)
        virDomainObjUnlock(vm);
3818 3819
    if (event)
        qemuDomainEventQueue(driver, event);
3820
    qemuDriverUnlock(driver);
3821
    return ret;
D
Daniel P. Berrange 已提交
3822 3823 3824
}


3825
static char *qemudDomainGetOSType(virDomainPtr dom) {
3826 3827 3828
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *type = NULL;
3829

3830
    qemuDriverLock(driver);
3831
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3832
    qemuDriverUnlock(driver);
3833
    if (!vm) {
3834 3835
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3836 3837
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3838
        goto cleanup;
3839 3840
    }

3841
    if (!(type = strdup(vm->def->os.type)))
3842
        virReportOOMError();
3843 3844

cleanup:
3845 3846
    if (vm)
        virDomainObjUnlock(vm);
3847 3848 3849
    return type;
}

3850 3851
/* Returns max memory in kb, 0 if error */
static unsigned long qemudDomainGetMaxMemory(virDomainPtr dom) {
3852 3853 3854
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned long ret = 0;
3855

3856
    qemuDriverLock(driver);
3857
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3858 3859
    qemuDriverUnlock(driver);

3860
    if (!vm) {
3861 3862
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3863 3864
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3865
        goto cleanup;
3866 3867
    }

3868
    ret = vm->def->mem.max_balloon;
3869 3870

cleanup:
3871 3872
    if (vm)
        virDomainObjUnlock(vm);
3873
    return ret;
3874 3875 3876
}

static int qemudDomainSetMemory(virDomainPtr dom, unsigned long newmem) {
3877
    struct qemud_driver *driver = dom->conn->privateData;
3878
    qemuDomainObjPrivatePtr priv;
3879
    virDomainObjPtr vm;
3880
    int ret = -1, r;
3881

3882
    qemuDriverLock(driver);
3883
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3884
    qemuDriverUnlock(driver);
3885
    if (!vm) {
3886 3887
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3888 3889
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3890
        goto cleanup;
3891 3892
    }

3893
    if (newmem > vm->def->mem.max_balloon) {
3894 3895
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("cannot set memory higher than max memory"));
3896
        goto cleanup;
3897 3898
    }

3899 3900 3901
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

3902 3903 3904 3905 3906 3907
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto endjob;
    }

3908 3909 3910 3911 3912 3913
    priv = vm->privateData;
    qemuDomainObjEnterMonitor(vm);
    r = qemuMonitorSetBalloon(priv->mon, newmem);
    qemuDomainObjExitMonitor(vm);
    if (r < 0)
        goto endjob;
3914

3915 3916 3917 3918 3919
    /* Lack of balloon support is a fatal error */
    if (r == 0) {
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        "%s", _("cannot set memory of an active domain"));
        goto endjob;
3920
    }
3921

3922
    ret = 0;
3923
endjob:
3924 3925
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
3926

3927
cleanup:
3928 3929
    if (vm)
        virDomainObjUnlock(vm);
3930
    return ret;
3931 3932
}

3933
static int qemudDomainGetInfo(virDomainPtr dom,
3934
                              virDomainInfoPtr info) {
3935 3936 3937
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
3938 3939
    int err;
    unsigned long balloon;
3940

3941
    qemuDriverLock(driver);
3942
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
3943
    qemuDriverUnlock(driver);
D
Daniel P. Berrange 已提交
3944
    if (!vm) {
3945 3946
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
3947 3948
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
3949
        goto cleanup;
D
Daniel P. Berrange 已提交
3950 3951
    }

3952
    info->state = vm->state;
D
Daniel P. Berrange 已提交
3953

D
Daniel P. Berrange 已提交
3954
    if (!virDomainObjIsActive(vm)) {
3955
        info->cpuTime = 0;
D
Daniel P. Berrange 已提交
3956
    } else {
3957
        if (qemudGetProcessInfo(&(info->cpuTime), NULL, vm->pid, 0) < 0) {
3958
            qemuReportError(VIR_ERR_OPERATION_FAILED, ("cannot read cputime for domain"));
3959
            goto cleanup;
D
Daniel P. Berrange 已提交
3960 3961 3962
        }
    }

3963
    info->maxMem = vm->def->mem.max_balloon;
3964

D
Daniel P. Berrange 已提交
3965
    if (virDomainObjIsActive(vm)) {
3966
        qemuDomainObjPrivatePtr priv = vm->privateData;
3967 3968 3969

        if ((vm->def->memballoon != NULL) &&
            (vm->def->memballoon->model == VIR_DOMAIN_MEMBALLOON_MODEL_NONE)) {
3970
            info->memory = vm->def->mem.max_balloon;
3971
        } else if (!priv->jobActive) {
3972 3973
            if (qemuDomainObjBeginJob(vm) < 0)
                goto cleanup;
3974 3975 3976 3977 3978 3979 3980 3981 3982
            if (!virDomainObjIsActive(vm))
                err = 0;
            else {
                qemuDomainObjEnterMonitor(vm);
                err = qemuMonitorGetBalloonInfo(priv->mon, &balloon);
                qemuDomainObjExitMonitor(vm);
            }
            if (qemuDomainObjEndJob(vm) == 0) {
                vm = NULL;
3983 3984 3985
                goto cleanup;
            }

3986 3987
            if (err < 0)
                goto cleanup;
3988 3989
            if (err == 0)
                /* Balloon not supported, so maxmem is always the allocation */
3990
                info->memory = vm->def->mem.max_balloon;
3991 3992 3993
            else
                info->memory = balloon;
        } else {
3994
            info->memory = vm->def->mem.cur_balloon;
3995
        }
3996
    } else {
3997
        info->memory = vm->def->mem.cur_balloon;
3998 3999
    }

4000
    info->nrVirtCpu = vm->def->vcpus;
4001 4002 4003
    ret = 0;

cleanup:
4004 4005
    if (vm)
        virDomainObjUnlock(vm);
4006
    return ret;
D
Daniel P. Berrange 已提交
4007 4008 4009
}


4010 4011 4012 4013 4014 4015 4016 4017 4018
/** qemuDomainMigrateOffline:
 * Pause domain for non-live migration.
 */
static int
qemuDomainMigrateOffline(struct qemud_driver *driver,
                         virDomainObjPtr vm)
{
    int ret;

H
Hu Tao 已提交
4019
    ret = doStopCPUs(driver, vm);
4020 4021 4022 4023 4024 4025 4026 4027
    if (ret == 0) {
        virDomainEventPtr event;

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_SUSPENDED,
                                         VIR_DOMAIN_EVENT_SUSPENDED_MIGRATED);
        if (event)
            qemuDomainEventQueue(driver, event);
H
Hu Tao 已提交
4028
    }
4029 4030 4031 4032 4033

    return ret;
}


4034 4035 4036 4037 4038 4039 4040 4041 4042 4043 4044 4045 4046 4047
static int
qemuDomainWaitForMigrationComplete(struct qemud_driver *driver, virDomainObjPtr vm)
{
    int ret = -1;
    int status;
    unsigned long long memProcessed;
    unsigned long long memRemaining;
    unsigned long long memTotal;
    qemuDomainObjPrivatePtr priv = vm->privateData;

    priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;

    while (priv->jobInfo.type == VIR_DOMAIN_JOB_UNBOUNDED) {
        /* Poll every 50ms for progress & to allow cancellation */
4048
        struct timespec ts = { .tv_sec = 0, .tv_nsec = 50 * 1000 * 1000ull };
4049 4050
        struct timeval now;
        int rc;
O
Osier Yang 已提交
4051 4052 4053 4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066
        const char *job;

        switch (priv->jobActive) {
            case QEMU_JOB_MIGRATION_OUT:
                job = _("migration job");
                break;
            case QEMU_JOB_SAVE:
                job = _("domain save job");
                break;
            case QEMU_JOB_DUMP:
                job = _("domain core dump job");
                break;
            default:
                job = _("job");
        }

4067

4068
        if (!virDomainObjIsActive(vm)) {
O
Osier Yang 已提交
4069 4070
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s: %s",
                            job, _("guest unexpectedly quit"));
4071 4072 4073
            goto cleanup;
        }

4074 4075
        if (priv->jobSignals & QEMU_JOB_SIGNAL_CANCEL) {
            priv->jobSignals ^= QEMU_JOB_SIGNAL_CANCEL;
O
Osier Yang 已提交
4076
            VIR_DEBUG0("Cancelling job at client request");
4077 4078 4079 4080
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            rc = qemuMonitorMigrateCancel(priv->mon);
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (rc < 0) {
O
Osier Yang 已提交
4081
                VIR_WARN0("Unable to cancel job");
4082
            }
4083 4084 4085 4086 4087
        } else if (priv->jobSignals & QEMU_JOB_SIGNAL_SUSPEND) {
            priv->jobSignals ^= QEMU_JOB_SIGNAL_SUSPEND;
            VIR_DEBUG0("Pausing domain for non-live migration");
            if (qemuDomainMigrateOffline(driver, vm) < 0)
                VIR_WARN0("Unable to pause domain");
4088 4089 4090 4091 4092 4093 4094 4095 4096 4097 4098
        } else if (priv->jobSignals & QEMU_JOB_SIGNAL_MIGRATE_DOWNTIME) {
            unsigned long long ms = priv->jobSignalsData.migrateDowntime;

            priv->jobSignals ^= QEMU_JOB_SIGNAL_MIGRATE_DOWNTIME;
            priv->jobSignalsData.migrateDowntime = 0;
            VIR_DEBUG("Setting migration downtime to %llums", ms);
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            rc = qemuMonitorSetMigrationDowntime(priv->mon, ms);
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (rc < 0)
                VIR_WARN0("Unable to set migration downtime");
4099 4100
        }

4101 4102 4103 4104
        /* Repeat check because the job signals might have caused
         * guest to die
         */
        if (!virDomainObjIsActive(vm)) {
O
Osier Yang 已提交
4105 4106
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s: %s",
                            job, _("guest unexpectedly quit"));
4107 4108 4109
            goto cleanup;
        }

4110 4111 4112 4113 4114 4115 4116 4117 4118 4119 4120 4121 4122 4123 4124 4125 4126 4127 4128
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
        rc = qemuMonitorGetMigrationStatus(priv->mon,
                                           &status,
                                           &memProcessed,
                                           &memRemaining,
                                           &memTotal);
        qemuDomainObjExitMonitorWithDriver(driver, vm);

        if (rc < 0) {
            priv->jobInfo.type = VIR_DOMAIN_JOB_FAILED;
            goto cleanup;
        }

        if (gettimeofday(&now, NULL) < 0) {
            priv->jobInfo.type = VIR_DOMAIN_JOB_FAILED;
            virReportSystemError(errno, "%s",
                                 _("cannot get time of day"));
            goto cleanup;
        }
4129
        priv->jobInfo.timeElapsed = timeval_to_ms(now) - priv->jobStart;
4130 4131 4132 4133 4134

        switch (status) {
        case QEMU_MONITOR_MIGRATION_STATUS_INACTIVE:
            priv->jobInfo.type = VIR_DOMAIN_JOB_NONE;
            qemuReportError(VIR_ERR_OPERATION_FAILED,
O
Osier Yang 已提交
4135
                            "%s: %s", job, _("is not active"));
4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146 4147 4148 4149 4150 4151 4152 4153 4154 4155
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_ACTIVE:
            priv->jobInfo.dataTotal = memTotal;
            priv->jobInfo.dataRemaining = memRemaining;
            priv->jobInfo.dataProcessed = memProcessed;

            priv->jobInfo.memTotal = memTotal;
            priv->jobInfo.memRemaining = memRemaining;
            priv->jobInfo.memProcessed = memProcessed;
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_COMPLETED:
            priv->jobInfo.type = VIR_DOMAIN_JOB_COMPLETED;
            ret = 0;
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_ERROR:
            priv->jobInfo.type = VIR_DOMAIN_JOB_FAILED;
            qemuReportError(VIR_ERR_OPERATION_FAILED,
O
Osier Yang 已提交
4156
                            "%s: %s", job, _("unexpectedly failed"));
4157 4158 4159 4160 4161
            break;

        case QEMU_MONITOR_MIGRATION_STATUS_CANCELLED:
            priv->jobInfo.type = VIR_DOMAIN_JOB_CANCELLED;
            qemuReportError(VIR_ERR_OPERATION_FAILED,
O
Osier Yang 已提交
4162
                            "%s: %s", job, _("canceled by client"));
4163 4164 4165 4166 4167 4168 4169 4170 4171 4172 4173 4174 4175 4176 4177 4178 4179
            break;
        }

        virDomainObjUnlock(vm);
        qemuDriverUnlock(driver);

        nanosleep(&ts, NULL);

        qemuDriverLock(driver);
        virDomainObjLock(vm);
    }

cleanup:
    return ret;
}


4180
#define QEMUD_SAVE_MAGIC "LibvirtQemudSave"
4181 4182 4183
#define QEMUD_SAVE_VERSION 2

enum qemud_save_formats {
4184 4185 4186
    QEMUD_SAVE_FORMAT_RAW = 0,
    QEMUD_SAVE_FORMAT_GZIP = 1,
    QEMUD_SAVE_FORMAT_BZIP2 = 2,
4187 4188
    /*
     * Deprecated by xz and never used as part of a release
4189
     * QEMUD_SAVE_FORMAT_LZMA
4190 4191
     */
    QEMUD_SAVE_FORMAT_XZ = 3,
4192
    QEMUD_SAVE_FORMAT_LZOP = 4,
4193 4194 4195
    /* Note: add new members only at the end.
       These values are used in the on-disk format.
       Do not change or re-use numbers. */
4196 4197

    QEMUD_SAVE_FORMAT_LAST
4198
};
4199

4200 4201 4202 4203 4204
VIR_ENUM_DECL(qemudSaveCompression)
VIR_ENUM_IMPL(qemudSaveCompression, QEMUD_SAVE_FORMAT_LAST,
              "raw",
              "gzip",
              "bzip2",
4205 4206
              "xz",
              "lzop")
4207

4208 4209 4210 4211 4212
struct qemud_save_header {
    char magic[sizeof(QEMUD_SAVE_MAGIC)-1];
    int version;
    int xml_len;
    int was_running;
4213 4214
    int compressed;
    int unused[15];
4215 4216
};

4217 4218 4219 4220 4221 4222 4223
struct fileOpHookData {
    virDomainPtr dom;
    const char *path;
    char *xml;
    struct qemud_save_header *header;
};

4224
/* return -errno on failure, or 0 on success */
4225 4226 4227 4228 4229
static int qemudDomainSaveFileOpHook(int fd, void *data) {
    struct fileOpHookData *hdata = data;
    int ret = 0;

    if (safewrite(fd, hdata->header, sizeof(*hdata->header)) != sizeof(*hdata->header)) {
4230
        ret = -errno;
4231
        qemuReportError(VIR_ERR_OPERATION_FAILED,
4232 4233
                        _("failed to write header to domain save file '%s'"),
                        hdata->path);
4234 4235 4236 4237
        goto endjob;
    }

    if (safewrite(fd, hdata->xml, hdata->header->xml_len) != hdata->header->xml_len) {
4238
        ret = -errno;
4239 4240 4241 4242 4243 4244 4245 4246
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                         _("failed to write xml to '%s'"), hdata->path);
        goto endjob;
    }
endjob:
    return ret;
}

4247 4248 4249
/* this internal function expects the driver lock to already be held on entry */
static int qemudDomainSaveFlag(struct qemud_driver *driver, virDomainPtr dom,
                               virDomainObjPtr vm, const char *path,
4250
                               int compressed)
4251
{
4252
    char *xml = NULL;
4253
    struct qemud_save_header header;
4254 4255
    struct fileOpHookData hdata;
    int bypassSecurityDriver = 0;
4256
    int ret = -1;
4257
    int rc;
4258
    virDomainEventPtr event = NULL;
4259
    qemuDomainObjPrivatePtr priv;
4260 4261
    struct stat sb;
    int is_reg = 0;
4262
    unsigned long long offset;
4263
    virCgroupPtr cgroup = NULL;
4264 4265 4266 4267 4268

    memset(&header, 0, sizeof(header));
    memcpy(header.magic, QEMUD_SAVE_MAGIC, sizeof(header.magic));
    header.version = QEMUD_SAVE_VERSION;

4269
    header.compressed = compressed;
4270

4271
    priv = vm->privateData;
4272

4273 4274 4275
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
4276
    if (!virDomainObjIsActive(vm)) {
4277 4278
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
4279
        goto endjob;
D
Daniel P. Berrange 已提交
4280
    }
4281

O
Osier Yang 已提交
4282 4283
    priv->jobActive = QEMU_JOB_SAVE;

4284 4285 4286
    memset(&priv->jobInfo, 0, sizeof(priv->jobInfo));
    priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;

4287 4288 4289
    /* Pause */
    if (vm->state == VIR_DOMAIN_RUNNING) {
        header.was_running = 1;
H
Hu Tao 已提交
4290
        if (doStopCPUs(driver, vm) < 0)
4291
            goto endjob;
4292 4293 4294 4295 4296 4297

        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("guest unexpectedly quit"));
            goto endjob;
        }
4298 4299 4300
    }

    /* Get XML for the domain */
4301
    xml = virDomainDefFormat(vm->def, VIR_DOMAIN_XML_SECURE);
4302
    if (!xml) {
4303 4304
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to get domain xml"));
4305
        goto endjob;
4306 4307 4308
    }
    header.xml_len = strlen(xml) + 1;

4309 4310 4311 4312 4313 4314 4315 4316 4317 4318 4319 4320 4321
    /* path might be a pre-existing block dev, in which case
     * we need to skip the create step, and also avoid unlink
     * in the failure case */
    if (stat(path, &sb) < 0) {
        /* Avoid throwing an error here, since it is possible
         * that with NFS we can't actually stat() the file.
         * The subsequent codepaths will still raise an error
         * if a truely fatal problem is hit */
        is_reg = 1;
    } else {
        is_reg = S_ISREG(sb.st_mode);
    }

4322 4323 4324 4325 4326
    offset = sizeof(header) + header.xml_len;

    /* Due to way we append QEMU state on our header with dd,
     * we need to ensure there's a 512 byte boundary. Unfortunately
     * we don't have an explicit offset in the header, so we fake
4327 4328
     * it by padding the XML string with NULLs.
     */
4329 4330 4331 4332 4333 4334 4335 4336 4337 4338 4339 4340 4341
    if (offset % QEMU_MONITOR_MIGRATE_TO_FILE_BS) {
        unsigned long long pad =
            QEMU_MONITOR_MIGRATE_TO_FILE_BS -
            (offset % QEMU_MONITOR_MIGRATE_TO_FILE_BS);

        if (VIR_REALLOC_N(xml, header.xml_len + pad) < 0) {
            virReportOOMError();
            goto endjob;
        }
        memset(xml + header.xml_len, 0, pad);
        offset += pad;
        header.xml_len += pad;
    }
4342

4343 4344 4345 4346 4347 4348
    /* Setup hook data needed by virFileOperation hook function */
    hdata.dom = dom;
    hdata.path = path;
    hdata.xml = xml;
    hdata.header = &header;

4349 4350
    /* Write header to file, followed by XML */

4351
    /* First try creating the file as root */
4352 4353 4354 4355
    if (!is_reg) {
        int fd = open(path, O_WRONLY | O_TRUNC);
        if (fd < 0) {
            virReportSystemError(errno, _("unable to open %s"), path);
4356 4357
            goto endjob;
        }
4358
        if (qemudDomainSaveFileOpHook(fd, &hdata) < 0) {
4359
            VIR_FORCE_CLOSE(fd);
4360 4361
            goto endjob;
        }
4362
        if (VIR_CLOSE(fd) < 0) {
4363
            virReportSystemError(errno, _("unable to close %s"), path);
4364 4365
            goto endjob;
        }
4366 4367 4368 4369 4370
    } else {
        if ((rc = virFileOperation(path, O_CREAT|O_TRUNC|O_WRONLY,
                                  S_IRUSR|S_IWUSR,
                                  getuid(), getgid(),
                                  qemudDomainSaveFileOpHook, &hdata,
4371
                                  0)) < 0) {
4372
            /* If we failed as root, and the error was permission-denied
4373 4374
               (EACCES or EPERM), assume it's on a network-connected share
               where root access is restricted (eg, root-squashed NFS). If the
4375 4376 4377 4378
               qemu user (driver->user) is non-root, just set a flag to
               bypass security driver shenanigans, and retry the operation
               after doing setuid to qemu user */

4379
            if (((rc != -EACCES) && (rc != -EPERM)) ||
4380
                driver->user == getuid()) {
4381
                virReportSystemError(-rc, _("Failed to create domain save file '%s'"),
4382 4383 4384
                                     path);
                goto endjob;
            }
4385

4386
            /* On Linux we can also verify the FS-type of the directory. */
4387 4388 4389 4390 4391 4392 4393 4394 4395 4396 4397 4398 4399 4400 4401 4402 4403 4404
            switch (virStorageFileIsSharedFS(path)) {
                case 1:
                   /* it was on a network share, so we'll continue
                    * as outlined above
                    */
                   break;

                case -1:
                   virReportSystemError(errno,
                                        _("Failed to create domain save file "
                                          "'%s': couldn't determine fs type"),
                                        path);
                   goto endjob;
                   break;

                case 0:
                default:
                   /* local file - log the error returned by virFileOperation */
4405
                   virReportSystemError(-rc,
4406 4407 4408 4409
                                        _("Failed to create domain save file '%s'"),
                                        path);
                   goto endjob;
                   break;
4410 4411 4412

            }

4413
            /* Retry creating the file as driver->user */
4414

4415 4416 4417 4418
            if ((rc = virFileOperation(path, O_CREAT|O_TRUNC|O_WRONLY,
                                       S_IRUSR|S_IWUSR|S_IRGRP|S_IWGRP,
                                       driver->user, driver->group,
                                       qemudDomainSaveFileOpHook, &hdata,
4419 4420
                                       VIR_FILE_OP_AS_UID)) < 0) {
                virReportSystemError(-rc, _("Error from child process creating '%s'"),
4421
                                 path);
4422 4423
                goto endjob;
            }
4424

4425 4426 4427
            /* Since we had to setuid to create the file, and the fstype
               is NFS, we assume it's a root-squashing NFS share, and that
               the security driver stuff would have failed anyway */
4428

4429 4430
            bypassSecurityDriver = 1;
        }
4431
    }
4432

4433

4434 4435 4436 4437 4438 4439 4440 4441 4442 4443 4444 4445 4446 4447 4448 4449 4450
    if (!is_reg &&
        qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_DEVICES)) {
        if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) != 0) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("Unable to find cgroup for %s\n"),
                            vm->def->name);
            goto endjob;
        }
        rc = virCgroupAllowDevicePath(cgroup, path);
        if (rc != 0) {
            virReportSystemError(-rc,
                                 _("Unable to allow device %s for %s"),
                                 path, vm->def->name);
            goto endjob;
        }
    }

4451
    if ((!bypassSecurityDriver) &&
4452 4453
        virSecurityManagerSetSavedStateLabel(driver->securityManager,
                                             vm, path) < 0)
4454 4455
        goto endjob;

4456 4457
    if (header.compressed == QEMUD_SAVE_FORMAT_RAW) {
        const char *args[] = { "cat", NULL };
M
Matthias Bolte 已提交
4458
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
4459 4460 4461
        rc = qemuMonitorMigrateToFile(priv->mon,
                                      QEMU_MONITOR_MIGRATE_BACKGROUND,
                                      args, path, offset);
M
Matthias Bolte 已提交
4462
        qemuDomainObjExitMonitorWithDriver(driver, vm);
4463
    } else {
4464
        const char *prog = qemudSaveCompressionTypeToString(header.compressed);
4465 4466 4467 4468 4469
        const char *args[] = {
            prog,
            "-c",
            NULL
        };
M
Matthias Bolte 已提交
4470
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
4471 4472 4473
        rc = qemuMonitorMigrateToFile(priv->mon,
                                      QEMU_MONITOR_MIGRATE_BACKGROUND,
                                      args, path, offset);
M
Matthias Bolte 已提交
4474
        qemuDomainObjExitMonitorWithDriver(driver, vm);
4475 4476
    }

4477 4478 4479 4480 4481
    if (rc < 0)
        goto endjob;

    rc = qemuDomainWaitForMigrationComplete(driver, vm);

4482
    if (rc < 0)
4483
        goto endjob;
4484

4485
    if ((!bypassSecurityDriver) &&
4486 4487
        virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                 vm, path) < 0)
4488
        VIR_WARN("failed to restore save state label on %s", path);
4489

4490 4491
    if (cgroup != NULL) {
        rc = virCgroupDenyDevicePath(cgroup, path);
4492 4493 4494
        if (rc != 0)
            VIR_WARN("Unable to deny device %s for %s %d",
                     path, vm->def->name, rc);
4495 4496
    }

4497 4498
    ret = 0;

4499
    /* Shut it down */
4500
    qemudShutdownVMDaemon(driver, vm, 0);
4501
    qemuDomainStopAudit(vm, "saved");
4502 4503 4504
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_SAVED);
4505
    if (!vm->persistent) {
4506 4507 4508
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains,
                                    vm);
4509 4510
        vm = NULL;
    }
4511

4512
endjob:
4513
    if (vm) {
4514
        if (ret != 0) {
4515
            if (header.was_running && virDomainObjIsActive(vm)) {
H
Hu Tao 已提交
4516
                rc = doStartCPUs(driver, vm, dom->conn);
4517 4518 4519
                if (rc < 0)
                    VIR_WARN0("Unable to resume guest CPUs after save failure");
            }
4520

4521 4522 4523 4524 4525
            if (cgroup != NULL) {
                rc = virCgroupDenyDevicePath(cgroup, path);
                if (rc != 0)
                    VIR_WARN("Unable to deny device %s for %s: %d",
                             path, vm->def->name, rc);
4526
            }
4527 4528

            if ((!bypassSecurityDriver) &&
4529 4530
                virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                         vm, path) < 0)
4531
                VIR_WARN("failed to restore save state label on %s", path);
4532 4533
        }

4534
        if (qemuDomainObjEndJob(vm) == 0)
4535
            vm = NULL;
4536
    }
4537

4538 4539
cleanup:
    VIR_FREE(xml);
4540
    if (ret != 0 && is_reg)
4541
        unlink(path);
4542 4543
    if (event)
        qemuDomainEventQueue(driver, event);
4544
    virCgroupFree(&cgroup);
4545
    return ret;
D
Daniel P. Berrange 已提交
4546 4547
}

4548 4549 4550 4551 4552 4553 4554 4555 4556 4557 4558 4559 4560 4561 4562 4563
/* Returns true if a compression program is available in PATH */
static bool qemudCompressProgramAvailable(enum qemud_save_formats compress)
{
    const char *prog;
    char *c;

    if (compress == QEMUD_SAVE_FORMAT_RAW)
        return true;
    prog = qemudSaveCompressionTypeToString(compress);
    c = virFindFileInPath(prog);
    if (!c)
        return false;
    VIR_FREE(c);
    return true;
}

4564 4565 4566 4567
static int qemudDomainSave(virDomainPtr dom, const char *path)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int compressed;
4568 4569 4570 4571
    int ret = -1;
    virDomainObjPtr vm = NULL;

    qemuDriverLock(driver);
4572 4573 4574 4575 4576 4577 4578 4579 4580 4581 4582

    if (driver->saveImageFormat == NULL)
        compressed = QEMUD_SAVE_FORMAT_RAW;
    else {
        compressed = qemudSaveCompressionTypeFromString(driver->saveImageFormat);
        if (compressed < 0) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("Invalid save image format specified "
                                    "in configuration file"));
            return -1;
        }
4583 4584 4585 4586 4587 4588
        if (!qemudCompressProgramAvailable(compressed)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("Compression program for image format "
                                    "in configuration file isn't available"));
            return -1;
        }
4589 4590
    }

4591 4592 4593 4594 4595 4596 4597 4598 4599 4600 4601 4602 4603 4604 4605 4606 4607
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    ret = qemudDomainSaveFlag(driver, dom, vm, path, compressed);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);

    return ret;
4608 4609 4610 4611 4612 4613 4614 4615 4616 4617 4618 4619 4620 4621 4622 4623 4624 4625 4626 4627 4628 4629 4630
}

static char *
qemuDomainManagedSavePath(struct qemud_driver *driver, virDomainObjPtr vm) {
    char *ret;

    if (virAsprintf(&ret, "%s/%s.save", driver->saveDir, vm->def->name) < 0) {
        virReportOOMError();
        return(NULL);
    }

    return(ret);
}

static int
qemuDomainManagedSave(virDomainPtr dom, unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    char *name = NULL;
    int ret = -1;
    int compressed;

4631
    virCheckFlags(0, -1);
4632 4633 4634 4635 4636 4637 4638 4639

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
4640
        goto cleanup;
4641 4642
    }

4643 4644 4645 4646 4647 4648
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

4649 4650
    name = qemuDomainManagedSavePath(driver, vm);
    if (name == NULL)
4651
        goto cleanup;
4652 4653 4654 4655

    VIR_DEBUG("Saving state to %s", name);

    compressed = QEMUD_SAVE_FORMAT_RAW;
4656
    ret = qemudDomainSaveFlag(driver, dom, vm, name, compressed);
4657 4658 4659 4660 4661

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
4662 4663 4664
    VIR_FREE(name);

    return ret;
4665 4666 4667 4668 4669 4670 4671 4672 4673 4674
}

static int
qemuDomainHasManagedSaveImage(virDomainPtr dom, unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    char *name = NULL;

4675
    virCheckFlags(0, -1);
4676 4677 4678 4679 4680 4681 4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692 4693 4694 4695 4696 4697 4698 4699 4700 4701 4702 4703 4704 4705 4706 4707 4708

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    name = qemuDomainManagedSavePath(driver, vm);
    if (name == NULL)
        goto cleanup;

    ret = virFileExists(name);

cleanup:
    VIR_FREE(name);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

static int
qemuDomainManagedSaveRemove(virDomainPtr dom, unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    char *name = NULL;

4709
    virCheckFlags(0, -1);
4710 4711 4712 4713 4714 4715 4716 4717 4718 4719 4720 4721 4722 4723 4724 4725 4726 4727 4728 4729 4730 4731 4732 4733

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    name = qemuDomainManagedSavePath(driver, vm);
    if (name == NULL)
        goto cleanup;

    ret = unlink(name);

cleanup:
    VIR_FREE(name);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}
D
Daniel P. Berrange 已提交
4734

H
Hu Tao 已提交
4735 4736 4737 4738 4739 4740 4741 4742 4743 4744 4745 4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759
static int doCoreDump(struct qemud_driver *driver,
                      virDomainObjPtr vm,
                      const char *path,
                      enum qemud_save_formats compress)
{
    int fd = -1;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    priv = vm->privateData;

    /* Create an empty file with appropriate ownership.  */
    if ((fd = open(path, O_CREAT|O_TRUNC|O_WRONLY, S_IRUSR|S_IWUSR)) < 0) {
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("failed to create '%s'"), path);
        goto cleanup;
    }

    if (VIR_CLOSE(fd) < 0) {
        virReportSystemError(errno,
                             _("unable to save file %s"),
                             path);
        goto cleanup;
    }

4760 4761
    if (virSecurityManagerSetSavedStateLabel(driver->securityManager,
                                             vm, path) < 0)
H
Hu Tao 已提交
4762 4763 4764 4765 4766 4767 4768 4769 4770 4771 4772 4773 4774 4775 4776 4777 4778 4779 4780 4781 4782 4783 4784 4785 4786 4787 4788 4789 4790 4791 4792
        goto cleanup;

    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    if (compress == QEMUD_SAVE_FORMAT_RAW) {
        const char *args[] = {
            "cat",
            NULL,
        };
        ret = qemuMonitorMigrateToFile(priv->mon,
                                       QEMU_MONITOR_MIGRATE_BACKGROUND,
                                       args, path, 0);
    } else {
        const char *prog = qemudSaveCompressionTypeToString(compress);
        const char *args[] = {
            prog,
            "-c",
            NULL,
        };
        ret = qemuMonitorMigrateToFile(priv->mon,
                                       QEMU_MONITOR_MIGRATE_BACKGROUND,
                                       args, path, 0);
    }
    qemuDomainObjExitMonitorWithDriver(driver, vm);
    if (ret < 0)
        goto cleanup;

    ret = qemuDomainWaitForMigrationComplete(driver, vm);

    if (ret < 0)
        goto cleanup;

4793 4794
    if (virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                 vm, path) < 0)
H
Hu Tao 已提交
4795 4796 4797 4798 4799 4800 4801 4802
        goto cleanup;

cleanup:
    if (ret != 0)
        unlink(path);
    return ret;
}

4803 4804 4805 4806 4807
static enum qemud_save_formats
getCompressionType(struct qemud_driver *driver)
{
    int compress = QEMUD_SAVE_FORMAT_RAW;

4808 4809 4810 4811 4812 4813 4814
    /*
     * We reuse "save" flag for "dump" here. Then, we can support the same
     * format in "save" and "dump".
     */
    if (driver->dumpImageFormat) {
        compress = qemudSaveCompressionTypeFromString(driver->dumpImageFormat);
        if (compress < 0) {
4815 4816 4817 4818
            qemuReportError(VIR_ERR_OPERATION_FAILED, "%s",
                            _("Invalid dump image format specified in "
                              "configuration file, using raw"));
            return QEMUD_SAVE_FORMAT_RAW;
4819
        }
4820 4821 4822
        if (!qemudCompressProgramAvailable(compress)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("Compression program for dump image format "
4823 4824 4825
                                    "in configuration file isn't available, "
                                    "using raw"));
            return QEMUD_SAVE_FORMAT_RAW;
4826
        }
4827
    }
4828 4829 4830 4831 4832 4833 4834 4835 4836
    return compress;
}

static int qemudDomainCoreDump(virDomainPtr dom,
                               const char *path,
                               int flags ATTRIBUTE_UNUSED) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int resume = 0, paused = 0;
H
Hu Tao 已提交
4837
    int ret = -1;
4838 4839 4840
    virDomainEventPtr event = NULL;
    qemuDomainObjPrivatePtr priv;

P
Paolo Bonzini 已提交
4841 4842 4843 4844 4845 4846
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
4847 4848
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
P
Paolo Bonzini 已提交
4849 4850
        goto cleanup;
    }
4851
    priv = vm->privateData;
P
Paolo Bonzini 已提交
4852

4853
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
4854 4855
        goto cleanup;

D
Daniel P. Berrange 已提交
4856
    if (!virDomainObjIsActive(vm)) {
4857 4858
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
4859
        goto endjob;
P
Paolo Bonzini 已提交
4860 4861
    }

O
Osier Yang 已提交
4862 4863
    priv->jobActive = QEMU_JOB_DUMP;

P
Paolo Bonzini 已提交
4864 4865
    /* Migrate will always stop the VM, so the resume condition is
       independent of whether the stop command is issued.  */
P
Paolo Bonzini 已提交
4866 4867 4868
    resume = (vm->state == VIR_DOMAIN_RUNNING);

    /* Pause domain for non-live dump */
P
Paolo Bonzini 已提交
4869
    if (!(flags & VIR_DUMP_LIVE) && vm->state == VIR_DOMAIN_RUNNING) {
H
Hu Tao 已提交
4870
        if (doStopCPUs(driver, vm) < 0)
4871
            goto endjob;
P
Paolo Bonzini 已提交
4872
        paused = 1;
4873 4874 4875 4876 4877 4878

        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("guest unexpectedly quit"));
            goto endjob;
        }
P
Paolo Bonzini 已提交
4879 4880
    }

H
Hu Tao 已提交
4881
    ret = doCoreDump(driver, vm, path, getCompressionType(driver));
4882 4883 4884 4885
    if (ret < 0)
        goto endjob;

    paused = 1;
4886 4887

endjob:
4888
    if ((ret == 0) && (flags & VIR_DUMP_CRASH)) {
4889
        qemudShutdownVMDaemon(driver, vm, 0);
4890
        qemuDomainStopAudit(vm, "crashed");
4891 4892 4893 4894 4895
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_CRASHED);
    }

P
Paolo Bonzini 已提交
4896 4897 4898
    /* Since the monitor is always attached to a pty for libvirt, it
       will support synchronous operations so we always get here after
       the migration is complete.  */
4899
    else if (resume && paused && virDomainObjIsActive(vm)) {
H
Hu Tao 已提交
4900
        if (doStartCPUs(driver, vm, dom->conn) < 0) {
4901
            if (virGetLastError() == NULL)
4902 4903
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("resuming after dump failed"));
P
Paolo Bonzini 已提交
4904 4905
        }
    }
4906

4907 4908
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
4909
    else if ((ret == 0) && (flags & VIR_DUMP_CRASH) && !vm->persistent) {
4910 4911 4912 4913
        virDomainRemoveInactive(&driver->domains,
                                vm);
        vm = NULL;
    }
4914 4915

cleanup:
P
Paolo Bonzini 已提交
4916 4917
    if (vm)
        virDomainObjUnlock(vm);
4918 4919
    if (event)
        qemuDomainEventQueue(driver, event);
4920
    qemuDriverUnlock(driver);
P
Paolo Bonzini 已提交
4921 4922 4923
    return ret;
}

H
Hu Tao 已提交
4924 4925 4926 4927 4928 4929 4930 4931 4932 4933 4934 4935 4936 4937 4938 4939 4940 4941 4942 4943 4944 4945 4946 4947 4948 4949 4950 4951 4952 4953 4954 4955 4956 4957 4958 4959 4960
static void processWatchdogEvent(void *data, void *opaque)
{
    int ret;
    struct watchdogEvent *wdEvent = data;
    struct qemud_driver *driver = opaque;

    switch (wdEvent->action) {
    case VIR_DOMAIN_WATCHDOG_ACTION_DUMP:
        {
            char *dumpfile;
            int i;

            i = virAsprintf(&dumpfile, "%s/%s-%u",
                            driver->autoDumpPath,
                            wdEvent->vm->def->name,
                            (unsigned int)time(NULL));

            qemuDriverLock(driver);
            virDomainObjLock(wdEvent->vm);

            if (qemuDomainObjBeginJobWithDriver(driver, wdEvent->vm) < 0)
                break;

            if (!virDomainObjIsActive(wdEvent->vm)) {
                qemuReportError(VIR_ERR_OPERATION_INVALID,
                                "%s", _("domain is not running"));
                break;
            }

            ret = doCoreDump(driver,
                             wdEvent->vm,
                             dumpfile,
                             getCompressionType(driver));
            if (ret < 0)
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("Dump failed"));

H
Hu Tao 已提交
4961
            ret = doStartCPUs(driver, wdEvent->vm, NULL);
H
Hu Tao 已提交
4962 4963 4964 4965 4966 4967 4968 4969 4970 4971 4972 4973 4974 4975 4976 4977 4978

            if (ret < 0)
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("Resuming after dump failed"));

            if (qemuDomainObjEndJob(wdEvent->vm) > 0)
                virDomainObjUnlock(wdEvent->vm);

            qemuDriverUnlock(driver);

            VIR_FREE(dumpfile);
        }
        break;
    }

    VIR_FREE(wdEvent);
}
P
Paolo Bonzini 已提交
4979

4980 4981 4982 4983 4984 4985
static int qemudDomainHotplugVcpus(virDomainObjPtr vm, unsigned int nvcpus)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int i, rc;
    int ret = -1;

4986 4987
    qemuDomainObjEnterMonitor(vm);

4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998 4999 5000 5001 5002 5003 5004 5005 5006 5007 5008 5009 5010 5011 5012 5013 5014 5015 5016 5017
    /* We need different branches here, because we want to offline
     * in reverse order to onlining, so any partial fail leaves us in a
     * reasonably sensible state */
    if (nvcpus > vm->def->vcpus) {
        for (i = vm->def->vcpus ; i < nvcpus ; i++) {
            /* Online new CPU */
            rc = qemuMonitorSetCPU(priv->mon, i, 1);
            if (rc == 0)
                goto unsupported;
            if (rc < 0)
                goto cleanup;

            vm->def->vcpus++;
        }
    } else {
        for (i = vm->def->vcpus - 1 ; i >= nvcpus ; i--) {
            /* Offline old CPU */
            rc = qemuMonitorSetCPU(priv->mon, i, 0);
            if (rc == 0)
                goto unsupported;
            if (rc < 0)
                goto cleanup;

            vm->def->vcpus--;
        }
    }

    ret = 0;

cleanup:
5018
    qemuDomainObjExitMonitor(vm);
5019 5020 5021 5022 5023 5024 5025 5026 5027
    return ret;

unsupported:
    qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                    _("cannot change vcpu count of this domain"));
    goto cleanup;
}


5028 5029 5030 5031
static int
qemudDomainSetVcpusFlags(virDomainPtr dom, unsigned int nvcpus,
                         unsigned int flags)
{
5032 5033
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5034
    virDomainDefPtr persistentDef;
5035 5036
    const char * type;
    int max;
5037
    int ret = -1;
5038

5039 5040 5041 5042 5043 5044 5045 5046 5047 5048 5049 5050 5051 5052 5053 5054
    virCheckFlags(VIR_DOMAIN_VCPU_LIVE |
                  VIR_DOMAIN_VCPU_CONFIG |
                  VIR_DOMAIN_VCPU_MAXIMUM, -1);

    /* At least one of LIVE or CONFIG must be set.  MAXIMUM cannot be
     * mixed with LIVE.  */
    if ((flags & (VIR_DOMAIN_VCPU_LIVE | VIR_DOMAIN_VCPU_CONFIG)) == 0 ||
        (flags & (VIR_DOMAIN_VCPU_MAXIMUM | VIR_DOMAIN_VCPU_LIVE)) ==
         (VIR_DOMAIN_VCPU_MAXIMUM | VIR_DOMAIN_VCPU_LIVE)) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid flag combination: (0x%x)"), flags);
        return -1;
    }
    if (!nvcpus || (unsigned short) nvcpus != nvcpus) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("argument out of range: %d"), nvcpus);
5055 5056 5057
        return -1;
    }

5058
    qemuDriverLock(driver);
5059
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5060 5061
    qemuDriverUnlock(driver);

5062
    if (!vm) {
5063 5064
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5065 5066
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5067
        goto cleanup;
5068 5069
    }

5070 5071 5072
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

5073
    if (!virDomainObjIsActive(vm) && (flags & VIR_DOMAIN_VCPU_LIVE)) {
5074 5075
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                         "%s", _("domain is not running"));
5076
        goto endjob;
5077 5078
    }

5079 5080 5081 5082 5083 5084
    if (!vm->persistent && (flags & VIR_DOMAIN_VCPU_CONFIG)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID, "%s",
                        _("cannot change persistent config of a transient domain"));
        goto endjob;
    }

5085 5086 5087 5088 5089 5090 5091 5092 5093 5094 5095 5096 5097
    if (!(type = virDomainVirtTypeToString(vm->def->virtType))) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("unknown virt type in domain definition '%d'"),
                        vm->def->virtType);
        goto endjob;
    }

    if ((max = qemudGetMaxVCPUs(NULL, type)) < 0) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("could not determine max vcpus for the domain"));
        goto endjob;
    }

C
Cole Robinson 已提交
5098
    if (!(flags & VIR_DOMAIN_VCPU_MAXIMUM) && vm->def->maxvcpus < max) {
5099 5100 5101
        max = vm->def->maxvcpus;
    }

5102 5103 5104 5105 5106 5107 5108
    if (nvcpus > max) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("requested vcpus is greater than max allowable"
                          " vcpus for the domain: %d > %d"), nvcpus, max);
        goto endjob;
    }

5109 5110 5111
    if (!(persistentDef = virDomainObjGetPersistentDef(driver->caps, vm)))
        goto endjob;

5112 5113
    switch (flags) {
    case VIR_DOMAIN_VCPU_MAXIMUM | VIR_DOMAIN_VCPU_CONFIG:
5114 5115 5116
        persistentDef->maxvcpus = nvcpus;
        if (nvcpus < persistentDef->vcpus)
            persistentDef->vcpus = nvcpus;
5117 5118 5119 5120
        ret = 0;
        break;

    case VIR_DOMAIN_VCPU_CONFIG:
5121
        persistentDef->vcpus = nvcpus;
5122 5123 5124 5125 5126 5127 5128 5129 5130
        ret = 0;
        break;

    case VIR_DOMAIN_VCPU_LIVE:
        ret = qemudDomainHotplugVcpus(vm, nvcpus);
        break;

    case VIR_DOMAIN_VCPU_LIVE | VIR_DOMAIN_VCPU_CONFIG:
        ret = qemudDomainHotplugVcpus(vm, nvcpus);
5131 5132 5133
        if (ret == 0) {
            persistentDef->vcpus = nvcpus;
        }
5134 5135
        break;
    }
5136

5137 5138 5139 5140
    /* Save the persistent config to disk */
    if (flags & VIR_DOMAIN_VCPU_CONFIG)
        ret = virDomainSaveConfig(driver->configDir, persistentDef);

5141 5142 5143
endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
5144

5145
cleanup:
5146 5147
    if (vm)
        virDomainObjUnlock(vm);
5148
    return ret;
5149 5150
}

5151 5152 5153 5154 5155 5156
static int
qemudDomainSetVcpus(virDomainPtr dom, unsigned int nvcpus)
{
    return qemudDomainSetVcpusFlags(dom, nvcpus, VIR_DOMAIN_VCPU_LIVE);
}

5157 5158 5159 5160 5161 5162

static int
qemudDomainPinVcpu(virDomainPtr dom,
                   unsigned int vcpu,
                   unsigned char *cpumap,
                   int maplen) {
5163 5164
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5165
    int maxcpu, hostcpus;
5166
    virNodeInfo nodeinfo;
5167
    int ret = -1;
5168
    qemuDomainObjPrivatePtr priv;
5169

5170
    qemuDriverLock(driver);
5171
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5172 5173
    qemuDriverUnlock(driver);

5174 5175 5176
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5177 5178
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5179 5180 5181
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
5182
    if (!virDomainObjIsActive(vm)) {
5183 5184
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s",_("cannot pin vcpus on an inactive domain"));
5185
        goto cleanup;
5186 5187
    }

5188 5189 5190
    priv = vm->privateData;

    if (vcpu > (priv->nvcpupids-1)) {
5191 5192 5193
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("vcpu number out of range %d > %d"),
                        vcpu, priv->nvcpupids);
5194
        goto cleanup;
5195 5196
    }

5197
    if (nodeGetInfo(dom->conn, &nodeinfo) < 0)
5198
        goto cleanup;
5199

5200
    hostcpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
5201
    maxcpu = maplen * 8;
5202 5203
    if (maxcpu > hostcpus)
        maxcpu = hostcpus;
5204

5205 5206
    if (priv->vcpupids != NULL) {
        if (virProcessInfoSetAffinity(priv->vcpupids[vcpu],
5207
                                      cpumap, maplen, maxcpu) < 0)
5208
            goto cleanup;
5209
    } else {
5210 5211
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        "%s", _("cpu affinity is not supported"));
5212
        goto cleanup;
5213
    }
5214
    ret = 0;
5215

5216
cleanup:
5217 5218
    if (vm)
        virDomainObjUnlock(vm);
5219
    return ret;
5220 5221 5222 5223 5224 5225 5226 5227
}

static int
qemudDomainGetVcpus(virDomainPtr dom,
                    virVcpuInfoPtr info,
                    int maxinfo,
                    unsigned char *cpumaps,
                    int maplen) {
5228 5229
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5230
    virNodeInfo nodeinfo;
5231
    int i, v, maxcpu, hostcpus;
5232
    int ret = -1;
5233
    qemuDomainObjPrivatePtr priv;
5234

5235
    qemuDriverLock(driver);
5236
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5237 5238
    qemuDriverUnlock(driver);

5239 5240 5241
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5242 5243
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5244 5245 5246
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
5247
    if (!virDomainObjIsActive(vm)) {
5248 5249 5250
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s",
                        _("cannot list vcpu pinning for an inactive domain"));
5251
        goto cleanup;
5252 5253
    }

5254 5255
    priv = vm->privateData;

5256
    if (nodeGetInfo(dom->conn, &nodeinfo) < 0)
5257
        goto cleanup;
5258

5259
    hostcpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
5260
    maxcpu = maplen * 8;
5261 5262
    if (maxcpu > hostcpus)
        maxcpu = hostcpus;
5263 5264

    /* Clamp to actual number of vcpus */
5265 5266
    if (maxinfo > priv->nvcpupids)
        maxinfo = priv->nvcpupids;
5267

5268 5269 5270 5271 5272 5273
    if (maxinfo >= 1) {
        if (info != NULL) {
            memset(info, 0, sizeof(*info) * maxinfo);
            for (i = 0 ; i < maxinfo ; i++) {
                info[i].number = i;
                info[i].state = VIR_VCPU_RUNNING;
5274

5275
                if (priv->vcpupids != NULL &&
5276 5277 5278
                    qemudGetProcessInfo(&(info[i].cpuTime),
                                        &(info[i].cpu),
                                        vm->pid,
5279
                                        priv->vcpupids[i]) < 0) {
5280
                    virReportSystemError(errno, "%s",
5281 5282 5283
                                         _("cannot get vCPU placement & pCPU time"));
                    goto cleanup;
                }
5284
            }
5285 5286
        }

5287 5288
        if (cpumaps != NULL) {
            memset(cpumaps, 0, maplen * maxinfo);
5289
            if (priv->vcpupids != NULL) {
5290 5291 5292
                for (v = 0 ; v < maxinfo ; v++) {
                    unsigned char *cpumap = VIR_GET_CPUMAP(cpumaps, maplen, v);

5293
                    if (virProcessInfoGetAffinity(priv->vcpupids[v],
5294
                                                  cpumap, maplen, maxcpu) < 0)
5295
                        goto cleanup;
5296
                }
5297
            } else {
5298 5299
                qemuReportError(VIR_ERR_NO_SUPPORT,
                                "%s", _("cpu affinity is not available"));
5300
                goto cleanup;
5301 5302 5303
            }
        }
    }
5304
    ret = maxinfo;
5305

5306
cleanup:
5307 5308
    if (vm)
        virDomainObjUnlock(vm);
5309
    return ret;
5310 5311 5312
}


5313 5314 5315
static int
qemudDomainGetVcpusFlags(virDomainPtr dom, unsigned int flags)
{
5316 5317
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
5318
    virDomainDefPtr def;
5319
    int ret = -1;
5320

5321 5322 5323 5324 5325 5326 5327 5328
    virCheckFlags(VIR_DOMAIN_VCPU_LIVE |
                  VIR_DOMAIN_VCPU_CONFIG |
                  VIR_DOMAIN_VCPU_MAXIMUM, -1);

    /* Exactly one of LIVE or CONFIG must be set.  */
    if (!(flags & VIR_DOMAIN_VCPU_LIVE) == !(flags & VIR_DOMAIN_VCPU_CONFIG)) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid flag combination: (0x%x)"), flags);
5329 5330 5331
        return -1;
    }

5332
    qemuDriverLock(driver);
5333
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5334 5335
    qemuDriverUnlock(driver);

5336
    if (!vm) {
5337 5338
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5339 5340
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5341
        goto cleanup;
5342 5343
    }

5344 5345 5346 5347 5348 5349 5350 5351 5352
    if (flags & VIR_DOMAIN_VCPU_LIVE) {
        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_OPERATION_INVALID, "%s",
                            _("domain not active"));
            goto cleanup;
        }
        def = vm->def;
    } else {
        def = vm->newDef ? vm->newDef : vm->def;
5353 5354
    }

5355
    ret = (flags & VIR_DOMAIN_VCPU_MAXIMUM) ? def->maxvcpus : def->vcpus;
5356

5357
cleanup:
5358 5359
    if (vm)
        virDomainObjUnlock(vm);
5360 5361 5362
    return ret;
}

5363 5364 5365 5366 5367 5368 5369
static int
qemudDomainGetMaxVcpus(virDomainPtr dom)
{
    return qemudDomainGetVcpusFlags(dom, (VIR_DOMAIN_VCPU_LIVE |
                                          VIR_DOMAIN_VCPU_MAXIMUM));
}

5370 5371 5372 5373 5374 5375 5376 5377 5378
static int qemudDomainGetSecurityLabel(virDomainPtr dom, virSecurityLabelPtr seclabel)
{
    struct qemud_driver *driver = (struct qemud_driver *)dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

5379 5380
    memset(seclabel, 0, sizeof(*seclabel));

5381 5382 5383
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5384 5385
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5386 5387 5388
        goto cleanup;
    }

5389
    if (!virDomainVirtTypeToString(vm->def->virtType)) {
5390 5391 5392
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("unknown virt type in domain definition '%d'"),
                        vm->def->virtType);
5393 5394 5395 5396 5397 5398 5399 5400 5401 5402 5403 5404 5405 5406 5407 5408 5409
        goto cleanup;
    }

    /*
     * Theoretically, the pid can be replaced during this operation and
     * return the label of a different process.  If atomicity is needed,
     * further validation will be required.
     *
     * Comment from Dan Berrange:
     *
     *   Well the PID as stored in the virDomainObjPtr can't be changed
     *   because you've got a locked object.  The OS level PID could have
     *   exited, though and in extreme circumstances have cycled through all
     *   PIDs back to ours. We could sanity check that our PID still exists
     *   after reading the label, by checking that our FD connecting to the
     *   QEMU monitor hasn't seen SIGHUP/ERR on poll().
     */
D
Daniel P. Berrange 已提交
5410
    if (virDomainObjIsActive(vm)) {
5411 5412
        if (virSecurityManagerGetProcessLabel(driver->securityManager,
                                              vm, seclabel) < 0) {
5413 5414 5415
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            "%s", _("Failed to get security label"));
            goto cleanup;
5416 5417 5418 5419 5420 5421 5422 5423
        }
    }

    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
5424
    qemuDriverUnlock(driver);
5425 5426 5427
    return ret;
}

5428 5429
static int qemudNodeGetSecurityModel(virConnectPtr conn,
                                     virSecurityModelPtr secmodel)
5430 5431 5432
{
    struct qemud_driver *driver = (struct qemud_driver *)conn->privateData;
    char *p;
5433
    int ret = 0;
5434

5435
    qemuDriverLock(driver);
5436 5437 5438 5439 5440
    memset(secmodel, 0, sizeof(*secmodel));

    /* NULL indicates no driver, which we treat as
     * success, but simply return no data in *secmodel */
    if (driver->caps->host.secModel.model == NULL)
5441
        goto cleanup;
5442

5443 5444
    p = driver->caps->host.secModel.model;
    if (strlen(p) >= VIR_SECURITY_MODEL_BUFLEN-1) {
5445 5446 5447
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("security model string exceeds max %d bytes"),
                        VIR_SECURITY_MODEL_BUFLEN-1);
5448 5449
        ret = -1;
        goto cleanup;
5450 5451 5452 5453 5454
    }
    strcpy(secmodel->model, p);

    p = driver->caps->host.secModel.doi;
    if (strlen(p) >= VIR_SECURITY_DOI_BUFLEN-1) {
5455 5456 5457
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("security DOI string exceeds max %d bytes"),
                        VIR_SECURITY_DOI_BUFLEN-1);
5458 5459
        ret = -1;
        goto cleanup;
5460 5461
    }
    strcpy(secmodel->doi, p);
5462 5463 5464 5465

cleanup:
    qemuDriverUnlock(driver);
    return ret;
5466 5467
}

5468 5469 5470 5471 5472 5473
/* qemudOpenAsUID() - pipe/fork/setuid/open a file, and return the
   pipe fd to caller, so that it can read from the file. Also return
   the pid of the child process, so the caller can wait for it to exit
   after it's finished reading (to avoid a zombie, if nothing
   else). */

5474 5475 5476
static int
qemudOpenAsUID(const char *path, uid_t uid, gid_t gid, pid_t *child_pid)
{
5477 5478 5479 5480 5481 5482 5483 5484 5485 5486 5487 5488 5489 5490 5491 5492 5493 5494 5495 5496 5497 5498 5499 5500 5501 5502 5503
    int pipefd[2];
    int fd = -1;

    *child_pid = -1;

    if (pipe(pipefd) < 0) {
        virReportSystemError(errno,
                             _("failed to create pipe to read '%s'"),
                             path);
        pipefd[0] = pipefd[1] = -1;
        goto parent_cleanup;
    }

    int forkRet = virFork(child_pid);

    if (*child_pid < 0) {
        virReportSystemError(errno,
                             _("failed to fork child to read '%s'"),
                             path);
        goto parent_cleanup;
    }

    if (*child_pid > 0) {

        /* parent */

        /* parent doesn't need the write side of the pipe */
5504
        VIR_FORCE_CLOSE(pipefd[1]);
5505 5506 5507 5508 5509 5510 5511 5512 5513 5514 5515

        if (forkRet < 0) {
            virReportSystemError(errno,
                                 _("failed in parent after forking child to read '%s'"),
                                 path);
            goto parent_cleanup;
        }
        /* caller gets the read side of the pipe */
        fd = pipefd[0];
        pipefd[0] = -1;
parent_cleanup:
5516 5517
        VIR_FORCE_CLOSE(pipefd[0]);
        VIR_FORCE_CLOSE(pipefd[1]);
5518 5519 5520 5521 5522 5523 5524 5525 5526 5527 5528 5529 5530 5531 5532 5533 5534 5535 5536 5537 5538 5539 5540 5541
        if ((fd < 0) && (*child_pid > 0)) {
            /* a child process was started and subsequently an error
               occurred in the parent, so we need to wait for it to
               exit, but its status is inconsequential. */
            while ((waitpid(*child_pid, NULL, 0) == -1)
                   && (errno == EINTR)) {
                /* empty */
            }
            *child_pid = -1;
        }
        return fd;
    }

    /* child */

    /* setuid to the qemu user, then open the file, read it,
       and stuff it into the pipe for the parent process to
       read */
    int exit_code;
    char *buf = NULL;
    size_t bufsize = 1024 * 1024;
    int bytesread;

    /* child doesn't need the read side of the pipe */
5542
    VIR_FORCE_CLOSE(pipefd[0]);
5543 5544 5545 5546 5547 5548 5549 5550 5551

    if (forkRet < 0) {
        exit_code = errno;
        virReportSystemError(errno,
                             _("failed in child after forking to read '%s'"),
                             path);
        goto child_cleanup;
    }

5552 5553 5554
    if (virSetUIDGID(uid, gid) < 0) {
       exit_code = errno;
       goto child_cleanup;
5555 5556
    }

5557 5558 5559 5560 5561 5562 5563 5564
    if ((fd = open(path, O_RDONLY)) < 0) {
        exit_code = errno;
        virReportSystemError(errno,
                             _("cannot open '%s' as uid %d"),
                             path, uid);
        goto child_cleanup;
    }

5565 5566 5567 5568 5569 5570
    if (VIR_ALLOC_N(buf, bufsize) < 0) {
        exit_code = ENOMEM;
        virReportOOMError();
        goto child_cleanup;
    }

5571 5572 5573 5574 5575 5576 5577 5578 5579 5580 5581 5582 5583 5584 5585 5586 5587 5588 5589 5590
    /* read from fd and write to pipefd[1] until EOF */
    do {
        if ((bytesread = saferead(fd, buf, bufsize)) < 0) {
            exit_code = errno;
            virReportSystemError(errno,
                                 _("child failed reading from '%s'"),
                                 path);
            goto child_cleanup;
        }
        if (safewrite(pipefd[1], buf, bytesread) != bytesread) {
            exit_code = errno;
            virReportSystemError(errno, "%s",
                                 _("child failed writing to pipe"));
            goto child_cleanup;
        }
    } while (bytesread > 0);
    exit_code = 0;

child_cleanup:
    VIR_FREE(buf);
5591 5592
    VIR_FORCE_CLOSE(fd);
    VIR_FORCE_CLOSE(pipefd[1]);
5593 5594 5595
    _exit(exit_code);
}

J
Jiri Denemark 已提交
5596 5597 5598 5599
static int qemudDomainSaveImageClose(int fd, pid_t read_pid, int *status)
{
    int ret = 0;

5600 5601 5602 5603
    if (VIR_CLOSE(fd) < 0) {
        virReportSystemError(errno, "%s",
                             _("cannot close file"));
    }
J
Jiri Denemark 已提交
5604 5605 5606 5607 5608 5609 5610 5611 5612 5613 5614 5615 5616 5617 5618 5619

    if (read_pid != -1) {
        /* reap the process that read the file */
        while ((ret = waitpid(read_pid, status, 0)) == -1
               && errno == EINTR) {
            /* empty */
        }
    } else if (status) {
        *status = 0;
    }

    return ret;
}

static int ATTRIBUTE_NONNULL(3) ATTRIBUTE_NONNULL(4) ATTRIBUTE_NONNULL(5)
qemudDomainSaveImageOpen(struct qemud_driver *driver,
5620 5621 5622 5623
                         const char *path,
                         virDomainDefPtr *ret_def,
                         struct qemud_save_header *ret_header,
                         pid_t *ret_read_pid)
J
Jiri Denemark 已提交
5624 5625
{
    int fd;
5626
    pid_t read_pid = -1;
5627
    struct qemud_save_header header;
J
Jiri Denemark 已提交
5628 5629
    char *xml = NULL;
    virDomainDefPtr def = NULL;
5630 5631

    if ((fd = open(path, O_RDONLY)) < 0) {
5632 5633 5634
        if ((driver->user == 0) || (getuid() != 0)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("cannot read domain image"));
J
Jiri Denemark 已提交
5635
            goto error;
5636 5637 5638 5639 5640 5641
        }

        /* Opening as root failed, but qemu runs as a different user
           that might have better luck. Create a pipe, then fork a
           child process to run as the qemu user, which will hopefully
           have the necessary authority to read the file. */
5642 5643
        if ((fd = qemudOpenAsUID(path,
                                 driver->user, driver->group, &read_pid)) < 0) {
5644
            /* error already reported */
J
Jiri Denemark 已提交
5645
            goto error;
5646
        }
5647 5648 5649
    }

    if (saferead(fd, &header, sizeof(header)) != sizeof(header)) {
5650 5651
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to read qemu header"));
J
Jiri Denemark 已提交
5652
        goto error;
5653 5654 5655
    }

    if (memcmp(header.magic, QEMUD_SAVE_MAGIC, sizeof(header.magic)) != 0) {
5656 5657
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("image magic is incorrect"));
J
Jiri Denemark 已提交
5658
        goto error;
5659 5660 5661
    }

    if (header.version > QEMUD_SAVE_VERSION) {
5662 5663 5664
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("image version is not supported (%d > %d)"),
                        header.version, QEMUD_SAVE_VERSION);
J
Jiri Denemark 已提交
5665
        goto error;
5666 5667
    }

5668 5669 5670
    if (header.xml_len <= 0) {
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("invalid XML length: %d"), header.xml_len);
J
Jiri Denemark 已提交
5671
        goto error;
5672 5673
    }

5674 5675
    if (VIR_ALLOC_N(xml, header.xml_len) < 0) {
        virReportOOMError();
J
Jiri Denemark 已提交
5676
        goto error;
5677 5678 5679
    }

    if (saferead(fd, xml, header.xml_len) != header.xml_len) {
5680 5681
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to read XML"));
J
Jiri Denemark 已提交
5682
        goto error;
5683 5684 5685
    }

    /* Create a domain from this XML */
5686
    if (!(def = virDomainDefParseString(driver->caps, xml,
5687
                                        VIR_DOMAIN_XML_INACTIVE))) {
5688 5689
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to parse XML"));
J
Jiri Denemark 已提交
5690
        goto error;
5691 5692
    }

J
Jiri Denemark 已提交
5693
    VIR_FREE(xml);
5694

J
Jiri Denemark 已提交
5695 5696 5697
    *ret_def = def;
    *ret_header = header;
    *ret_read_pid = read_pid;
5698

J
Jiri Denemark 已提交
5699
    return fd;
5700

J
Jiri Denemark 已提交
5701 5702 5703 5704 5705 5706 5707 5708 5709 5710 5711 5712 5713 5714 5715 5716 5717 5718 5719 5720 5721 5722 5723 5724 5725 5726
error:
    virDomainDefFree(def);
    VIR_FREE(xml);
    qemudDomainSaveImageClose(fd, read_pid, NULL);

    return -1;
}

static int ATTRIBUTE_NONNULL(6)
qemudDomainSaveImageStartVM(virConnectPtr conn,
                            struct qemud_driver *driver,
                            virDomainObjPtr vm,
                            int fd,
                            pid_t read_pid,
                            const struct qemud_save_header *header,
                            const char *path)
{
    int ret = -1;
    virDomainEventPtr event;
    int intermediatefd = -1;
    pid_t intermediate_pid = -1;
    int childstat;
    int wait_ret;
    int status;

    if (header->version == 2) {
5727
        const char *intermediate_argv[3] = { NULL, "-dc", NULL };
J
Jiri Denemark 已提交
5728
        const char *prog = qemudSaveCompressionTypeToString(header->compressed);
5729
        if (prog == NULL) {
5730 5731
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            _("Invalid compressed save format %d"),
J
Jiri Denemark 已提交
5732 5733
                            header->compressed);
            goto out;
5734
        }
5735

J
Jiri Denemark 已提交
5736
        if (header->compressed != QEMUD_SAVE_FORMAT_RAW) {
5737
            intermediate_argv[0] = prog;
5738 5739
            intermediatefd = fd;
            fd = -1;
5740
            if (virExec(intermediate_argv, NULL, NULL,
5741
                        &intermediate_pid, intermediatefd, &fd, NULL, 0) < 0) {
5742 5743 5744
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("Failed to start decompression binary %s"),
                                intermediate_argv[0]);
J
Jiri Denemark 已提交
5745
                goto out;
5746 5747 5748
            }
        }
    }
J
Jiri Denemark 已提交
5749

5750
    /* Set the migration source and start it up. */
5751 5752
    ret = qemudStartVMDaemon(conn, driver, vm, "stdio", true, fd, path,
                             VIR_VM_OP_RESTORE);
J
Jiri Denemark 已提交
5753

5754 5755 5756
    if (intermediate_pid != -1) {
        /* Wait for intermediate process to exit */
        while (waitpid(intermediate_pid, &childstat, 0) == -1 &&
J
Jiri Denemark 已提交
5757 5758 5759
               errno == EINTR) {
            /* empty */
        }
5760
    }
5761
    VIR_FORCE_CLOSE(intermediatefd);
J
Jiri Denemark 已提交
5762 5763

    wait_ret = qemudDomainSaveImageClose(fd, read_pid, &status);
5764
    fd = -1;
5765 5766 5767 5768 5769 5770 5771 5772 5773 5774 5775 5776 5777 5778 5779 5780 5781 5782 5783 5784 5785
    if (read_pid != -1) {
        if (wait_ret == -1) {
            virReportSystemError(errno,
                                 _("failed to wait for process reading '%s'"),
                                 path);
            ret = -1;
        } else if (!WIFEXITED(status)) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            _("child process exited abnormally reading '%s'"),
                            path);
            ret = -1;
        } else {
            int exit_status = WEXITSTATUS(status);
            if (exit_status != 0) {
                virReportSystemError(exit_status,
                                     _("child process returned error reading '%s'"),
                                     path);
                ret = -1;
            }
        }
    }
J
Jiri Denemark 已提交
5786

5787 5788
    if (ret < 0) {
        qemuDomainStartAudit(vm, "restored", false);
J
Jiri Denemark 已提交
5789
        goto out;
5790
    }
5791

5792 5793 5794
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_RESTORED);
5795
    qemuDomainStartAudit(vm, "restored", true);
J
Jiri Denemark 已提交
5796 5797 5798
    if (event)
        qemuDomainEventQueue(driver, event);

5799

5800
    /* If it was running before, resume it now. */
J
Jiri Denemark 已提交
5801
    if (header->was_running) {
H
Hu Tao 已提交
5802
        if (doStartCPUs(driver, vm, conn) < 0) {
5803
            if (virGetLastError() == NULL)
5804 5805
                qemuReportError(VIR_ERR_OPERATION_FAILED,
                                "%s", _("failed to resume domain"));
J
Jiri Denemark 已提交
5806
            goto out;
5807
        }
5808 5809
        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0) {
            VIR_WARN("Failed to save status on vm %s", vm->def->name);
J
Jiri Denemark 已提交
5810
            goto out;
5811
        }
5812
    }
J
Jiri Denemark 已提交
5813

5814
    ret = 0;
5815

J
Jiri Denemark 已提交
5816
out:
5817 5818
    if (virSecurityManagerRestoreSavedStateLabel(driver->securityManager,
                                                 vm, path) < 0)
5819 5820
        VIR_WARN("failed to restore save state label on %s", path);

J
Jiri Denemark 已提交
5821 5822 5823 5824 5825 5826 5827 5828 5829 5830 5831 5832 5833 5834 5835 5836 5837 5838 5839 5840 5841 5842 5843 5844 5845
    return ret;
}

static int qemudDomainRestore(virConnectPtr conn,
                              const char *path) {
    struct qemud_driver *driver = conn->privateData;
    virDomainDefPtr def = NULL;
    virDomainObjPtr vm = NULL;
    int fd = -1;
    pid_t read_pid = -1;
    int ret = -1;
    struct qemud_save_header header;

    qemuDriverLock(driver);

    fd = qemudDomainSaveImageOpen(driver, path, &def, &header, &read_pid);
    if (fd < 0)
        goto cleanup;

    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;

    if (!(vm = virDomainAssignDef(driver->caps,
                                  &driver->domains,
                                  def, true))) {
5846
        /* virDomainAssignDef already set the error */
J
Jiri Denemark 已提交
5847 5848 5849 5850 5851 5852 5853 5854 5855 5856 5857
        goto cleanup;
    }
    def = NULL;

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    ret = qemudDomainSaveImageStartVM(conn, driver, vm, fd,
                                      read_pid, &header, path);

    if (qemuDomainObjEndJob(vm) == 0)
5858
        vm = NULL;
J
Jiri Denemark 已提交
5859 5860 5861 5862
    else if (ret < 0 && !vm->persistent) {
        virDomainRemoveInactive(&driver->domains, vm);
        vm = NULL;
    }
5863

5864 5865
cleanup:
    virDomainDefFree(def);
J
Jiri Denemark 已提交
5866
    qemudDomainSaveImageClose(fd, read_pid, NULL);
5867 5868 5869
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
5870
    return ret;
D
Daniel P. Berrange 已提交
5871 5872
}

J
Jiri Denemark 已提交
5873 5874 5875 5876 5877 5878 5879 5880 5881 5882 5883 5884 5885 5886 5887 5888 5889 5890 5891 5892 5893 5894 5895 5896 5897 5898 5899 5900 5901 5902 5903 5904 5905 5906 5907 5908 5909 5910 5911 5912 5913
static int qemudDomainObjRestore(virConnectPtr conn,
                                 struct qemud_driver *driver,
                                 virDomainObjPtr vm,
                                 const char *path)
{
    virDomainDefPtr def = NULL;
    int fd = -1;
    pid_t read_pid = -1;
    int ret = -1;
    struct qemud_save_header header;

    fd = qemudDomainSaveImageOpen(driver, path, &def, &header, &read_pid);
    if (fd < 0)
        goto cleanup;

    if (STRNEQ(vm->def->name, def->name) ||
        memcmp(vm->def->uuid, def->uuid, VIR_UUID_BUFLEN)) {
        char vm_uuidstr[VIR_UUID_STRING_BUFLEN];
        char def_uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(vm->def->uuid, vm_uuidstr);
        virUUIDFormat(def->uuid, def_uuidstr);
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("cannot restore domain '%s' uuid %s from a file"
                          " which belongs to domain '%s' uuid %s"),
                        vm->def->name, vm_uuidstr,
                        def->name, def_uuidstr);
        goto cleanup;
    }

    virDomainObjAssignDef(vm, def, true);
    def = NULL;

    ret = qemudDomainSaveImageStartVM(conn, driver, vm, fd,
                                      read_pid, &header, path);

cleanup:
    virDomainDefFree(def);
    qemudDomainSaveImageClose(fd, read_pid, NULL);
    return ret;
}

D
Daniel P. Berrange 已提交
5914

5915 5916 5917 5918 5919 5920 5921 5922 5923 5924 5925 5926 5927 5928 5929 5930 5931 5932 5933 5934 5935 5936 5937 5938 5939 5940 5941 5942 5943 5944 5945 5946 5947 5948 5949 5950 5951 5952
static char *qemudVMDumpXML(struct qemud_driver *driver,
                            virDomainObjPtr vm,
                            int flags)
{
    char *ret = NULL;
    virCPUDefPtr cpu = NULL;
    virDomainDefPtr def;
    virCPUDefPtr def_cpu;

    if ((flags & VIR_DOMAIN_XML_INACTIVE) && vm->newDef)
        def = vm->newDef;
    else
        def = vm->def;
    def_cpu = def->cpu;

    /* Update guest CPU requirements according to host CPU */
    if ((flags & VIR_DOMAIN_XML_UPDATE_CPU) && def_cpu && def_cpu->model) {
        if (!driver->caps || !driver->caps->host.cpu) {
            qemuReportError(VIR_ERR_OPERATION_FAILED,
                            "%s", _("cannot get host CPU capabilities"));
            goto cleanup;
        }

        if (!(cpu = virCPUDefCopy(def_cpu))
            || cpuUpdate(cpu, driver->caps->host.cpu))
            goto cleanup;
        def->cpu = cpu;
    }

    ret = virDomainDefFormat(def, flags);

cleanup:
    def->cpu = def_cpu;
    virCPUDefFree(cpu);
    return ret;
}


5953
static char *qemudDomainDumpXML(virDomainPtr dom,
5954
                                int flags) {
5955 5956 5957
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    char *ret = NULL;
5958 5959
    unsigned long balloon;
    int err;
5960

5961
    qemuDriverLock(driver);
5962
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
5963

D
Daniel P. Berrange 已提交
5964
    if (!vm) {
5965 5966
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
5967 5968
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
5969
        goto cleanup;
D
Daniel P. Berrange 已提交
5970 5971
    }

5972 5973 5974 5975
    /* Refresh current memory based on balloon info if supported */
    if ((vm->def->memballoon != NULL) &&
        (vm->def->memballoon->model != VIR_DOMAIN_MEMBALLOON_MODEL_NONE) &&
        (virDomainObjIsActive(vm))) {
5976
        qemuDomainObjPrivatePtr priv = vm->privateData;
5977 5978 5979
        /* Don't delay if someone's using the monitor, just use
         * existing most recent data instead */
        if (!priv->jobActive) {
5980
            if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
5981 5982
                goto cleanup;

5983
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
5984
            err = qemuMonitorGetBalloonInfo(priv->mon, &balloon);
5985
            qemuDomainObjExitMonitorWithDriver(driver, vm);
5986 5987 5988 5989
            if (qemuDomainObjEndJob(vm) == 0) {
                vm = NULL;
                goto cleanup;
            }
5990 5991 5992
            if (err < 0)
                goto cleanup;
            if (err > 0)
5993
                vm->def->mem.cur_balloon = balloon;
5994 5995
            /* err == 0 indicates no balloon support, so ignore it */
        }
5996
    }
5997

5998
    ret = qemudVMDumpXML(driver, vm, flags);
5999 6000

cleanup:
6001 6002
    if (vm)
        virDomainObjUnlock(vm);
6003
    qemuDriverUnlock(driver);
6004
    return ret;
D
Daniel P. Berrange 已提交
6005 6006 6007
}


6008 6009 6010 6011
static char *qemuDomainXMLFromNative(virConnectPtr conn,
                                     const char *format,
                                     const char *config,
                                     unsigned int flags ATTRIBUTE_UNUSED) {
6012
    struct qemud_driver *driver = conn->privateData;
6013 6014 6015 6016
    virDomainDefPtr def = NULL;
    char *xml = NULL;

    if (STRNEQ(format, QEMU_CONFIG_FORMAT_ARGV)) {
6017 6018
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("unsupported config type %s"), format);
6019 6020 6021
        goto cleanup;
    }

6022
    qemuDriverLock(driver);
6023
    def = qemuParseCommandLineString(driver->caps, config);
6024
    qemuDriverUnlock(driver);
6025 6026 6027
    if (!def)
        goto cleanup;

6028
    xml = virDomainDefFormat(def, VIR_DOMAIN_XML_INACTIVE);
6029 6030 6031 6032 6033 6034

cleanup:
    virDomainDefFree(def);
    return xml;
}

6035 6036 6037 6038 6039 6040
static char *qemuDomainXMLToNative(virConnectPtr conn,
                                   const char *format,
                                   const char *xmlData,
                                   unsigned int flags ATTRIBUTE_UNUSED) {
    struct qemud_driver *driver = conn->privateData;
    virDomainDefPtr def = NULL;
6041
    virDomainChrSourceDef monConfig;
6042
    unsigned long long qemuCmdFlags;
E
Eric Blake 已提交
6043
    virCommandPtr cmd = NULL;
6044 6045 6046
    char *ret = NULL;
    int i;

6047 6048
    qemuDriverLock(driver);

6049
    if (STRNEQ(format, QEMU_CONFIG_FORMAT_ARGV)) {
6050 6051
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("unsupported config type %s"), format);
6052 6053 6054
        goto cleanup;
    }

6055
    def = virDomainDefParseString(driver->caps, xmlData, 0);
6056 6057 6058
    if (!def)
        goto cleanup;

6059 6060
    /* Since we're just exporting args, we can't do bridge/network/direct
     * setups, since libvirt will normally create TAP/macvtap devices
6061 6062 6063 6064 6065
     * directly. We convert those configs into generic 'ethernet'
     * config and assume the user has suitable 'ifup-qemu' scripts
     */
    for (i = 0 ; i < def->nnets ; i++) {
        virDomainNetDefPtr net = def->nets[i];
6066
        int bootIndex = net->bootIndex;
6067 6068
        if (net->type == VIR_DOMAIN_NET_TYPE_NETWORK ||
            net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
6069 6070 6071 6072 6073 6074 6075 6076 6077 6078 6079 6080 6081 6082 6083 6084 6085 6086 6087 6088
            VIR_FREE(net->data.network.name);

            memset(net, 0, sizeof *net);

            net->type = VIR_DOMAIN_NET_TYPE_ETHERNET;
            net->data.ethernet.dev = NULL;
            net->data.ethernet.script = NULL;
            net->data.ethernet.ipaddr = NULL;
        } else if (net->type == VIR_DOMAIN_NET_TYPE_BRIDGE) {
            char *brname = net->data.bridge.brname;
            char *script = net->data.bridge.script;
            char *ipaddr = net->data.bridge.ipaddr;

            memset(net, 0, sizeof *net);

            net->type = VIR_DOMAIN_NET_TYPE_ETHERNET;
            net->data.ethernet.dev = brname;
            net->data.ethernet.script = script;
            net->data.ethernet.ipaddr = ipaddr;
        }
6089
        net->bootIndex = bootIndex;
6090 6091 6092 6093
    }
    for (i = 0 ; i < def->ngraphics ; i++) {
        if (def->graphics[i]->type == VIR_DOMAIN_GRAPHICS_TYPE_VNC &&
            def->graphics[i]->data.vnc.autoport)
6094
            def->graphics[i]->data.vnc.port = QEMU_VNC_PORT_MIN;
6095 6096
    }

6097 6098 6099
    if (qemuCapsExtractVersionInfo(def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
6100 6101
        goto cleanup;

6102
    if (qemuPrepareMonitorChr(driver, &monConfig, def->name) < 0)
6103
        goto cleanup;
6104

6105 6106
    if (!(cmd = qemuBuildCommandLine(conn, driver, def,
                                     &monConfig, false, qemuCmdFlags,
6107
                                     NULL, -1, NULL, VIR_VM_OP_NO_OP)))
6108 6109
        goto cleanup;

E
Eric Blake 已提交
6110
    ret = virCommandToString(cmd);
6111 6112

cleanup:
6113
    qemuDriverUnlock(driver);
6114

E
Eric Blake 已提交
6115
    virCommandFree(cmd);
6116 6117 6118 6119 6120
    virDomainDefFree(def);
    return ret;
}


6121
static int qemudListDefinedDomains(virConnectPtr conn,
6122
                            char **const names, int nnames) {
6123
    struct qemud_driver *driver = conn->privateData;
6124
    int n;
6125

6126
    qemuDriverLock(driver);
6127
    n = virDomainObjListGetInactiveNames(&driver->domains, names, nnames);
6128
    qemuDriverUnlock(driver);
6129
    return n;
D
Daniel P. Berrange 已提交
6130 6131
}

6132
static int qemudNumDefinedDomains(virConnectPtr conn) {
6133
    struct qemud_driver *driver = conn->privateData;
6134
    int n;
6135

6136
    qemuDriverLock(driver);
6137
    n = virDomainObjListNumOfDomains(&driver->domains, 0);
6138
    qemuDriverUnlock(driver);
6139

6140
    return n;
D
Daniel P. Berrange 已提交
6141 6142 6143
}


J
Jiri Denemark 已提交
6144 6145
static int qemudDomainObjStart(virConnectPtr conn,
                               struct qemud_driver *driver,
6146 6147
                               virDomainObjPtr vm,
                               bool start_paused)
J
Jiri Denemark 已提交
6148 6149 6150 6151 6152 6153 6154 6155 6156 6157 6158 6159 6160 6161 6162 6163 6164 6165 6166 6167
{
    int ret = -1;
    char *managed_save;

    /*
     * If there is a managed saved state restore it instead of starting
     * from scratch. In any case the old state is removed.
     */
    managed_save = qemuDomainManagedSavePath(driver, vm);
    if ((managed_save) && (virFileExists(managed_save))) {
        ret = qemudDomainObjRestore(conn, driver, vm, managed_save);

        if (unlink(managed_save) < 0) {
            VIR_WARN("Failed to remove the managed state %s", managed_save);
        }

        if (ret == 0)
            goto cleanup;
    }

6168 6169
    ret = qemudStartVMDaemon(conn, driver, vm, NULL, start_paused, -1, NULL,
                             VIR_VM_OP_CREATE);
6170 6171
    qemuDomainStartAudit(vm, "booted", ret >= 0);
    if (ret >= 0) {
J
Jiri Denemark 已提交
6172 6173 6174 6175 6176 6177 6178 6179 6180 6181 6182 6183 6184
        virDomainEventPtr event =
            virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_BOOTED);
        if (event)
            qemuDomainEventQueue(driver, event);
    }

cleanup:
    VIR_FREE(managed_save);
    return ret;
}

6185 6186 6187
static int
qemudDomainStartWithFlags(virDomainPtr dom, unsigned int flags)
{
6188 6189 6190
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
6191

6192
    virCheckFlags(VIR_DOMAIN_START_PAUSED, -1);
6193

6194
    qemuDriverLock(driver);
6195
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6196

6197
    if (!vm) {
6198 6199
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6200 6201
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6202
        goto cleanup;
6203 6204
    }

6205 6206 6207 6208
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    if (virDomainObjIsActive(vm)) {
6209 6210
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is already running"));
6211 6212 6213
        goto endjob;
    }

6214 6215
    ret = qemudDomainObjStart(dom->conn, driver, vm,
                              (flags & VIR_DOMAIN_START_PAUSED) != 0);
6216

6217
endjob:
6218 6219
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
6220

6221
cleanup:
6222 6223
    if (vm)
        virDomainObjUnlock(vm);
6224
    qemuDriverUnlock(driver);
6225
    return ret;
D
Daniel P. Berrange 已提交
6226 6227
}

6228 6229 6230 6231 6232 6233
static int
qemudDomainStart(virDomainPtr dom)
{
    return qemudDomainStartWithFlags(dom, 0);
}

6234 6235 6236 6237 6238 6239 6240 6241 6242 6243 6244 6245 6246 6247 6248
static int
qemudCanonicalizeMachineFromInfo(virDomainDefPtr def,
                                 virCapsGuestDomainInfoPtr info,
                                 char **canonical)
{
    int i;

    *canonical = NULL;

    for (i = 0; i < info->nmachines; i++) {
        virCapsGuestMachinePtr machine = info->machines[i];

        if (!machine->canonical)
            continue;

6249
        if (STRNEQ(def->os.machine, machine->name))
6250 6251 6252
            continue;

        if (!(*canonical = strdup(machine->canonical))) {
6253
            virReportOOMError();
6254 6255 6256 6257 6258 6259 6260 6261 6262
            return -1;
        }

        break;
    }

    return 0;
}

6263 6264 6265 6266 6267 6268
static int
qemudCanonicalizeMachineDirect(virDomainDefPtr def, char **canonical)
{
    virCapsGuestMachinePtr *machines = NULL;
    int i, nmachines = 0;

6269
    if (qemuCapsProbeMachineTypes(def->emulator, &machines, &nmachines) < 0)
6270 6271 6272 6273 6274 6275
        return -1;

    for (i = 0; i < nmachines; i++) {
        if (!machines[i]->canonical)
            continue;

6276
        if (STRNEQ(def->os.machine, machines[i]->name))
6277 6278 6279 6280 6281 6282 6283 6284 6285 6286 6287 6288
            continue;

        *canonical = machines[i]->canonical;
        machines[i]->canonical = NULL;
        break;
    }

    virCapabilitiesFreeMachines(machines, nmachines);

    return 0;
}

6289 6290
int
qemudCanonicalizeMachine(struct qemud_driver *driver, virDomainDefPtr def)
6291 6292 6293 6294 6295 6296
{
    char *canonical = NULL;
    int i;

    for (i = 0; i < driver->caps->nguests; i++) {
        virCapsGuestPtr guest = driver->caps->guests[i];
6297
        virCapsGuestDomainInfoPtr info;
6298 6299 6300
        int j;

        for (j = 0; j < guest->arch.ndomains; j++) {
6301
            info = &guest->arch.domains[j]->info;
6302

6303 6304 6305 6306 6307 6308 6309 6310 6311
            if (!info->emulator || !STREQ(info->emulator, def->emulator))
                continue;

            if (!info->nmachines)
                info = &guest->arch.defaultInfo;

            if (qemudCanonicalizeMachineFromInfo(def, info, &canonical) < 0)
                return -1;
            goto out;
6312 6313
        }

6314 6315 6316 6317
        info = &guest->arch.defaultInfo;

        if (info->emulator && STREQ(info->emulator, def->emulator)) {
            if (qemudCanonicalizeMachineFromInfo(def, info, &canonical) < 0)
6318 6319 6320 6321
                return -1;
            goto out;
        }
    }
6322 6323 6324 6325

    if (qemudCanonicalizeMachineDirect(def, &canonical) < 0)
        return -1;

6326 6327 6328 6329 6330 6331 6332
out:
    if (canonical) {
        VIR_FREE(def->os.machine);
        def->os.machine = canonical;
    }
    return 0;
}
D
Daniel P. Berrange 已提交
6333

6334
static virDomainPtr qemudDomainDefine(virConnectPtr conn, const char *xml) {
6335
    struct qemud_driver *driver = conn->privateData;
6336
    virDomainDefPtr def;
6337
    virDomainObjPtr vm = NULL;
6338
    virDomainPtr dom = NULL;
6339
    virDomainEventPtr event = NULL;
6340
    int dupVM;
6341

6342
    qemuDriverLock(driver);
6343
    if (!(def = virDomainDefParseString(driver->caps, xml,
6344
                                        VIR_DOMAIN_XML_INACTIVE)))
6345
        goto cleanup;
6346

6347
    if (virSecurityManagerVerify(driver->securityManager, def) < 0)
6348 6349
        goto cleanup;

6350 6351
    if ((dupVM = virDomainObjIsDuplicate(&driver->domains, def, 0)) < 0)
        goto cleanup;
6352

6353
    if (qemudCanonicalizeMachine(driver, def) < 0)
6354 6355
        goto cleanup;

6356 6357 6358
    if (qemuAssignPCIAddresses(def) < 0)
        goto cleanup;

6359
    if (!(vm = virDomainAssignDef(driver->caps,
6360
                                  &driver->domains,
6361
                                  def, false))) {
6362
        goto cleanup;
6363
    }
6364
    def = NULL;
6365
    vm->persistent = 1;
6366

6367
    if (virDomainSaveConfig(driver->configDir,
6368
                            vm->newDef ? vm->newDef : vm->def) < 0) {
6369 6370
        virDomainRemoveInactive(&driver->domains,
                                vm);
6371
        vm = NULL;
6372
        goto cleanup;
6373 6374
    }

6375 6376
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_DEFINED,
6377
                                     !dupVM ?
6378 6379
                                     VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                     VIR_DOMAIN_EVENT_DEFINED_UPDATED);
6380

6381
    dom = virGetDomain(conn, vm->def->name, vm->def->uuid);
6382
    if (dom) dom->id = vm->def->id;
6383 6384

cleanup:
6385
    virDomainDefFree(def);
6386 6387
    if (vm)
        virDomainObjUnlock(vm);
6388 6389
    if (event)
        qemuDomainEventQueue(driver, event);
6390
    qemuDriverUnlock(driver);
6391
    return dom;
D
Daniel P. Berrange 已提交
6392 6393
}

6394
static int qemudDomainUndefine(virDomainPtr dom) {
6395 6396
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
6397
    virDomainEventPtr event = NULL;
6398
    int ret = -1;
D
Daniel P. Berrange 已提交
6399

6400
    qemuDriverLock(driver);
6401
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6402

D
Daniel P. Berrange 已提交
6403
    if (!vm) {
6404 6405
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6406 6407
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6408
        goto cleanup;
D
Daniel P. Berrange 已提交
6409 6410
    }

D
Daniel P. Berrange 已提交
6411
    if (virDomainObjIsActive(vm)) {
6412 6413
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot delete active domain"));
6414
        goto cleanup;
D
Daniel P. Berrange 已提交
6415 6416
    }

6417
    if (!vm->persistent) {
6418
        qemuReportError(VIR_ERR_OPERATION_INVALID,
6419
                        "%s", _("cannot undefine transient domain"));
6420
        goto cleanup;
6421 6422
    }

6423
    if (virDomainDeleteConfig(driver->configDir, driver->autostartDir, vm) < 0)
6424
        goto cleanup;
D
Daniel P. Berrange 已提交
6425

6426 6427 6428
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_UNDEFINED,
                                     VIR_DOMAIN_EVENT_UNDEFINED_REMOVED);
6429

6430 6431
    virDomainRemoveInactive(&driver->domains,
                            vm);
6432
    vm = NULL;
6433
    ret = 0;
D
Daniel P. Berrange 已提交
6434

6435
cleanup:
6436 6437
    if (vm)
        virDomainObjUnlock(vm);
6438 6439
    if (event)
        qemuDomainEventQueue(driver, event);
6440
    qemuDriverUnlock(driver);
6441
    return ret;
D
Daniel P. Berrange 已提交
6442 6443
}

6444

6445 6446
static int qemudDomainAttachDevice(virDomainPtr dom,
                                   const char *xml)
6447
{
6448 6449 6450 6451
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainDeviceDefPtr dev = NULL;
    unsigned long long qemuCmdFlags;
6452
    virCgroupPtr cgroup = NULL;
6453
    int ret = -1;
6454

6455 6456 6457 6458 6459 6460 6461
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6462 6463 6464
        goto cleanup;
    }

6465 6466
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
6467

6468 6469 6470 6471 6472
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot attach device on inactive domain"));
        goto endjob;
    }
6473

6474 6475 6476 6477
    dev = virDomainDeviceDefParse(driver->caps, vm->def, xml,
                                  VIR_DOMAIN_XML_INACTIVE);
    if (dev == NULL)
        goto endjob;
6478

6479 6480 6481 6482
    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
        goto endjob;
6483

6484 6485 6486 6487 6488 6489 6490 6491 6492 6493
    if (dev->type == VIR_DOMAIN_DEVICE_DISK) {
        if (qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_DEVICES)) {
            if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) !=0 ) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("Unable to find cgroup for %s\n"),
                                vm->def->name);
                goto endjob;
            }
            if (qemuSetupDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                goto endjob;
6494 6495
        }

6496 6497 6498 6499 6500 6501 6502 6503 6504 6505
        switch (dev->data.disk->device) {
        case VIR_DOMAIN_DISK_DEVICE_CDROM:
        case VIR_DOMAIN_DISK_DEVICE_FLOPPY:
            ret = qemuDomainChangeEjectableMedia(driver, vm,
                                                 dev->data.disk,
                                                 qemuCmdFlags,
                                                 false);
            if (ret == 0)
                dev->data.disk = NULL;
            break;
6506

6507 6508 6509 6510 6511 6512 6513 6514 6515 6516 6517 6518 6519 6520 6521 6522 6523 6524 6525 6526 6527 6528 6529
        case VIR_DOMAIN_DISK_DEVICE_DISK:
            if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_USB) {
                ret = qemuDomainAttachUsbMassstorageDevice(driver, vm,
                                                           dev->data.disk, qemuCmdFlags);
                if (ret == 0)
                    dev->data.disk = NULL;
            } else if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_VIRTIO) {
                ret = qemuDomainAttachPciDiskDevice(driver, vm,
                                                    dev->data.disk, qemuCmdFlags);
                if (ret == 0)
                    dev->data.disk = NULL;
            } else if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_SCSI) {
                ret = qemuDomainAttachSCSIDisk(driver, vm,
                                               dev->data.disk, qemuCmdFlags);
                if (ret == 0)
                    dev->data.disk = NULL;
            } else {
                qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                                _("disk bus '%s' cannot be hotplugged."),
                                virDomainDiskBusTypeToString(dev->data.disk->bus));
                /* fallthrough */
            }
            break;
6530

6531 6532 6533 6534 6535
        default:
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                            _("disk device type '%s' cannot be hotplugged"),
                            virDomainDiskDeviceTypeToString(dev->data.disk->device));
            /* Fallthrough */
6536
        }
6537 6538 6539 6540
        if (ret != 0 && cgroup) {
            if (qemuTeardownDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                VIR_WARN("Failed to teardown cgroup for disk path %s",
                         NULLSTR(dev->data.disk->src));
6541
        }
6542 6543 6544 6545 6546 6547 6548 6549 6550 6551 6552
    } else if (dev->type == VIR_DOMAIN_DEVICE_CONTROLLER) {
        if (dev->data.controller->type == VIR_DOMAIN_CONTROLLER_TYPE_SCSI) {
            ret = qemuDomainAttachPciControllerDevice(driver, vm,
                                                      dev->data.controller, qemuCmdFlags);
            if (ret == 0)
                dev->data.controller = NULL;
        } else {
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                            _("disk controller bus '%s' cannot be hotplugged."),
                            virDomainControllerTypeToString(dev->data.controller->type));
            /* fallthrough */
6553
        }
6554 6555 6556 6557 6558 6559 6560 6561 6562 6563
    } else if (dev->type == VIR_DOMAIN_DEVICE_NET) {
        ret = qemuDomainAttachNetDevice(dom->conn, driver, vm,
                                        dev->data.net, qemuCmdFlags);
        if (ret == 0)
            dev->data.net = NULL;
    } else if (dev->type == VIR_DOMAIN_DEVICE_HOSTDEV) {
        ret = qemuDomainAttachHostDevice(driver, vm,
                                         dev->data.hostdev, qemuCmdFlags);
        if (ret == 0)
            dev->data.hostdev = NULL;
6564
    } else {
6565 6566 6567 6568
        qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                        _("device type '%s' cannot be attached"),
                        virDomainDeviceTypeToString(dev->type));
        goto endjob;
6569 6570
    }

6571 6572 6573 6574 6575 6576 6577 6578 6579 6580 6581 6582 6583 6584 6585
    if (!ret && virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
        ret = -1;

endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);

    virDomainDeviceDefFree(dev);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
6586 6587 6588
    return ret;
}

6589 6590 6591 6592 6593 6594 6595 6596
static int qemudDomainAttachDeviceFlags(virDomainPtr dom,
                                        const char *xml,
                                        unsigned int flags) {
    if (flags & VIR_DOMAIN_DEVICE_MODIFY_CONFIG) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot modify the persistent configuration of a domain"));
        return -1;
    }
6597

6598 6599
    return qemudDomainAttachDevice(dom, xml);
}
6600

6601

6602 6603 6604 6605 6606 6607 6608 6609 6610 6611 6612
static int qemuDomainUpdateDeviceFlags(virDomainPtr dom,
                                       const char *xml,
                                       unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    virDomainDeviceDefPtr dev = NULL;
    unsigned long long qemuCmdFlags;
    virCgroupPtr cgroup = NULL;
    int ret = -1;
    bool force = (flags & VIR_DOMAIN_DEVICE_MODIFY_FORCE) != 0;
6613

6614 6615 6616 6617
    virCheckFlags(VIR_DOMAIN_DEVICE_MODIFY_CURRENT |
                  VIR_DOMAIN_DEVICE_MODIFY_LIVE |
                  VIR_DOMAIN_DEVICE_MODIFY_CONFIG |
                  VIR_DOMAIN_DEVICE_MODIFY_FORCE, -1);
6618

6619 6620 6621
    if (flags & VIR_DOMAIN_DEVICE_MODIFY_CONFIG) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot modify the persistent configuration of a domain"));
6622 6623 6624
        return -1;
    }

6625 6626 6627 6628 6629 6630 6631 6632
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
6633 6634
    }

6635 6636 6637 6638 6639 6640 6641
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot attach device on inactive domain"));
        goto endjob;
6642 6643
    }

6644 6645 6646 6647 6648 6649 6650 6651 6652
    dev = virDomainDeviceDefParse(driver->caps, vm->def, xml,
                                  VIR_DOMAIN_XML_INACTIVE);
    if (dev == NULL)
        goto endjob;

    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
        goto endjob;
6653

6654 6655 6656 6657 6658 6659 6660 6661 6662 6663 6664
    switch (dev->type) {
    case VIR_DOMAIN_DEVICE_DISK:
        if (qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_DEVICES)) {
            if (virCgroupForDomain(driver->cgroup, vm->def->name, &cgroup, 0) !=0 ) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                _("Unable to find cgroup for %s\n"),
                                vm->def->name);
                goto endjob;
            }
            if (qemuSetupDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                goto endjob;
6665 6666
        }

6667 6668 6669 6670 6671 6672 6673 6674 6675 6676
        switch (dev->data.disk->device) {
        case VIR_DOMAIN_DISK_DEVICE_CDROM:
        case VIR_DOMAIN_DISK_DEVICE_FLOPPY:
            ret = qemuDomainChangeEjectableMedia(driver, vm,
                                                 dev->data.disk,
                                                 qemuCmdFlags,
                                                 force);
            if (ret == 0)
                dev->data.disk = NULL;
            break;
6677

6678

6679 6680 6681 6682 6683 6684
        default:
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                            _("disk bus '%s' cannot be updated."),
                            virDomainDiskBusTypeToString(dev->data.disk->bus));
            break;
        }
6685

6686 6687 6688 6689 6690
        if (ret != 0 && cgroup) {
            if (qemuTeardownDiskCgroup(driver, cgroup, dev->data.disk) < 0)
                VIR_WARN("Failed to teardown cgroup for disk path %s",
                         NULLSTR(dev->data.disk->src));
        }
6691
        break;
6692 6693 6694

    case VIR_DOMAIN_DEVICE_GRAPHICS:
        ret = qemuDomainChangeGraphics(driver, vm, dev->data.graphics);
6695
        break;
6696

6697
    default:
6698
        qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
6699 6700 6701
                        _("disk device type '%s' cannot be updated"),
                        virDomainDiskDeviceTypeToString(dev->data.disk->device));
        break;
6702 6703
    }

6704 6705 6706 6707 6708 6709 6710 6711 6712 6713
    if (!ret && virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
        ret = -1;

endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

cleanup:
    if (cgroup)
        virCgroupFree(&cgroup);
6714

6715 6716 6717 6718
    virDomainDeviceDefFree(dev);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
6719 6720 6721
    return ret;
}

6722

6723 6724
static int qemudDomainDetachDevice(virDomainPtr dom,
                                   const char *xml) {
6725 6726
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
6727
    unsigned long long qemuCmdFlags;
6728 6729
    virDomainDeviceDefPtr dev = NULL;
    int ret = -1;
6730

6731
    qemuDriverLock(driver);
6732
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6733
    if (!vm) {
6734 6735
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6736 6737
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6738
        goto cleanup;
6739 6740
    }

6741 6742 6743
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
6744
    if (!virDomainObjIsActive(vm)) {
6745 6746
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot detach device on inactive domain"));
6747
        goto endjob;
6748 6749
    }

6750
    dev = virDomainDeviceDefParse(driver->caps, vm->def, xml,
6751
                                  VIR_DOMAIN_XML_INACTIVE);
6752
    if (dev == NULL)
6753
        goto endjob;
6754

6755 6756 6757
    if (qemuCapsExtractVersionInfo(vm->def->emulator,
                                   NULL,
                                   &qemuCmdFlags) < 0)
6758
        goto endjob;
6759 6760

    if (dev->type == VIR_DOMAIN_DEVICE_DISK &&
6761 6762
        dev->data.disk->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
        if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_VIRTIO) {
6763
            ret = qemuDomainDetachPciDiskDevice(driver, vm, dev, qemuCmdFlags);
6764 6765
        }
        else if (dev->data.disk->bus == VIR_DOMAIN_DISK_BUS_SCSI) {
6766 6767
            ret = qemuDomainDetachSCSIDiskDevice(driver, vm, dev,
                                                 qemuCmdFlags);
6768 6769
        }
        else {
6770
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
6771 6772
                            _("This type of disk cannot be hot unplugged"));
        }
6773
    } else if (dev->type == VIR_DOMAIN_DEVICE_NET) {
6774
        ret = qemuDomainDetachNetDevice(driver, vm, dev, qemuCmdFlags);
6775 6776
    } else if (dev->type == VIR_DOMAIN_DEVICE_CONTROLLER) {
        if (dev->data.controller->type == VIR_DOMAIN_CONTROLLER_TYPE_SCSI) {
6777 6778
            ret = qemuDomainDetachPciControllerDevice(driver, vm, dev,
                                                      qemuCmdFlags);
6779
        } else {
6780
            qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
6781 6782
                            _("disk controller bus '%s' cannot be hotunplugged."),
                            virDomainControllerTypeToString(dev->data.controller->type));
6783 6784
            /* fallthrough */
        }
6785
    } else if (dev->type == VIR_DOMAIN_DEVICE_HOSTDEV) {
6786
        ret = qemuDomainDetachHostDevice(driver, vm, dev, qemuCmdFlags);
6787
    } else {
6788
        qemuReportError(VIR_ERR_CONFIG_UNSUPPORTED,
6789
                        "%s", _("This type of device cannot be hot unplugged"));
6790
    }
6791

6792
    if (!ret && virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0)
6793 6794
        ret = -1;

6795
endjob:
6796 6797
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
6798

6799 6800
cleanup:
    virDomainDeviceDefFree(dev);
6801 6802
    if (vm)
        virDomainObjUnlock(vm);
6803
    qemuDriverUnlock(driver);
6804 6805 6806
    return ret;
}

6807 6808 6809 6810
static int qemudDomainDetachDeviceFlags(virDomainPtr dom,
                                        const char *xml,
                                        unsigned int flags) {
    if (flags & VIR_DOMAIN_DEVICE_MODIFY_CONFIG) {
6811 6812
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("cannot modify the persistent configuration of a domain"));
6813 6814 6815 6816 6817 6818
        return -1;
    }

    return qemudDomainDetachDevice(dom, xml);
}

6819
static int qemudDomainGetAutostart(virDomainPtr dom,
6820
                                   int *autostart) {
6821 6822 6823
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
6824

6825
    qemuDriverLock(driver);
6826
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6827 6828
    qemuDriverUnlock(driver);

6829
    if (!vm) {
6830 6831
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6832 6833
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6834
        goto cleanup;
6835 6836 6837
    }

    *autostart = vm->autostart;
6838
    ret = 0;
6839

6840
cleanup:
6841 6842
    if (vm)
        virDomainObjUnlock(vm);
6843
    return ret;
6844 6845
}

6846
static int qemudDomainSetAutostart(virDomainPtr dom,
6847
                                   int autostart) {
6848 6849
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
6850 6851
    char *configFile = NULL, *autostartLink = NULL;
    int ret = -1;
6852

6853
    qemuDriverLock(driver);
6854
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
6855

6856
    if (!vm) {
6857 6858
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
6859 6860
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
6861
        goto cleanup;
6862 6863
    }

6864
    if (!vm->persistent) {
6865
        qemuReportError(VIR_ERR_OPERATION_INVALID,
6866
                        "%s", _("cannot set autostart for transient domain"));
6867
        goto cleanup;
6868 6869
    }

6870 6871
    autostart = (autostart != 0);

6872
    if (vm->autostart != autostart) {
6873
        if ((configFile = virDomainConfigFile(driver->configDir, vm->def->name)) == NULL)
6874
            goto cleanup;
6875
        if ((autostartLink = virDomainConfigFile(driver->autostartDir, vm->def->name)) == NULL)
6876
            goto cleanup;
6877

6878 6879
        if (autostart) {
            int err;
6880

6881
            if ((err = virFileMakePath(driver->autostartDir))) {
6882
                virReportSystemError(err,
6883 6884
                                     _("cannot create autostart directory %s"),
                                     driver->autostartDir);
6885 6886
                goto cleanup;
            }
6887

6888
            if (symlink(configFile, autostartLink) < 0) {
6889
                virReportSystemError(errno,
6890 6891
                                     _("Failed to create symlink '%s to '%s'"),
                                     autostartLink, configFile);
6892 6893 6894 6895
                goto cleanup;
            }
        } else {
            if (unlink(autostartLink) < 0 && errno != ENOENT && errno != ENOTDIR) {
6896
                virReportSystemError(errno,
6897 6898
                                     _("Failed to delete symlink '%s'"),
                                     autostartLink);
6899 6900
                goto cleanup;
            }
6901 6902
        }

6903
        vm->autostart = autostart;
6904
    }
6905
    ret = 0;
6906

6907 6908 6909
cleanup:
    VIR_FREE(configFile);
    VIR_FREE(autostartLink);
6910 6911
    if (vm)
        virDomainObjUnlock(vm);
6912
    qemuDriverUnlock(driver);
6913
    return ret;
6914 6915
}

6916 6917 6918 6919 6920

static char *qemuGetSchedulerType(virDomainPtr dom,
                                  int *nparams)
{
    struct qemud_driver *driver = dom->conn->privateData;
6921
    char *ret = NULL;
6922

6923
    qemuDriverLock(driver);
6924
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_CPU)) {
6925 6926
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
6927
        goto cleanup;
6928 6929 6930 6931 6932 6933 6934
    }

    if (nparams)
        *nparams = 1;

    ret = strdup("posix");
    if (!ret)
6935
        virReportOOMError();
6936 6937 6938

cleanup:
    qemuDriverUnlock(driver);
6939 6940 6941
    return ret;
}

6942 6943 6944 6945 6946 6947 6948 6949 6950 6951 6952 6953 6954 6955 6956 6957 6958 6959 6960 6961 6962 6963 6964 6965 6966 6967 6968 6969 6970 6971 6972 6973 6974 6975 6976 6977 6978 6979 6980 6981 6982 6983 6984 6985 6986 6987 6988 6989 6990 6991 6992 6993 6994 6995 6996 6997 6998 6999 7000 7001 7002 7003 7004 7005 7006 7007 7008

static int qemuDomainSetMemoryParameters(virDomainPtr dom,
                                         virMemoryParameterPtr params,
                                         int nparams,
                                         unsigned int flags ATTRIBUTE_UNUSED)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int i;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;

    qemuDriverLock(driver);
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_MEMORY)) {
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
        goto cleanup;
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
        goto cleanup;
    }

    ret = 0;
    for (i = 0; i < nparams; i++) {
        virMemoryParameterPtr param = &params[i];

        if (STREQ(param->field, VIR_DOMAIN_MEMORY_HARD_LIMIT)) {
            int rc;
            if (param->type != VIR_DOMAIN_MEMORY_PARAM_ULLONG) {
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for memory hard_limit tunable, expected a 'ullong'"));
                ret = -1;
                continue;
            }

            rc = virCgroupSetMemoryHardLimit(group, params[i].value.ul);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to set memory hard_limit tunable"));
                ret = -1;
            }
        } else if (STREQ(param->field, VIR_DOMAIN_MEMORY_SOFT_LIMIT)) {
            int rc;
            if (param->type != VIR_DOMAIN_MEMORY_PARAM_ULLONG) {
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for memory soft_limit tunable, expected a 'ullong'"));
                ret = -1;
                continue;
            }

            rc = virCgroupSetMemorySoftLimit(group, params[i].value.ul);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to set memory soft_limit tunable"));
                ret = -1;
            }
7009
        } else if (STREQ(param->field, VIR_DOMAIN_MEMORY_SWAP_HARD_LIMIT)) {
7010 7011 7012 7013 7014 7015 7016 7017 7018 7019 7020 7021 7022 7023 7024 7025 7026 7027 7028 7029 7030 7031 7032 7033 7034 7035 7036 7037 7038 7039 7040 7041 7042
            int rc;
            if (param->type != VIR_DOMAIN_MEMORY_PARAM_ULLONG) {
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for swap_hard_limit tunable, expected a 'ullong'"));
                ret = -1;
                continue;
            }

            rc = virCgroupSetSwapHardLimit(group, params[i].value.ul);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to set swap_hard_limit tunable"));
                ret = -1;
            }
        } else if (STREQ(param->field, VIR_DOMAIN_MEMORY_MIN_GUARANTEE)) {
            qemuReportError(VIR_ERR_INVALID_ARG,
                            _("Memory tunable `%s' not implemented"), param->field);
            ret = -1;
        } else {
            qemuReportError(VIR_ERR_INVALID_ARG,
                            _("Parameter `%s' not supported"), param->field);
            ret = -1;
        }
    }

cleanup:
    virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

7043 7044 7045 7046 7047 7048 7049 7050 7051
static int qemuDomainGetMemoryParameters(virDomainPtr dom,
                                         virMemoryParameterPtr params,
                                         int *nparams,
                                         unsigned int flags ATTRIBUTE_UNUSED)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int i;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
7052
    unsigned long long val;
7053 7054 7055 7056 7057 7058 7059 7060 7061 7062 7063 7064 7065 7066 7067 7068 7069 7070 7071 7072 7073 7074 7075 7076 7077 7078 7079 7080 7081 7082 7083 7084 7085 7086 7087 7088 7089 7090 7091 7092 7093 7094 7095 7096 7097 7098 7099 7100 7101 7102
    int ret = -1;
    int rc;

    qemuDriverLock(driver);

    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_MEMORY)) {
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
        goto cleanup;
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
        goto cleanup;
    }

    if ((*nparams) == 0) {
        /* Current number of memory parameters supported by cgroups */
        *nparams = QEMU_NB_MEM_PARAM;
        ret = 0;
        goto cleanup;
    }

    if ((*nparams) != QEMU_NB_MEM_PARAM) {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("Invalid parameter count"));
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
        goto cleanup;
    }

    for (i = 0; i < *nparams; i++) {
        virMemoryParameterPtr param = &params[i];
        val = 0;
        param->value.ul = 0;
        param->type = VIR_DOMAIN_MEMORY_PARAM_ULLONG;

        switch(i) {
        case 0: /* fill memory hard limit here */
            rc = virCgroupGetMemoryHardLimit(group, &val);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to get memory hard limit"));
7103
                goto cleanup;
7104 7105 7106 7107
            }
            if (virStrcpyStatic(param->field, VIR_DOMAIN_MEMORY_HARD_LIMIT) == NULL) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Field memory hard limit too long for destination"));
7108
                goto cleanup;
7109 7110 7111 7112 7113 7114 7115 7116 7117
            }
            param->value.ul = val;
            break;

        case 1: /* fill memory soft limit here */
            rc = virCgroupGetMemorySoftLimit(group, &val);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to get memory soft limit"));
7118
                goto cleanup;
7119 7120 7121 7122
            }
            if (virStrcpyStatic(param->field, VIR_DOMAIN_MEMORY_SOFT_LIMIT) == NULL) {
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Field memory soft limit too long for destination"));
7123
                goto cleanup;
7124 7125 7126 7127 7128 7129 7130 7131 7132
            }
            param->value.ul = val;
            break;

        case 2: /* fill swap hard limit here */
            rc = virCgroupGetSwapHardLimit(group, &val);
            if (rc != 0) {
                virReportSystemError(-rc, "%s",
                                     _("unable to get swap hard limit"));
7133
                goto cleanup;
7134
            }
7135
            if (virStrcpyStatic(param->field, VIR_DOMAIN_MEMORY_SWAP_HARD_LIMIT) == NULL) {
7136 7137
                qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                "%s", _("Field swap hard limit too long for destination"));
7138
                goto cleanup;
7139 7140 7141 7142 7143 7144 7145 7146 7147 7148
            }
            param->value.ul = val;
            break;

        default:
            break;
            /* should not hit here */
        }
    }

7149 7150
    ret = 0;

7151 7152 7153 7154 7155 7156 7157 7158 7159
cleanup:
    if (group)
        virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

7160 7161 7162 7163 7164 7165 7166 7167 7168 7169
static int qemuSetSchedulerParameters(virDomainPtr dom,
                                      virSchedParameterPtr params,
                                      int nparams)
{
    struct qemud_driver *driver = dom->conn->privateData;
    int i;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    int ret = -1;

7170
    qemuDriverLock(driver);
7171
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_CPU)) {
7172 7173
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
7174
        goto cleanup;
7175 7176 7177 7178 7179
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
7180 7181
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
7182 7183 7184 7185
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
7186 7187
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
7188 7189 7190 7191 7192 7193 7194 7195 7196
        goto cleanup;
    }

    for (i = 0; i < nparams; i++) {
        virSchedParameterPtr param = &params[i];

        if (STREQ(param->field, "cpu_shares")) {
            int rc;
            if (param->type != VIR_DOMAIN_SCHED_FIELD_ULLONG) {
7197 7198
                qemuReportError(VIR_ERR_INVALID_ARG, "%s",
                                _("invalid type for cpu_shares tunable, expected a 'ullong'"));
7199 7200 7201 7202 7203
                goto cleanup;
            }

            rc = virCgroupSetCpuShares(group, params[i].value.ul);
            if (rc != 0) {
7204
                virReportSystemError(-rc, "%s",
7205 7206 7207 7208
                                     _("unable to set cpu shares tunable"));
                goto cleanup;
            }
        } else {
7209 7210
            qemuReportError(VIR_ERR_INVALID_ARG,
                            _("Invalid parameter `%s'"), param->field);
7211 7212 7213 7214 7215 7216 7217 7218 7219
            goto cleanup;
        }
    }
    ret = 0;

cleanup:
    virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
7220
    qemuDriverUnlock(driver);
7221 7222 7223 7224 7225 7226 7227 7228 7229 7230 7231 7232 7233 7234
    return ret;
}

static int qemuGetSchedulerParameters(virDomainPtr dom,
                                      virSchedParameterPtr params,
                                      int *nparams)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virCgroupPtr group = NULL;
    virDomainObjPtr vm = NULL;
    unsigned long long val;
    int ret = -1;
    int rc;

7235
    qemuDriverLock(driver);
7236
    if (!qemuCgroupControllerActive(driver, VIR_CGROUP_CONTROLLER_CPU)) {
7237 7238
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        __FUNCTION__);
7239
        goto cleanup;
7240 7241 7242
    }

    if ((*nparams) != 1) {
7243 7244
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("Invalid parameter count"));
7245
        goto cleanup;
7246 7247 7248 7249 7250
    }

    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (vm == NULL) {
7251 7252
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("No such domain %s"), dom->uuid);
7253 7254 7255 7256
        goto cleanup;
    }

    if (virCgroupForDomain(driver->cgroup, vm->def->name, &group, 0) != 0) {
7257 7258
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find cgroup for domain %s"), vm->def->name);
7259 7260 7261 7262 7263
        goto cleanup;
    }

    rc = virCgroupGetCpuShares(group, &val);
    if (rc != 0) {
7264
        virReportSystemError(-rc, "%s",
7265 7266 7267 7268 7269
                             _("unable to get cpu shares tunable"));
        goto cleanup;
    }
    params[0].value.ul = val;
    params[0].type = VIR_DOMAIN_SCHED_FIELD_ULLONG;
C
Chris Lalancette 已提交
7270
    if (virStrcpyStatic(params[0].field, "cpu_shares") == NULL) {
7271 7272
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("Field cpu_shares too long for destination"));
C
Chris Lalancette 已提交
7273 7274
        goto cleanup;
    }
7275 7276 7277 7278 7279 7280 7281

    ret = 0;

cleanup:
    virCgroupFree(&group);
    if (vm)
        virDomainObjUnlock(vm);
7282
    qemuDriverUnlock(driver);
7283 7284 7285 7286
    return ret;
}


7287 7288 7289 7290 7291 7292 7293 7294 7295
/* This uses the 'info blockstats' monitor command which was
 * integrated into both qemu & kvm in late 2007.  If the command is
 * not supported we detect this and return the appropriate error.
 */
static int
qemudDomainBlockStats (virDomainPtr dom,
                       const char *path,
                       struct _virDomainBlockStats *stats)
{
7296
    struct qemud_driver *driver = dom->conn->privateData;
7297
    int i, ret = -1;
7298
    virDomainObjPtr vm;
7299
    virDomainDiskDefPtr disk = NULL;
7300

7301
    qemuDriverLock(driver);
7302
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7303
    qemuDriverUnlock(driver);
7304
    if (!vm) {
7305 7306
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7307 7308
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7309
        goto cleanup;
7310
    }
7311 7312 7313 7314

    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
7315
    if (!virDomainObjIsActive (vm)) {
7316 7317
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7318
        goto endjob;
7319 7320
    }

7321 7322 7323 7324 7325 7326 7327 7328
    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (STREQ(path, vm->def->disks[i]->dst)) {
            disk = vm->def->disks[i];
            break;
        }
    }

    if (!disk) {
7329 7330
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid path: %s"), path);
7331
        goto endjob;
7332 7333
    }

7334
    if (!disk->info.alias) {
7335 7336
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("missing disk device alias name for %s"), disk->dst);
7337
        goto endjob;
7338
    }
7339

7340
    qemuDomainObjPrivatePtr priv = vm->privateData;
7341 7342
    qemuDomainObjEnterMonitor(vm);
    ret = qemuMonitorGetBlockStatsInfo(priv->mon,
7343
                                       disk->info.alias,
7344 7345 7346 7347 7348 7349
                                       &stats->rd_req,
                                       &stats->rd_bytes,
                                       &stats->wr_req,
                                       &stats->wr_bytes,
                                       &stats->errs);
    qemuDomainObjExitMonitor(vm);
7350

7351
endjob:
7352 7353
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
7354

7355
cleanup:
7356 7357
    if (vm)
        virDomainObjUnlock(vm);
7358
    return ret;
7359 7360
}

7361
#ifdef __linux__
7362 7363 7364 7365 7366
static int
qemudDomainInterfaceStats (virDomainPtr dom,
                           const char *path,
                           struct _virDomainInterfaceStats *stats)
{
7367 7368
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
7369
    int i;
7370
    int ret = -1;
7371

7372
    qemuDriverLock(driver);
7373
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7374 7375
    qemuDriverUnlock(driver);

7376
    if (!vm) {
7377 7378
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7379 7380
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7381
        goto cleanup;
7382 7383
    }

D
Daniel P. Berrange 已提交
7384
    if (!virDomainObjIsActive(vm)) {
7385 7386
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7387
        goto cleanup;
7388 7389 7390
    }

    /* Check the path is one of the domain's network interfaces. */
7391 7392
    for (i = 0 ; i < vm->def->nnets ; i++) {
        if (vm->def->nets[i]->ifname &&
7393 7394 7395 7396
            STREQ (vm->def->nets[i]->ifname, path)) {
            ret = 0;
            break;
        }
7397 7398
    }

7399
    if (ret == 0)
7400
        ret = linuxDomainInterfaceStats(path, stats);
7401
    else
7402 7403
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid path, '%s' is not a known interface"), path);
7404

7405
cleanup:
7406 7407
    if (vm)
        virDomainObjUnlock(vm);
7408 7409
    return ret;
}
7410
#else
7411 7412 7413 7414
static int
qemudDomainInterfaceStats (virDomainPtr dom,
                           const char *path ATTRIBUTE_UNUSED,
                           struct _virDomainInterfaceStats *stats ATTRIBUTE_UNUSED)
7415 7416
    qemuReportError(VIR_ERR_NO_SUPPORT,
                    "%s", __FUNCTION__);
7417 7418
    return -1;
}
7419
#endif
7420

7421 7422 7423 7424 7425 7426 7427 7428 7429 7430 7431 7432 7433 7434 7435 7436
static int
qemudDomainMemoryStats (virDomainPtr dom,
                        struct _virDomainMemoryStat *stats,
                        unsigned int nr_stats)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    unsigned int ret = -1;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7437 7438
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7439 7440 7441
        goto cleanup;
    }

7442 7443 7444
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

7445 7446 7447
    if (virDomainObjIsActive(vm)) {
        qemuDomainObjPrivatePtr priv = vm->privateData;
        qemuDomainObjEnterMonitor(vm);
7448
        ret = qemuMonitorGetMemoryStats(priv->mon, stats, nr_stats);
7449 7450
        qemuDomainObjExitMonitor(vm);
    } else {
7451 7452
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7453 7454
    }

7455 7456 7457
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

7458 7459 7460 7461 7462 7463
cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}

7464 7465 7466 7467 7468 7469 7470
static int
qemudDomainBlockPeek (virDomainPtr dom,
                      const char *path,
                      unsigned long long offset, size_t size,
                      void *buffer,
                      unsigned int flags ATTRIBUTE_UNUSED)
{
7471 7472 7473
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int fd = -1, ret = -1, i;
7474

7475
    qemuDriverLock(driver);
7476
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7477 7478
    qemuDriverUnlock(driver);

7479
    if (!vm) {
7480 7481
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7482 7483
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7484
        goto cleanup;
7485 7486 7487
    }

    if (!path || path[0] == '\0') {
7488 7489
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("NULL or empty path"));
7490
        goto cleanup;
7491 7492 7493
    }

    /* Check the path belongs to this domain. */
7494 7495
    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (vm->def->disks[i]->src != NULL &&
7496 7497 7498 7499
            STREQ (vm->def->disks[i]->src, path)) {
            ret = 0;
            break;
        }
7500 7501
    }

7502 7503 7504 7505 7506
    if (ret == 0) {
        ret = -1;
        /* The path is correct, now try to open it and get its size. */
        fd = open (path, O_RDONLY);
        if (fd == -1) {
7507 7508
            virReportSystemError(errno,
                                 _("%s: failed to open"), path);
7509 7510
            goto cleanup;
        }
7511

7512 7513 7514 7515 7516 7517
        /* Seek and read. */
        /* NB. Because we configure with AC_SYS_LARGEFILE, off_t should
         * be 64 bits on all platforms.
         */
        if (lseek (fd, offset, SEEK_SET) == (off_t) -1 ||
            saferead (fd, buffer, size) == (ssize_t) -1) {
7518 7519
            virReportSystemError(errno,
                                 _("%s: failed to seek or read"), path);
7520 7521 7522 7523 7524
            goto cleanup;
        }

        ret = 0;
    } else {
7525 7526
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("invalid path"));
7527 7528
    }

7529
cleanup:
7530
    VIR_FORCE_CLOSE(fd);
7531 7532
    if (vm)
        virDomainObjUnlock(vm);
7533 7534 7535
    return ret;
}

R
Richard W.M. Jones 已提交
7536 7537 7538 7539 7540 7541
static int
qemudDomainMemoryPeek (virDomainPtr dom,
                       unsigned long long offset, size_t size,
                       void *buffer,
                       unsigned int flags)
{
7542 7543
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
7544
    char *tmp = NULL;
R
Richard W.M. Jones 已提交
7545 7546
    int fd = -1, ret = -1;

7547
    qemuDriverLock(driver);
7548
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
7549
    qemuDriverUnlock(driver);
R
Richard W.M. Jones 已提交
7550 7551

    if (!vm) {
7552 7553
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
7554 7555
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
7556 7557 7558
        goto cleanup;
    }

7559
    if (flags != VIR_MEMORY_VIRTUAL && flags != VIR_MEMORY_PHYSICAL) {
7560 7561
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("flags parameter must be VIR_MEMORY_VIRTUAL or VIR_MEMORY_PHYSICAL"));
7562
        goto cleanup;
R
Richard W.M. Jones 已提交
7563 7564
    }

7565 7566 7567
    if (qemuDomainObjBeginJob(vm) < 0)
        goto cleanup;

D
Daniel P. Berrange 已提交
7568
    if (!virDomainObjIsActive(vm)) {
7569 7570
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
7571
        goto endjob;
R
Richard W.M. Jones 已提交
7572 7573
    }

7574
    if (virAsprintf(&tmp, "%s/qemu.mem.XXXXXX", driver->cacheDir) < 0) {
7575
        virReportOOMError();
7576
        goto endjob;
7577 7578
    }

R
Richard W.M. Jones 已提交
7579 7580
    /* Create a temporary filename. */
    if ((fd = mkstemp (tmp)) == -1) {
7581 7582
        virReportSystemError(errno,
                             _("mkstemp(\"%s\") failed"), tmp);
7583
        goto endjob;
R
Richard W.M. Jones 已提交
7584 7585
    }

7586
    qemuDomainObjPrivatePtr priv = vm->privateData;
7587
    qemuDomainObjEnterMonitor(vm);
7588
    if (flags == VIR_MEMORY_VIRTUAL) {
7589 7590
        if (qemuMonitorSaveVirtualMemory(priv->mon, offset, size, tmp) < 0) {
            qemuDomainObjExitMonitor(vm);
7591
            goto endjob;
7592
        }
7593
    } else {
7594 7595
        if (qemuMonitorSavePhysicalMemory(priv->mon, offset, size, tmp) < 0) {
            qemuDomainObjExitMonitor(vm);
7596
            goto endjob;
7597
        }
R
Richard W.M. Jones 已提交
7598
    }
7599
    qemuDomainObjExitMonitor(vm);
R
Richard W.M. Jones 已提交
7600 7601 7602

    /* Read the memory file into buffer. */
    if (saferead (fd, buffer, size) == (ssize_t) -1) {
7603 7604 7605
        virReportSystemError(errno,
                             _("failed to read temporary file "
                               "created with template %s"), tmp);
7606
        goto endjob;
R
Richard W.M. Jones 已提交
7607 7608 7609
    }

    ret = 0;
7610

7611
endjob:
7612 7613
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
7614

7615
cleanup:
7616
    VIR_FREE(tmp);
7617
    VIR_FORCE_CLOSE(fd);
R
Richard W.M. Jones 已提交
7618
    unlink (tmp);
7619 7620
    if (vm)
        virDomainObjUnlock(vm);
R
Richard W.M. Jones 已提交
7621 7622 7623
    return ret;
}

7624

7625 7626 7627 7628 7629 7630 7631 7632 7633 7634
static int qemuDomainGetBlockInfo(virDomainPtr dom,
                                  const char *path,
                                  virDomainBlockInfoPtr info,
                                  unsigned int flags) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
    int fd = -1;
    off_t end;
    virStorageFileMetadata meta;
7635
    virDomainDiskDefPtr disk = NULL;
7636 7637
    struct stat sb;
    int i;
7638
    int format;
7639 7640 7641 7642 7643 7644 7645 7646 7647 7648 7649 7650 7651 7652 7653 7654 7655 7656 7657 7658 7659 7660 7661 7662

    virCheckFlags(0, -1);

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!path || path[0] == '\0') {
        qemuReportError(VIR_ERR_INVALID_ARG,
                        "%s", _("NULL or empty path"));
        goto cleanup;
    }

    /* Check the path belongs to this domain. */
    for (i = 0 ; i < vm->def->ndisks ; i++) {
        if (vm->def->disks[i]->src != NULL &&
            STREQ (vm->def->disks[i]->src, path)) {
7663
            disk = vm->def->disks[i];
7664 7665 7666 7667
            break;
        }
    }

7668
    if (!disk) {
7669 7670 7671 7672 7673 7674 7675 7676 7677 7678 7679 7680 7681 7682
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("invalid path %s not assigned to domain"), path);
        goto cleanup;
    }

    /* The path is correct, now try to open it and get its size. */
    fd = open (path, O_RDONLY);
    if (fd == -1) {
        virReportSystemError(errno,
                             _("failed to open path '%s'"), path);
        goto cleanup;
    }

    /* Probe for magic formats */
7683 7684 7685 7686 7687 7688 7689 7690
    if (disk->driverType) {
        if ((format = virStorageFileFormatTypeFromString(disk->driverType)) < 0) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("unknown disk format %s for %s"),
                            disk->driverType, disk->src);
            goto cleanup;
        }
    } else {
7691 7692 7693 7694 7695 7696 7697
        if (driver->allowDiskFormatProbing) {
            if ((format = virStorageFileProbeFormat(disk->src)) < 0)
                goto cleanup;
        } else {
            qemuReportError(VIR_ERR_INTERNAL_ERROR,
                            _("no disk format for %s and probing is disabled"),
                            disk->src);
7698
            goto cleanup;
7699
        }
7700 7701 7702 7703 7704
    }

    if (virStorageFileGetMetadataFromFD(path, fd,
                                        format,
                                        &meta) < 0)
7705 7706 7707 7708 7709 7710 7711 7712 7713 7714
        goto cleanup;

    /* Get info for normal formats */
    if (fstat(fd, &sb) < 0) {
        virReportSystemError(errno,
                             _("cannot stat file '%s'"), path);
        goto cleanup;
    }

    if (S_ISREG(sb.st_mode)) {
7715
#ifndef WIN32
7716 7717 7718 7719 7720 7721 7722 7723 7724 7725 7726 7727 7728 7729 7730 7731 7732 7733 7734 7735 7736 7737 7738 7739 7740 7741 7742 7743
        info->physical = (unsigned long long)sb.st_blocks *
            (unsigned long long)DEV_BSIZE;
#else
        info->physical = sb.st_size;
#endif
        /* Regular files may be sparse, so logical size (capacity) is not same
         * as actual physical above
         */
        info->capacity = sb.st_size;
    } else {
        /* NB. Because we configure with AC_SYS_LARGEFILE, off_t should
         * be 64 bits on all platforms.
         */
        end = lseek (fd, 0, SEEK_END);
        if (end == (off_t)-1) {
            virReportSystemError(errno,
                                 _("failed to seek to end of %s"), path);
            goto cleanup;
        }
        info->physical = end;
        info->capacity = end;
    }

    /* If the file we probed has a capacity set, then override
     * what we calculated from file/block extents */
    if (meta.capacity)
        info->capacity = meta.capacity;

7744
    /* Set default value .. */
7745 7746
    info->allocation = info->physical;

7747 7748 7749
    /* ..but if guest is running & not using raw
       disk format and on a block device, then query
       highest allocated extent from QEMU */
7750
    if (disk->type == VIR_DOMAIN_DISK_TYPE_BLOCK &&
7751
        format != VIR_STORAGE_FILE_RAW &&
7752 7753 7754 7755
        S_ISBLK(sb.st_mode)) {
        qemuDomainObjPrivatePtr priv = vm->privateData;
        if (qemuDomainObjBeginJob(vm) < 0)
            goto cleanup;
7756 7757 7758 7759 7760 7761 7762 7763 7764
        if (!virDomainObjIsActive(vm))
            ret = 0;
        else {
            qemuDomainObjEnterMonitor(vm);
            ret = qemuMonitorGetBlockExtent(priv->mon,
                                            disk->info.alias,
                                            &info->allocation);
            qemuDomainObjExitMonitor(vm);
        }
7765 7766 7767 7768 7769 7770

        if (qemuDomainObjEndJob(vm) == 0)
            vm = NULL;
    } else {
        ret = 0;
    }
7771 7772

cleanup:
7773
    VIR_FORCE_CLOSE(fd);
7774 7775 7776 7777 7778 7779
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}


7780
static int
7781 7782 7783 7784
qemuDomainEventRegister(virConnectPtr conn,
                        virConnectDomainEventCallback callback,
                        void *opaque,
                        virFreeCallback freecb)
7785
{
7786 7787 7788
    struct qemud_driver *driver = conn->privateData;
    int ret;

7789
    qemuDriverLock(driver);
7790 7791
    ret = virDomainEventCallbackListAdd(conn, driver->domainEventCallbacks,
                                        callback, opaque, freecb);
7792
    qemuDriverUnlock(driver);
7793

7794
    return ret;
7795 7796
}

7797

7798
static int
7799 7800
qemuDomainEventDeregister(virConnectPtr conn,
                          virConnectDomainEventCallback callback)
7801
{
7802 7803 7804
    struct qemud_driver *driver = conn->privateData;
    int ret;

7805
    qemuDriverLock(driver);
7806 7807 7808 7809 7810 7811
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDelete(conn, driver->domainEventCallbacks,
                                                   callback);
    else
        ret = virDomainEventCallbackListRemove(conn, driver->domainEventCallbacks,
                                               callback);
7812
    qemuDriverUnlock(driver);
7813

7814
    return ret;
7815 7816
}

7817 7818 7819 7820 7821 7822 7823 7824 7825 7826 7827 7828 7829 7830 7831 7832 7833 7834 7835 7836 7837 7838 7839 7840 7841 7842 7843 7844 7845 7846 7847 7848 7849 7850 7851 7852 7853 7854 7855 7856 7857 7858 7859

static int
qemuDomainEventRegisterAny(virConnectPtr conn,
                           virDomainPtr dom,
                           int eventID,
                           virConnectDomainEventGenericCallback callback,
                           void *opaque,
                           virFreeCallback freecb)
{
    struct qemud_driver *driver = conn->privateData;
    int ret;

    qemuDriverLock(driver);
    ret = virDomainEventCallbackListAddID(conn,
                                          driver->domainEventCallbacks,
                                          dom, eventID,
                                          callback, opaque, freecb);
    qemuDriverUnlock(driver);

    return ret;
}


static int
qemuDomainEventDeregisterAny(virConnectPtr conn,
                             int callbackID)
{
    struct qemud_driver *driver = conn->privateData;
    int ret;

    qemuDriverLock(driver);
    if (driver->domainEventDispatching)
        ret = virDomainEventCallbackListMarkDeleteID(conn, driver->domainEventCallbacks,
                                                     callbackID);
    else
        ret = virDomainEventCallbackListRemoveID(conn, driver->domainEventCallbacks,
                                                 callbackID);
    qemuDriverUnlock(driver);

    return ret;
}


7860 7861
static void qemuDomainEventDispatchFunc(virConnectPtr conn,
                                        virDomainEventPtr event,
7862
                                        virConnectDomainEventGenericCallback cb,
7863 7864
                                        void *cbopaque,
                                        void *opaque)
7865
{
7866
    struct qemud_driver *driver = opaque;
7867

7868 7869 7870 7871 7872 7873 7874 7875 7876 7877 7878 7879 7880 7881 7882 7883 7884 7885 7886 7887 7888 7889 7890 7891 7892 7893 7894 7895 7896 7897 7898 7899 7900 7901 7902 7903 7904 7905 7906 7907 7908 7909 7910 7911
    /* Drop the lock whle dispatching, for sake of re-entrancy */
    qemuDriverUnlock(driver);
    virDomainEventDispatchDefaultFunc(conn, event, cb, cbopaque, NULL);
    qemuDriverLock(driver);
}

static void qemuDomainEventFlush(int timer ATTRIBUTE_UNUSED, void *opaque)
{
    struct qemud_driver *driver = opaque;
    virDomainEventQueue tempQueue;

    qemuDriverLock(driver);

    driver->domainEventDispatching = 1;

    /* Copy the queue, so we're reentrant safe */
    tempQueue.count = driver->domainEventQueue->count;
    tempQueue.events = driver->domainEventQueue->events;
    driver->domainEventQueue->count = 0;
    driver->domainEventQueue->events = NULL;

    virEventUpdateTimeout(driver->domainEventTimer, -1);
    virDomainEventQueueDispatch(&tempQueue,
                                driver->domainEventCallbacks,
                                qemuDomainEventDispatchFunc,
                                driver);

    /* Purge any deleted callbacks */
    virDomainEventCallbackListPurgeMarked(driver->domainEventCallbacks);

    driver->domainEventDispatching = 0;
    qemuDriverUnlock(driver);
}


/* driver must be locked before calling */
static void qemuDomainEventQueue(struct qemud_driver *driver,
                                 virDomainEventPtr event)
{
    if (virDomainEventQueuePush(driver->domainEventQueue,
                                event) < 0)
        virDomainEventFree(event);
    if (qemu_driver->domainEventQueue->count == 1)
        virEventUpdateTimeout(driver->domainEventTimer, 0);
7912 7913
}

D
Daniel Veillard 已提交
7914 7915
/* Migration support. */

7916 7917 7918 7919 7920
static bool ATTRIBUTE_NONNULL(1)
qemuDomainIsMigratable(virDomainDefPtr def)
{
    if (def->nhostdevs > 0) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
7921
            "%s", _("Domain with assigned host devices cannot be migrated"));
7922 7923 7924 7925 7926 7927
        return false;
    }

    return true;
}

C
Chris Lalancette 已提交
7928 7929 7930 7931 7932 7933 7934 7935 7936 7937 7938 7939 7940 7941 7942 7943 7944 7945 7946 7947 7948
/* Prepare is the first step, and it runs on the destination host.
 *
 * This version starts an empty VM listening on a localhost TCP port, and
 * sets up the corresponding virStream to handle the incoming data.
 */
static int
qemudDomainMigratePrepareTunnel(virConnectPtr dconn,
                                virStreamPtr st,
                                unsigned long flags,
                                const char *dname,
                                unsigned long resource ATTRIBUTE_UNUSED,
                                const char *dom_xml)
{
    struct qemud_driver *driver = dconn->privateData;
    virDomainDefPtr def = NULL;
    virDomainObjPtr vm = NULL;
    char *migrateFrom;
    virDomainEventPtr event = NULL;
    int ret = -1;
    int internalret;
    char *unixfile = NULL;
7949
    unsigned long long qemuCmdFlags;
7950 7951 7952 7953 7954 7955 7956 7957
    qemuDomainObjPrivatePtr priv = NULL;
    struct timeval now;

    if (gettimeofday(&now, NULL) < 0) {
        virReportSystemError(errno, "%s",
                             _("cannot get time of day"));
        return -1;
    }
C
Chris Lalancette 已提交
7958 7959 7960

    qemuDriverLock(driver);
    if (!dom_xml) {
7961 7962
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("no domain XML passed"));
C
Chris Lalancette 已提交
7963 7964 7965
        goto cleanup;
    }
    if (!(flags & VIR_MIGRATE_TUNNELLED)) {
7966
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
C
Chris Lalancette 已提交
7967 7968 7969 7970
                         "%s", _("PrepareTunnel called but no TUNNELLED flag set"));
        goto cleanup;
    }
    if (st == NULL) {
7971 7972
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("tunnelled migration requested but NULL stream passed"));
C
Chris Lalancette 已提交
7973 7974 7975 7976
        goto cleanup;
    }

    /* Parse the domain XML. */
7977
    if (!(def = virDomainDefParseString(driver->caps, dom_xml,
C
Chris Lalancette 已提交
7978
                                        VIR_DOMAIN_XML_INACTIVE))) {
7979 7980
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to parse XML"));
C
Chris Lalancette 已提交
7981 7982 7983
        goto cleanup;
    }

7984 7985 7986
    if (!qemuDomainIsMigratable(def))
        goto cleanup;

C
Chris Lalancette 已提交
7987
    /* Target domain name, maybe renamed. */
7988 7989 7990 7991 7992 7993
    if (dname) {
        VIR_FREE(def->name);
        def->name = strdup(dname);
        if (def->name == NULL)
            goto cleanup;
    }
C
Chris Lalancette 已提交
7994

7995 7996
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
C
Chris Lalancette 已提交
7997

7998
    if (!(vm = virDomainAssignDef(driver->caps,
C
Chris Lalancette 已提交
7999
                                  &driver->domains,
8000
                                  def, true))) {
8001
        /* virDomainAssignDef already set the error */
C
Chris Lalancette 已提交
8002 8003 8004
        goto cleanup;
    }
    def = NULL;
8005
    priv = vm->privateData;
C
Chris Lalancette 已提交
8006

8007 8008
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
8009
    priv->jobActive = QEMU_JOB_MIGRATION_OUT;
8010

C
Chris Lalancette 已提交
8011 8012 8013 8014
    /* Domain starts inactive, even if the domain XML had an id field. */
    vm->def->id = -1;

    if (virAsprintf(&unixfile, "%s/qemu.tunnelmigrate.dest.%s",
8015
                    driver->libDir, vm->def->name) < 0) {
8016
        virReportOOMError();
8017
        goto endjob;
C
Chris Lalancette 已提交
8018 8019 8020 8021
    }
    unlink(unixfile);

    /* check that this qemu version supports the interactive exec */
8022
    if (qemuCapsExtractVersionInfo(vm->def->emulator, NULL, &qemuCmdFlags) < 0) {
8023 8024 8025
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("Cannot determine QEMU argv syntax %s"),
                        vm->def->emulator);
8026
        goto endjob;
C
Chris Lalancette 已提交
8027 8028 8029 8030 8031 8032
    }
    if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_UNIX)
        internalret = virAsprintf(&migrateFrom, "unix:%s", unixfile);
    else if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_EXEC)
        internalret = virAsprintf(&migrateFrom, "exec:nc -U -l %s", unixfile);
    else {
8033 8034
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("Destination qemu is too old to support tunnelled migration"));
8035
        goto endjob;
C
Chris Lalancette 已提交
8036 8037
    }
    if (internalret < 0) {
8038
        virReportOOMError();
8039
        goto endjob;
C
Chris Lalancette 已提交
8040 8041 8042 8043
    }
    /* Start the QEMU daemon, with the same command-line arguments plus
     * -incoming unix:/path/to/file or exec:nc -U /path/to/file
     */
8044
    internalret = qemudStartVMDaemon(dconn, driver, vm, migrateFrom, true,
8045
                                     -1, NULL, VIR_VM_OP_MIGRATE_IN_START);
C
Chris Lalancette 已提交
8046 8047
    VIR_FREE(migrateFrom);
    if (internalret < 0) {
8048
        qemuDomainStartAudit(vm, "migrated", false);
C
Chris Lalancette 已提交
8049 8050 8051 8052 8053 8054 8055
        /* Note that we don't set an error here because qemudStartVMDaemon
         * should have already done that.
         */
        if (!vm->persistent) {
            virDomainRemoveInactive(&driver->domains, vm);
            vm = NULL;
        }
8056
        goto endjob;
C
Chris Lalancette 已提交
8057 8058
    }

8059 8060 8061
    if (virFDStreamConnectUNIX(st,
                               unixfile,
                               false) < 0) {
8062
        qemuDomainStartAudit(vm, "migrated", false);
8063
        qemudShutdownVMDaemon(driver, vm, 0);
8064
        if (!vm->persistent) {
8065 8066
            if (qemuDomainObjEndJob(vm) > 0)
                virDomainRemoveInactive(&driver->domains, vm);
8067 8068
            vm = NULL;
        }
8069
        virReportSystemError(errno,
C
Chris Lalancette 已提交
8070 8071
                             _("cannot open unix socket '%s' for tunnelled migration"),
                             unixfile);
8072
        goto endjob;
C
Chris Lalancette 已提交
8073 8074
    }

8075
    qemuDomainStartAudit(vm, "migrated", true);
8076

C
Chris Lalancette 已提交
8077 8078 8079 8080 8081
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_MIGRATED);
    ret = 0;

8082
endjob:
8083 8084 8085
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
8086

8087 8088 8089 8090 8091 8092 8093 8094 8095
    /* We set a fake job active which is held across
     * API calls until the finish() call. This prevents
     * any other APIs being invoked while incoming
     * migration is taking place
     */
    if (vm &&
        virDomainObjIsActive(vm)) {
        priv->jobActive = QEMU_JOB_MIGRATION_IN;
        priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;
8096
        priv->jobStart = timeval_to_ms(now);
8097 8098
    }

C
Chris Lalancette 已提交
8099 8100
cleanup:
    virDomainDefFree(def);
8101 8102
    if (unixfile)
        unlink(unixfile);
C
Chris Lalancette 已提交
8103 8104 8105 8106 8107 8108 8109 8110 8111
    VIR_FREE(unixfile);
    if (vm)
        virDomainObjUnlock(vm);
    if (event)
        qemuDomainEventQueue(driver, event);
    qemuDriverUnlock(driver);
    return ret;
}

D
Daniel Veillard 已提交
8112 8113 8114 8115
/* Prepare is the first step, and it runs on the destination host.
 *
 * This starts an empty VM listening on a TCP port.
 */
8116
static int ATTRIBUTE_NONNULL (5)
D
Daniel Veillard 已提交
8117 8118 8119 8120 8121
qemudDomainMigratePrepare2 (virConnectPtr dconn,
                            char **cookie ATTRIBUTE_UNUSED,
                            int *cookielen ATTRIBUTE_UNUSED,
                            const char *uri_in,
                            char **uri_out,
C
Chris Lalancette 已提交
8122
                            unsigned long flags,
D
Daniel Veillard 已提交
8123 8124 8125 8126 8127
                            const char *dname,
                            unsigned long resource ATTRIBUTE_UNUSED,
                            const char *dom_xml)
{
    static int port = 0;
8128 8129
    struct qemud_driver *driver = dconn->privateData;
    virDomainDefPtr def = NULL;
D
Daniel Veillard 已提交
8130 8131
    virDomainObjPtr vm = NULL;
    int this_port;
C
Chris Lalancette 已提交
8132
    char *hostname = NULL;
D
Daniel Veillard 已提交
8133 8134
    char migrateFrom [64];
    const char *p;
8135
    virDomainEventPtr event = NULL;
8136
    int ret = -1;
8137
    int internalret;
8138 8139 8140 8141 8142 8143 8144 8145
    qemuDomainObjPrivatePtr priv = NULL;
    struct timeval now;

    if (gettimeofday(&now, NULL) < 0) {
        virReportSystemError(errno, "%s",
                             _("cannot get time of day"));
        return -1;
    }
8146

C
Chris Lalancette 已提交
8147 8148 8149 8150 8151 8152 8153 8154 8155
    virCheckFlags(VIR_MIGRATE_LIVE |
                  VIR_MIGRATE_PEER2PEER |
                  VIR_MIGRATE_TUNNELLED |
                  VIR_MIGRATE_PERSIST_DEST |
                  VIR_MIGRATE_UNDEFINE_SOURCE |
                  VIR_MIGRATE_PAUSED |
                  VIR_MIGRATE_NON_SHARED_DISK |
                  VIR_MIGRATE_NON_SHARED_INC, -1);

8156
    *uri_out = NULL;
D
Daniel Veillard 已提交
8157

8158
    qemuDriverLock(driver);
C
Chris Lalancette 已提交
8159 8160 8161 8162
    if (flags & VIR_MIGRATE_TUNNELLED) {
        /* this is a logical error; we never should have gotten here with
         * VIR_MIGRATE_TUNNELLED set
         */
8163 8164
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("Tunnelled migration requested but invalid RPC method called"));
C
Chris Lalancette 已提交
8165 8166 8167
        goto cleanup;
    }

D
Daniel Veillard 已提交
8168
    if (!dom_xml) {
8169 8170
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("no domain XML passed"));
8171
        goto cleanup;
D
Daniel Veillard 已提交
8172 8173 8174 8175 8176 8177 8178 8179 8180 8181 8182 8183 8184 8185 8186 8187 8188
    }

    /* The URI passed in may be NULL or a string "tcp://somehostname:port".
     *
     * If the URI passed in is NULL then we allocate a port number
     * from our pool of port numbers and return a URI of
     * "tcp://ourhostname:port".
     *
     * If the URI passed in is not NULL then we try to parse out the
     * port number and use that (note that the hostname is assumed
     * to be a correct hostname which refers to the target machine).
     */
    if (uri_in == NULL) {
        this_port = QEMUD_MIGRATION_FIRST_PORT + port++;
        if (port == QEMUD_MIGRATION_NUM_PORTS) port = 0;

        /* Get hostname */
C
Chris Lalancette 已提交
8189
        if ((hostname = virGetHostname(NULL)) == NULL)
8190
            goto cleanup;
D
Daniel Veillard 已提交
8191

C
Chris Lalancette 已提交
8192 8193 8194 8195 8196 8197
        if (STRPREFIX(hostname, "localhost")) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("hostname on destination resolved to localhost, but migration requires an FQDN"));
            goto cleanup;
        }

8198 8199 8200 8201 8202
        /* XXX this really should have been a properly well-formed
         * URI, but we can't add in tcp:// now without breaking
         * compatability with old targets. We at least make the
         * new targets accept both syntaxes though.
         */
D
Daniel Veillard 已提交
8203
        /* Caller frees */
8204 8205
        internalret = virAsprintf(uri_out, "tcp:%s:%d", hostname, this_port);
        if (internalret < 0) {
8206
            virReportOOMError();
8207
            goto cleanup;
D
Daniel Veillard 已提交
8208 8209 8210 8211 8212 8213
        }
    } else {
        /* Check the URI starts with "tcp:".  We will escape the
         * URI when passing it to the qemu monitor, so bad
         * characters in hostname part don't matter.
         */
8214
        if (!STRPREFIX (uri_in, "tcp:")) {
8215 8216
            qemuReportError (VIR_ERR_INVALID_ARG,
                             "%s", _("only tcp URIs are supported for KVM/QEMU migrations"));
8217
            goto cleanup;
D
Daniel Veillard 已提交
8218 8219 8220 8221
        }

        /* Get the port number. */
        p = strrchr (uri_in, ':');
8222 8223 8224 8225 8226 8227 8228 8229
        if (p == strchr(uri_in, ':')) {
            /* Generate a port */
            this_port = QEMUD_MIGRATION_FIRST_PORT + port++;
            if (port == QEMUD_MIGRATION_NUM_PORTS)
                port = 0;

            /* Caller frees */
            if (virAsprintf(uri_out, "%s:%d", uri_in, this_port) < 0) {
8230
                virReportOOMError();
8231 8232 8233 8234 8235 8236 8237
                goto cleanup;
            }

        } else {
            p++; /* definitely has a ':' in it, see above */
            this_port = virParseNumber (&p);
            if (this_port == -1 || p-uri_in != strlen (uri_in)) {
8238 8239
                qemuReportError(VIR_ERR_INVALID_ARG,
                                "%s", _("URI ended with incorrect ':port'"));
8240 8241
                goto cleanup;
            }
D
Daniel Veillard 已提交
8242 8243 8244
        }
    }

8245
    if (*uri_out)
8246 8247
        VIR_DEBUG("Generated uri_out=%s", *uri_out);

D
Daniel Veillard 已提交
8248
    /* Parse the domain XML. */
8249
    if (!(def = virDomainDefParseString(driver->caps, dom_xml,
8250
                                        VIR_DOMAIN_XML_INACTIVE))) {
8251 8252
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to parse XML"));
8253
        goto cleanup;
D
Daniel Veillard 已提交
8254 8255
    }

8256 8257 8258
    if (!qemuDomainIsMigratable(def))
        goto cleanup;

D
Daniel Veillard 已提交
8259
    /* Target domain name, maybe renamed. */
8260 8261 8262 8263 8264 8265
    if (dname) {
        VIR_FREE(def->name);
        def->name = strdup(dname);
        if (def->name == NULL)
            goto cleanup;
    }
D
Daniel Veillard 已提交
8266

8267 8268
    if (virDomainObjIsDuplicate(&driver->domains, def, 1) < 0)
        goto cleanup;
D
Daniel Veillard 已提交
8269

8270
    if (!(vm = virDomainAssignDef(driver->caps,
D
Daniel Veillard 已提交
8271
                                  &driver->domains,
8272
                                  def, true))) {
8273
        /* virDomainAssignDef already set the error */
8274
        goto cleanup;
D
Daniel Veillard 已提交
8275
    }
8276
    def = NULL;
8277
    priv = vm->privateData;
D
Daniel Veillard 已提交
8278

8279 8280
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
8281
    priv->jobActive = QEMU_JOB_MIGRATION_OUT;
8282

D
Daniel Veillard 已提交
8283 8284 8285 8286 8287 8288 8289
    /* Domain starts inactive, even if the domain XML had an id field. */
    vm->def->id = -1;

    /* Start the QEMU daemon, with the same command-line arguments plus
     * -incoming tcp:0.0.0.0:port
     */
    snprintf (migrateFrom, sizeof (migrateFrom), "tcp:0.0.0.0:%d", this_port);
8290
    if (qemudStartVMDaemon (dconn, driver, vm, migrateFrom, true,
8291
                            -1, NULL, VIR_VM_OP_MIGRATE_IN_START) < 0) {
8292
        qemuDomainStartAudit(vm, "migrated", false);
8293 8294 8295
        /* Note that we don't set an error here because qemudStartVMDaemon
         * should have already done that.
         */
8296
        if (!vm->persistent) {
8297 8298
            if (qemuDomainObjEndJob(vm) > 0)
                virDomainRemoveInactive(&driver->domains, vm);
8299 8300
            vm = NULL;
        }
8301
        goto endjob;
D
Daniel Veillard 已提交
8302
    }
8303

8304
    qemuDomainStartAudit(vm, "migrated", true);
8305 8306 8307
    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STARTED,
                                     VIR_DOMAIN_EVENT_STARTED_MIGRATED);
8308
    ret = 0;
D
Daniel Veillard 已提交
8309

8310
endjob:
8311 8312 8313
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
8314

8315 8316 8317 8318 8319 8320 8321 8322 8323
    /* We set a fake job active which is held across
     * API calls until the finish() call. This prevents
     * any other APIs being invoked while incoming
     * migration is taking place
     */
    if (vm &&
        virDomainObjIsActive(vm)) {
        priv->jobActive = QEMU_JOB_MIGRATION_IN;
        priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;
8324
        priv->jobStart = timeval_to_ms(now);
8325 8326
    }

8327
cleanup:
C
Chris Lalancette 已提交
8328
    VIR_FREE(hostname);
8329
    virDomainDefFree(def);
C
Chris Lalancette 已提交
8330
    if (ret != 0)
8331
        VIR_FREE(*uri_out);
8332 8333
    if (vm)
        virDomainObjUnlock(vm);
8334 8335
    if (event)
        qemuDomainEventQueue(driver, event);
8336
    qemuDriverUnlock(driver);
8337
    return ret;
C
Chris Lalancette 已提交
8338 8339 8340

}

8341 8342 8343 8344

/* Perform migration using QEMU's native TCP migrate support,
 * not encrypted obviously
 */
8345
static int doNativeMigrate(struct qemud_driver *driver,
8346 8347
                           virDomainObjPtr vm,
                           const char *uri,
8348
                           unsigned int flags,
8349 8350 8351 8352
                           const char *dname ATTRIBUTE_UNUSED,
                           unsigned long resource)
{
    int ret = -1;
8353
    xmlURIPtr uribits = NULL;
8354
    qemuDomainObjPrivatePtr priv = vm->privateData;
8355
    unsigned int background_flags = QEMU_MONITOR_MIGRATE_BACKGROUND;
8356

8357 8358 8359 8360 8361
    /* Issue the migrate command. */
    if (STRPREFIX(uri, "tcp:") && !STRPREFIX(uri, "tcp://")) {
        /* HACK: source host generates bogus URIs, so fix them up */
        char *tmpuri;
        if (virAsprintf(&tmpuri, "tcp://%s", uri + strlen("tcp:")) < 0) {
8362
            virReportOOMError();
8363 8364 8365 8366 8367 8368 8369 8370
            goto cleanup;
        }
        uribits = xmlParseURI(tmpuri);
        VIR_FREE(tmpuri);
    } else {
        uribits = xmlParseURI(uri);
    }
    if (!uribits) {
8371 8372
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot parse URI %s"), uri);
8373 8374 8375
        goto cleanup;
    }

8376
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
8377
    if (resource > 0 &&
8378
        qemuMonitorSetMigrationSpeed(priv->mon, resource) < 0) {
8379
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8380
        goto cleanup;
8381
    }
8382

8383 8384 8385 8386 8387 8388 8389 8390
    if (flags & VIR_MIGRATE_NON_SHARED_DISK)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_DISK;

    if (flags & VIR_MIGRATE_NON_SHARED_INC)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_INC;

    if (qemuMonitorMigrateToHost(priv->mon, background_flags, uribits->server,
                                 uribits->port) < 0) {
8391
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8392 8393
        goto cleanup;
    }
8394
    qemuDomainObjExitMonitorWithDriver(driver, vm);
8395

8396
    if (qemuDomainWaitForMigrationComplete(driver, vm) < 0)
8397 8398 8399 8400 8401 8402 8403 8404 8405 8406
        goto cleanup;

    ret = 0;

cleanup:
    xmlFreeURI(uribits);
    return ret;
}


8407 8408
#define TUNNEL_SEND_BUF_SIZE 65536

8409
static int doTunnelSendAll(virStreamPtr st,
8410 8411
                           int sock)
{
8412 8413 8414 8415 8416 8417 8418 8419
    char *buffer;
    int nbytes = TUNNEL_SEND_BUF_SIZE;

    if (VIR_ALLOC_N(buffer, TUNNEL_SEND_BUF_SIZE) < 0) {
        virReportOOMError();
        virStreamAbort(st);
        return -1;
    }
8420 8421 8422 8423 8424

    /* XXX should honour the 'resource' parameter here */
    for (;;) {
        nbytes = saferead(sock, buffer, nbytes);
        if (nbytes < 0) {
8425
            virReportSystemError(errno, "%s",
8426
                                 _("tunnelled migration failed to read from qemu"));
8427 8428
            virStreamAbort(st);
            VIR_FREE(buffer);
8429 8430 8431 8432 8433 8434 8435
            return -1;
        }
        else if (nbytes == 0)
            /* EOF; get out of here */
            break;

        if (virStreamSend(st, buffer, nbytes) < 0) {
8436 8437
            qemuReportError(VIR_ERR_OPERATION_FAILED, "%s",
                            _("Failed to write migration data to remote libvirtd"));
8438
            VIR_FREE(buffer);
8439 8440 8441 8442
            return -1;
        }
    }

8443 8444
    VIR_FREE(buffer);

8445 8446 8447 8448 8449 8450 8451
    if (virStreamFinish(st) < 0)
        /* virStreamFinish set the error for us */
        return -1;

    return 0;
}

C
Chris Lalancette 已提交
8452
static int doTunnelMigrate(virDomainPtr dom,
8453
                           struct qemud_driver *driver,
8454
                           virConnectPtr dconn,
C
Chris Lalancette 已提交
8455
                           virDomainObjPtr vm,
8456
                           const char *dom_xml,
C
Chris Lalancette 已提交
8457 8458 8459 8460 8461
                           const char *uri,
                           unsigned long flags,
                           const char *dname,
                           unsigned long resource)
{
8462
    qemuDomainObjPrivatePtr priv = vm->privateData;
8463 8464
    int client_sock = -1;
    int qemu_sock = -1;
C
Chris Lalancette 已提交
8465 8466
    struct sockaddr_un sa_qemu, sa_client;
    socklen_t addrlen;
8467
    virDomainPtr ddomain = NULL;
C
Chris Lalancette 已提交
8468
    int retval = -1;
8469
    virStreamPtr st = NULL;
C
Chris Lalancette 已提交
8470 8471
    char *unixfile = NULL;
    int internalret;
8472
    unsigned long long qemuCmdFlags;
C
Chris Lalancette 已提交
8473 8474
    int status;
    unsigned long long transferred, remaining, total;
8475
    unsigned int background_flags = QEMU_MONITOR_MIGRATE_BACKGROUND;
C
Chris Lalancette 已提交
8476

8477 8478 8479 8480 8481 8482 8483 8484
    /*
     * The order of operations is important here to avoid touching
     * the source VM until we are very sure we can successfully
     * start the migration operation.
     *
     *   1. setup local support infrastructure (eg sockets)
     *   2. setup destination fully
     *   3. start migration on source
C
Chris Lalancette 已提交
8485 8486
     */

8487

8488
    /* Stage 1. setup local support infrastructure */
C
Chris Lalancette 已提交
8489 8490

    if (virAsprintf(&unixfile, "%s/qemu.tunnelmigrate.src.%s",
8491
                    driver->libDir, vm->def->name) < 0) {
8492
        virReportOOMError();
8493
        goto cleanup;
C
Chris Lalancette 已提交
8494 8495 8496 8497
    }

    qemu_sock = socket(AF_UNIX, SOCK_STREAM, 0);
    if (qemu_sock < 0) {
8498
        virReportSystemError(errno, "%s",
C
Chris Lalancette 已提交
8499
                             _("cannot open tunnelled migration socket"));
8500
        goto cleanup;
C
Chris Lalancette 已提交
8501 8502 8503 8504 8505
    }
    memset(&sa_qemu, 0, sizeof(sa_qemu));
    sa_qemu.sun_family = AF_UNIX;
    if (virStrcpy(sa_qemu.sun_path, unixfile,
                  sizeof(sa_qemu.sun_path)) == NULL) {
8506 8507 8508
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("Unix socket '%s' too big for destination"),
                        unixfile);
8509
        goto cleanup;
C
Chris Lalancette 已提交
8510 8511 8512
    }
    unlink(unixfile);
    if (bind(qemu_sock, (struct sockaddr *)&sa_qemu, sizeof(sa_qemu)) < 0) {
8513
        virReportSystemError(errno,
C
Chris Lalancette 已提交
8514 8515
                             _("Cannot bind to unix socket '%s' for tunnelled migration"),
                             unixfile);
8516
        goto cleanup;
C
Chris Lalancette 已提交
8517 8518
    }
    if (listen(qemu_sock, 1) < 0) {
8519
        virReportSystemError(errno,
C
Chris Lalancette 已提交
8520 8521
                             _("Cannot listen on unix socket '%s' for tunnelled migration"),
                             unixfile);
8522
        goto cleanup;
C
Chris Lalancette 已提交
8523 8524
    }

8525 8526 8527 8528 8529 8530 8531
    if (chown(unixfile, qemu_driver->user, qemu_driver->group) < 0) {
        virReportSystemError(errno,
                             _("Cannot change unix socket '%s' owner"),
                             unixfile);
        goto cleanup;
    }

C
Chris Lalancette 已提交
8532
    /* check that this qemu version supports the unix migration */
8533
    if (qemuCapsExtractVersionInfo(vm->def->emulator, NULL, &qemuCmdFlags) < 0) {
8534 8535 8536
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("Cannot extract Qemu version from '%s'"),
                        vm->def->emulator);
8537 8538 8539 8540 8541
        goto cleanup;
    }

    if (!(qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_UNIX) &&
        !(qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_EXEC)) {
8542 8543
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("Source qemu is too old to support tunnelled migration"));
8544
        goto cleanup;
C
Chris Lalancette 已提交
8545
    }
8546 8547 8548 8549 8550 8551 8552 8553 8554 8555 8556 8557


    /* Stage 2. setup destination fully
     *
     * Once stage 2 has completed successfully, we *must* call finish
     * to cleanup the target whether we succeed or fail
     */
    st = virStreamNew(dconn, 0);
    if (st == NULL)
        /* virStreamNew only fails on OOM, and it reports the error itself */
        goto cleanup;

8558
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8559 8560 8561
    internalret = dconn->driver->domainMigratePrepareTunnel(dconn, st,
                                                            flags, dname,
                                                            resource, dom_xml);
8562
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8563 8564 8565 8566 8567

    if (internalret < 0)
        /* domainMigratePrepareTunnel sets the error for us */
        goto cleanup;

8568 8569 8570 8571 8572 8573 8574 8575 8576
    /* the domain may have shutdown or crashed while we had the locks dropped
     * in qemuDomainObjEnterRemoteWithDriver, so check again
     */
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8577
    /*   3. start migration on source */
8578
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
8579 8580 8581 8582 8583 8584 8585 8586
    if (flags & VIR_MIGRATE_NON_SHARED_DISK)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_DISK;
    if (flags & VIR_MIGRATE_NON_SHARED_INC)
        background_flags |= QEMU_MONITOR_MIGRATE_NON_SHARED_INC;
    if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_UNIX){
        internalret = qemuMonitorMigrateToUnix(priv->mon, background_flags,
                                               unixfile);
    }
C
Chris Lalancette 已提交
8587 8588
    else if (qemuCmdFlags & QEMUD_CMD_FLAG_MIGRATE_QEMU_EXEC) {
        const char *args[] = { "nc", "-U", unixfile, NULL };
8589
        internalret = qemuMonitorMigrateToCommand(priv->mon, QEMU_MONITOR_MIGRATE_BACKGROUND, args);
8590 8591
    } else {
        internalret = -1;
C
Chris Lalancette 已提交
8592
    }
8593
    qemuDomainObjExitMonitorWithDriver(driver, vm);
C
Chris Lalancette 已提交
8594
    if (internalret < 0) {
8595 8596
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("tunnelled migration monitor command failed"));
8597
        goto finish;
C
Chris Lalancette 已提交
8598 8599
    }

8600 8601 8602 8603 8604 8605
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8606 8607 8608
    /* From this point onwards we *must* call cancel to abort the
     * migration on source if anything goes wrong */

C
Chris Lalancette 已提交
8609 8610 8611
    /* it is also possible that the migrate didn't fail initially, but
     * rather failed later on.  Check the output of "info migrate"
     */
8612
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
8613 8614
    if (qemuMonitorGetMigrationStatus(priv->mon,
                                      &status,
C
Chris Lalancette 已提交
8615 8616 8617
                                      &transferred,
                                      &remaining,
                                      &total) < 0) {
8618
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8619
        goto cancel;
C
Chris Lalancette 已提交
8620
    }
8621
    qemuDomainObjExitMonitorWithDriver(driver, vm);
C
Chris Lalancette 已提交
8622 8623

    if (status == QEMU_MONITOR_MIGRATION_STATUS_ERROR) {
8624 8625
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s",_("migrate failed"));
8626
        goto cancel;
C
Chris Lalancette 已提交
8627 8628 8629 8630 8631 8632
    }

    addrlen = sizeof(sa_client);
    while ((client_sock = accept(qemu_sock, (struct sockaddr *)&sa_client, &addrlen)) < 0) {
        if (errno == EAGAIN || errno == EINTR)
            continue;
8633
        virReportSystemError(errno, "%s",
C
Chris Lalancette 已提交
8634
                             _("tunnelled migration failed to accept from qemu"));
8635
        goto cancel;
C
Chris Lalancette 已提交
8636 8637
    }

8638
    retval = doTunnelSendAll(st, client_sock);
8639

8640
cancel:
8641
    if (retval != 0 && virDomainObjIsActive(vm)) {
8642
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
8643
        qemuMonitorMigrateCancel(priv->mon);
8644
        qemuDomainObjExitMonitorWithDriver(driver, vm);
8645
    }
C
Chris Lalancette 已提交
8646

8647
finish:
C
Chris Lalancette 已提交
8648
    dname = dname ? dname : dom->name;
8649
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
C
Chris Lalancette 已提交
8650 8651
    ddomain = dconn->driver->domainMigrateFinish2
        (dconn, dname, NULL, 0, uri, flags, retval);
8652
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8653 8654

cleanup:
8655 8656
    VIR_FORCE_CLOSE(client_sock);
    VIR_FORCE_CLOSE(qemu_sock);
8657

C
Chris Lalancette 已提交
8658 8659 8660
    if (ddomain)
        virUnrefDomain(ddomain);

8661 8662 8663 8664
    if (unixfile) {
        unlink(unixfile);
        VIR_FREE(unixfile);
    }
C
Chris Lalancette 已提交
8665

8666 8667 8668
    if (st)
        /* don't call virStreamFree(), because that resets any pending errors */
        virUnrefStream(st);
8669 8670 8671 8672
    return retval;
}


8673 8674 8675 8676
/* This is essentially a simplified re-impl of
 * virDomainMigrateVersion2 from libvirt.c, but running in source
 * libvirtd context, instead of client app context */
static int doNonTunnelMigrate(virDomainPtr dom,
8677
                              struct qemud_driver *driver,
8678 8679 8680 8681 8682 8683 8684 8685 8686 8687 8688
                              virConnectPtr dconn,
                              virDomainObjPtr vm,
                              const char *dom_xml,
                              const char *uri ATTRIBUTE_UNUSED,
                              unsigned long flags,
                              const char *dname,
                              unsigned long resource)
{
    virDomainPtr ddomain = NULL;
    int retval = -1;
    char *uri_out = NULL;
8689
    int rc;
8690

8691
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8692 8693
    /* NB we don't pass 'uri' into this, since that's the libvirtd
     * URI in this context - so we let dest pick it */
8694 8695 8696 8697 8698 8699 8700 8701 8702
    rc = dconn->driver->domainMigratePrepare2(dconn,
                                              NULL, /* cookie */
                                              0, /* cookielen */
                                              NULL, /* uri */
                                              &uri_out,
                                              flags, dname,
                                              resource, dom_xml);
    qemuDomainObjExitRemoteWithDriver(driver, vm);
    if (rc < 0)
8703 8704 8705
        /* domainMigratePrepare2 sets the error for us */
        goto cleanup;

8706 8707 8708 8709 8710 8711 8712 8713 8714
    /* the domain may have shutdown or crashed while we had the locks dropped
     * in qemuDomainObjEnterRemoteWithDriver, so check again
     */
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8715
    if (uri_out == NULL) {
8716 8717
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("domainMigratePrepare2 did not set uri"));
8718
        goto cleanup;
8719 8720
    }

8721
    if (doNativeMigrate(driver, vm, uri_out, flags, dname, resource) < 0)
8722 8723 8724 8725 8726 8727
        goto finish;

    retval = 0;

finish:
    dname = dname ? dname : dom->name;
8728
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8729 8730
    ddomain = dconn->driver->domainMigrateFinish2
        (dconn, dname, NULL, 0, uri_out, flags, retval);
8731
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8732 8733 8734 8735 8736 8737 8738 8739 8740

    if (ddomain)
        virUnrefDomain(ddomain);

cleanup:
    return retval;
}


8741
static int doPeer2PeerMigrate(virDomainPtr dom,
8742
                              struct qemud_driver *driver,
8743 8744 8745 8746 8747 8748 8749 8750 8751
                              virDomainObjPtr vm,
                              const char *uri,
                              unsigned long flags,
                              const char *dname,
                              unsigned long resource)
{
    int ret = -1;
    virConnectPtr dconn = NULL;
    char *dom_xml;
8752
    bool p2p;
8753 8754 8755 8756 8757

    /* the order of operations is important here; we make sure the
     * destination side is completely setup before we touch the source
     */

8758
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
8759
    dconn = virConnectOpen(uri);
8760
    qemuDomainObjExitRemoteWithDriver(driver, vm);
8761
    if (dconn == NULL) {
8762 8763
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("Failed to connect to remote libvirt URI %s"), uri);
8764 8765
        return -1;
    }
8766 8767 8768 8769 8770 8771

    qemuDomainObjEnterRemoteWithDriver(driver, vm);
    p2p = VIR_DRV_SUPPORTS_FEATURE(dconn->driver, dconn,
                                   VIR_DRV_FEATURE_MIGRATION_P2P);
    qemuDomainObjExitRemoteWithDriver(driver, vm);
    if (!p2p) {
8772 8773
        qemuReportError(VIR_ERR_OPERATION_FAILED, "%s",
                        _("Destination libvirt does not support peer-to-peer migration protocol"));
8774 8775 8776
        goto cleanup;
    }

8777 8778 8779 8780 8781 8782 8783
    /* domain may have been stopped while we were talking to remote daemon */
    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                        _("guest unexpectedly quit"));
        goto cleanup;
    }

8784 8785 8786
    dom_xml = qemudVMDumpXML(driver, vm,
                             VIR_DOMAIN_XML_SECURE |
                             VIR_DOMAIN_XML_UPDATE_CPU);
8787
    if (!dom_xml) {
8788 8789
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        "%s", _("failed to get domain xml"));
8790 8791 8792
        goto cleanup;
    }

8793
    if (flags & VIR_MIGRATE_TUNNELLED)
8794
        ret = doTunnelMigrate(dom, driver, dconn, vm, dom_xml, uri, flags, dname, resource);
8795
    else
8796
        ret = doNonTunnelMigrate(dom, driver, dconn, vm, dom_xml, uri, flags, dname, resource);
8797 8798 8799

cleanup:
    VIR_FREE(dom_xml);
C
Chris Lalancette 已提交
8800
    /* don't call virConnectClose(), because that resets any pending errors */
8801
    qemuDomainObjEnterRemoteWithDriver(driver, vm);
C
Chris Lalancette 已提交
8802
    virUnrefConnect(dconn);
8803
    qemuDomainObjExitRemoteWithDriver(driver, vm);
C
Chris Lalancette 已提交
8804

8805
    return ret;
D
Daniel Veillard 已提交
8806 8807
}

8808

D
Daniel Veillard 已提交
8809 8810 8811 8812 8813 8814
/* Perform is the second step, and it runs on the source host. */
static int
qemudDomainMigratePerform (virDomainPtr dom,
                           const char *cookie ATTRIBUTE_UNUSED,
                           int cookielen ATTRIBUTE_UNUSED,
                           const char *uri,
8815
                           unsigned long flags,
8816
                           const char *dname,
D
Daniel Veillard 已提交
8817 8818
                           unsigned long resource)
{
8819 8820
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
8821
    virDomainEventPtr event = NULL;
8822
    int ret = -1;
8823
    int resume = 0;
8824
    qemuDomainObjPrivatePtr priv;
D
Daniel Veillard 已提交
8825

C
Chris Lalancette 已提交
8826 8827 8828 8829 8830 8831 8832 8833 8834
    virCheckFlags(VIR_MIGRATE_LIVE |
                  VIR_MIGRATE_PEER2PEER |
                  VIR_MIGRATE_TUNNELLED |
                  VIR_MIGRATE_PERSIST_DEST |
                  VIR_MIGRATE_UNDEFINE_SOURCE |
                  VIR_MIGRATE_PAUSED |
                  VIR_MIGRATE_NON_SHARED_DISK |
                  VIR_MIGRATE_NON_SHARED_INC, -1);

8835
    qemuDriverLock(driver);
8836
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
D
Daniel Veillard 已提交
8837
    if (!vm) {
8838 8839
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
8840 8841
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
8842
        goto cleanup;
D
Daniel Veillard 已提交
8843
    }
8844
    priv = vm->privateData;
D
Daniel Veillard 已提交
8845

8846 8847
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
8848
    priv->jobActive = QEMU_JOB_MIGRATION_OUT;
8849

D
Daniel P. Berrange 已提交
8850
    if (!virDomainObjIsActive(vm)) {
8851 8852
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
8853
        goto endjob;
D
Daniel Veillard 已提交
8854 8855
    }

8856 8857 8858
    memset(&priv->jobInfo, 0, sizeof(priv->jobInfo));
    priv->jobInfo.type = VIR_DOMAIN_JOB_UNBOUNDED;

8859
    resume = vm->state == VIR_DOMAIN_RUNNING;
8860
    if (!(flags & VIR_MIGRATE_LIVE) && vm->state == VIR_DOMAIN_RUNNING) {
8861
        if (qemuDomainMigrateOffline(driver, vm) < 0)
8862
            goto endjob;
8863 8864
    }

8865
    if ((flags & (VIR_MIGRATE_TUNNELLED | VIR_MIGRATE_PEER2PEER))) {
8866
        if (doPeer2PeerMigrate(dom, driver, vm, uri, flags, dname, resource) < 0)
8867
            /* doPeer2PeerMigrate already set the error, so just get out */
8868
            goto endjob;
8869
    } else {
8870
        if (doNativeMigrate(driver, vm, uri, flags, dname, resource) < 0)
8871
            goto endjob;
8872 8873
    }

D
Daniel Veillard 已提交
8874
    /* Clean up the source domain. */
8875
    qemudShutdownVMDaemon(driver, vm, 1);
8876
    qemuDomainStopAudit(vm, "migrated");
8877
    resume = 0;
8878 8879 8880 8881

    event = virDomainEventNewFromObj(vm,
                                     VIR_DOMAIN_EVENT_STOPPED,
                                     VIR_DOMAIN_EVENT_STOPPED_MIGRATED);
C
Chris Lalancette 已提交
8882
    if (!vm->persistent || (flags & VIR_MIGRATE_UNDEFINE_SOURCE)) {
8883
        virDomainDeleteConfig(driver->configDir, driver->autostartDir, vm);
8884 8885
        if (qemuDomainObjEndJob(vm) > 0)
            virDomainRemoveInactive(&driver->domains, vm);
8886 8887
        vm = NULL;
    }
8888
    ret = 0;
D
Daniel Veillard 已提交
8889

8890
endjob:
8891
    if (resume && vm->state == VIR_DOMAIN_PAUSED) {
8892
        /* we got here through some sort of failure; start the domain again */
H
Hu Tao 已提交
8893
        if (doStartCPUs(driver, vm, dom->conn) < 0) {
8894 8895 8896 8897
            /* Hm, we already know we are in error here.  We don't want to
             * overwrite the previous error, though, so we just throw something
             * to the logs and hope for the best
             */
8898
            VIR_ERROR(_("Failed to resume guest %s after failure"),
8899
                      vm->def->name);
8900 8901 8902 8903 8904 8905
        }

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
    }
8906 8907 8908
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
8909

8910
cleanup:
8911 8912
    if (vm)
        virDomainObjUnlock(vm);
8913 8914
    if (event)
        qemuDomainEventQueue(driver, event);
8915
    qemuDriverUnlock(driver);
8916
    return ret;
D
Daniel Veillard 已提交
8917 8918
}

8919
#if WITH_MACVTAP
8920 8921 8922 8923 8924 8925 8926 8927 8928 8929 8930 8931 8932 8933 8934 8935 8936 8937 8938 8939 8940 8941 8942 8943 8944 8945 8946 8947 8948 8949 8950 8951 8952 8953
static void
qemudVPAssociatePortProfiles(virDomainDefPtr def) {
    int i;
    int last_good_net = -1;
    virDomainNetDefPtr net;

    for (i = 0; i < def->nnets; i++) {
        net = def->nets[i];
        if (net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
            if (vpAssociatePortProfileId(net->ifname,
                                         net->mac,
                                         net->data.direct.linkdev,
                                         &net->data.direct.virtPortProfile,
                                         def->uuid,
                                         VIR_VM_OP_MIGRATE_IN_FINISH) != 0)
                goto err_exit;
        }
        last_good_net = i;
    }

    return;

err_exit:
    for (i = 0; i < last_good_net; i++) {
        net = def->nets[i];
        if (net->type == VIR_DOMAIN_NET_TYPE_DIRECT) {
            vpDisassociatePortProfileId(net->ifname,
                                        net->mac,
                                        net->data.direct.linkdev,
                                        &net->data.direct.virtPortProfile,
                                        VIR_VM_OP_MIGRATE_IN_FINISH);
        }
    }
}
8954 8955 8956 8957
#else /* !WITH_MACVTAP */
static void
qemudVPAssociatePortProfiles(virDomainDefPtr def ATTRIBUTE_UNUSED) { }
#endif /* WITH_MACVTAP */
8958

D
Daniel Veillard 已提交
8959 8960 8961 8962 8963 8964 8965
/* Finish is the third and final step, and it runs on the destination host. */
static virDomainPtr
qemudDomainMigrateFinish2 (virConnectPtr dconn,
                           const char *dname,
                           const char *cookie ATTRIBUTE_UNUSED,
                           int cookielen ATTRIBUTE_UNUSED,
                           const char *uri ATTRIBUTE_UNUSED,
C
Chris Lalancette 已提交
8966
                           unsigned long flags,
D
Daniel Veillard 已提交
8967 8968
                           int retcode)
{
8969 8970 8971
    struct qemud_driver *driver = dconn->privateData;
    virDomainObjPtr vm;
    virDomainPtr dom = NULL;
8972
    virDomainEventPtr event = NULL;
8973
    virErrorPtr orig_err;
C
Chris Lalancette 已提交
8974
    int newVM = 1;
8975
    qemuDomainObjPrivatePtr priv = NULL;
D
Daniel Veillard 已提交
8976

C
Chris Lalancette 已提交
8977 8978 8979 8980 8981 8982 8983 8984 8985
    virCheckFlags(VIR_MIGRATE_LIVE |
                  VIR_MIGRATE_PEER2PEER |
                  VIR_MIGRATE_TUNNELLED |
                  VIR_MIGRATE_PERSIST_DEST |
                  VIR_MIGRATE_UNDEFINE_SOURCE |
                  VIR_MIGRATE_PAUSED |
                  VIR_MIGRATE_NON_SHARED_DISK |
                  VIR_MIGRATE_NON_SHARED_INC, NULL);

8986 8987 8988
    /* Migration failed. Save the current error so nothing squashes it */
    orig_err = virSaveLastError();

8989
    qemuDriverLock(driver);
8990
    vm = virDomainFindByName(&driver->domains, dname);
D
Daniel Veillard 已提交
8991
    if (!vm) {
8992 8993
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching name '%s'"), dname);
8994
        goto cleanup;
D
Daniel Veillard 已提交
8995 8996
    }

8997 8998 8999 9000 9001 9002 9003 9004 9005
    priv = vm->privateData;
    if (priv->jobActive != QEMU_JOB_MIGRATION_IN) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("domain '%s' is not processing incoming migration"), dname);
        goto cleanup;
    }
    priv->jobActive = QEMU_JOB_NONE;
    memset(&priv->jobInfo, 0, sizeof(priv->jobInfo));

9006 9007 9008
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

D
Daniel Veillard 已提交
9009 9010 9011 9012
    /* Did the migration go as planned?  If yes, return the domain
     * object, but if no, clean up the empty qemu process.
     */
    if (retcode == 0) {
9013 9014 9015 9016 9017 9018
        if (!virDomainObjIsActive(vm)) {
            qemuReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                            _("guest unexpectedly quit"));
            goto cleanup;
        }

9019 9020
        qemudVPAssociatePortProfiles(vm->def);

C
Chris Lalancette 已提交
9021 9022 9023 9024 9025
        if (flags & VIR_MIGRATE_PERSIST_DEST) {
            if (vm->persistent)
                newVM = 0;
            vm->persistent = 1;

9026
            if (virDomainSaveConfig(driver->configDir, vm->def) < 0) {
C
Chris Lalancette 已提交
9027 9028 9029 9030 9031 9032 9033 9034 9035 9036
                /* Hmpf.  Migration was successful, but making it persistent
                 * was not.  If we report successful, then when this domain
                 * shuts down, management tools are in for a surprise.  On the
                 * other hand, if we report failure, then the management tools
                 * might try to restart the domain on the source side, even
                 * though the domain is actually running on the destination.
                 * Return a NULL dom pointer, and hope that this is a rare
                 * situation and management tools are smart.
                 */
                vm = NULL;
9037
                goto endjob;
C
Chris Lalancette 已提交
9038 9039 9040 9041 9042 9043 9044 9045 9046
            }

            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_DEFINED,
                                             newVM ?
                                             VIR_DOMAIN_EVENT_DEFINED_ADDED :
                                             VIR_DOMAIN_EVENT_DEFINED_UPDATED);
            if (event)
                qemuDomainEventQueue(driver, event);
9047
            event = NULL;
C
Chris Lalancette 已提交
9048 9049

        }
D
Daniel Veillard 已提交
9050
        dom = virGetDomain (dconn, vm->def->name, vm->def->uuid);
9051

9052 9053 9054 9055 9056
        if (!(flags & VIR_MIGRATE_PAUSED)) {
            /* run 'cont' on the destination, which allows migration on qemu
             * >= 0.10.6 to work properly.  This isn't strictly necessary on
             * older qemu's, but it also doesn't hurt anything there
             */
H
Hu Tao 已提交
9057
            if (doStartCPUs(driver, vm, dconn) < 0) {
9058
                if (virGetLastError() == NULL)
9059 9060
                    qemuReportError(VIR_ERR_INTERNAL_ERROR,
                                    "%s", _("resume operation failed"));
9061 9062
                goto endjob;
            }
9063 9064
        }

9065 9066 9067
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_RESUMED,
                                         VIR_DOMAIN_EVENT_RESUMED_MIGRATED);
9068 9069 9070 9071 9072 9073
        if (vm->state == VIR_DOMAIN_PAUSED) {
            qemuDomainEventQueue(driver, event);
            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_SUSPENDED,
                                             VIR_DOMAIN_EVENT_SUSPENDED_PAUSED);
        }
9074 9075 9076 9077
        if (virDomainSaveStatus(driver->caps, driver->stateDir, vm) < 0) {
            VIR_WARN("Failed to save status on vm %s", vm->def->name);
            goto endjob;
        }
D
Daniel Veillard 已提交
9078
    } else {
9079
        qemudShutdownVMDaemon(driver, vm, 1);
9080
        qemuDomainStopAudit(vm, "failed");
9081 9082 9083
        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STOPPED,
                                         VIR_DOMAIN_EVENT_STOPPED_FAILED);
9084
        if (!vm->persistent) {
9085 9086
            if (qemuDomainObjEndJob(vm) > 0)
                virDomainRemoveInactive(&driver->domains, vm);
9087 9088
            vm = NULL;
        }
D
Daniel Veillard 已提交
9089
    }
9090

9091
endjob:
9092 9093 9094
    if (vm &&
        qemuDomainObjEndJob(vm) == 0)
        vm = NULL;
9095

9096
cleanup:
9097 9098 9099 9100
    if (orig_err) {
        virSetError(orig_err);
        virFreeError(orig_err);
    }
9101 9102
    if (vm)
        virDomainObjUnlock(vm);
9103 9104
    if (event)
        qemuDomainEventQueue(driver, event);
9105
    qemuDriverUnlock(driver);
9106
    return dom;
D
Daniel Veillard 已提交
9107 9108
}

9109 9110 9111 9112 9113 9114 9115 9116 9117 9118 9119 9120 9121 9122 9123 9124
static int
qemudNodeDeviceGetPciInfo (virNodeDevicePtr dev,
                           unsigned *domain,
                           unsigned *bus,
                           unsigned *slot,
                           unsigned *function)
{
    virNodeDeviceDefPtr def = NULL;
    virNodeDevCapsDefPtr cap;
    char *xml = NULL;
    int ret = -1;

    xml = virNodeDeviceGetXMLDesc(dev, 0);
    if (!xml)
        goto out;

9125
    def = virNodeDeviceDefParseString(xml, EXISTING_DEVICE);
9126 9127 9128 9129 9130 9131 9132 9133 9134 9135 9136 9137 9138 9139 9140 9141 9142
    if (!def)
        goto out;

    cap = def->caps;
    while (cap) {
        if (cap->type == VIR_NODE_DEV_CAP_PCI_DEV) {
            *domain   = cap->data.pci_dev.domain;
            *bus      = cap->data.pci_dev.bus;
            *slot     = cap->data.pci_dev.slot;
            *function = cap->data.pci_dev.function;
            break;
        }

        cap = cap->next;
    }

    if (!cap) {
9143 9144
        qemuReportError(VIR_ERR_INVALID_ARG,
                        _("device %s is not a PCI device"), dev->name);
9145 9146 9147 9148 9149 9150 9151 9152 9153 9154 9155 9156 9157
        goto out;
    }

    ret = 0;
out:
    virNodeDeviceDefFree(def);
    VIR_FREE(xml);
    return ret;
}

static int
qemudNodeDeviceDettach (virNodeDevicePtr dev)
{
9158
    struct qemud_driver *driver = dev->conn->privateData;
9159 9160 9161 9162 9163 9164 9165
    pciDevice *pci;
    unsigned domain, bus, slot, function;
    int ret = -1;

    if (qemudNodeDeviceGetPciInfo(dev, &domain, &bus, &slot, &function) < 0)
        return -1;

9166
    pci = pciGetDevice(domain, bus, slot, function);
9167 9168 9169
    if (!pci)
        return -1;

9170 9171
    qemuDriverLock(driver);
    if (pciDettachDevice(pci, driver->activePciHostdevs) < 0)
9172 9173 9174 9175
        goto out;

    ret = 0;
out:
9176
    qemuDriverUnlock(driver);
9177
    pciFreeDevice(pci);
9178 9179 9180 9181 9182 9183
    return ret;
}

static int
qemudNodeDeviceReAttach (virNodeDevicePtr dev)
{
9184
    struct qemud_driver *driver = dev->conn->privateData;
9185 9186 9187 9188 9189 9190 9191
    pciDevice *pci;
    unsigned domain, bus, slot, function;
    int ret = -1;

    if (qemudNodeDeviceGetPciInfo(dev, &domain, &bus, &slot, &function) < 0)
        return -1;

9192
    pci = pciGetDevice(domain, bus, slot, function);
9193 9194 9195
    if (!pci)
        return -1;

9196 9197
    qemuDriverLock(driver);
    if (pciReAttachDevice(pci, driver->activePciHostdevs) < 0)
9198 9199 9200 9201
        goto out;

    ret = 0;
out:
9202
    qemuDriverUnlock(driver);
9203
    pciFreeDevice(pci);
9204 9205 9206 9207 9208 9209
    return ret;
}

static int
qemudNodeDeviceReset (virNodeDevicePtr dev)
{
9210
    struct qemud_driver *driver = dev->conn->privateData;
9211 9212 9213 9214 9215 9216 9217
    pciDevice *pci;
    unsigned domain, bus, slot, function;
    int ret = -1;

    if (qemudNodeDeviceGetPciInfo(dev, &domain, &bus, &slot, &function) < 0)
        return -1;

9218
    pci = pciGetDevice(domain, bus, slot, function);
9219 9220 9221
    if (!pci)
        return -1;

9222 9223
    qemuDriverLock(driver);

9224
    if (pciResetDevice(pci, driver->activePciHostdevs, NULL) < 0)
9225 9226 9227 9228
        goto out;

    ret = 0;
out:
9229
    qemuDriverUnlock(driver);
9230
    pciFreeDevice(pci);
9231 9232 9233
    return ret;
}

9234 9235 9236 9237 9238 9239 9240 9241 9242 9243 9244
static int
qemuCPUCompare(virConnectPtr conn,
               const char *xmlDesc,
               unsigned int flags ATTRIBUTE_UNUSED)
{
    struct qemud_driver *driver = conn->privateData;
    int ret = VIR_CPU_COMPARE_ERROR;

    qemuDriverLock(driver);

    if (!driver->caps || !driver->caps->host.cpu) {
9245 9246
        qemuReportError(VIR_ERR_NO_SUPPORT,
                        "%s", _("cannot get host CPU capabilities"));
9247 9248
    }
    else
9249
        ret = cpuCompareXML(driver->caps->host.cpu, xmlDesc);
9250 9251 9252 9253 9254 9255

    qemuDriverUnlock(driver);

    return ret;
}

9256

9257 9258 9259 9260 9261 9262 9263 9264 9265 9266 9267 9268 9269
static char *
qemuCPUBaseline(virConnectPtr conn ATTRIBUTE_UNUSED,
                const char **xmlCPUs,
                unsigned int ncpus,
                unsigned int flags ATTRIBUTE_UNUSED)
{
    char *cpu;

    cpu = cpuBaselineXML(xmlCPUs, ncpus, NULL, 0);

    return cpu;
}

9270 9271 9272 9273 9274 9275 9276 9277 9278 9279 9280 9281 9282 9283 9284 9285 9286 9287 9288 9289 9290 9291 9292

static int qemuDomainGetJobInfo(virDomainPtr dom,
                                virDomainJobInfoPtr info) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    priv = vm->privateData;

    if (virDomainObjIsActive(vm)) {
        if (priv->jobActive) {
9293 9294
            struct timeval now;

9295
            memcpy(info, &priv->jobInfo, sizeof(*info));
9296 9297 9298 9299 9300 9301 9302 9303 9304 9305 9306

            /* Refresh elapsed time again just to ensure it
             * is fully updated. This is primarily for benefit
             * of incoming migration which we don't currently
             * monitor actively in the background thread
             */
            if (gettimeofday(&now, NULL) < 0) {
                virReportSystemError(errno, "%s",
                                     _("cannot get time of day"));
                goto cleanup;
            }
9307
            info->timeElapsed = timeval_to_ms(now) - priv->jobStart;
9308 9309 9310 9311 9312 9313 9314 9315 9316 9317 9318 9319 9320 9321 9322 9323 9324 9325 9326
        } else {
            memset(info, 0, sizeof(*info));
            info->type = VIR_DOMAIN_JOB_NONE;
        }
    } else {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}


9327 9328 9329 9330 9331 9332 9333 9334 9335 9336 9337 9338 9339 9340 9341 9342 9343 9344 9345 9346 9347 9348
static int qemuDomainAbortJob(virDomainPtr dom) {
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    qemuDriverUnlock(driver);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    priv = vm->privateData;

    if (virDomainObjIsActive(vm)) {
        if (priv->jobActive) {
            VIR_DEBUG("Requesting cancellation of job on vm %s", vm->def->name);
9349
            priv->jobSignals |= QEMU_JOB_SIGNAL_CANCEL;
9350 9351 9352 9353 9354 9355 9356 9357 9358 9359 9360 9361 9362 9363 9364 9365 9366 9367 9368 9369
        } else {
            qemuReportError(VIR_ERR_OPERATION_INVALID,
                            "%s", _("no job is active on the domain"));
            goto cleanup;
        }
    } else {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    return ret;
}


9370 9371 9372 9373 9374 9375 9376 9377 9378 9379
static int
qemuDomainMigrateSetMaxDowntime(virDomainPtr dom,
                                unsigned long long downtime,
                                unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm;
    qemuDomainObjPrivatePtr priv;
    int ret = -1;

9380
    virCheckFlags(0, -1);
9381 9382 9383 9384 9385 9386 9387 9388 9389 9390 9391 9392 9393 9394 9395 9396 9397 9398 9399 9400

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);

    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(dom->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    priv = vm->privateData;

9401
    if (priv->jobActive != QEMU_JOB_MIGRATION_OUT) {
9402 9403 9404 9405 9406 9407 9408 9409 9410 9411 9412 9413 9414 9415 9416 9417 9418
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not being migrated"));
        goto cleanup;
    }

    VIR_DEBUG("Requesting migration downtime change to %llums", downtime);
    priv->jobSignals |= QEMU_JOB_SIGNAL_MIGRATE_DOWNTIME;
    priv->jobSignalsData.migrateDowntime = downtime;
    ret = 0;

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

C
Chris Lalancette 已提交
9419 9420 9421 9422 9423 9424 9425 9426 9427 9428 9429 9430 9431 9432
static char *qemuFindQemuImgBinary(void)
{
    char *ret;

    ret = virFindFileInPath("kvm-img");
    if (ret == NULL)
        ret = virFindFileInPath("qemu-img");
    if (ret == NULL)
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        "%s", _("unable to find kvm-img or qemu-img"));

    return ret;
}

9433 9434 9435
static int qemuDomainSnapshotWriteMetadata(virDomainObjPtr vm,
                                           virDomainSnapshotObjPtr snapshot,
                                           char *snapshotDir)
C
Chris Lalancette 已提交
9436 9437 9438 9439 9440 9441 9442 9443 9444 9445
{
    int fd = -1;
    char *newxml = NULL;
    int ret = -1;
    char *snapDir = NULL;
    char *snapFile = NULL;
    int err;
    char uuidstr[VIR_UUID_STRING_BUFLEN];

    virUUIDFormat(vm->def->uuid, uuidstr);
9446
    newxml = virDomainSnapshotDefFormat(uuidstr, snapshot->def, 1);
C
Chris Lalancette 已提交
9447 9448 9449 9450 9451 9452 9453 9454 9455 9456 9457 9458 9459 9460 9461 9462
    if (newxml == NULL) {
        virReportOOMError();
        return -1;
    }

    if (virAsprintf(&snapDir, "%s/%s", snapshotDir, vm->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }
    err = virFileMakePath(snapDir);
    if (err < 0) {
        virReportSystemError(err, _("cannot create snapshot directory '%s'"),
                             snapDir);
        goto cleanup;
    }

9463
    if (virAsprintf(&snapFile, "%s/%s.xml", snapDir, snapshot->def->name) < 0) {
C
Chris Lalancette 已提交
9464 9465 9466 9467 9468 9469 9470 9471 9472 9473 9474 9475 9476 9477 9478 9479 9480 9481 9482 9483 9484
        virReportOOMError();
        goto cleanup;
    }
    fd = open(snapFile, O_CREAT|O_TRUNC|O_WRONLY, S_IRUSR|S_IWUSR);
    if (fd < 0) {
        qemuReportError(VIR_ERR_OPERATION_FAILED,
                        _("failed to create snapshot file '%s'"), snapFile);
        goto cleanup;
    }
    if (safewrite(fd, newxml, strlen(newxml)) != strlen(newxml)) {
        virReportSystemError(errno, _("Failed to write snapshot data to %s"),
                             snapFile);
        goto cleanup;
    }

    ret = 0;

cleanup:
    VIR_FREE(snapFile);
    VIR_FREE(snapDir);
    VIR_FREE(newxml);
9485
    VIR_FORCE_CLOSE(fd);
C
Chris Lalancette 已提交
9486 9487 9488
    return ret;
}

9489 9490
static int qemuDomainSnapshotSetCurrentActive(virDomainObjPtr vm,
                                              char *snapshotDir)
C
Chris Lalancette 已提交
9491 9492 9493 9494
{
    if (vm->current_snapshot) {
        vm->current_snapshot->def->active = 1;

9495 9496
        return qemuDomainSnapshotWriteMetadata(vm, vm->current_snapshot,
                                               snapshotDir);
C
Chris Lalancette 已提交
9497 9498 9499 9500 9501
    }

    return 0;
}

9502 9503
static int qemuDomainSnapshotSetCurrentInactive(virDomainObjPtr vm,
                                                char *snapshotDir)
C
Chris Lalancette 已提交
9504 9505 9506 9507
{
    if (vm->current_snapshot) {
        vm->current_snapshot->def->active = 0;

9508 9509
        return qemuDomainSnapshotWriteMetadata(vm, vm->current_snapshot,
                                               snapshotDir);
C
Chris Lalancette 已提交
9510 9511 9512 9513 9514 9515 9516 9517 9518 9519 9520 9521 9522 9523 9524 9525 9526 9527 9528
    }

    return 0;
}


static int qemuDomainSnapshotIsAllowed(virDomainObjPtr vm)
{
    int i;

    /* FIXME: we need to figure out what else here might succeed; in
     * particular, if it's a raw device but on LVM, we could probably make
     * that succeed as well
     */
    for (i = 0; i < vm->def->ndisks; i++) {
        if (vm->def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK &&
            (!vm->def->disks[i]->driverType ||
             STRNEQ(vm->def->disks[i]->driverType, "qcow2"))) {
            qemuReportError(VIR_ERR_OPERATION_INVALID,
9529 9530
                            _("Disk '%s' does not support snapshotting"),
                            vm->def->disks[i]->src);
C
Chris Lalancette 已提交
9531 9532 9533 9534 9535 9536 9537 9538 9539
            return 0;
        }
    }

    return 1;
}

static virDomainSnapshotPtr qemuDomainSnapshotCreateXML(virDomainPtr domain,
                                                        const char *xmlDesc,
9540
                                                        unsigned int flags)
C
Chris Lalancette 已提交
9541 9542 9543 9544 9545 9546 9547 9548 9549 9550
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    virDomainSnapshotObjPtr snap = NULL;
    virDomainSnapshotPtr snapshot = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    virDomainSnapshotDefPtr def;
    const char *qemuimgarg[] = { NULL, "snapshot", "-c", NULL, NULL, NULL };
    int i;

9551 9552
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9553 9554 9555 9556 9557 9558 9559 9560 9561 9562 9563 9564 9565 9566 9567 9568 9569 9570 9571 9572 9573 9574 9575 9576 9577 9578 9579 9580 9581 9582 9583 9584 9585 9586 9587 9588 9589 9590 9591 9592 9593 9594 9595 9596 9597 9598 9599 9600 9601 9602 9603 9604 9605 9606 9607 9608 9609 9610 9611 9612 9613
    qemuDriverLock(driver);
    virUUIDFormat(domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    /* in a perfect world, we would allow qemu to tell us this.  The problem
     * is that qemu only does this check device-by-device; so if you had a
     * domain that booted from a large qcow2 device, but had a secondary raw
     * device attached, you wouldn't find out that you can't snapshot your
     * guest until *after* it had spent the time to snapshot the boot device.
     * This is probably a bug in qemu, but we'll work around it here for now.
     */
    if (!qemuDomainSnapshotIsAllowed(vm))
        goto cleanup;

    if (!(def = virDomainSnapshotDefParseString(xmlDesc, 1)))
        goto cleanup;

    if (!(snap = virDomainSnapshotAssignDef(&vm->snapshots, def)))
        goto cleanup;

    /* actually do the snapshot */
    if (!virDomainObjIsActive(vm)) {
        qemuimgarg[0] = qemuFindQemuImgBinary();
        if (qemuimgarg[0] == NULL)
            /* qemuFindQemuImgBinary set the error */
            goto cleanup;

        qemuimgarg[3] = snap->def->name;

        for (i = 0; i < vm->def->ndisks; i++) {
            /* FIXME: we also need to handle LVM here */
            /* FIXME: if we fail halfway through this loop, we are in an
             * inconsistent state.  I'm not quite sure what to do about that
             */
            if (vm->def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
                if (!vm->def->disks[i]->driverType ||
                    STRNEQ(vm->def->disks[i]->driverType, "qcow2")) {
                    qemuReportError(VIR_ERR_OPERATION_INVALID,
                                    _("Disk device '%s' does not support snapshotting"),
                                    vm->def->disks[i]->info.alias);
                    goto cleanup;
                }

                qemuimgarg[4] = vm->def->disks[i]->src;

                if (virRun(qemuimgarg, NULL) < 0) {
                    virReportSystemError(errno,
                                         _("Failed to run '%s' to create snapshot '%s' from disk '%s'"),
                                         qemuimgarg[0], snap->def->name,
                                         vm->def->disks[i]->src);
                    goto cleanup;
                }
            }
        }
    }
    else {
9614 9615 9616 9617 9618
        qemuDomainObjPrivatePtr priv;
        int ret;

        if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
            goto cleanup;
C
Chris Lalancette 已提交
9619 9620
        priv = vm->privateData;
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
9621
        ret = qemuMonitorCreateSnapshot(priv->mon, def->name);
C
Chris Lalancette 已提交
9622
        qemuDomainObjExitMonitorWithDriver(driver, vm);
9623
        if (qemuDomainObjEndJob(vm) == 0) {
9624
            vm = NULL;
9625 9626
            goto cleanup;
        }
9627 9628
        if (ret < 0)
            goto cleanup;
C
Chris Lalancette 已提交
9629 9630 9631 9632 9633 9634 9635 9636 9637 9638 9639 9640 9641 9642 9643 9644 9645 9646 9647 9648
    }

    snap->def->state = vm->state;

    /* FIXME: if we fail after this point, there's not a whole lot we can
     * do; we've successfully taken the snapshot, and we are now running
     * on it, so we have to go forward the best we can
     */

    if (vm->current_snapshot) {
        def->parent = strdup(vm->current_snapshot->def->name);
        if (def->parent == NULL) {
            virReportOOMError();
            goto cleanup;
        }
    }

    /* Now we set the new current_snapshot for the domain */
    vm->current_snapshot = snap;

9649 9650 9651
    if (qemuDomainSnapshotWriteMetadata(vm, vm->current_snapshot,
                                        driver->snapshotDir) < 0)
        /* qemuDomainSnapshotWriteMetadata set the error */
C
Chris Lalancette 已提交
9652 9653 9654 9655 9656 9657 9658 9659 9660 9661 9662 9663 9664 9665
        goto cleanup;

    snapshot = virGetDomainSnapshot(domain, snap->def->name);

cleanup:
    VIR_FREE(qemuimgarg[0]);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return snapshot;
}

static int qemuDomainSnapshotListNames(virDomainPtr domain, char **names,
                                       int nameslen,
9666
                                       unsigned int flags)
C
Chris Lalancette 已提交
9667 9668 9669 9670 9671
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int n = -1;

9672 9673
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9674 9675 9676 9677 9678 9679 9680 9681 9682 9683 9684 9685 9686 9687 9688 9689 9690 9691 9692 9693
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    n = virDomainSnapshotObjListGetNames(&vm->snapshots, names, nameslen);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return n;
}

static int qemuDomainSnapshotNum(virDomainPtr domain,
9694
                                 unsigned int flags)
C
Chris Lalancette 已提交
9695 9696 9697 9698 9699
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int n = -1;

9700 9701
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9702 9703 9704 9705 9706 9707 9708 9709 9710 9711 9712 9713 9714 9715 9716 9717 9718 9719 9720 9721 9722
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    n = virDomainSnapshotObjListNum(&vm->snapshots);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return n;
}

static virDomainSnapshotPtr qemuDomainSnapshotLookupByName(virDomainPtr domain,
                                                           const char *name,
9723
                                                           unsigned int flags)
C
Chris Lalancette 已提交
9724 9725 9726 9727 9728 9729
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm;
    virDomainSnapshotObjPtr snap = NULL;
    virDomainSnapshotPtr snapshot = NULL;

9730 9731
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9732 9733 9734 9735 9736 9737 9738 9739 9740 9741 9742 9743 9744 9745 9746 9747 9748 9749 9750 9751 9752 9753 9754 9755 9756 9757 9758
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no snapshot with matching name '%s'"), name);
        goto cleanup;
    }

    snapshot = virGetDomainSnapshot(domain, snap->def->name);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return snapshot;
}

static int qemuDomainHasCurrentSnapshot(virDomainPtr domain,
9759
                                        unsigned int flags)
C
Chris Lalancette 已提交
9760 9761 9762 9763 9764
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm;
    int ret = -1;

9765 9766
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9767 9768 9769 9770 9771 9772 9773 9774 9775 9776 9777 9778 9779 9780 9781 9782 9783 9784 9785 9786
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    ret = (vm->current_snapshot != NULL);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

static virDomainSnapshotPtr qemuDomainSnapshotCurrent(virDomainPtr domain,
9787
                                                      unsigned int flags)
C
Chris Lalancette 已提交
9788 9789 9790 9791 9792
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm;
    virDomainSnapshotPtr snapshot = NULL;

9793 9794
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9795 9796 9797 9798 9799 9800 9801 9802 9803 9804 9805 9806 9807 9808 9809 9810 9811 9812 9813 9814 9815 9816 9817 9818 9819 9820
    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!vm->current_snapshot) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT, "%s",
                        _("the domain does not have a current snapshot"));
        goto cleanup;
    }

    snapshot = virGetDomainSnapshot(domain, vm->current_snapshot->def->name);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return snapshot;
}

static char *qemuDomainSnapshotDumpXML(virDomainSnapshotPtr snapshot,
9821
                                       unsigned int flags)
C
Chris Lalancette 已提交
9822 9823 9824 9825 9826 9827 9828
{
    struct qemud_driver *driver = snapshot->domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    char *xml = NULL;
    virDomainSnapshotObjPtr snap = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];

9829 9830
    virCheckFlags(0, NULL);

C
Chris Lalancette 已提交
9831 9832 9833 9834 9835 9836 9837 9838 9839 9840 9841 9842 9843 9844 9845 9846 9847 9848 9849 9850 9851 9852 9853 9854 9855 9856 9857
    qemuDriverLock(driver);
    virUUIDFormat(snapshot->domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, snapshot->domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, snapshot->name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no domain snapshot with matching name '%s'"),
                        snapshot->name);
        goto cleanup;
    }

    xml = virDomainSnapshotDefFormat(uuidstr, snap->def, 0);

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return xml;
}

static int qemuDomainRevertToSnapshot(virDomainSnapshotPtr snapshot,
9858
                                      unsigned int flags)
C
Chris Lalancette 已提交
9859 9860 9861 9862 9863 9864 9865 9866 9867 9868
{
    struct qemud_driver *driver = snapshot->domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    virDomainSnapshotObjPtr snap = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    virDomainEventPtr event = NULL;
    qemuDomainObjPrivatePtr priv;
    int rc;

9869 9870
    virCheckFlags(0, -1);

C
Chris Lalancette 已提交
9871 9872 9873 9874 9875 9876 9877 9878 9879 9880 9881 9882 9883 9884 9885 9886 9887 9888 9889 9890 9891 9892 9893 9894 9895 9896 9897 9898 9899 9900 9901
    qemuDriverLock(driver);
    virUUIDFormat(snapshot->domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, snapshot->domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, snapshot->name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no domain snapshot with matching name '%s'"),
                        snapshot->name);
        goto cleanup;
    }

    vm->current_snapshot = snap;

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

    if (snap->def->state == VIR_DOMAIN_RUNNING
        || snap->def->state == VIR_DOMAIN_PAUSED) {

        if (virDomainObjIsActive(vm)) {
            priv = vm->privateData;
            qemuDomainObjEnterMonitorWithDriver(driver, vm);
            rc = qemuMonitorLoadSnapshot(priv->mon, snap->def->name);
            qemuDomainObjExitMonitorWithDriver(driver, vm);
            if (rc < 0)
9902
                goto endjob;
C
Chris Lalancette 已提交
9903 9904
        }
        else {
9905
            if (qemuDomainSnapshotSetCurrentActive(vm, driver->snapshotDir) < 0)
9906
                goto endjob;
C
Chris Lalancette 已提交
9907 9908

            rc = qemudStartVMDaemon(snapshot->domain->conn, driver, vm, NULL,
9909
                                    false, -1, NULL, VIR_VM_OP_CREATE);
9910
            qemuDomainStartAudit(vm, "from-snapshot", rc >= 0);
9911
            if (qemuDomainSnapshotSetCurrentInactive(vm, driver->snapshotDir) < 0)
9912
                goto endjob;
C
Chris Lalancette 已提交
9913
            if (rc < 0)
9914
                goto endjob;
C
Chris Lalancette 已提交
9915 9916 9917 9918 9919 9920
        }

        if (snap->def->state == VIR_DOMAIN_PAUSED) {
            /* qemu unconditionally starts the domain running again after
             * loadvm, so let's pause it to keep consistency
             */
H
Hu Tao 已提交
9921 9922
            rc = doStopCPUs(driver, vm);
            if (rc < 0)
9923
                goto endjob;
C
Chris Lalancette 已提交
9924 9925 9926 9927 9928 9929 9930 9931 9932 9933 9934 9935 9936 9937 9938 9939 9940 9941
        }

        event = virDomainEventNewFromObj(vm,
                                         VIR_DOMAIN_EVENT_STARTED,
                                         VIR_DOMAIN_EVENT_STARTED_FROM_SNAPSHOT);
    }
    else {
        /* qemu is a little funny with running guests and the restoration
         * of snapshots.  If the snapshot was taken online,
         * then after a "loadvm" monitor command, the VM is set running
         * again.  If the snapshot was taken offline, then after a "loadvm"
         * monitor command the VM is left paused.  Unpausing it leads to
         * the memory state *before* the loadvm with the disk *after* the
         * loadvm, which obviously is bound to corrupt something.
         * Therefore we destroy the domain and set it to "off" in this case.
         */

        if (virDomainObjIsActive(vm)) {
9942
            qemudShutdownVMDaemon(driver, vm, 0);
9943
            qemuDomainStopAudit(vm, "from-snapshot");
C
Chris Lalancette 已提交
9944 9945 9946
            event = virDomainEventNewFromObj(vm,
                                             VIR_DOMAIN_EVENT_STOPPED,
                                             VIR_DOMAIN_EVENT_STOPPED_FROM_SNAPSHOT);
9947 9948 9949 9950
            if (!vm->persistent) {
                if (qemuDomainObjEndJob(vm) > 0)
                    virDomainRemoveInactive(&driver->domains, vm);
                vm = NULL;
9951
                goto cleanup;
9952
            }
C
Chris Lalancette 已提交
9953 9954
        }

9955
        if (qemuDomainSnapshotSetCurrentActive(vm, driver->snapshotDir) < 0)
9956
            goto endjob;
C
Chris Lalancette 已提交
9957 9958 9959 9960 9961 9962
    }

    vm->state = snap->def->state;

    ret = 0;

9963
endjob:
C
Chris Lalancette 已提交
9964 9965 9966
    if (vm && qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

9967
cleanup:
C
Chris Lalancette 已提交
9968 9969 9970 9971 9972 9973 9974 9975 9976 9977 9978 9979 9980 9981 9982 9983 9984 9985 9986 9987 9988 9989 9990 9991 9992 9993 9994 9995 9996 9997 9998 9999 10000 10001 10002 10003 10004 10005 10006 10007 10008 10009 10010 10011 10012 10013 10014 10015 10016 10017 10018 10019 10020 10021 10022 10023 10024 10025 10026 10027 10028 10029 10030 10031 10032 10033 10034 10035 10036 10037 10038 10039 10040 10041 10042 10043 10044 10045 10046 10047 10048 10049 10050 10051 10052 10053 10054 10055 10056 10057 10058 10059 10060 10061 10062 10063 10064 10065 10066 10067 10068 10069 10070 10071 10072 10073 10074 10075 10076 10077 10078 10079 10080 10081 10082 10083 10084 10085 10086 10087 10088 10089 10090 10091
    if (event)
        qemuDomainEventQueue(driver, event);
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);

    return ret;
}

static int qemuDomainSnapshotDiscard(struct qemud_driver *driver,
                                     virDomainObjPtr vm,
                                     virDomainSnapshotObjPtr snap)
{
    const char *qemuimgarg[] = { NULL, "snapshot", "-d", NULL, NULL, NULL };
    char *snapFile = NULL;
    int ret = -1;
    int i;
    qemuDomainObjPrivatePtr priv;
    virDomainSnapshotObjPtr parentsnap;

    if (!virDomainObjIsActive(vm)) {
        qemuimgarg[0] = qemuFindQemuImgBinary();
        if (qemuimgarg[0] == NULL)
            /* qemuFindQemuImgBinary set the error */
            goto cleanup;

        qemuimgarg[3] = snap->def->name;

        for (i = 0; i < vm->def->ndisks; i++) {
            /* FIXME: we also need to handle LVM here */
            if (vm->def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
                if (!vm->def->disks[i]->driverType ||
                    STRNEQ(vm->def->disks[i]->driverType, "qcow2")) {
                    /* we continue on even in the face of error, since other
                     * disks in this VM may have this snapshot in place
                     */
                    continue;
                }

                qemuimgarg[4] = vm->def->disks[i]->src;

                if (virRun(qemuimgarg, NULL) < 0) {
                    /* we continue on even in the face of error, since other
                     * disks in this VM may have this snapshot in place
                     */
                    continue;
                }
            }
        }
    }
    else {
        priv = vm->privateData;
        qemuDomainObjEnterMonitorWithDriver(driver, vm);
        /* we continue on even in the face of error */
        qemuMonitorDeleteSnapshot(priv->mon, snap->def->name);
        qemuDomainObjExitMonitorWithDriver(driver, vm);
    }

    if (snap == vm->current_snapshot) {
        if (snap->def->parent) {
            parentsnap = virDomainSnapshotFindByName(&vm->snapshots,
                                                     snap->def->parent);
            if (!parentsnap) {
                qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                                _("no domain snapshot parent with matching name '%s'"),
                                snap->def->parent);
                goto cleanup;
            }

            /* Now we set the new current_snapshot for the domain */
            vm->current_snapshot = parentsnap;
        }
        else
            vm->current_snapshot = NULL;
    }

    if (virAsprintf(&snapFile, "%s/%s/%s.xml", driver->snapshotDir,
                    vm->def->name, snap->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }
    unlink(snapFile);

    virDomainSnapshotObjListRemove(&vm->snapshots, snap);

    ret = 0;

cleanup:
    VIR_FREE(snapFile);
    VIR_FREE(qemuimgarg[0]);

    return ret;
}

struct snap_remove {
    struct qemud_driver *driver;
    virDomainObjPtr vm;
    char *parent;
    int err;
};

static void qemuDomainSnapshotDiscardChildren(void *payload,
                                              const char *name ATTRIBUTE_UNUSED,
                                              void *data)
{
    virDomainSnapshotObjPtr snap = payload;
    struct snap_remove *curr = data;
    struct snap_remove this;

    if (snap->def->parent && STREQ(snap->def->parent, curr->parent)) {
        this.driver = curr->driver;
        this.vm = curr->vm;
        this.parent = snap->def->name;
        this.err = 0;
        virHashForEach(curr->vm->snapshots.objs,
                       qemuDomainSnapshotDiscardChildren, &this);

        if (this.err)
            curr->err = this.err;
        else
            this.err = qemuDomainSnapshotDiscard(curr->driver, curr->vm, snap);
    }
}

10092 10093 10094 10095 10096 10097 10098 10099 10100 10101 10102 10103 10104 10105 10106 10107 10108 10109 10110 10111 10112 10113 10114 10115 10116 10117 10118 10119 10120 10121 10122 10123 10124 10125 10126 10127 10128
struct snap_reparent {
    struct qemud_driver *driver;
    virDomainSnapshotObjPtr snap;
    virDomainObjPtr vm;
    int err;
};

static void
qemuDomainSnapshotReparentChildren(void *payload,
                                   const char *name ATTRIBUTE_UNUSED,
                                   void *data)
{
    virDomainSnapshotObjPtr snap = payload;
    struct snap_reparent *rep = data;

    if (rep->err < 0) {
        return;
    }

    if (snap->def->parent && STREQ(snap->def->parent, rep->snap->def->name)) {
        VIR_FREE(snap->def->parent);

        if (rep->snap->def->parent != NULL) {
            snap->def->parent = strdup(rep->snap->def->parent);

            if (snap->def->parent == NULL) {
                virReportOOMError();
                rep->err = -1;
                return;
            }
        }

        rep->err = qemuDomainSnapshotWriteMetadata(rep->vm, snap,
                                                   rep->driver->snapshotDir);
    }
}

C
Chris Lalancette 已提交
10129 10130 10131 10132 10133 10134 10135 10136 10137
static int qemuDomainSnapshotDelete(virDomainSnapshotPtr snapshot,
                                    unsigned int flags)
{
    struct qemud_driver *driver = snapshot->domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    virDomainSnapshotObjPtr snap = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    struct snap_remove rem;
10138
    struct snap_reparent rep;
C
Chris Lalancette 已提交
10139

10140 10141
    virCheckFlags(VIR_DOMAIN_SNAPSHOT_DELETE_CHILDREN, -1);

C
Chris Lalancette 已提交
10142 10143 10144 10145 10146 10147 10148 10149 10150 10151 10152 10153 10154 10155 10156 10157 10158
    qemuDriverLock(driver);
    virUUIDFormat(snapshot->domain->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, snapshot->domain->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    snap = virDomainSnapshotFindByName(&vm->snapshots, snapshot->name);
    if (!snap) {
        qemuReportError(VIR_ERR_NO_DOMAIN_SNAPSHOT,
                        _("no domain snapshot with matching name '%s'"),
                        snapshot->name);
        goto cleanup;
    }

10159 10160 10161
    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;

C
Chris Lalancette 已提交
10162 10163 10164 10165 10166 10167 10168 10169
    if (flags & VIR_DOMAIN_SNAPSHOT_DELETE_CHILDREN) {
        rem.driver = driver;
        rem.vm = vm;
        rem.parent = snap->def->name;
        rem.err = 0;
        virHashForEach(vm->snapshots.objs, qemuDomainSnapshotDiscardChildren,
                       &rem);
        if (rem.err < 0)
10170
            goto endjob;
10171 10172 10173 10174 10175 10176 10177 10178 10179
    } else {
        rep.driver = driver;
        rep.snap = snap;
        rep.vm = vm;
        rep.err = 0;
        virHashForEach(vm->snapshots.objs, qemuDomainSnapshotReparentChildren,
                       &rep);
        if (rep.err < 0)
            goto endjob;
C
Chris Lalancette 已提交
10180 10181 10182 10183
    }

    ret = qemuDomainSnapshotDiscard(driver, vm, snap);

10184 10185 10186 10187
endjob:
    if (qemuDomainObjEndJob(vm) == 0)
        vm = NULL;

C
Chris Lalancette 已提交
10188 10189 10190 10191 10192 10193
cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}
10194

10195 10196 10197 10198 10199 10200 10201 10202 10203 10204 10205 10206 10207 10208 10209 10210 10211 10212 10213 10214 10215 10216 10217 10218 10219 10220 10221 10222 10223 10224 10225 10226 10227 10228 10229 10230 10231 10232 10233 10234 10235 10236 10237 10238 10239 10240 10241 10242 10243 10244 10245
static int qemuDomainMonitorCommand(virDomainPtr domain, const char *cmd,
                                    char **result, unsigned int flags)
{
    struct qemud_driver *driver = domain->conn->privateData;
    virDomainObjPtr vm = NULL;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;

    virCheckFlags(0, -1);

    qemuDriverLock(driver);
    vm = virDomainFindByUUID(&driver->domains, domain->uuid);
    if (!vm) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(domain->uuid, uuidstr);
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
   }

    priv = vm->privateData;

    if (!priv->monitor_warned) {
        VIR_INFO("Qemu monitor command '%s' executed; libvirt results may be unpredictable!",
                 cmd);
        priv->monitor_warned = 1;
    }

    if (qemuDomainObjBeginJobWithDriver(driver, vm) < 0)
        goto cleanup;
    qemuDomainObjEnterMonitorWithDriver(driver, vm);
    ret = qemuMonitorArbitraryCommand(priv->mon, cmd, result);
    qemuDomainObjExitMonitorWithDriver(driver, vm);
    if (qemuDomainObjEndJob(vm) == 0) {
        vm = NULL;
        goto cleanup;
    }

cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}

10246 10247 10248 10249 10250 10251 10252 10253 10254 10255 10256 10257 10258 10259 10260 10261 10262 10263 10264 10265 10266 10267 10268 10269 10270 10271 10272 10273 10274 10275 10276 10277 10278 10279 10280 10281 10282 10283 10284 10285 10286 10287 10288 10289 10290 10291 10292 10293 10294 10295 10296 10297 10298 10299 10300 10301 10302

static int
qemuDomainOpenConsole(virDomainPtr dom,
                      const char *devname,
                      virStreamPtr st,
                      unsigned int flags)
{
    struct qemud_driver *driver = dom->conn->privateData;
    virDomainObjPtr vm = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];
    int ret = -1;
    int i;
    virDomainChrDefPtr chr = NULL;

    virCheckFlags(0, -1);

    qemuDriverLock(driver);
    virUUIDFormat(dom->uuid, uuidstr);
    vm = virDomainFindByUUID(&driver->domains, dom->uuid);
    if (!vm) {
        qemuReportError(VIR_ERR_NO_DOMAIN,
                        _("no domain with matching uuid '%s'"), uuidstr);
        goto cleanup;
    }

    if (!virDomainObjIsActive(vm)) {
        qemuReportError(VIR_ERR_OPERATION_INVALID,
                        "%s", _("domain is not running"));
        goto cleanup;
    }

    if (devname) {
        if (vm->def->console &&
            STREQ(devname, vm->def->console->info.alias))
            chr = vm->def->console;
        for (i = 0 ; !chr && i < vm->def->nserials ; i++) {
            if (STREQ(devname, vm->def->serials[i]->info.alias))
                chr = vm->def->serials[i];
        }
        for (i = 0 ; !chr && i < vm->def->nparallels ; i++) {
            if (STREQ(devname, vm->def->parallels[i]->info.alias))
                chr = vm->def->parallels[i];
        }
    } else {
        if (vm->def->console)
            chr = vm->def->console;
        else if (vm->def->nserials)
            chr = vm->def->serials[0];
    }

    if (!chr) {
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("cannot find character device %s"),
                        NULLSTR(devname));
        goto cleanup;
    }

10303
    if (chr->source.type != VIR_DOMAIN_CHR_TYPE_PTY) {
10304 10305 10306 10307 10308 10309
        qemuReportError(VIR_ERR_INTERNAL_ERROR,
                        _("character device %s is not using a PTY"),
                        NULLSTR(devname));
        goto cleanup;
    }

10310
    if (virFDStreamOpenFile(st, chr->source.data.file.path, O_RDWR) < 0)
10311 10312 10313 10314 10315 10316 10317 10318 10319 10320 10321
        goto cleanup;

    ret = 0;
cleanup:
    if (vm)
        virDomainObjUnlock(vm);
    qemuDriverUnlock(driver);
    return ret;
}


10322 10323 10324 10325 10326
static virDriver qemuDriver = {
    VIR_DRV_QEMU,
    "QEMU",
    qemudOpen, /* open */
    qemudClose, /* close */
D
Daniel Veillard 已提交
10327
    qemudSupportsFeature, /* supports_feature */
10328 10329
    qemudGetType, /* type */
    qemudGetVersion, /* version */
10330
    NULL, /* libvirtVersion (impl. in libvirt.c) */
10331
    virGetHostname, /* getHostname */
10332
    qemudGetMaxVCPUs, /* getMaxVcpus */
10333
    nodeGetInfo, /* nodeGetInfo */
10334 10335 10336
    qemudGetCapabilities, /* getCapabilities */
    qemudListDomains, /* listDomains */
    qemudNumDomains, /* numOfDomains */
10337
    qemudDomainCreate, /* domainCreateXML */
10338 10339 10340 10341 10342
    qemudDomainLookupByID, /* domainLookupByID */
    qemudDomainLookupByUUID, /* domainLookupByUUID */
    qemudDomainLookupByName, /* domainLookupByName */
    qemudDomainSuspend, /* domainSuspend */
    qemudDomainResume, /* domainResume */
10343
    qemudDomainShutdown, /* domainShutdown */
10344 10345 10346
    NULL, /* domainReboot */
    qemudDomainDestroy, /* domainDestroy */
    qemudDomainGetOSType, /* domainGetOSType */
10347
    qemudDomainGetMaxMemory, /* domainGetMaxMemory */
10348
    NULL, /* domainSetMaxMemory */
10349
    qemudDomainSetMemory, /* domainSetMemory */
10350 10351 10352
    qemudDomainGetInfo, /* domainGetInfo */
    qemudDomainSave, /* domainSave */
    qemudDomainRestore, /* domainRestore */
P
Paolo Bonzini 已提交
10353
    qemudDomainCoreDump, /* domainCoreDump */
10354
    qemudDomainSetVcpus, /* domainSetVcpus */
10355 10356
    qemudDomainSetVcpusFlags, /* domainSetVcpusFlags */
    qemudDomainGetVcpusFlags, /* domainGetVcpusFlags */
10357 10358
    qemudDomainPinVcpu, /* domainPinVcpu */
    qemudDomainGetVcpus, /* domainGetVcpus */
10359
    qemudDomainGetMaxVcpus, /* domainGetMaxVcpus */
10360 10361
    qemudDomainGetSecurityLabel, /* domainGetSecurityLabel */
    qemudNodeGetSecurityModel, /* nodeGetSecurityModel */
10362
    qemudDomainDumpXML, /* domainDumpXML */
10363
    qemuDomainXMLFromNative, /* domainXmlFromNative */
10364
    qemuDomainXMLToNative, /* domainXMLToNative */
10365 10366
    qemudListDefinedDomains, /* listDefinedDomains */
    qemudNumDefinedDomains, /* numOfDefinedDomains */
10367
    qemudDomainStart, /* domainCreate */
10368
    qemudDomainStartWithFlags, /* domainCreateWithFlags */
10369 10370
    qemudDomainDefine, /* domainDefineXML */
    qemudDomainUndefine, /* domainUndefine */
10371
    qemudDomainAttachDevice, /* domainAttachDevice */
10372
    qemudDomainAttachDeviceFlags, /* domainAttachDeviceFlags */
10373
    qemudDomainDetachDevice, /* domainDetachDevice */
10374
    qemudDomainDetachDeviceFlags, /* domainDetachDeviceFlags */
10375
    qemuDomainUpdateDeviceFlags, /* domainUpdateDeviceFlags */
10376 10377
    qemudDomainGetAutostart, /* domainGetAutostart */
    qemudDomainSetAutostart, /* domainSetAutostart */
10378 10379 10380
    qemuGetSchedulerType, /* domainGetSchedulerType */
    qemuGetSchedulerParameters, /* domainGetSchedulerParameters */
    qemuSetSchedulerParameters, /* domainSetSchedulerParameters */
D
Daniel Veillard 已提交
10381 10382
    NULL, /* domainMigratePrepare (v1) */
    qemudDomainMigratePerform, /* domainMigratePerform */
10383
    NULL, /* domainMigrateFinish */
10384
    qemudDomainBlockStats, /* domainBlockStats */
10385
    qemudDomainInterfaceStats, /* domainInterfaceStats */
10386
    qemudDomainMemoryStats, /* domainMemoryStats */
10387
    qemudDomainBlockPeek, /* domainBlockPeek */
R
Richard W.M. Jones 已提交
10388
    qemudDomainMemoryPeek, /* domainMemoryPeek */
10389
    qemuDomainGetBlockInfo, /* domainGetBlockInfo */
10390 10391
    nodeGetCellsFreeMemory, /* nodeGetCellsFreeMemory */
    nodeGetFreeMemory,  /* getFreeMemory */
10392 10393
    qemuDomainEventRegister, /* domainEventRegister */
    qemuDomainEventDeregister, /* domainEventDeregister */
D
Daniel Veillard 已提交
10394 10395
    qemudDomainMigratePrepare2, /* domainMigratePrepare2 */
    qemudDomainMigrateFinish2, /* domainMigrateFinish2 */
10396 10397 10398
    qemudNodeDeviceDettach, /* nodeDeviceDettach */
    qemudNodeDeviceReAttach, /* nodeDeviceReAttach */
    qemudNodeDeviceReset, /* nodeDeviceReset */
C
Chris Lalancette 已提交
10399
    qemudDomainMigratePrepareTunnel, /* domainMigratePrepareTunnel */
10400 10401 10402 10403
    qemuIsEncrypted, /* isEncrypted */
    qemuIsSecure, /* isSecure */
    qemuDomainIsActive, /* domainIsActive */
    qemuDomainIsPersistent, /* domainIsPersistent */
10404
    qemuDomainIsUpdated, /* domainIsUpdated */
10405
    qemuCPUCompare, /* cpuCompare */
10406
    qemuCPUBaseline, /* cpuBaseline */
10407
    qemuDomainGetJobInfo, /* domainGetJobInfo */
10408
    qemuDomainAbortJob, /* domainAbortJob */
10409
    qemuDomainMigrateSetMaxDowntime, /* domainMigrateSetMaxDowntime */
10410 10411
    qemuDomainEventRegisterAny, /* domainEventRegisterAny */
    qemuDomainEventDeregisterAny, /* domainEventDeregisterAny */
10412 10413 10414
    qemuDomainManagedSave, /* domainManagedSave */
    qemuDomainHasManagedSaveImage, /* domainHasManagedSaveImage */
    qemuDomainManagedSaveRemove, /* domainManagedSaveRemove */
C
Chris Lalancette 已提交
10415 10416 10417 10418 10419 10420 10421 10422 10423
    qemuDomainSnapshotCreateXML, /* domainSnapshotCreateXML */
    qemuDomainSnapshotDumpXML, /* domainSnapshotDumpXML */
    qemuDomainSnapshotNum, /* domainSnapshotNum */
    qemuDomainSnapshotListNames, /* domainSnapshotListNames */
    qemuDomainSnapshotLookupByName, /* domainSnapshotLookupByName */
    qemuDomainHasCurrentSnapshot, /* domainHasCurrentSnapshot */
    qemuDomainSnapshotCurrent, /* domainSnapshotCurrent */
    qemuDomainRevertToSnapshot, /* domainRevertToSnapshot */
    qemuDomainSnapshotDelete, /* domainSnapshotDelete */
10424
    qemuDomainMonitorCommand, /* qemuDomainMonitorCommand */
10425
    qemuDomainSetMemoryParameters, /* domainSetMemoryParameters */
10426
    qemuDomainGetMemoryParameters, /* domainGetMemoryParameters */
10427
    qemuDomainOpenConsole, /* domainOpenConsole */
10428 10429 10430
};


10431
static virStateDriver qemuStateDriver = {
10432
    .name = "QEMU",
10433 10434 10435 10436
    .initialize = qemudStartup,
    .cleanup = qemudShutdown,
    .reload = qemudReload,
    .active = qemudActive,
10437
};
10438

S
Stefan Berger 已提交
10439
static int
10440
qemudVMFilterRebuild(virConnectPtr conn ATTRIBUTE_UNUSED,
S
Stefan Berger 已提交
10441 10442 10443
                     virHashIterator iter, void *data)
{
    virHashForEach(qemu_driver->domains.objs, iter, data);
10444

S
Stefan Berger 已提交
10445 10446 10447
    return 0;
}

10448 10449 10450 10451 10452 10453 10454 10455 10456 10457 10458 10459 10460 10461 10462 10463 10464 10465 10466 10467 10468 10469
static int
qemudVMFiltersInstantiate(virConnectPtr conn,
                          virDomainDefPtr def)
{
    int err = 0;
    int i;

    if (!conn)
        return 1;

    for (i = 0 ; i < def->nnets ; i++) {
        virDomainNetDefPtr net = def->nets[i];
        if ((net->filter) && (net->ifname)) {
           if (virDomainConfNWFilterInstantiate(conn, net)) {
                err = 1;
                break;
            }
        }
    }

    return err;
}
S
Stefan Berger 已提交
10470

10471 10472 10473 10474 10475 10476 10477 10478 10479 10480 10481 10482 10483

static void
qemudVMDriverLock(void) {
    qemuDriverLock(qemu_driver);
};


static void
qemudVMDriverUnlock(void) {
    qemuDriverUnlock(qemu_driver);
};


S
Stefan Berger 已提交
10484 10485 10486
static virNWFilterCallbackDriver qemuCallbackDriver = {
    .name = "QEMU",
    .vmFilterRebuild = qemudVMFilterRebuild,
10487 10488
    .vmDriverLock = qemudVMDriverLock,
    .vmDriverUnlock = qemudVMDriverUnlock,
S
Stefan Berger 已提交
10489 10490
};

10491
int qemuRegister(void) {
10492 10493
    virRegisterDriver(&qemuDriver);
    virRegisterStateDriver(&qemuStateDriver);
S
Stefan Berger 已提交
10494
    virNWFilterRegisterCallbackDriver(&qemuCallbackDriver);
10495 10496
    return 0;
}