qemu_domain.c 64.5 KB
Newer Older
1 2 3
/*
 * qemu_domain.h: QEMU domain private state
 *
4
 * Copyright (C) 2006-2013 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2006 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with this library.  If not, see
O
Osier Yang 已提交
19
 * <http://www.gnu.org/licenses/>.
20 21 22 23 24 25 26 27
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

#include <config.h>

#include "qemu_domain.h"
#include "qemu_command.h"
28
#include "qemu_capabilities.h"
29
#include "qemu_migration.h"
30
#include "viralloc.h"
31
#include "virlog.h"
32
#include "virerror.h"
33
#include "c-ctype.h"
34
#include "cpu/cpu.h"
35
#include "viruuid.h"
E
Eric Blake 已提交
36
#include "virfile.h"
37
#include "domain_event.h"
38
#include "virtime.h"
39
#include "virstoragefile.h"
40
#include "virstring.h"
41

42
#include <sys/time.h>
43
#include <fcntl.h>
44

45 46 47 48 49 50
#include <libxml/xpathInternals.h>

#define VIR_FROM_THIS VIR_FROM_QEMU

#define QEMU_NAMESPACE_HREF "http://libvirt.org/schemas/domain/qemu/1.0"

51 52 53 54 55 56
VIR_ENUM_IMPL(qemuDomainJob, QEMU_JOB_LAST,
              "none",
              "query",
              "destroy",
              "suspend",
              "modify",
57
              "abort",
58
              "migration operation",
59 60 61 62 63 64 65 66 67 68
              "none",   /* async job is never stored in job.active */
              "async nested",
);

VIR_ENUM_IMPL(qemuDomainAsyncJob, QEMU_ASYNC_JOB_LAST,
              "none",
              "migration out",
              "migration in",
              "save",
              "dump",
69
              "snapshot",
70 71
);

72

J
Jiri Denemark 已提交
73 74 75 76 77 78 79
const char *
qemuDomainAsyncJobPhaseToString(enum qemuDomainAsyncJob job,
                                int phase ATTRIBUTE_UNUSED)
{
    switch (job) {
    case QEMU_ASYNC_JOB_MIGRATION_OUT:
    case QEMU_ASYNC_JOB_MIGRATION_IN:
80 81
        return qemuMigrationJobPhaseTypeToString(phase);

J
Jiri Denemark 已提交
82 83
    case QEMU_ASYNC_JOB_SAVE:
    case QEMU_ASYNC_JOB_DUMP:
84
    case QEMU_ASYNC_JOB_SNAPSHOT:
J
Jiri Denemark 已提交
85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102
    case QEMU_ASYNC_JOB_NONE:
    case QEMU_ASYNC_JOB_LAST:
        ; /* fall through */
    }

    return "none";
}

int
qemuDomainAsyncJobPhaseFromString(enum qemuDomainAsyncJob job,
                                  const char *phase)
{
    if (!phase)
        return 0;

    switch (job) {
    case QEMU_ASYNC_JOB_MIGRATION_OUT:
    case QEMU_ASYNC_JOB_MIGRATION_IN:
103 104
        return qemuMigrationJobPhaseTypeFromString(phase);

J
Jiri Denemark 已提交
105 106
    case QEMU_ASYNC_JOB_SAVE:
    case QEMU_ASYNC_JOB_DUMP:
107
    case QEMU_ASYNC_JOB_SNAPSHOT:
J
Jiri Denemark 已提交
108 109 110 111 112 113 114 115 116 117 118
    case QEMU_ASYNC_JOB_NONE:
    case QEMU_ASYNC_JOB_LAST:
        ; /* fall through */
    }

    if (STREQ(phase, "none"))
        return 0;
    else
        return -1;
}

119

120
void qemuDomainEventQueue(virQEMUDriverPtr driver,
121 122
                          virDomainEventPtr event)
{
123
    virDomainEventStateQueue(driver->domainEventState, event);
124 125 126
}


127 128 129 130 131 132 133 134
static int
qemuDomainObjInitJob(qemuDomainObjPrivatePtr priv)
{
    memset(&priv->job, 0, sizeof(priv->job));

    if (virCondInit(&priv->job.cond) < 0)
        return -1;

135
    if (virCondInit(&priv->job.asyncCond) < 0) {
136
        virCondDestroy(&priv->job.cond);
137 138 139
        return -1;
    }

140 141 142 143 144 145 146 147 148
    return 0;
}

static void
qemuDomainObjResetJob(qemuDomainObjPrivatePtr priv)
{
    struct qemuDomainJobObj *job = &priv->job;

    job->active = QEMU_JOB_NONE;
149
    job->owner = 0;
150 151 152 153 154 155 156 157
}

static void
qemuDomainObjResetAsyncJob(qemuDomainObjPrivatePtr priv)
{
    struct qemuDomainJobObj *job = &priv->job;

    job->asyncJob = QEMU_ASYNC_JOB_NONE;
158
    job->asyncOwner = 0;
J
Jiri Denemark 已提交
159
    job->phase = 0;
160
    job->mask = DEFAULT_JOB_MASK;
161
    job->start = 0;
162
    job->dump_memory_only = false;
163
    job->asyncAbort = false;
164
    memset(&job->status, 0, sizeof(job->status));
165 166 167
    memset(&job->info, 0, sizeof(job->info));
}

168 169 170 171 172 173 174 175
void
qemuDomainObjRestoreJob(virDomainObjPtr obj,
                        struct qemuDomainJobObj *job)
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

    memset(job, 0, sizeof(*job));
    job->active = priv->job.active;
176
    job->owner = priv->job.owner;
177
    job->asyncJob = priv->job.asyncJob;
178
    job->asyncOwner = priv->job.asyncOwner;
J
Jiri Denemark 已提交
179
    job->phase = priv->job.phase;
180 181 182 183 184

    qemuDomainObjResetJob(priv);
    qemuDomainObjResetAsyncJob(priv);
}

185 186 187 188 189
void
qemuDomainObjTransferJob(virDomainObjPtr obj)
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

190
    VIR_DEBUG("Changing job owner from %llu to %llu",
191 192 193 194
              priv->job.owner, virThreadSelfID());
    priv->job.owner = virThreadSelfID();
}

195 196 197
static void
qemuDomainObjFreeJob(qemuDomainObjPrivatePtr priv)
{
198 199
    virCondDestroy(&priv->job.cond);
    virCondDestroy(&priv->job.asyncCond);
200 201
}

202 203 204 205 206 207
static bool
qemuDomainTrackJob(enum qemuDomainJob job)
{
    return (QEMU_DOMAIN_TRACK_JOBS & JOB_MASK(job)) != 0;
}

208

209 210
static void
*qemuDomainObjPrivateAlloc(void)
211 212 213 214 215 216
{
    qemuDomainObjPrivatePtr priv;

    if (VIR_ALLOC(priv) < 0)
        return NULL;

217
    if (qemuDomainObjInitJob(priv) < 0)
218
        goto error;
219

220
    if (!(priv->devs = virChrdevAlloc()))
221 222
        goto error;

223
    priv->migMaxBandwidth = QEMU_DOMAIN_MIG_BANDWIDTH_MAX;
224

225
    return priv;
226 227 228 229

error:
    VIR_FREE(priv);
    return NULL;
230 231
}

232 233
static void
qemuDomainObjPrivateFree(void *data)
234 235 236
{
    qemuDomainObjPrivatePtr priv = data;

237
    virObjectUnref(priv->qemuCaps);
238

239
    virCgroupFree(&priv->cgroup);
240
    qemuDomainPCIAddressSetFree(priv->pciaddrs);
241
    qemuDomainCCWAddressSetFree(priv->ccwaddrs);
242
    virDomainChrSourceDefFree(priv->monConfig);
243
    qemuDomainObjFreeJob(priv);
244
    VIR_FREE(priv->vcpupids);
245
    VIR_FREE(priv->lockState);
J
Jiri Denemark 已提交
246
    VIR_FREE(priv->origname);
247

248
    virChrdevFree(priv->devs);
249

250 251
    /* This should never be non-NULL if we get here, but just in case... */
    if (priv->mon) {
252
        VIR_ERROR(_("Unexpected QEMU monitor still active during domain deletion"));
253 254
        qemuMonitorClose(priv->mon);
    }
D
Daniel P. Berrange 已提交
255 256 257 258
    if (priv->agent) {
        VIR_ERROR(_("Unexpected QEMU agent still active during domain deletion"));
        qemuAgentClose(priv->agent);
    }
259
    VIR_FREE(priv->cleanupCallbacks);
260 261 262 263
    VIR_FREE(priv);
}


264 265
static int
qemuDomainObjPrivateXMLFormat(virBufferPtr buf, void *data)
266 267 268
{
    qemuDomainObjPrivatePtr priv = data;
    const char *monitorpath;
269
    enum qemuDomainJob job;
270 271 272

    /* priv->monitor_chr is set only for qemu */
    if (priv->monConfig) {
273
        switch (priv->monConfig->type) {
274
        case VIR_DOMAIN_CHR_TYPE_UNIX:
275
            monitorpath = priv->monConfig->data.nix.path;
276 277 278
            break;
        default:
        case VIR_DOMAIN_CHR_TYPE_PTY:
279
            monitorpath = priv->monConfig->data.file.path;
280 281 282 283 284 285
            break;
        }

        virBufferEscapeString(buf, "  <monitor path='%s'", monitorpath);
        if (priv->monJSON)
            virBufferAddLit(buf, " json='1'");
286
        virBufferAsprintf(buf, " type='%s'/>\n",
287
                          virDomainChrTypeToString(priv->monConfig->type));
288 289 290 291 292 293
    }


    if (priv->nvcpupids) {
        int i;
        virBufferAddLit(buf, "  <vcpus>\n");
294
        for (i = 0; i < priv->nvcpupids; i++) {
295
            virBufferAsprintf(buf, "    <vcpu pid='%d'/>\n", priv->vcpupids[i]);
296 297 298 299
        }
        virBufferAddLit(buf, "  </vcpus>\n");
    }

300
    if (priv->qemuCaps) {
301 302
        int i;
        virBufferAddLit(buf, "  <qemuCaps>\n");
303
        for (i = 0; i < QEMU_CAPS_LAST; i++) {
304
            if (virQEMUCapsGet(priv->qemuCaps, i)) {
305
                virBufferAsprintf(buf, "    <flag name='%s'/>\n",
306
                                  virQEMUCapsTypeToString(i));
307 308 309 310 311
            }
        }
        virBufferAddLit(buf, "  </qemuCaps>\n");
    }

312 313 314
    if (priv->lockState)
        virBufferAsprintf(buf, "  <lockstate>%s</lockstate>\n", priv->lockState);

315 316 317 318
    job = priv->job.active;
    if (!qemuDomainTrackJob(job))
        priv->job.active = QEMU_JOB_NONE;

319
    if (priv->job.active || priv->job.asyncJob) {
J
Jiri Denemark 已提交
320
        virBufferAsprintf(buf, "  <job type='%s' async='%s'",
321 322
                          qemuDomainJobTypeToString(priv->job.active),
                          qemuDomainAsyncJobTypeToString(priv->job.asyncJob));
J
Jiri Denemark 已提交
323 324 325 326 327 328
        if (priv->job.phase) {
            virBufferAsprintf(buf, " phase='%s'",
                              qemuDomainAsyncJobPhaseToString(
                                    priv->job.asyncJob, priv->job.phase));
        }
        virBufferAddLit(buf, "/>\n");
329
    }
330
    priv->job.active = job;
331

332
    if (priv->fakeReboot)
333
        virBufferAddLit(buf, "  <fakereboot/>\n");
334

335 336 337
    return 0;
}

338 339
static int
qemuDomainObjPrivateXMLParse(xmlXPathContextPtr ctxt, void *data)
340 341 342 343 344 345
{
    qemuDomainObjPrivatePtr priv = data;
    char *monitorpath;
    char *tmp;
    int n, i;
    xmlNodePtr *nodes = NULL;
346
    virQEMUCapsPtr qemuCaps = NULL;
347 348 349 350 351 352 353 354

    if (VIR_ALLOC(priv->monConfig) < 0) {
        virReportOOMError();
        goto error;
    }

    if (!(monitorpath =
          virXPathString("string(./monitor[1]/@path)", ctxt))) {
355 356
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("no monitor path"));
357 358 359 360 361
        goto error;
    }

    tmp = virXPathString("string(./monitor[1]/@type)", ctxt);
    if (tmp)
362
        priv->monConfig->type = virDomainChrTypeFromString(tmp);
363
    else
364
        priv->monConfig->type = VIR_DOMAIN_CHR_TYPE_PTY;
365 366
    VIR_FREE(tmp);

E
Eric Blake 已提交
367 368
    priv->monJSON = virXPathBoolean("count(./monitor[@json = '1']) > 0",
                                    ctxt) > 0;
369

370
    switch (priv->monConfig->type) {
371
    case VIR_DOMAIN_CHR_TYPE_PTY:
372
        priv->monConfig->data.file.path = monitorpath;
373 374
        break;
    case VIR_DOMAIN_CHR_TYPE_UNIX:
375
        priv->monConfig->data.nix.path = monitorpath;
376 377 378
        break;
    default:
        VIR_FREE(monitorpath);
379 380 381
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("unsupported monitor type '%s'"),
                       virDomainChrTypeToString(priv->monConfig->type));
382 383 384 385 386 387 388 389 390 391 392 393 394
        goto error;
    }

    n = virXPathNodeSet("./vcpus/vcpu", ctxt, &nodes);
    if (n < 0)
        goto error;
    if (n) {
        priv->nvcpupids = n;
        if (VIR_REALLOC_N(priv->vcpupids, priv->nvcpupids) < 0) {
            virReportOOMError();
            goto error;
        }

395
        for (i = 0; i < n; i++) {
396 397 398 399 400 401 402 403 404 405 406 407 408
            char *pidstr = virXMLPropString(nodes[i], "pid");
            if (!pidstr)
                goto error;

            if (virStrToLong_i(pidstr, NULL, 10, &(priv->vcpupids[i])) < 0) {
                VIR_FREE(pidstr);
                goto error;
            }
            VIR_FREE(pidstr);
        }
        VIR_FREE(nodes);
    }

409
    if ((n = virXPathNodeSet("./qemuCaps/flag", ctxt, &nodes)) < 0) {
410 411
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("failed to parse qemu capabilities flags"));
412 413 414
        goto error;
    }
    if (n > 0) {
415
        if (!(qemuCaps = virQEMUCapsNew()))
416 417
            goto error;

418
        for (i = 0; i < n; i++) {
419 420
            char *str = virXMLPropString(nodes[i], "name");
            if (str) {
421
                int flag = virQEMUCapsTypeFromString(str);
422
                if (flag < 0) {
423 424
                    virReportError(VIR_ERR_INTERNAL_ERROR,
                                   _("Unknown qemu capabilities flag %s"), str);
425
                    VIR_FREE(str);
426 427
                    goto error;
                }
428
                VIR_FREE(str);
429
                virQEMUCapsSet(qemuCaps, flag);
430 431 432
            }
        }

433
        priv->qemuCaps = qemuCaps;
434 435 436
    }
    VIR_FREE(nodes);

437
    priv->lockState = virXPathString("string(./lockstate)", ctxt);
438

439 440 441 442
    if ((tmp = virXPathString("string(./job[1]/@type)", ctxt))) {
        int type;

        if ((type = qemuDomainJobTypeFromString(tmp)) < 0) {
443 444
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("Unknown job type %s"), tmp);
445 446 447 448 449 450 451 452 453 454 455
            VIR_FREE(tmp);
            goto error;
        }
        VIR_FREE(tmp);
        priv->job.active = type;
    }

    if ((tmp = virXPathString("string(./job[1]/@async)", ctxt))) {
        int async;

        if ((async = qemuDomainAsyncJobTypeFromString(tmp)) < 0) {
456 457
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("Unknown async job type %s"), tmp);
458 459 460 461 462
            VIR_FREE(tmp);
            goto error;
        }
        VIR_FREE(tmp);
        priv->job.asyncJob = async;
J
Jiri Denemark 已提交
463 464 465 466

        if ((tmp = virXPathString("string(./job[1]/@phase)", ctxt))) {
            priv->job.phase = qemuDomainAsyncJobPhaseFromString(async, tmp);
            if (priv->job.phase < 0) {
467 468
                virReportError(VIR_ERR_INTERNAL_ERROR,
                               _("Unknown job phase %s"), tmp);
J
Jiri Denemark 已提交
469 470 471 472 473
                VIR_FREE(tmp);
                goto error;
            }
            VIR_FREE(tmp);
        }
474 475
    }

476 477
    priv->fakeReboot = virXPathBoolean("boolean(./fakereboot)", ctxt) == 1;

478 479 480
    return 0;

error:
481
    virDomainChrSourceDefFree(priv->monConfig);
482 483
    priv->monConfig = NULL;
    VIR_FREE(nodes);
484
    virObjectUnref(qemuCaps);
485 486 487 488
    return -1;
}


489 490 491 492 493 494 495 496
virDomainXMLPrivateDataCallbacks virQEMUDriverPrivateDataCallbacks = {
    .alloc = qemuDomainObjPrivateAlloc,
    .free = qemuDomainObjPrivateFree,
    .parse = qemuDomainObjPrivateXMLParse,
    .format = qemuDomainObjPrivateXMLFormat,
};


497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518
static void
qemuDomainDefNamespaceFree(void *nsdata)
{
    qemuDomainCmdlineDefPtr cmd = nsdata;
    unsigned int i;

    if (!cmd)
        return;

    for (i = 0; i < cmd->num_args; i++)
        VIR_FREE(cmd->args[i]);
    for (i = 0; i < cmd->num_env; i++) {
        VIR_FREE(cmd->env_name[i]);
        VIR_FREE(cmd->env_value[i]);
    }
    VIR_FREE(cmd->args);
    VIR_FREE(cmd->env_name);
    VIR_FREE(cmd->env_value);
    VIR_FREE(cmd);
}

static int
P
Philipp Hahn 已提交
519 520
qemuDomainDefNamespaceParse(xmlDocPtr xml ATTRIBUTE_UNUSED,
                            xmlNodePtr root ATTRIBUTE_UNUSED,
521 522 523 524
                            xmlXPathContextPtr ctxt,
                            void **data)
{
    qemuDomainCmdlineDefPtr cmd = NULL;
P
Philipp Hahn 已提交
525
    bool uses_qemu_ns = false;
526 527 528
    xmlNodePtr *nodes = NULL;
    int n, i;

P
Philipp Hahn 已提交
529
    if (xmlXPathRegisterNs(ctxt, BAD_CAST "qemu", BAD_CAST QEMU_NAMESPACE_HREF) < 0) {
530 531 532
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("Failed to register xml namespace '%s'"),
                       QEMU_NAMESPACE_HREF);
533 534 535 536 537 538 539 540 541 542 543 544
        return -1;
    }

    if (VIR_ALLOC(cmd) < 0) {
        virReportOOMError();
        return -1;
    }

    /* first handle the extra command-line arguments */
    n = virXPathNodeSet("./qemu:commandline/qemu:arg", ctxt, &nodes);
    if (n < 0)
        goto error;
P
Philipp Hahn 已提交
545
    uses_qemu_ns |= n > 0;
546 547 548 549 550 551 552

    if (n && VIR_ALLOC_N(cmd->args, n) < 0)
        goto no_memory;

    for (i = 0; i < n; i++) {
        cmd->args[cmd->num_args] = virXMLPropString(nodes[i], "value");
        if (cmd->args[cmd->num_args] == NULL) {
553 554
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("No qemu command-line argument specified"));
555 556 557 558 559 560 561 562 563 564 565
            goto error;
        }
        cmd->num_args++;
    }

    VIR_FREE(nodes);

    /* now handle the extra environment variables */
    n = virXPathNodeSet("./qemu:commandline/qemu:env", ctxt, &nodes);
    if (n < 0)
        goto error;
P
Philipp Hahn 已提交
566
    uses_qemu_ns |= n > 0;
567 568 569 570 571 572 573 574 575 576 577 578

    if (n && VIR_ALLOC_N(cmd->env_name, n) < 0)
        goto no_memory;

    if (n && VIR_ALLOC_N(cmd->env_value, n) < 0)
        goto no_memory;

    for (i = 0; i < n; i++) {
        char *tmp;

        tmp = virXMLPropString(nodes[i], "name");
        if (tmp == NULL) {
579 580
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("No qemu environment name specified"));
581 582 583
            goto error;
        }
        if (tmp[0] == '\0') {
584 585
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("Empty qemu environment name specified"));
586 587 588
            goto error;
        }
        if (!c_isalpha(tmp[0]) && tmp[0] != '_') {
589 590
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("Invalid environment name, it must begin with a letter or underscore"));
591 592 593
            goto error;
        }
        if (strspn(tmp, "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789_") != strlen(tmp)) {
594 595
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("Invalid environment name, it must contain only alphanumerics and underscore"));
596 597 598 599 600 601 602 603 604 605 606 607
            goto error;
        }

        cmd->env_name[cmd->num_env] = tmp;

        cmd->env_value[cmd->num_env] = virXMLPropString(nodes[i], "value");
        /* a NULL value for command is allowed, since it might be empty */
        cmd->num_env++;
    }

    VIR_FREE(nodes);

P
Philipp Hahn 已提交
608 609 610 611
    if (uses_qemu_ns)
        *data = cmd;
    else
        VIR_FREE(cmd);
612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638

    return 0;

no_memory:
    virReportOOMError();

error:
    VIR_FREE(nodes);
    qemuDomainDefNamespaceFree(cmd);
    return -1;
}

static int
qemuDomainDefNamespaceFormatXML(virBufferPtr buf,
                                void *nsdata)
{
    qemuDomainCmdlineDefPtr cmd = nsdata;
    unsigned int i;

    if (!cmd->num_args && !cmd->num_env)
        return 0;

    virBufferAddLit(buf, "  <qemu:commandline>\n");
    for (i = 0; i < cmd->num_args; i++)
        virBufferEscapeString(buf, "    <qemu:arg value='%s'/>\n",
                              cmd->args[i]);
    for (i = 0; i < cmd->num_env; i++) {
639
        virBufferAsprintf(buf, "    <qemu:env name='%s'", cmd->env_name[i]);
640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655
        if (cmd->env_value[i])
            virBufferEscapeString(buf, " value='%s'", cmd->env_value[i]);
        virBufferAddLit(buf, "/>\n");
    }
    virBufferAddLit(buf, "  </qemu:commandline>\n");

    return 0;
}

static const char *
qemuDomainDefNamespaceHref(void)
{
    return "xmlns:qemu='" QEMU_NAMESPACE_HREF "'";
}


656 657 658 659 660 661
virDomainXMLNamespace virQEMUDriverDomainXMLNamespace = {
    .parse = qemuDomainDefNamespaceParse,
    .free = qemuDomainDefNamespaceFree,
    .format = qemuDomainDefNamespaceFormatXML,
    .href = qemuDomainDefNamespaceHref,
};
662

663

664 665 666 667 668
static int
qemuDomainDefPostParse(virDomainDefPtr def,
                       virCapsPtr caps,
                       void *opaque ATTRIBUTE_UNUSED)
{
669 670
    bool addPCIRoot = false;

671 672 673 674 675
    /* check for emulator and create a default one if needed */
    if (!def->emulator &&
        !(def->emulator = virDomainDefGetDefaultEmulator(def, caps)))
        return -1;

676 677 678 679 680 681 682 683 684 685 686 687
    /* Add implicit PCI root controller if the machine has one */
    switch (def->os.arch) {
    case VIR_ARCH_I686:
    case VIR_ARCH_X86_64:
        if (!def->os.machine)
            break;
        if (STRPREFIX(def->os.machine, "pc-q35") ||
            STREQ(def->os.machine, "q35") ||
            STREQ(def->os.machine, "isapc"))
            break;
        if (!STRPREFIX(def->os.machine, "pc-0.") &&
            !STRPREFIX(def->os.machine, "pc-1.") &&
688
            !STRPREFIX(def->os.machine, "pc-i440") &&
689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712
            !STREQ(def->os.machine, "pc") &&
            !STRPREFIX(def->os.machine, "rhel"))
            break;
        addPCIRoot = true;
        break;

    case VIR_ARCH_ALPHA:
    case VIR_ARCH_PPC:
    case VIR_ARCH_PPC64:
    case VIR_ARCH_PPCEMB:
    case VIR_ARCH_SH4:
    case VIR_ARCH_SH4EB:
        addPCIRoot = true;
        break;
    default:
        break;
    }

    if (addPCIRoot &&
        virDomainDefMaybeAddController(
            def, VIR_DOMAIN_CONTROLLER_TYPE_PCI, 0,
            VIR_DOMAIN_CONTROLLER_MODEL_PCI_ROOT) < 0)
        return -1;

713 714 715 716
    return 0;
}


717 718
static int
qemuDomainDeviceDefPostParse(virDomainDeviceDefPtr dev,
719
                             virDomainDefPtr def,
720
                             virCapsPtr caps ATTRIBUTE_UNUSED,
721
                             void *opaque)
722
{
723 724 725 726
    int ret = -1;
    virQEMUDriverPtr driver = opaque;
    virQEMUDriverConfigPtr cfg = NULL;

727
    if (dev->type == VIR_DOMAIN_DEVICE_NET &&
728 729
        dev->data.net->type != VIR_DOMAIN_NET_TYPE_HOSTDEV &&
        !dev->data.net->model) {
730 731 732 733
        if (VIR_STRDUP(dev->data.net->model,
                       def->os.arch == VIR_ARCH_S390 ||
                       def->os.arch == VIR_ARCH_S390X ? "virtio" : "rtl8139") < 0)
            goto cleanup;
734
    }
735

736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756
    /* set default disk types and drivers */
    if (dev->type == VIR_DOMAIN_DEVICE_DISK) {
        virDomainDiskDefPtr disk = dev->data.disk;

        /* both of these require data from the driver config */
        if (driver && (cfg = virQEMUDriverGetConfig(driver))) {
            /* assign default storage format and driver according to config */
            if (cfg->allowDiskFormatProbing) {
                /* default disk format for drives */
                if (disk->format == VIR_STORAGE_FILE_NONE &&
                    (disk->type == VIR_DOMAIN_DISK_TYPE_FILE ||
                     disk->type == VIR_DOMAIN_DISK_TYPE_BLOCK))
                    disk->format = VIR_STORAGE_FILE_AUTO;

                 /* default disk format for mirrored drive */
                if (disk->mirror &&
                    disk->mirrorFormat == VIR_STORAGE_FILE_NONE)
                    disk->mirrorFormat = VIR_STORAGE_FILE_AUTO;
            } else {
                /* default driver if probing is forbidden */
                if (!disk->driverName &&
757 758
                    VIR_STRDUP(disk->driverName, "qemu") < 0)
                        goto cleanup;
759 760 761 762 763 764 765 766 767 768 769 770

                /* default disk format for drives */
                if (disk->format == VIR_STORAGE_FILE_NONE &&
                    (disk->type == VIR_DOMAIN_DISK_TYPE_FILE ||
                     disk->type == VIR_DOMAIN_DISK_TYPE_BLOCK))
                    disk->format = VIR_STORAGE_FILE_RAW;

                 /* default disk format for mirrored drive */
                if (disk->mirror &&
                    disk->mirrorFormat == VIR_STORAGE_FILE_NONE)
                    disk->mirrorFormat = VIR_STORAGE_FILE_RAW;
            }
771 772 773
        }
    }

774 775 776 777 778 779 780
    /* set the default console type for S390 arches */
    if (dev->type == VIR_DOMAIN_DEVICE_CHR &&
        dev->data.chr->deviceType == VIR_DOMAIN_CHR_DEVICE_TYPE_CONSOLE &&
        dev->data.chr->targetType == VIR_DOMAIN_CHR_CONSOLE_TARGET_TYPE_NONE &&
        (def->os.arch == VIR_ARCH_S390 || def->os.arch == VIR_ARCH_S390X))
        dev->data.chr->targetType = VIR_DOMAIN_CHR_CONSOLE_TARGET_TYPE_VIRTIO;

781 782 783 784 785 786 787 788
    /* set the default USB model to none for s390 unless an address is found */
    if (dev->type == VIR_DOMAIN_DEVICE_CONTROLLER &&
        dev->data.controller->type == VIR_DOMAIN_CONTROLLER_TYPE_USB &&
        dev->data.controller->model == -1 &&
        dev->data.controller->info.type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_NONE &&
        (def->os.arch == VIR_ARCH_S390 || def->os.arch == VIR_ARCH_S390X))
        dev->data.controller->model = VIR_DOMAIN_CONTROLLER_MODEL_USB_NONE;

789 790 791 792 793 794 795 796 797 798 799
    /* auto generate unix socket path */
    if (dev->type == VIR_DOMAIN_DEVICE_CHR &&
        dev->data.chr->deviceType == VIR_DOMAIN_CHR_DEVICE_TYPE_CHANNEL &&
        dev->data.chr->targetType == VIR_DOMAIN_CHR_CHANNEL_TARGET_TYPE_VIRTIO &&
        dev->data.chr->source.type == VIR_DOMAIN_CHR_TYPE_UNIX &&
        !dev->data.chr->source.data.nix.path &&
        (driver && (cfg = virQEMUDriverGetConfig(driver)))) {

        if (virAsprintf(&dev->data.chr->source.data.nix.path,
                        "%s/channel/target/%s.%s",
                        cfg->libDir, def->name,
800 801 802 803
                        dev->data.chr->target.name) < 0) {
            virReportOOMError();
            goto cleanup;
        }
804 805 806
        dev->data.chr->source.data.nix.listen = true;
    }

807 808 809 810 811
    ret = 0;

cleanup:
    virObjectUnref(cfg);
    return ret;
812 813 814 815 816
}


virDomainDefParserConfig virQEMUDriverDomainDefParserConfig = {
    .devicesPostParseCallback = qemuDomainDeviceDefPostParse,
817
    .domainPostParseCallback = qemuDomainDefPostParse,
818 819 820
};


821
static void
822
qemuDomainObjSaveJob(virQEMUDriverPtr driver, virDomainObjPtr obj)
823
{
824 825 826
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);

    if (virDomainObjIsActive(obj)) {
827
        if (virDomainSaveStatus(driver->xmlopt, cfg->stateDir, obj) < 0)
828
            VIR_WARN("Failed to save status on vm %s", obj->def->name);
829
    }
830

831
    virObjectUnref(cfg);
832 833
}

J
Jiri Denemark 已提交
834
void
835
qemuDomainObjSetJobPhase(virQEMUDriverPtr driver,
J
Jiri Denemark 已提交
836 837 838 839
                         virDomainObjPtr obj,
                         int phase)
{
    qemuDomainObjPrivatePtr priv = obj->privateData;
840
    unsigned long long me = virThreadSelfID();
J
Jiri Denemark 已提交
841 842 843 844

    if (!priv->job.asyncJob)
        return;

845 846 847 848 849
    VIR_DEBUG("Setting '%s' phase to '%s'",
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
              qemuDomainAsyncJobPhaseToString(priv->job.asyncJob, phase));

    if (priv->job.asyncOwner && me != priv->job.asyncOwner) {
850
        VIR_WARN("'%s' async job is owned by thread %llu",
851 852 853 854
                 qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
                 priv->job.asyncOwner);
    }

J
Jiri Denemark 已提交
855
    priv->job.phase = phase;
856
    priv->job.asyncOwner = me;
J
Jiri Denemark 已提交
857 858 859
    qemuDomainObjSaveJob(driver, obj);
}

860
void
861 862
qemuDomainObjSetAsyncJobMask(virDomainObjPtr obj,
                             unsigned long long allowedJobs)
863 864 865
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

866 867 868 869 870 871 872
    if (!priv->job.asyncJob)
        return;

    priv->job.mask = allowedJobs | JOB_MASK(QEMU_JOB_DESTROY);
}

void
873
qemuDomainObjDiscardAsyncJob(virQEMUDriverPtr driver, virDomainObjPtr obj)
874 875 876 877 878 879
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

    if (priv->job.active == QEMU_JOB_ASYNC_NESTED)
        qemuDomainObjResetJob(priv);
    qemuDomainObjResetAsyncJob(priv);
880
    qemuDomainObjSaveJob(driver, obj);
881 882
}

883 884 885 886 887 888 889 890 891
void
qemuDomainObjReleaseAsyncJob(virDomainObjPtr obj)
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

    VIR_DEBUG("Releasing ownership of '%s' async job",
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob));

    if (priv->job.asyncOwner != virThreadSelfID()) {
892
        VIR_WARN("'%s' async job is owned by thread %llu",
893 894 895 896 897 898
                 qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
                 priv->job.asyncOwner);
    }
    priv->job.asyncOwner = 0;
}

899
static bool
900
qemuDomainNestedJobAllowed(qemuDomainObjPrivatePtr priv, enum qemuDomainJob job)
901 902
{
    return !priv->job.asyncJob || (priv->job.mask & JOB_MASK(job)) != 0;
903 904
}

905 906 907 908 909 910
bool
qemuDomainJobAllowed(qemuDomainObjPrivatePtr priv, enum qemuDomainJob job)
{
    return !priv->job.active && qemuDomainNestedJobAllowed(priv, job);
}

911 912 913
/* Give up waiting for mutex after 30 seconds */
#define QEMU_JOB_WAIT_TIME (1000ull * 30)

914
/*
915
 * obj must be locked before calling
916
 */
917
static int ATTRIBUTE_NONNULL(1)
918
qemuDomainObjBeginJobInternal(virQEMUDriverPtr driver,
919 920 921
                              virDomainObjPtr obj,
                              enum qemuDomainJob job,
                              enum qemuDomainAsyncJob asyncJob)
922 923
{
    qemuDomainObjPrivatePtr priv = obj->privateData;
J
Jiri Denemark 已提交
924
    unsigned long long now;
925
    unsigned long long then;
926
    bool nested = job == QEMU_JOB_ASYNC_NESTED;
927
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
928

929 930
    priv->jobs_queued++;

931 932
    if (virTimeMillisNow(&now) < 0) {
        virObjectUnref(cfg);
933
        return -1;
934 935
    }

J
Jiri Denemark 已提交
936
    then = now + QEMU_JOB_WAIT_TIME;
937

938
    virObjectRef(obj);
939

940
retry:
941 942
    if (cfg->maxQueuedJobs &&
        priv->jobs_queued > cfg->maxQueuedJobs) {
943 944 945
        goto error;
    }

946
    while (!nested && !qemuDomainNestedJobAllowed(priv, job)) {
947
        if (virCondWaitUntil(&priv->job.asyncCond, &obj->parent.lock, then) < 0)
948 949 950
            goto error;
    }

951
    while (priv->job.active) {
952
        if (virCondWaitUntil(&priv->job.cond, &obj->parent.lock, then) < 0)
953
            goto error;
954
    }
955 956 957

    /* No job is active but a new async job could have been started while obj
     * was unlocked, so we need to recheck it. */
958
    if (!nested && !qemuDomainNestedJobAllowed(priv, job))
959 960
        goto retry;

961
    qemuDomainObjResetJob(priv);
962 963

    if (job != QEMU_JOB_ASYNC) {
964 965 966
        VIR_DEBUG("Starting job: %s (async=%s)",
                   qemuDomainJobTypeToString(job),
                   qemuDomainAsyncJobTypeToString(priv->job.asyncJob));
967
        priv->job.active = job;
968
        priv->job.owner = virThreadSelfID();
969
    } else {
970 971
        VIR_DEBUG("Starting async job: %s",
                  qemuDomainAsyncJobTypeToString(asyncJob));
972 973
        qemuDomainObjResetAsyncJob(priv);
        priv->job.asyncJob = asyncJob;
974
        priv->job.asyncOwner = virThreadSelfID();
975 976
        priv->job.start = now;
    }
977

978 979
    if (qemuDomainTrackJob(job))
        qemuDomainObjSaveJob(driver, obj);
980

981
    virObjectUnref(cfg);
982
    return 0;
983 984

error:
985
    VIR_WARN("Cannot start job (%s, %s) for domain %s;"
986
             " current job is (%s, %s) owned by (%llu, %llu)",
987 988 989 990 991 992 993
             qemuDomainJobTypeToString(job),
             qemuDomainAsyncJobTypeToString(asyncJob),
             obj->def->name,
             qemuDomainJobTypeToString(priv->job.active),
             qemuDomainAsyncJobTypeToString(priv->job.asyncJob),
             priv->job.owner, priv->job.asyncOwner);

994
    if (errno == ETIMEDOUT)
995 996
        virReportError(VIR_ERR_OPERATION_TIMEOUT,
                       "%s", _("cannot acquire state change lock"));
997 998
    else if (cfg->maxQueuedJobs &&
             priv->jobs_queued > cfg->maxQueuedJobs)
999 1000 1001
        virReportError(VIR_ERR_OPERATION_FAILED,
                       "%s", _("cannot acquire state change lock "
                               "due to max_queued limit"));
1002 1003 1004
    else
        virReportSystemError(errno,
                             "%s", _("cannot acquire job mutex"));
1005
    priv->jobs_queued--;
1006
    virObjectUnref(obj);
1007
    virObjectUnref(cfg);
1008
    return -1;
1009 1010 1011
}

/*
1012
 * obj must be locked before calling
1013 1014 1015 1016 1017 1018 1019
 *
 * This must be called by anything that will change the VM state
 * in any way, or anything that will use the QEMU monitor.
 *
 * Upon successful return, the object will have its ref count increased,
 * successful calls must be followed by EndJob eventually
 */
1020
int qemuDomainObjBeginJob(virQEMUDriverPtr driver,
1021 1022
                          virDomainObjPtr obj,
                          enum qemuDomainJob job)
1023
{
1024
    return qemuDomainObjBeginJobInternal(driver, obj, job,
1025 1026 1027
                                         QEMU_ASYNC_JOB_NONE);
}

1028
int qemuDomainObjBeginAsyncJob(virQEMUDriverPtr driver,
1029
                               virDomainObjPtr obj,
1030
                               enum qemuDomainAsyncJob asyncJob)
1031
{
1032
    return qemuDomainObjBeginJobInternal(driver, obj, QEMU_JOB_ASYNC,
1033
                                         asyncJob);
1034 1035
}

1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049
int
qemuDomainObjBeginNestedJob(virQEMUDriverPtr driver,
                            virDomainObjPtr obj,
                            enum qemuDomainAsyncJob asyncJob)
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

    if (asyncJob != priv->job.asyncJob) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("unexpected async job %d"), asyncJob);
        return -1;
    }

    if (priv->job.asyncOwner != virThreadSelfID()) {
1050
        VIR_WARN("This thread doesn't seem to be the async job owner: %llu",
1051 1052 1053 1054 1055 1056 1057 1058
                 priv->job.asyncOwner);
    }

    return qemuDomainObjBeginJobInternal(driver, obj,
                                         QEMU_JOB_ASYNC_NESTED,
                                         QEMU_ASYNC_JOB_NONE);
}

1059

1060
/*
1061
 * obj must be locked before calling
1062 1063 1064 1065
 *
 * To be called after completing the work associated with the
 * earlier qemuDomainBeginJob() call
 *
1066 1067
 * Returns true if @obj was still referenced, false if it was
 * disposed of.
1068
 */
1069
bool qemuDomainObjEndJob(virQEMUDriverPtr driver, virDomainObjPtr obj)
1070 1071
{
    qemuDomainObjPrivatePtr priv = obj->privateData;
1072
    enum qemuDomainJob job = priv->job.active;
1073

1074 1075
    priv->jobs_queued--;

1076
    VIR_DEBUG("Stopping job: %s (async=%s)",
1077
              qemuDomainJobTypeToString(job),
1078 1079
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob));

1080
    qemuDomainObjResetJob(priv);
1081 1082
    if (qemuDomainTrackJob(job))
        qemuDomainObjSaveJob(driver, obj);
1083
    virCondSignal(&priv->job.cond);
1084

1085
    return virObjectUnref(obj);
1086 1087
}

1088
bool
1089
qemuDomainObjEndAsyncJob(virQEMUDriverPtr driver, virDomainObjPtr obj)
1090 1091
{
    qemuDomainObjPrivatePtr priv = obj->privateData;
1092

1093 1094
    priv->jobs_queued--;

1095 1096 1097
    VIR_DEBUG("Stopping async job: %s",
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob));

1098
    qemuDomainObjResetAsyncJob(priv);
1099
    qemuDomainObjSaveJob(driver, obj);
1100 1101
    virCondBroadcast(&priv->job.asyncCond);

1102
    return virObjectUnref(obj);
1103 1104
}

1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115
void
qemuDomainObjAbortAsyncJob(virDomainObjPtr obj)
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

    VIR_DEBUG("Requesting abort of async job: %s",
              qemuDomainAsyncJobTypeToString(priv->job.asyncJob));

    priv->job.asyncAbort = true;
}

1116 1117 1118 1119 1120 1121 1122 1123 1124
/*
 * obj must be locked before calling
 *
 * To be called immediately before any QEMU monitor API call
 * Must have already either called qemuDomainObjBeginJob() and checked
 * that the VM is still active; may not be used for nested async jobs.
 *
 * To be followed with qemuDomainObjExitMonitor() once complete
 */
1125
static int
1126
qemuDomainObjEnterMonitorInternal(virQEMUDriverPtr driver,
1127 1128
                                  virDomainObjPtr obj,
                                  enum qemuDomainAsyncJob asyncJob)
1129 1130 1131
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

1132
    if (asyncJob != QEMU_ASYNC_JOB_NONE) {
1133
        if (qemuDomainObjBeginNestedJob(driver, obj, asyncJob) < 0)
1134 1135
            return -1;
        if (!virDomainObjIsActive(obj)) {
1136 1137
            virReportError(VIR_ERR_OPERATION_FAILED, "%s",
                           _("domain is no longer running"));
1138 1139
            /* Still referenced by the containing async job.  */
            ignore_value(qemuDomainObjEndJob(driver, obj));
1140 1141
            return -1;
        }
1142 1143 1144
    } else if (priv->job.asyncOwner == virThreadSelfID()) {
        VIR_WARN("This thread seems to be the async job owner; entering"
                 " monitor without asking for a nested job is dangerous");
1145 1146
    }

1147
    virObjectLock(priv->mon);
1148
    virObjectRef(priv->mon);
1149
    ignore_value(virTimeMillisNow(&priv->monStart));
1150
    virObjectUnlock(obj);
1151 1152

    return 0;
1153 1154
}

1155
static void ATTRIBUTE_NONNULL(1)
1156
qemuDomainObjExitMonitorInternal(virQEMUDriverPtr driver,
1157
                                 virDomainObjPtr obj)
1158 1159
{
    qemuDomainObjPrivatePtr priv = obj->privateData;
1160
    bool hasRefs;
1161

1162
    hasRefs = virObjectUnref(priv->mon);
1163

1164
    if (hasRefs)
1165
        virObjectUnlock(priv->mon);
1166

1167
    virObjectLock(obj);
1168

1169
    priv->monStart = 0;
1170
    if (!hasRefs)
1171
        priv->mon = NULL;
1172

1173 1174 1175 1176 1177
    if (priv->job.active == QEMU_JOB_ASYNC_NESTED) {
        qemuDomainObjResetJob(priv);
        qemuDomainObjSaveJob(driver, obj);
        virCondSignal(&priv->job.cond);

1178
        virObjectUnref(obj);
1179
    }
1180 1181
}

1182
void qemuDomainObjEnterMonitor(virQEMUDriverPtr driver,
1183
                               virDomainObjPtr obj)
1184
{
1185
    ignore_value(qemuDomainObjEnterMonitorInternal(driver, obj,
1186
                                                   QEMU_ASYNC_JOB_NONE));
1187 1188
}

1189
/* obj must NOT be locked before calling
1190 1191 1192
 *
 * Should be paired with an earlier qemuDomainObjEnterMonitor() call
 */
1193
void qemuDomainObjExitMonitor(virQEMUDriverPtr driver,
1194
                              virDomainObjPtr obj)
1195
{
1196
    qemuDomainObjExitMonitorInternal(driver, obj);
1197
}
1198 1199

/*
1200
 * obj must be locked before calling
1201 1202
 *
 * To be called immediately before any QEMU monitor API call.
1203
 * Must have already either called qemuDomainObjBeginJob()
1204 1205 1206 1207 1208
 * and checked that the VM is still active, with asyncJob of
 * QEMU_ASYNC_JOB_NONE; or already called qemuDomainObjBeginAsyncJob,
 * with the same asyncJob.
 *
 * Returns 0 if job was started, in which case this must be followed with
1209
 * qemuDomainObjExitMonitor(); or -1 if the job could not be
1210 1211 1212
 * started (probably because the vm exited in the meantime).
 */
int
1213
qemuDomainObjEnterMonitorAsync(virQEMUDriverPtr driver,
1214 1215
                               virDomainObjPtr obj,
                               enum qemuDomainAsyncJob asyncJob)
1216
{
1217
    return qemuDomainObjEnterMonitorInternal(driver, obj, asyncJob);
1218 1219
}

D
Daniel P. Berrange 已提交
1220 1221


1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232
/*
 * obj must be locked before calling
 *
 * To be called immediately before any QEMU agent API call.
 * Must have already called qemuDomainObjBeginJob() and checked
 * that the VM is still active.
 *
 * To be followed with qemuDomainObjExitAgent() once complete
 */
void
qemuDomainObjEnterAgent(virDomainObjPtr obj)
D
Daniel P. Berrange 已提交
1233 1234 1235
{
    qemuDomainObjPrivatePtr priv = obj->privateData;

1236
    virObjectLock(priv->agent);
1237
    virObjectRef(priv->agent);
D
Daniel P. Berrange 已提交
1238
    ignore_value(virTimeMillisNow(&priv->agentStart));
1239
    virObjectUnlock(obj);
D
Daniel P. Berrange 已提交
1240 1241
}

1242 1243 1244 1245 1246 1247 1248

/* obj must NOT be locked before calling
 *
 * Should be paired with an earlier qemuDomainObjEnterAgent() call
 */
void
qemuDomainObjExitAgent(virDomainObjPtr obj)
D
Daniel P. Berrange 已提交
1249 1250
{
    qemuDomainObjPrivatePtr priv = obj->privateData;
1251
    bool hasRefs;
D
Daniel P. Berrange 已提交
1252

1253
    hasRefs = virObjectUnref(priv->agent);
D
Daniel P. Berrange 已提交
1254

1255
    if (hasRefs)
1256
        virObjectUnlock(priv->agent);
D
Daniel P. Berrange 已提交
1257

1258
    virObjectLock(obj);
D
Daniel P. Berrange 已提交
1259 1260

    priv->agentStart = 0;
1261
    if (!hasRefs)
D
Daniel P. Berrange 已提交
1262 1263 1264
        priv->agent = NULL;
}

1265
void qemuDomainObjEnterRemote(virDomainObjPtr obj)
1266
{
1267
    virObjectRef(obj);
1268
    virObjectUnlock(obj);
1269 1270
}

1271
void qemuDomainObjExitRemote(virDomainObjPtr obj)
1272
{
1273
    virObjectLock(obj);
1274
    virObjectUnref(obj);
1275
}
1276 1277


1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306
virDomainDefPtr
qemuDomainDefCopy(virQEMUDriverPtr driver,
                  virDomainDefPtr src,
                  unsigned int flags)
{
    virBuffer buf = VIR_BUFFER_INITIALIZER;
    virDomainDefPtr ret = NULL;
    virCapsPtr caps = NULL;
    const char *xml = NULL;

    if (qemuDomainDefFormatBuf(driver, src, flags, &buf) < 0)
        goto cleanup;

    xml = virBufferContentAndReset(&buf);

    if (!(caps = virQEMUDriverGetCapabilities(driver, false)))
        goto cleanup;

    if (!(ret = virDomainDefParseString(xml, caps, driver->xmlopt,
                                        QEMU_EXPECTED_VIRT_TYPES,
                                        VIR_DOMAIN_XML_INACTIVE)))
        goto cleanup;

cleanup:
    VIR_FREE(xml);
    virObjectUnref(caps);
    return ret;
}

1307
int
1308
qemuDomainDefFormatBuf(virQEMUDriverPtr driver,
1309 1310 1311
                       virDomainDefPtr def,
                       unsigned int flags,
                       virBuffer *buf)
1312
{
1313
    int ret = -1;
1314
    virCPUDefPtr cpu = NULL;
1315
    virCPUDefPtr def_cpu = def->cpu;
1316 1317
    virDomainControllerDefPtr *controllers = NULL;
    int ncontrollers = 0;
1318 1319 1320 1321
    virCapsPtr caps = NULL;

    if (!(caps = virQEMUDriverGetCapabilities(driver, false)))
        goto cleanup;
1322 1323

    /* Update guest CPU requirements according to host CPU */
1324 1325 1326
    if ((flags & VIR_DOMAIN_XML_UPDATE_CPU) &&
        def_cpu &&
        (def_cpu->mode != VIR_CPU_MODE_CUSTOM || def_cpu->model)) {
1327 1328
        if (!caps->host.cpu ||
            !caps->host.cpu->model) {
1329 1330
            virReportError(VIR_ERR_OPERATION_FAILED,
                           "%s", _("cannot get host CPU capabilities"));
1331 1332 1333
            goto cleanup;
        }

1334
        if (!(cpu = virCPUDefCopy(def_cpu)) ||
1335
            cpuUpdate(cpu, caps->host.cpu) < 0)
1336 1337 1338 1339
            goto cleanup;
        def->cpu = cpu;
    }

1340
    if ((flags & VIR_DOMAIN_XML_MIGRATABLE)) {
1341
        int i;
1342
        int toremove = 0;
1343
        virDomainControllerDefPtr usb = NULL, pci = NULL;
1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361

        /* If only the default USB controller is present, we can remove it
         * and make the XML compatible with older versions of libvirt which
         * didn't support USB controllers in the XML but always added the
         * default one to qemu anyway.
         */
        for (i = 0; i < def->ncontrollers; i++) {
            if (def->controllers[i]->type == VIR_DOMAIN_CONTROLLER_TYPE_USB) {
                if (usb) {
                    usb = NULL;
                    break;
                }
                usb = def->controllers[i];
            }
        }
        if (usb && usb->idx == 0 && usb->model == -1) {
            VIR_DEBUG("Removing default USB controller from domain '%s'"
                      " for migration compatibility", def->name);
1362
            toremove++;
1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382
        } else {
            usb = NULL;
        }

        /* Remove the default PCI controller if there is only one present
         * and its model is pci-root */
        for (i = 0; i < def->ncontrollers; i++) {
            if (def->controllers[i]->type == VIR_DOMAIN_CONTROLLER_TYPE_PCI) {
                if (pci) {
                    pci = NULL;
                    break;
                }
                pci = def->controllers[i];
            }
        }

        if (pci && pci->idx == 0 &&
            pci->model == VIR_DOMAIN_CONTROLLER_MODEL_PCI_ROOT) {
            VIR_DEBUG("Removing default 'pci-root' from domain '%s'"
                      " for migration compatibility", def->name);
1383
            toremove++;
1384 1385 1386 1387
        } else {
            pci = NULL;
        }

1388
        if (toremove) {
1389 1390
            controllers = def->controllers;
            ncontrollers = def->ncontrollers;
1391
            if (VIR_ALLOC_N(def->controllers, ncontrollers - toremove) < 0) {
1392 1393 1394 1395 1396 1397 1398
                controllers = NULL;
                virReportOOMError();
                goto cleanup;
            }

            def->ncontrollers = 0;
            for (i = 0; i < ncontrollers; i++) {
1399
                if (controllers[i] != usb && controllers[i] != pci)
1400 1401 1402
                    def->controllers[def->ncontrollers++] = controllers[i];
            }
        }
1403 1404


1405 1406
    }

1407
    ret = virDomainDefFormatInternal(def, flags, buf);
1408 1409 1410 1411

cleanup:
    def->cpu = def_cpu;
    virCPUDefFree(cpu);
1412 1413 1414 1415 1416
    if (controllers) {
        VIR_FREE(def->controllers);
        def->controllers = controllers;
        def->ncontrollers = ncontrollers;
    }
1417
    virObjectUnref(caps);
1418 1419
    return ret;
}
1420

1421
char *qemuDomainDefFormatXML(virQEMUDriverPtr driver,
1422
                             virDomainDefPtr def,
1423
                             unsigned int flags)
1424 1425 1426
{
    virBuffer buf = VIR_BUFFER_INITIALIZER;

1427
    if (qemuDomainDefFormatBuf(driver, def, flags, &buf) < 0) {
1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440
        virBufferFreeAndReset(&buf);
        return NULL;
    }

    if (virBufferError(&buf)) {
        virReportOOMError();
        virBufferFreeAndReset(&buf);
        return NULL;
    }

    return virBufferContentAndReset(&buf);
}

1441
char *qemuDomainFormatXML(virQEMUDriverPtr driver,
1442
                          virDomainObjPtr vm,
1443
                          unsigned int flags)
1444 1445 1446 1447 1448 1449 1450 1451
{
    virDomainDefPtr def;

    if ((flags & VIR_DOMAIN_XML_INACTIVE) && vm->newDef)
        def = vm->newDef;
    else
        def = vm->def;

1452
    return qemuDomainDefFormatXML(driver, def, flags);
1453 1454
}

1455
char *
1456
qemuDomainDefFormatLive(virQEMUDriverPtr driver,
1457
                        virDomainDefPtr def,
1458 1459
                        bool inactive,
                        bool compatible)
1460 1461 1462 1463 1464
{
    unsigned int flags = QEMU_DOMAIN_FORMAT_LIVE_FLAGS;

    if (inactive)
        flags |= VIR_DOMAIN_XML_INACTIVE;
1465 1466
    if (compatible)
        flags |= VIR_DOMAIN_XML_MIGRATABLE;
1467

1468
    return qemuDomainDefFormatXML(driver, def, flags);
1469 1470
}

1471

1472
void qemuDomainObjTaint(virQEMUDriverPtr driver,
1473
                        virDomainObjPtr obj,
1474 1475
                        enum virDomainTaintFlags taint,
                        int logFD)
1476
{
1477 1478
    virErrorPtr orig_err = NULL;

1479 1480 1481 1482 1483 1484 1485 1486 1487
    if (virDomainObjTaint(obj, taint)) {
        char uuidstr[VIR_UUID_STRING_BUFLEN];
        virUUIDFormat(obj->def->uuid, uuidstr);

        VIR_WARN("Domain id=%d name='%s' uuid=%s is tainted: %s",
                 obj->def->id,
                 obj->def->name,
                 uuidstr,
                 virDomainTaintTypeToString(taint));
1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501

        /* We don't care about errors logging taint info, so
         * preserve original error, and clear any error that
         * is raised */
        orig_err = virSaveLastError();
        if (qemuDomainAppendLog(driver, obj, logFD,
                                "Domain id=%d is tainted: %s\n",
                                obj->def->id,
                                virDomainTaintTypeToString(taint)) < 0)
            virResetLastError();
        if (orig_err) {
            virSetError(orig_err);
            virFreeError(orig_err);
        }
1502 1503 1504 1505
    }
}


1506
void qemuDomainObjCheckTaint(virQEMUDriverPtr driver,
1507 1508
                             virDomainObjPtr obj,
                             int logFD)
1509 1510
{
    int i;
1511
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
1512

1513 1514 1515 1516
    if (cfg->privileged &&
        (!cfg->clearEmulatorCapabilities ||
         cfg->user == 0 ||
         cfg->group == 0))
1517
        qemuDomainObjTaint(driver, obj, VIR_DOMAIN_TAINT_HIGH_PRIVILEGES, logFD);
1518 1519 1520 1521

    if (obj->def->namespaceData) {
        qemuDomainCmdlineDefPtr qemucmd = obj->def->namespaceData;
        if (qemucmd->num_args || qemucmd->num_env)
1522
            qemuDomainObjTaint(driver, obj, VIR_DOMAIN_TAINT_CUSTOM_ARGV, logFD);
1523 1524
    }

1525 1526 1527
    if (obj->def->cpu && obj->def->cpu->mode == VIR_CPU_MODE_HOST_PASSTHROUGH)
        qemuDomainObjTaint(driver, obj, VIR_DOMAIN_TAINT_HOST_CPU, logFD);

1528
    for (i = 0; i < obj->def->ndisks; i++)
1529
        qemuDomainObjCheckDiskTaint(driver, obj, obj->def->disks[i], logFD);
1530

1531
    for (i = 0; i < obj->def->nnets; i++)
1532
        qemuDomainObjCheckNetTaint(driver, obj, obj->def->nets[i], logFD);
1533 1534

    virObjectUnref(cfg);
1535 1536 1537
}


1538
void qemuDomainObjCheckDiskTaint(virQEMUDriverPtr driver,
1539
                                 virDomainObjPtr obj,
1540 1541
                                 virDomainDiskDefPtr disk,
                                 int logFD)
1542
{
1543 1544
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);

1545
    if ((!disk->format || disk->format == VIR_STORAGE_FILE_AUTO) &&
1546
        cfg->allowDiskFormatProbing)
1547
        qemuDomainObjTaint(driver, obj, VIR_DOMAIN_TAINT_DISK_PROBING, logFD);
1548

1549
    if (disk->rawio == 1)
1550
        qemuDomainObjTaint(driver, obj, VIR_DOMAIN_TAINT_HIGH_PRIVILEGES, logFD);
1551 1552

    virObjectUnref(cfg);
1553 1554 1555
}


1556
void qemuDomainObjCheckNetTaint(virQEMUDriverPtr driver,
1557
                                virDomainObjPtr obj,
1558 1559
                                virDomainNetDefPtr net,
                                int logFD)
1560
{
1561 1562 1563 1564 1565 1566
    /* script is only useful for NET_TYPE_ETHERNET (qemu) and
     * NET_TYPE_BRIDGE (xen), but could be (incorrectly) specified for
     * any interface type. In any case, it's adding user sauce into
     * the soup, so it should taint the domain.
     */
    if (net->script != NULL)
1567
        qemuDomainObjTaint(driver, obj, VIR_DOMAIN_TAINT_SHELL_SCRIPTS, logFD);
1568
}
1569 1570 1571


static int
1572
qemuDomainOpenLogHelper(virQEMUDriverConfigPtr cfg,
1573
                        virDomainObjPtr vm,
E
Eric Blake 已提交
1574
                        int oflags,
1575 1576 1577 1578
                        mode_t mode)
{
    char *logfile;
    int fd = -1;
1579
    bool trunc = false;
1580

1581
    if (virAsprintf(&logfile, "%s/%s.log", cfg->logDir, vm->def->name) < 0) {
1582 1583 1584 1585
        virReportOOMError();
        return -1;
    }

1586 1587 1588 1589 1590 1591 1592 1593 1594
    /* To make SELinux happy we always need to open in append mode.
     * So we fake O_TRUNC by calling ftruncate after open instead
     */
    if (oflags & O_TRUNC) {
        oflags &= ~O_TRUNC;
        oflags |= O_APPEND;
        trunc = true;
    }

E
Eric Blake 已提交
1595
    if ((fd = open(logfile, oflags, mode)) < 0) {
1596 1597 1598 1599 1600 1601 1602
        virReportSystemError(errno, _("failed to create logfile %s"),
                             logfile);
        goto cleanup;
    }
    if (virSetCloseExec(fd) < 0) {
        virReportSystemError(errno, _("failed to set close-on-exec flag on %s"),
                             logfile);
1603 1604 1605 1606 1607 1608 1609
        VIR_FORCE_CLOSE(fd);
        goto cleanup;
    }
    if (trunc &&
        ftruncate(fd, 0) < 0) {
        virReportSystemError(errno, _("failed to truncate %s"),
                             logfile);
1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620
        VIR_FORCE_CLOSE(fd);
        goto cleanup;
    }

cleanup:
    VIR_FREE(logfile);
    return fd;
}


int
1621
qemuDomainCreateLog(virQEMUDriverPtr driver, virDomainObjPtr vm,
E
Eric Blake 已提交
1622
                    bool append)
1623
{
1624
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
E
Eric Blake 已提交
1625
    int oflags;
1626
    int ret;
1627

E
Eric Blake 已提交
1628
    oflags = O_CREAT | O_WRONLY;
1629
    /* Only logrotate files in /var/log, so only append if running privileged */
1630
    if (cfg->privileged || append)
E
Eric Blake 已提交
1631
        oflags |= O_APPEND;
1632
    else
E
Eric Blake 已提交
1633
        oflags |= O_TRUNC;
1634

1635 1636 1637
    ret = qemuDomainOpenLogHelper(cfg, vm, oflags, S_IRUSR | S_IWUSR);
    virObjectUnref(cfg);
    return ret;
1638 1639 1640 1641
}


int
1642
qemuDomainOpenLog(virQEMUDriverPtr driver, virDomainObjPtr vm, off_t pos)
1643
{
1644
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
1645 1646 1647 1648
    int fd;
    off_t off;
    int whence;

1649 1650 1651
    fd = qemuDomainOpenLogHelper(cfg, vm, O_RDONLY, 0);
    virObjectUnref(cfg);
    if (fd < 0)
1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677
        return -1;

    if (pos < 0) {
        off = 0;
        whence = SEEK_END;
    } else {
        off = pos;
        whence = SEEK_SET;
    }

    if (lseek(fd, off, whence) < 0) {
        if (whence == SEEK_END)
            virReportSystemError(errno,
                                 _("unable to seek to end of log for %s"),
                                 vm->def->name);
        else
            virReportSystemError(errno,
                                 _("unable to seek to %lld from start for %s"),
                                 (long long)off, vm->def->name);
        VIR_FORCE_CLOSE(fd);
    }

    return fd;
}


1678
int qemuDomainAppendLog(virQEMUDriverPtr driver,
1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711
                        virDomainObjPtr obj,
                        int logFD,
                        const char *fmt, ...)
{
    int fd = logFD;
    va_list argptr;
    char *message = NULL;
    int ret = -1;

    va_start(argptr, fmt);

    if ((fd == -1) &&
        (fd = qemuDomainCreateLog(driver, obj, true)) < 0)
        goto cleanup;

    if (virVasprintf(&message, fmt, argptr) < 0) {
        virReportOOMError();
        goto cleanup;
    }
    if (safewrite(fd, message, strlen(message)) < 0) {
        virReportSystemError(errno, _("Unable to write to domain logfile %s"),
                             obj->def->name);
        goto cleanup;
    }

    ret = 0;

cleanup:
    va_end(argptr);

    if (fd != logFD)
        VIR_FORCE_CLOSE(fd);

O
Osier Yang 已提交
1712
    VIR_FREE(message);
1713 1714
    return ret;
}
1715 1716 1717

/* Locate an appropriate 'qemu-img' binary.  */
const char *
1718
qemuFindQemuImgBinary(virQEMUDriverPtr driver)
1719
{
1720 1721 1722
    if (!driver->qemuImgBinary)
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("unable to find kvm-img or qemu-img"));
1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739

    return driver->qemuImgBinary;
}

int
qemuDomainSnapshotWriteMetadata(virDomainObjPtr vm,
                                virDomainSnapshotObjPtr snapshot,
                                char *snapshotDir)
{
    char *newxml = NULL;
    int ret = -1;
    char *snapDir = NULL;
    char *snapFile = NULL;
    char uuidstr[VIR_UUID_STRING_BUFLEN];

    virUUIDFormat(vm->def->uuid, uuidstr);
    newxml = virDomainSnapshotDefFormat(uuidstr, snapshot->def,
1740 1741
                                        QEMU_DOMAIN_FORMAT_LIVE_FLAGS, 1);
    if (newxml == NULL)
1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758
        return -1;

    if (virAsprintf(&snapDir, "%s/%s", snapshotDir, vm->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }
    if (virFileMakePath(snapDir) < 0) {
        virReportSystemError(errno, _("cannot create snapshot directory '%s'"),
                             snapDir);
        goto cleanup;
    }

    if (virAsprintf(&snapFile, "%s/%s.xml", snapDir, snapshot->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }

J
Ján Tomko 已提交
1759
    ret = virXMLSaveFile(snapFile, NULL, "snapshot-edit", newxml);
1760 1761 1762 1763 1764 1765 1766 1767 1768 1769

cleanup:
    VIR_FREE(snapFile);
    VIR_FREE(snapDir);
    VIR_FREE(newxml);
    return ret;
}

/* The domain is expected to be locked and inactive. Return -1 on normal
 * failure, 1 if we skipped a disk due to try_all.  */
1770
static int
1771
qemuDomainSnapshotForEachQcow2Raw(virQEMUDriverPtr driver,
1772 1773 1774 1775 1776
                                  virDomainDefPtr def,
                                  const char *name,
                                  const char *op,
                                  bool try_all,
                                  int ndisks)
1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788
{
    const char *qemuimgarg[] = { NULL, "snapshot", NULL, NULL, NULL, NULL };
    int i;
    bool skipped = false;

    qemuimgarg[0] = qemuFindQemuImgBinary(driver);
    if (qemuimgarg[0] == NULL) {
        /* qemuFindQemuImgBinary set the error */
        return -1;
    }

    qemuimgarg[2] = op;
1789
    qemuimgarg[3] = name;
1790

1791
    for (i = 0; i < ndisks; i++) {
1792
        /* FIXME: we also need to handle LVM here */
1793
        if (def->disks[i]->device == VIR_DOMAIN_DISK_DEVICE_DISK) {
1794 1795
            if (def->disks[i]->format > 0 &&
                def->disks[i]->format != VIR_STORAGE_FILE_QCOW2) {
1796 1797 1798 1799 1800
                if (try_all) {
                    /* Continue on even in the face of error, since other
                     * disks in this VM may have the same snapshot name.
                     */
                    VIR_WARN("skipping snapshot action on %s",
1801
                             def->disks[i]->dst);
1802 1803
                    skipped = true;
                    continue;
1804 1805 1806 1807 1808
                } else if (STREQ(op, "-c") && i) {
                    /* We must roll back partial creation by deleting
                     * all earlier snapshots.  */
                    qemuDomainSnapshotForEachQcow2Raw(driver, def, name,
                                                      "-d", false, i);
1809
                }
1810 1811 1812 1813
                virReportError(VIR_ERR_OPERATION_INVALID,
                               _("Disk device '%s' does not support"
                                 " snapshotting"),
                               def->disks[i]->dst);
1814 1815 1816
                return -1;
            }

1817
            qemuimgarg[4] = def->disks[i]->src;
1818 1819 1820 1821

            if (virRun(qemuimgarg, NULL) < 0) {
                if (try_all) {
                    VIR_WARN("skipping snapshot action on %s",
1822
                             def->disks[i]->dst);
1823 1824
                    skipped = true;
                    continue;
1825 1826 1827 1828 1829
                } else if (STREQ(op, "-c") && i) {
                    /* We must roll back partial creation by deleting
                     * all earlier snapshots.  */
                    qemuDomainSnapshotForEachQcow2Raw(driver, def, name,
                                                      "-d", false, i);
1830 1831 1832 1833 1834 1835 1836 1837 1838
                }
                return -1;
            }
        }
    }

    return skipped ? 1 : 0;
}

1839 1840 1841
/* The domain is expected to be locked and inactive. Return -1 on normal
 * failure, 1 if we skipped a disk due to try_all.  */
int
1842
qemuDomainSnapshotForEachQcow2(virQEMUDriverPtr driver,
1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858
                               virDomainObjPtr vm,
                               virDomainSnapshotObjPtr snap,
                               const char *op,
                               bool try_all)
{
    /* Prefer action on the disks in use at the time the snapshot was
     * created; but fall back to current definition if dealing with a
     * snapshot created prior to libvirt 0.9.5.  */
    virDomainDefPtr def = snap->def->dom;

    if (!def)
        def = vm->def;
    return qemuDomainSnapshotForEachQcow2Raw(driver, def, snap->def->name,
                                             op, try_all, def->ndisks);
}

1859 1860
/* Discard one snapshot (or its metadata), without reparenting any children.  */
int
1861
qemuDomainSnapshotDiscard(virQEMUDriverPtr driver,
1862 1863 1864 1865 1866 1867 1868 1869 1870
                          virDomainObjPtr vm,
                          virDomainSnapshotObjPtr snap,
                          bool update_current,
                          bool metadata_only)
{
    char *snapFile = NULL;
    int ret = -1;
    qemuDomainObjPrivatePtr priv;
    virDomainSnapshotObjPtr parentsnap = NULL;
1871
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
1872 1873 1874 1875 1876 1877 1878 1879 1880

    if (!metadata_only) {
        if (!virDomainObjIsActive(vm)) {
            /* Ignore any skipped disks */
            if (qemuDomainSnapshotForEachQcow2(driver, vm, snap, "-d",
                                               true) < 0)
                goto cleanup;
        } else {
            priv = vm->privateData;
1881
            qemuDomainObjEnterMonitor(driver, vm);
1882 1883
            /* we continue on even in the face of error */
            qemuMonitorDeleteSnapshot(priv->mon, snap->def->name);
1884
            qemuDomainObjExitMonitor(driver, vm);
1885 1886 1887
        }
    }

1888
    if (virAsprintf(&snapFile, "%s/%s/%s.xml", cfg->snapshotDir,
1889 1890 1891 1892 1893 1894 1895
                    vm->def->name, snap->def->name) < 0) {
        virReportOOMError();
        goto cleanup;
    }

    if (snap == vm->current_snapshot) {
        if (update_current && snap->def->parent) {
1896
            parentsnap = virDomainSnapshotFindByName(vm->snapshots,
1897 1898 1899 1900 1901 1902 1903
                                                     snap->def->parent);
            if (!parentsnap) {
                VIR_WARN("missing parent snapshot matching name '%s'",
                         snap->def->parent);
            } else {
                parentsnap->def->current = true;
                if (qemuDomainSnapshotWriteMetadata(vm, parentsnap,
1904
                                                    cfg->snapshotDir) < 0) {
1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916
                    VIR_WARN("failed to set parent snapshot '%s' as current",
                             snap->def->parent);
                    parentsnap->def->current = false;
                    parentsnap = NULL;
                }
            }
        }
        vm->current_snapshot = parentsnap;
    }

    if (unlink(snapFile) < 0)
        VIR_WARN("Failed to unlink %s", snapFile);
1917
    virDomainSnapshotObjListRemove(vm->snapshots, snap);
1918 1919 1920 1921 1922

    ret = 0;

cleanup:
    VIR_FREE(snapFile);
1923
    virObjectUnref(cfg);
1924 1925 1926 1927 1928 1929 1930 1931 1932
    return ret;
}

/* Hash iterator callback to discard multiple snapshots.  */
void qemuDomainSnapshotDiscardAll(void *payload,
                                  const void *name ATTRIBUTE_UNUSED,
                                  void *data)
{
    virDomainSnapshotObjPtr snap = payload;
1933
    virQEMUSnapRemovePtr curr = data;
1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944
    int err;

    if (snap->def->current)
        curr->current = true;
    err = qemuDomainSnapshotDiscard(curr->driver, curr->vm, snap, false,
                                    curr->metadata_only);
    if (err && !curr->err)
        curr->err = err;
}

int
1945
qemuDomainSnapshotDiscardAllMetadata(virQEMUDriverPtr driver,
1946 1947
                                     virDomainObjPtr vm)
{
1948
    virQEMUSnapRemove rem;
1949 1950 1951 1952 1953

    rem.driver = driver;
    rem.vm = vm;
    rem.metadata_only = true;
    rem.err = 0;
1954 1955
    virDomainSnapshotForEach(vm->snapshots, qemuDomainSnapshotDiscardAll,
                             &rem);
1956 1957 1958 1959 1960

    return rem.err;
}

/*
1961
 * The caller must hold a lock the vm and there must
1962 1963 1964
 * be no remaining references to vm.
 */
void
1965
qemuDomainRemoveInactive(virQEMUDriverPtr driver,
1966 1967
                         virDomainObjPtr vm)
{
1968
    char *snapDir;
1969
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
1970

1971 1972 1973 1974 1975
    /* Remove any snapshot metadata prior to removing the domain */
    if (qemuDomainSnapshotDiscardAllMetadata(driver, vm) < 0) {
        VIR_WARN("unable to remove all snapshots for domain %s",
                 vm->def->name);
    }
1976
    else if (virAsprintf(&snapDir, "%s/%s", cfg->snapshotDir,
1977 1978
                         vm->def->name) < 0) {
        VIR_WARN("unable to remove snapshot directory %s/%s",
1979
                 cfg->snapshotDir, vm->def->name);
1980 1981 1982 1983 1984
    } else {
        if (rmdir(snapDir) < 0 && errno != ENOENT)
            VIR_WARN("unable to remove snapshot directory %s", snapDir);
        VIR_FREE(snapDir);
    }
1985
    virDomainObjListRemove(driver->domains, vm);
1986
    virObjectUnref(cfg);
1987
}
1988 1989

void
1990
qemuDomainSetFakeReboot(virQEMUDriverPtr driver,
1991 1992 1993 1994
                        virDomainObjPtr vm,
                        bool value)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
1995
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
1996 1997

    if (priv->fakeReboot == value)
1998
        goto cleanup;
1999 2000 2001

    priv->fakeReboot = value;

2002
    if (virDomainSaveStatus(driver->xmlopt, cfg->stateDir, vm) < 0)
2003
        VIR_WARN("Failed to save status on vm %s", vm->def->name);
2004

2005
cleanup:
2006
    virObjectUnref(cfg);
2007
}
M
Michal Privoznik 已提交
2008 2009

int
2010
qemuDomainCheckDiskPresence(virQEMUDriverPtr driver,
M
Michal Privoznik 已提交
2011
                            virDomainObjPtr vm,
2012
                            bool cold_boot)
M
Michal Privoznik 已提交
2013 2014 2015 2016
{
    int ret = -1;
    int i;
    virDomainDiskDefPtr disk;
M
Michal Privoznik 已提交
2017
    char uuid[VIR_UUID_STRING_BUFLEN];
2018
    virDomainEventPtr event = NULL;
2019
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
M
Michal Privoznik 已提交
2020 2021 2022 2023 2024 2025 2026 2027 2028

    virUUIDFormat(vm->def->uuid, uuid);

    for (i = 0; i < vm->def->ndisks; i++) {
        disk = vm->def->disks[i];

        if (!disk->startupPolicy || !disk->src)
            continue;

M
Michal Privoznik 已提交
2029
        if (virFileAccessibleAs(disk->src, F_OK,
2030 2031
                                cfg->user,
                                cfg->group) >= 0) {
M
Michal Privoznik 已提交
2032
            /* disk accessible */
M
Michal Privoznik 已提交
2033 2034 2035 2036 2037 2038 2039 2040
            continue;
        }

        switch ((enum virDomainStartupPolicy) disk->startupPolicy) {
            case VIR_DOMAIN_STARTUP_POLICY_OPTIONAL:
                break;

            case VIR_DOMAIN_STARTUP_POLICY_MANDATORY:
M
Michal Privoznik 已提交
2041
                virReportSystemError(errno,
M
Michal Privoznik 已提交
2042 2043 2044 2045 2046 2047
                                     _("cannot access file '%s'"),
                                     disk->src);
                goto cleanup;
                break;

            case VIR_DOMAIN_STARTUP_POLICY_REQUISITE:
2048
                if (cold_boot) {
M
Michal Privoznik 已提交
2049
                    virReportSystemError(errno,
M
Michal Privoznik 已提交
2050 2051 2052 2053 2054 2055 2056 2057 2058 2059 2060 2061
                                         _("cannot access file '%s'"),
                                         disk->src);
                    goto cleanup;
                }
                break;

            case VIR_DOMAIN_STARTUP_POLICY_DEFAULT:
            case VIR_DOMAIN_STARTUP_POLICY_LAST:
                /* this should never happen */
                break;
        }

M
Michal Privoznik 已提交
2062 2063
        VIR_DEBUG("Dropping disk '%s' on domain '%s' (UUID '%s') "
                  "due to inaccessible source '%s'",
M
Michal Privoznik 已提交
2064 2065
                  disk->dst, vm->def->name, uuid, disk->src);

2066
        event = virDomainEventDiskChangeNewFromObj(vm, disk->src, NULL, disk->info.alias,
2067
                                                   VIR_DOMAIN_EVENT_DISK_CHANGE_MISSING_ON_START);
2068 2069 2070
        if (event)
            qemuDomainEventQueue(driver, event);

M
Michal Privoznik 已提交
2071 2072 2073 2074 2075 2076
        VIR_FREE(disk->src);
    }

    ret = 0;

cleanup:
2077
    virObjectUnref(cfg);
M
Michal Privoznik 已提交
2078 2079
    return ret;
}
2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133

/*
 * The vm must be locked when any of the following cleanup functions is
 * called.
 */
int
qemuDomainCleanupAdd(virDomainObjPtr vm,
                     qemuDomainCleanupCallback cb)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int i;

    VIR_DEBUG("vm=%s, cb=%p", vm->def->name, cb);

    for (i = 0; i < priv->ncleanupCallbacks; i++) {
        if (priv->cleanupCallbacks[i] == cb)
            return 0;
    }

    if (VIR_RESIZE_N(priv->cleanupCallbacks,
                     priv->ncleanupCallbacks_max,
                     priv->ncleanupCallbacks, 1) < 0) {
        virReportOOMError();
        return -1;
    }

    priv->cleanupCallbacks[priv->ncleanupCallbacks++] = cb;
    return 0;
}

void
qemuDomainCleanupRemove(virDomainObjPtr vm,
                        qemuDomainCleanupCallback cb)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int i;

    VIR_DEBUG("vm=%s, cb=%p", vm->def->name, cb);

    for (i = 0; i < priv->ncleanupCallbacks; i++) {
        if (priv->cleanupCallbacks[i] == cb) {
            memmove(priv->cleanupCallbacks + i,
                    priv->cleanupCallbacks + i + 1,
                    priv->ncleanupCallbacks - i - 1);
            priv->ncleanupCallbacks--;
        }
    }

    VIR_SHRINK_N(priv->cleanupCallbacks,
                 priv->ncleanupCallbacks_max,
                 priv->ncleanupCallbacks_max - priv->ncleanupCallbacks);
}

void
2134
qemuDomainCleanupRun(virQEMUDriverPtr driver,
2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151
                     virDomainObjPtr vm)
{
    qemuDomainObjPrivatePtr priv = vm->privateData;
    int i;

    VIR_DEBUG("driver=%p, vm=%s", driver, vm->def->name);

    /* run cleanup callbacks in reverse order */
    for (i = priv->ncleanupCallbacks - 1; i >= 0; i--) {
        if (priv->cleanupCallbacks[i])
            priv->cleanupCallbacks[i](driver, vm);
    }

    VIR_FREE(priv->cleanupCallbacks);
    priv->ncleanupCallbacks = 0;
    priv->ncleanupCallbacks_max = 0;
}
2152 2153

int
2154
qemuDomainDetermineDiskChain(virQEMUDriverPtr driver,
2155 2156 2157
                             virDomainDiskDefPtr disk,
                             bool force)
{
2158 2159
    virQEMUDriverConfigPtr cfg = virQEMUDriverGetConfig(driver);
    int ret = 0;
2160

2161 2162 2163
    if (!disk->src ||
        disk->type == VIR_DOMAIN_DISK_TYPE_NETWORK ||
        disk->type == VIR_DOMAIN_DISK_TYPE_VOLUME)
2164
        goto cleanup;
2165 2166 2167 2168 2169 2170

    if (disk->backingChain) {
        if (force) {
            virStorageFileFreeMetadata(disk->backingChain);
            disk->backingChain = NULL;
        } else {
2171
            goto cleanup;
2172 2173 2174
        }
    }
    disk->backingChain = virStorageFileGetMetadata(disk->src, disk->format,
2175 2176
                                                   cfg->user, cfg->group,
                                                   cfg->allowDiskFormatProbing);
2177
    if (!disk->backingChain)
2178 2179 2180 2181 2182
        ret = -1;

cleanup:
    virObjectUnref(cfg);
    return ret;
2183
}
2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216


unsigned long long
qemuDomainMemoryLimit(virDomainDefPtr def)
{
    unsigned long long mem;
    int i;

    if (def->mem.hard_limit) {
        mem = def->mem.hard_limit;
    } else {
        /* If there is no hard_limit set, compute a reasonable one to avoid
         * system thrashing caused by exploited qemu.  A 'reasonable
         * limit' has been chosen:
         *     (1 + k) * (domain memory + total video memory) + (32MB for
         *     cache per each disk) + F
         * where k = 0.5 and F = 200MB.  The cache for disks is important as
         * kernel cache on the host side counts into the RSS limit.
         *
         * Technically, the disk cache does not have to be included in
         * RLIMIT_MEMLOCK but it doesn't hurt as it's just an upper limit and
         * it makes this function and its usage simpler.
         */
        mem = def->mem.max_balloon;
        for (i = 0; i < def->nvideos; i++)
            mem += def->videos[i]->vram;
        mem *= 1.5;
        mem += def->ndisks * 32768;
        mem += 204800;
    }

    return mem;
}