qemu_capabilities.c 112.8 KB
Newer Older
1 2 3
/*
 * qemu_capabilities.c: QEMU capabilities generation
 *
4
 * Copyright (C) 2006-2014 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2006 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with this library.  If not, see
O
Osier Yang 已提交
19
 * <http://www.gnu.org/licenses/>.
20 21 22 23 24 25 26
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

#include <config.h>

#include "qemu_capabilities.h"
27
#include "viralloc.h"
28
#include "vircrypto.h"
29
#include "virlog.h"
30
#include "virerror.h"
E
Eric Blake 已提交
31
#include "virfile.h"
32 33
#include "virpidfile.h"
#include "virprocess.h"
34 35 36
#include "nodeinfo.h"
#include "cpu/cpu.h"
#include "domain_conf.h"
37
#include "vircommand.h"
38
#include "virbitmap.h"
39
#include "virnodesuspend.h"
40
#include "virnuma.h"
41
#include "qemu_monitor.h"
42
#include "virstring.h"
43
#include "qemu_hostdev.h"
44

45
#include <fcntl.h>
46 47 48
#include <sys/stat.h>
#include <unistd.h>
#include <sys/wait.h>
49
#include <stdarg.h>
50 51 52

#define VIR_FROM_THIS VIR_FROM_QEMU

53 54
VIR_LOG_INIT("qemu.qemu_capabilities");

55 56 57 58
/* While not public, these strings must not change. They
 * are used in domain status files which are read on
 * daemon restarts
 */
59
VIR_ENUM_IMPL(virQEMUCaps, QEMU_CAPS_LAST,
60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
              "kqemu",  /* 0 */
              "vnc-colon",
              "no-reboot",
              "drive",
              "drive-boot",

              "name", /* 5 */
              "uuid",
              "domid",
              "vnet-hdr",
              "migrate-kvm-stdio",

              "migrate-qemu-tcp", /* 10 */
              "migrate-qemu-exec",
              "drive-cache-v2",
              "kvm",
              "drive-format",

              "vga", /* 15 */
              "0.10",
              "pci-device",
              "mem-path",
              "drive-serial",

              "xen-domid", /* 20 */
              "migrate-qemu-unix",
              "chardev",
              "enable-kvm",
              "monitor-json",

              "balloon", /* 25 */
              "device",
              "sdl",
              "smp-topology",
              "netdev",

              "rtc", /* 30 */
97
              "vhost-net",
98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130
              "rtc-td-hack",
              "no-hpet",
              "no-kvm-pit",

              "tdf", /* 35 */
              "pci-configfd",
              "nodefconfig",
              "boot-menu",
              "enable-kqemu",

              "fsdev", /* 40 */
              "nesting",
              "name-process",
              "drive-readonly",
              "smbios-type",

              "vga-qxl", /* 45 */
              "spice",
              "vga-none",
              "migrate-qemu-fd",
              "boot-index",

              "hda-duplex", /* 50 */
              "drive-aio",
              "pci-multibus",
              "pci-bootindex",
              "ccid-emulated",

              "ccid-passthru", /* 55 */
              "chardev-spicevmc",
              "device-spicevmc",
              "virtio-tx-alg",
              "device-qxl-vga",
131 132

              "pci-multifunction", /* 60 */
133
              "virtio-blk-pci.ioeventfd",
M
Michal Privoznik 已提交
134
              "sga",
135 136
              "virtio-blk-pci.event_idx",
              "virtio-net-pci.event_idx",
137 138 139 140 141 142 143 144 145 146

              "cache-directsync", /* 65 */
              "piix3-usb-uhci",
              "piix4-usb-uhci",
              "usb-ehci",
              "ich9-usb-ehci1",

              "vt82c686b-usb-uhci", /* 70 */
              "pci-ohci",
              "usb-redir",
M
Marc-André Lureau 已提交
147
              "usb-hub",
148
              "no-shutdown",
149 150

              "cache-unsafe", /* 75 */
151
              "rombar",
J
Jim Fehlig 已提交
152
              "ich9-ahci",
153
              "no-acpi",
154
              "fsdev-readonly",
155

156
              "virtio-blk-pci.scsi", /* 80 */
157
              "blk-sg-io",
O
Osier Yang 已提交
158
              "drive-copy-on-read",
159
              "cpu-host",
160
              "fsdev-writeout",
161 162

              "drive-iotune", /* 85 */
163
              "system_wakeup",
164
              "scsi-disk.channel",
165
              "scsi-block",
166
              "transaction",
167 168 169

              "block-job-sync", /* 90 */
              "block-job-async",
170
              "scsi-cd",
171
              "ide-cd",
172
              "no-user-config",
M
Marc-André Lureau 已提交
173 174

              "hda-micro", /* 95 */
175
              "dump-guest-memory",
G
Gerd Hoffmann 已提交
176
              "nec-usb-xhci",
177
              "virtio-s390",
178
              "balloon-event",
M
Marc-André Lureau 已提交
179

R
Richa Marwaha 已提交
180
              "bridge", /* 100 */
181 182
              "lsi",
              "virtio-scsi-pci",
V
Viktor Mihajlovski 已提交
183
              "blockio",
184
              "disable-s3",
R
Richa Marwaha 已提交
185

186
              "disable-s4", /* 105 */
187
              "usb-redir.filter",
188 189
              "ide-drive.wwn",
              "scsi-disk.wwn",
190
              "seccomp-sandbox",
191 192

              "reboot-timeout", /* 110 */
193
              "dump-guest-core",
194
              "seamless-migration",
195
              "block-commit",
196
              "vnc",
197 198

              "drive-mirror", /* 115 */
199 200
              "usb-redir.bootindex",
              "usb-host.bootindex",
201
              "blockdev-snapshot-sync",
202 203 204 205 206 207
              "qxl",

              "VGA", /* 120 */
              "cirrus-vga",
              "vmware-svga",
              "device-video-primary",
208
              "s390-sclp",
209 210

              "usb-serial", /* 125 */
G
Guannan Ren 已提交
211
              "usb-net",
212
              "add-fd",
213
              "nbd-server",
214 215 216
              "virtio-rng",

              "rng-random", /* 130 */
217
              "rng-egd",
O
Olivia Yin 已提交
218 219
              "virtio-ccw",
              "dtb",
220
              "megasas",
J
Ján Tomko 已提交
221 222

              "ipv6-migration", /* 135 */
223
              "machine-opt",
L
Li Zhang 已提交
224
              "machine-usb-opt",
S
Stefan Berger 已提交
225 226
              "tpm-passthrough",
              "tpm-tis",
227 228

              "nvram",  /* 140 */
H
Han Cheng 已提交
229 230 231 232 233 234
              "pci-bridge",
              "vfio-pci",
              "vfio-pci.bootindex",
              "scsi-generic",

              "scsi-generic.bootindex", /* 145 */
235
              "mem-merge",
236
              "vnc-websocket",
O
Osier Yang 已提交
237
              "drive-discard",
238
              "mlock",
239 240

              "vnc-share-policy", /* 150 */
241
              "device-del-event",
242
              "dmi-to-pci-bridge",
243 244
              "i440fx-pci-hole64-size",
              "q35-pci-hole64-size",
245 246

              "usb-storage", /* 155 */
247
              "usb-storage.removable",
248
              "virtio-mmio",
249
              "ich9-intel-hda",
250
              "kvm-pit-lost-tick-policy",
251 252

              "boot-strict", /* 160 */
253 254
              "pvpanic",
              "enable-fips",
255 256
              "spice-file-xfer-disable",
              "spiceport",
L
Li Zhang 已提交
257 258

              "usb-kbd", /* 165 */
259
              "host-pci-multidomain",
260
              "msg-timestamp",
261
              "active-commit",
262
              "change-backing-file",
263 264

              "memory-backend-ram", /* 170 */
265
              "numa",
266
              "memory-backend-file",
267
              "usb-audio",
268
              "rtc-reset-reinjection",
269 270

              "splash-timeout", /* 175 */
J
John Ferlan 已提交
271
              "iothread",
272
              "migrate-rdma",
273
              "ivshmem",
274 275
    );

276 277 278 279 280 281 282 283

/*
 * Update the XML parser/formatter when adding more
 * information to this struct so that it gets cached
 * correctly. It does not have to be ABI-stable, as
 * the cache will be discarded & repopulated if the
 * timestamp on the libvirtd binary changes.
 */
284
struct _virQEMUCaps {
285 286
    virObject object;

287 288
    bool usedQMP;

289
    char *binary;
290
    time_t ctime;
291

292
    virBitmapPtr flags;
293 294 295 296

    unsigned int version;
    unsigned int kvmVersion;

297
    virArch arch;
298 299 300 301 302 303 304

    size_t ncpuDefinitions;
    char **cpuDefinitions;

    size_t nmachineTypes;
    char **machineTypes;
    char **machineAliases;
305
    unsigned int *machineMaxCpus;
306 307
};

308
struct _virQEMUCapsCache {
309 310
    virMutex lock;
    virHashTablePtr binaries;
311
    char *libDir;
312
    char *cacheDir;
313 314
    uid_t runUid;
    gid_t runGid;
315 316
};

317 318 319 320
struct virQEMUCapsSearchData {
    virArch arch;
};

321

322 323
static virClassPtr virQEMUCapsClass;
static void virQEMUCapsDispose(void *obj);
324

325
static int virQEMUCapsOnceInit(void)
326
{
327 328 329 330
    if (!(virQEMUCapsClass = virClassNew(virClassForObject(),
                                         "virQEMUCaps",
                                         sizeof(virQEMUCaps),
                                         virQEMUCapsDispose)))
331 332 333 334 335
        return -1;

    return 0;
}

336
VIR_ONCE_GLOBAL_INIT(virQEMUCaps)
337

338
static virArch virQEMUCapsArchFromString(const char *arch)
339 340 341 342 343 344 345 346 347 348
{
    if (STREQ(arch, "i386"))
        return VIR_ARCH_I686;
    if (STREQ(arch, "arm"))
        return VIR_ARCH_ARMV7L;

    return virArchFromString(arch);
}


349
static const char *virQEMUCapsArchToString(virArch arch)
350 351 352 353 354 355 356 357 358 359
{
    if (arch == VIR_ARCH_I686)
        return "i386";
    else if (arch == VIR_ARCH_ARMV7L)
        return "arm";

    return virArchToString(arch);
}


360
static virCommandPtr
361 362
virQEMUCapsProbeCommand(const char *qemu,
                        virQEMUCapsPtr qemuCaps,
363
                        uid_t runUid, gid_t runGid)
364 365 366
{
    virCommandPtr cmd = virCommandNew(qemu);

367 368
    if (qemuCaps) {
        if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_NO_USER_CONFIG))
369
            virCommandAddArg(cmd, "-no-user-config");
370
        else if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_NODEFCONFIG))
371 372 373 374 375
            virCommandAddArg(cmd, "-nodefconfig");
    }

    virCommandAddEnvPassCommon(cmd);
    virCommandClearCaps(cmd);
376 377
    virCommandSetGID(cmd, runGid);
    virCommandSetUID(cmd, runUid);
378 379 380 381 382

    return cmd;
}


383
static void
384 385
virQEMUCapsSetDefaultMachine(virQEMUCapsPtr qemuCaps,
                             size_t defIdx)
386
{
387 388
    char *name = qemuCaps->machineTypes[defIdx];
    char *alias = qemuCaps->machineAliases[defIdx];
389
    unsigned int maxCpus = qemuCaps->machineMaxCpus[defIdx];
390 391 392 393 394 395 396

    memmove(qemuCaps->machineTypes + 1,
            qemuCaps->machineTypes,
            sizeof(qemuCaps->machineTypes[0]) * defIdx);
    memmove(qemuCaps->machineAliases + 1,
            qemuCaps->machineAliases,
            sizeof(qemuCaps->machineAliases[0]) * defIdx);
397 398 399
    memmove(qemuCaps->machineMaxCpus + 1,
            qemuCaps->machineMaxCpus,
            sizeof(qemuCaps->machineMaxCpus[0]) * defIdx);
400 401
    qemuCaps->machineTypes[0] = name;
    qemuCaps->machineAliases[0] = alias;
402
    qemuCaps->machineMaxCpus[0] = maxCpus;
403 404
}

405 406 407 408
/* Format is:
 * <machine> <desc> [(default)|(alias of <canonical>)]
 */
static int
409 410
virQEMUCapsParseMachineTypesStr(const char *output,
                                virQEMUCapsPtr qemuCaps)
411 412 413
{
    const char *p = output;
    const char *next;
414
    size_t defIdx = 0;
415 416 417

    do {
        const char *t;
418 419
        char *name;
        char *canonical = NULL;
420 421 422 423 424 425 426 427 428 429

        if ((next = strchr(p, '\n')))
            ++next;

        if (STRPREFIX(p, "Supported machines are:"))
            continue;

        if (!(t = strchr(p, ' ')) || (next && t >= next))
            continue;

430 431
        if (VIR_STRNDUP(name, p, t - p) < 0)
            return -1;
432 433

        p = t;
434
        if ((t = strstr(p, "(default)")) && (!next || t < next))
435
            defIdx = qemuCaps->nmachineTypes;
436 437 438

        if ((t = strstr(p, "(alias of ")) && (!next || t < next)) {
            p = t + strlen("(alias of ");
439 440
            if (!(t = strchr(p, ')')) || (next && t >= next)) {
                VIR_FREE(name);
441
                continue;
442
            }
443

444
            if (VIR_STRNDUP(canonical, p, t - p) < 0) {
445
                VIR_FREE(name);
446
                return -1;
447 448 449
            }
        }

450
        if (VIR_REALLOC_N(qemuCaps->machineTypes, qemuCaps->nmachineTypes + 1) < 0 ||
451 452
            VIR_REALLOC_N(qemuCaps->machineAliases, qemuCaps->nmachineTypes + 1) < 0 ||
            VIR_REALLOC_N(qemuCaps->machineMaxCpus, qemuCaps->nmachineTypes + 1) < 0) {
453 454
            VIR_FREE(name);
            VIR_FREE(canonical);
455
            return -1;
456
        }
457
        qemuCaps->nmachineTypes++;
458
        if (canonical) {
459 460
            qemuCaps->machineTypes[qemuCaps->nmachineTypes-1] = canonical;
            qemuCaps->machineAliases[qemuCaps->nmachineTypes-1] = name;
461
        } else {
462 463
            qemuCaps->machineTypes[qemuCaps->nmachineTypes-1] = name;
            qemuCaps->machineAliases[qemuCaps->nmachineTypes-1] = NULL;
464
        }
465 466
        /* When parsing from command line we don't have information about maxCpus */
        qemuCaps->machineMaxCpus[qemuCaps->nmachineTypes-1] = 0;
467 468
    } while ((p = next));

469

470
    if (defIdx)
471
        virQEMUCapsSetDefaultMachine(qemuCaps, defIdx);
472 473 474 475

    return 0;
}

476
static int
477 478
virQEMUCapsProbeMachineTypes(virQEMUCapsPtr qemuCaps,
                             uid_t runUid, gid_t runGid)
479 480
{
    char *output;
481 482
    int ret = -1;
    virCommandPtr cmd;
483
    int status;
484

485 486 487 488
    /* Make sure the binary we are about to try exec'ing exists.
     * Technically we could catch the exec() failure, but that's
     * in a sub-process so it's hard to feed back a useful error.
     */
489
    if (!virFileIsExecutable(qemuCaps->binary)) {
490
        virReportSystemError(errno, _("Cannot find QEMU binary %s"),
491
                             qemuCaps->binary);
492 493 494
        return -1;
    }

495
    cmd = virQEMUCapsProbeCommand(qemuCaps->binary, qemuCaps, runUid, runGid);
496
    virCommandAddArgList(cmd, "-M", "?", NULL);
497
    virCommandSetOutputBuffer(cmd, &output);
498

499 500
    /* Ignore failure from older qemu that did not understand '-M ?'.  */
    if (virCommandRun(cmd, &status) < 0)
501 502
        goto cleanup;

503
    if (virQEMUCapsParseMachineTypesStr(output, qemuCaps) < 0)
504
        goto cleanup;
505 506 507

    ret = 0;

508
 cleanup:
509 510
    VIR_FREE(output);
    virCommandFree(cmd);
511 512 513 514 515 516

    return ret;
}


typedef int
517 518
(*virQEMUCapsParseCPUModels)(const char *output,
                             virQEMUCapsPtr qemuCaps);
519 520 521 522 523 524 525

/* Format:
 *      <arch> <model>
 * qemu-0.13 encloses some model names in []:
 *      <arch> [<model>]
 */
static int
526 527
virQEMUCapsParseX86Models(const char *output,
                          virQEMUCapsPtr qemuCaps)
528 529 530
{
    const char *p = output;
    const char *next;
531
    int ret = -1;
532 533 534

    do {
        const char *t;
535
        size_t len;
536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552

        if ((next = strchr(p, '\n')))
            next++;

        if (!(t = strchr(p, ' ')) || (next && t >= next))
            continue;

        if (!STRPREFIX(p, "x86"))
            continue;

        p = t;
        while (*p == ' ')
            p++;

        if (*p == '\0' || *p == '\n')
            continue;

553
        if (VIR_EXPAND_N(qemuCaps->cpuDefinitions, qemuCaps->ncpuDefinitions, 1) < 0)
554
            goto cleanup;
555

556 557 558 559
        if (next)
            len = next - p - 1;
        else
            len = strlen(p);
560

561 562 563 564
        if (len > 2 && *p == '[' && p[len - 1] == ']') {
            p++;
            len -= 2;
        }
565

566
        if (VIR_STRNDUP(qemuCaps->cpuDefinitions[qemuCaps->ncpuDefinitions - 1], p, len) < 0)
567
            goto cleanup;
568 569
    } while ((p = next));

570
    ret = 0;
571

572
 cleanup:
573
    return ret;
574 575
}

P
Prerna Saxena 已提交
576 577 578 579
/* ppc64 parser.
 * Format : PowerPC <machine> <description>
 */
static int
580 581
virQEMUCapsParsePPCModels(const char *output,
                          virQEMUCapsPtr qemuCaps)
P
Prerna Saxena 已提交
582 583 584
{
    const char *p = output;
    const char *next;
585
    int ret = -1;
P
Prerna Saxena 已提交
586 587 588

    do {
        const char *t;
589
        size_t len;
P
Prerna Saxena 已提交
590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609

        if ((next = strchr(p, '\n')))
            next++;

        if (!STRPREFIX(p, "PowerPC "))
            continue;

        /* Skip the preceding sub-string "PowerPC " */
        p += 8;

        /*Malformed string, does not obey the format 'PowerPC <model> <desc>'*/
        if (!(t = strchr(p, ' ')) || (next && t >= next))
            continue;

        if (*p == '\0')
            break;

        if (*p == '\n')
            continue;

610
        if (VIR_EXPAND_N(qemuCaps->cpuDefinitions, qemuCaps->ncpuDefinitions, 1) < 0)
611
            goto cleanup;
P
Prerna Saxena 已提交
612

613
        len = t - p - 1;
P
Prerna Saxena 已提交
614

615
        if (VIR_STRNDUP(qemuCaps->cpuDefinitions[qemuCaps->ncpuDefinitions - 1], p, len) < 0)
616
            goto cleanup;
P
Prerna Saxena 已提交
617 618
    } while ((p = next));

619
    ret = 0;
P
Prerna Saxena 已提交
620

621
 cleanup:
622
    return ret;
P
Prerna Saxena 已提交
623
}
624

625
static int
626
virQEMUCapsProbeCPUModels(virQEMUCapsPtr qemuCaps, uid_t runUid, gid_t runGid)
627 628 629
{
    char *output = NULL;
    int ret = -1;
630
    virQEMUCapsParseCPUModels parse;
631
    virCommandPtr cmd;
632

633
    if (qemuCaps->arch == VIR_ARCH_I686 ||
634
        qemuCaps->arch == VIR_ARCH_X86_64) {
635
        parse = virQEMUCapsParseX86Models;
636
    } else if (qemuCaps->arch == VIR_ARCH_PPC64) {
637
        parse = virQEMUCapsParsePPCModels;
638
    } else {
639
        VIR_DEBUG("don't know how to parse %s CPU models",
640
                  virArchToString(qemuCaps->arch));
641 642 643
        return 0;
    }

644
    cmd = virQEMUCapsProbeCommand(qemuCaps->binary, qemuCaps, runUid, runGid);
645
    virCommandAddArgList(cmd, "-cpu", "?", NULL);
646
    virCommandSetOutputBuffer(cmd, &output);
647

648
    if (virCommandRun(cmd, NULL) < 0)
649 650
        goto cleanup;

651
    if (parse(output, qemuCaps) < 0)
652 653 654 655
        goto cleanup;

    ret = 0;

656
 cleanup:
657
    VIR_FREE(output);
658
    virCommandFree(cmd);
659 660 661 662 663

    return ret;
}


664
static char *
665 666
virQEMUCapsFindBinaryForArch(virArch hostarch,
                             virArch guestarch)
667 668
{
    char *ret;
669
    const char *archstr = virQEMUCapsArchToString(guestarch);
670
    char *binary;
671

672
    if (virAsprintf(&binary, "qemu-system-%s", archstr) < 0)
673 674 675 676 677 678 679 680 681 682 683
        return NULL;

    ret = virFindFileInPath(binary);
    VIR_FREE(binary);
    if (ret && !virFileIsExecutable(ret))
        VIR_FREE(ret);

    if (guestarch == VIR_ARCH_I686 &&
        !ret &&
        hostarch == VIR_ARCH_X86_64) {
        ret = virFindFileInPath("qemu-system-x86_64");
684 685
        if (ret && !virFileIsExecutable(ret))
            VIR_FREE(ret);
686
    }
687

688 689 690 691 692
    if (guestarch == VIR_ARCH_I686 &&
        !ret) {
        ret = virFindFileInPath("qemu");
        if (ret && !virFileIsExecutable(ret))
            VIR_FREE(ret);
693
    }
694

695 696 697 698 699
    return ret;
}


static bool
700 701
virQEMUCapsIsValidForKVM(virArch hostarch,
                         virArch guestarch)
702
{
703
    if (hostarch == guestarch)
704
        return true;
705 706
    if (hostarch == VIR_ARCH_X86_64 &&
        guestarch == VIR_ARCH_I686)
707 708 709 710
        return true;
    return false;
}

711
static int
712 713 714 715
virQEMUCapsInitGuest(virCapsPtr caps,
                     virQEMUCapsCachePtr cache,
                     virArch hostarch,
                     virArch guestarch)
716
{
717
    size_t i;
718 719
    char *kvmbin = NULL;
    char *binary = NULL;
720 721
    virQEMUCapsPtr qemubinCaps = NULL;
    virQEMUCapsPtr kvmbinCaps = NULL;
722 723
    int ret = -1;

J
Ján Tomko 已提交
724
    /* Check for existence of base emulator, or alternate base
725 726
     * which can be used with magic cpu choice
     */
727
    binary = virQEMUCapsFindBinaryForArch(hostarch, guestarch);
728

729
    /* Ignore binary if extracting version info fails */
730
    if (binary) {
731
        if (!(qemubinCaps = virQEMUCapsCacheLookup(cache, binary))) {
732 733 734 735
            virResetLastError();
            VIR_FREE(binary);
        }
    }
736 737

    /* qemu-kvm/kvm binaries can only be used if
738 739 740 741 742
     *  - host & guest arches match
     * Or
     *  - hostarch is x86_64 and guest arch is i686
     * The latter simply needs "-cpu qemu32"
     */
743
    if (virQEMUCapsIsValidForKVM(hostarch, guestarch)) {
744 745 746
        const char *const kvmbins[] = { "/usr/libexec/qemu-kvm", /* RHEL */
                                        "qemu-kvm", /* Fedora */
                                        "kvm" }; /* Upstream .spec */
747

748 749
        for (i = 0; i < ARRAY_CARDINALITY(kvmbins); ++i) {
            kvmbin = virFindFileInPath(kvmbins[i]);
750

751 752
            if (!kvmbin)
                continue;
753

754
            if (!(kvmbinCaps = virQEMUCapsCacheLookup(cache, kvmbin))) {
755
                virResetLastError();
756 757 758
                VIR_FREE(kvmbin);
                continue;
            }
759

760 761
            if (!binary) {
                binary = kvmbin;
762
                qemubinCaps = kvmbinCaps;
763
                kvmbin = NULL;
764
                kvmbinCaps = NULL;
765
            }
766
            break;
767 768 769
        }
    }

770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798
    ret = virQEMUCapsInitGuestFromBinary(caps,
                                         binary, qemubinCaps,
                                         kvmbin, kvmbinCaps,
                                         guestarch);

    VIR_FREE(binary);
    VIR_FREE(kvmbin);
    virObjectUnref(qemubinCaps);
    virObjectUnref(kvmbinCaps);

    return ret;
}

int
virQEMUCapsInitGuestFromBinary(virCapsPtr caps,
                               const char *binary,
                               virQEMUCapsPtr qemubinCaps,
                               const char *kvmbin,
                               virQEMUCapsPtr kvmbinCaps,
                               virArch guestarch)
{
    virCapsGuestPtr guest;
    bool haskvm = false;
    bool haskqemu = false;
    virCapsGuestMachinePtr *machines = NULL;
    size_t nmachines = 0;
    int ret = -1;
    bool hasdisksnapshot = false;

799 800 801
    if (!binary)
        return 0;

802
    if (virFileExists("/dev/kvm") &&
803 804
        (virQEMUCapsGet(qemubinCaps, QEMU_CAPS_KVM) ||
         virQEMUCapsGet(qemubinCaps, QEMU_CAPS_ENABLE_KVM) ||
805
         kvmbin))
806
        haskvm = true;
807

808
    if (virFileExists("/dev/kqemu") &&
809
        virQEMUCapsGet(qemubinCaps, QEMU_CAPS_KQEMU))
810
        haskqemu = true;
J
Jiri Denemark 已提交
811

812
    if (virQEMUCapsGetMachineTypesCaps(qemubinCaps, &nmachines, &machines) < 0)
813
        goto cleanup;
814 815 816 817

    /* We register kvm as the base emulator too, since we can
     * just give -no-kvm to disable acceleration if required */
    if ((guest = virCapabilitiesAddGuest(caps,
D
Daniel P. Berrange 已提交
818
                                         "hvm",
819
                                         guestarch,
820 821 822 823
                                         binary,
                                         NULL,
                                         nmachines,
                                         machines)) == NULL)
824
        goto cleanup;
825 826 827 828 829

    machines = NULL;
    nmachines = 0;

    if (caps->host.cpu &&
J
Jiri Denemark 已提交
830
        caps->host.cpu->model &&
831
        virQEMUCapsGetCPUDefinitions(qemubinCaps, NULL) > 0 &&
832
        !virCapabilitiesAddGuestFeature(guest, "cpuselection", true, false))
833
        goto cleanup;
834

835
    if (virQEMUCapsGet(qemubinCaps, QEMU_CAPS_BOOTINDEX) &&
836
        !virCapabilitiesAddGuestFeature(guest, "deviceboot", true, false))
837
        goto cleanup;
838

839 840 841
    if (virQEMUCapsGet(qemubinCaps, QEMU_CAPS_DISK_SNAPSHOT))
        hasdisksnapshot = true;

842 843
    if (!virCapabilitiesAddGuestFeature(guest, "disksnapshot", hasdisksnapshot,
                                        false))
844
        goto cleanup;
845

D
Daniel P. Berrange 已提交
846 847 848 849 850 851
    if (virCapabilitiesAddGuestDomain(guest,
                                      "qemu",
                                      NULL,
                                      NULL,
                                      0,
                                      NULL) == NULL)
852
        goto cleanup;
853

D
Daniel P. Berrange 已提交
854 855 856 857 858 859 860
    if (haskqemu &&
        virCapabilitiesAddGuestDomain(guest,
                                      "kqemu",
                                      NULL,
                                      NULL,
                                      0,
                                      NULL) == NULL)
861
        goto cleanup;
862

D
Daniel P. Berrange 已提交
863 864
    if (haskvm) {
        virCapsGuestDomainPtr dom;
865

D
Daniel P. Berrange 已提交
866
        if (kvmbin &&
867
            virQEMUCapsGetMachineTypesCaps(kvmbinCaps, &nmachines, &machines) < 0)
868
            goto cleanup;
869

D
Daniel P. Berrange 已提交
870 871 872 873 874 875
        if ((dom = virCapabilitiesAddGuestDomain(guest,
                                                 "kvm",
                                                 kvmbin ? kvmbin : binary,
                                                 NULL,
                                                 nmachines,
                                                 machines)) == NULL) {
876
            goto cleanup;
D
Daniel P. Berrange 已提交
877
        }
878

D
Daniel P. Berrange 已提交
879 880
        machines = NULL;
        nmachines = 0;
881 882 883

    }

884 885
    if (((guestarch == VIR_ARCH_I686) ||
         (guestarch == VIR_ARCH_X86_64)) &&
886 887
        (virCapabilitiesAddGuestFeature(guest, "acpi", true, true) == NULL ||
         virCapabilitiesAddGuestFeature(guest, "apic", true, false) == NULL))
888
        goto cleanup;
889

890
    if ((guestarch == VIR_ARCH_I686) &&
891 892
        (virCapabilitiesAddGuestFeature(guest, "pae", true, false) == NULL ||
         virCapabilitiesAddGuestFeature(guest, "nonpae", true, false) == NULL))
893
        goto cleanup;
894 895 896

    ret = 0;

897
 cleanup:
898 899 900

    virCapabilitiesFreeMachines(machines, nmachines);

901
    return ret;
902 903 904 905
}


static int
906 907
virQEMUCapsInitCPU(virCapsPtr caps,
                   virArch arch)
908 909
{
    virCPUDefPtr cpu = NULL;
910
    virCPUDataPtr data = NULL;
911 912 913
    virNodeInfo nodeinfo;
    int ret = -1;

914
    if (VIR_ALLOC(cpu) < 0)
915 916
        goto error;

917 918
    cpu->arch = arch;

919
    if (nodeGetInfo(&nodeinfo))
920 921 922 923 924 925
        goto error;

    cpu->type = VIR_CPU_TYPE_HOST;
    cpu->sockets = nodeinfo.sockets;
    cpu->cores = nodeinfo.cores;
    cpu->threads = nodeinfo.threads;
J
Jiri Denemark 已提交
926
    caps->host.cpu = cpu;
927

928
    if (!(data = cpuNodeData(arch))
929
        || cpuDecode(cpu, data, NULL, 0, NULL) < 0)
J
Jiri Denemark 已提交
930
        goto cleanup;
931 932 933

    ret = 0;

934
 cleanup:
J
Jiri Denemark 已提交
935
    cpuDataFree(data);
936 937 938

    return ret;

939
 error:
940 941 942 943 944
    virCPUDefFree(cpu);
    goto cleanup;
}


M
Michal Privoznik 已提交
945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967
static int
virQEMUCapsInitPages(virCapsPtr caps)
{
    int ret = -1;
    unsigned int *pages_size = NULL;
    size_t npages;

    if (virNumaGetPages(-1 /* Magic constant for overall info */,
                        &pages_size, NULL, NULL, &npages) < 0)
        goto cleanup;

    caps->host.pagesSize = pages_size;
    pages_size = NULL;
    caps->host.nPagesSize = npages;
    npages = 0;

    ret = 0;
 cleanup:
    VIR_FREE(pages_size);
    return ret;
}


968
virCapsPtr virQEMUCapsInit(virQEMUCapsCachePtr cache)
969 970
{
    virCapsPtr caps;
971
    size_t i;
T
Tal Kain 已提交
972
    virArch hostarch = virArchFromHost();
973

T
Tal Kain 已提交
974
    if ((caps = virCapabilitiesNew(hostarch,
975
                                   true, true)) == NULL)
976
        goto error;
977 978 979 980 981 982 983

    /* Some machines have problematic NUMA toplogy causing
     * unexpected failures. We don't want to break the QEMU
     * driver in this scenario, so log errors & carry on
     */
    if (nodeCapsInitNUMA(caps) < 0) {
        virCapabilitiesFreeNUMAInfo(caps);
984
        VIR_WARN("Failed to query host NUMA topology, disabling NUMA capabilities");
985 986
    }

T
Tal Kain 已提交
987
    if (virQEMUCapsInitCPU(caps, hostarch) < 0)
988
        VIR_WARN("Failed to get host CPU");
989

990
    /* Add the power management features of the host */
991
    if (virNodeSuspendGetTargetMask(&caps->host.powerMgmt) < 0)
992 993
        VIR_WARN("Failed to get host power management capabilities");

M
Michal Privoznik 已提交
994 995 996 997
    /* Add huge pages info */
    if (virQEMUCapsInitPages(caps) < 0)
        VIR_WARN("Failed to get pages info");

998 999 1000
    /* Add domain migration transport URIs */
    virCapabilitiesAddHostMigrateTransport(caps, "tcp");
    virCapabilitiesAddHostMigrateTransport(caps, "rdma");
1001

1002 1003 1004 1005
    /* QEMU can support pretty much every arch that exists,
     * so just probe for them all - we gracefully fail
     * if a qemu-system-$ARCH binary can't be found
     */
1006
    for (i = 0; i < VIR_ARCH_LAST; i++)
1007
        if (virQEMUCapsInitGuest(caps, cache,
T
Tal Kain 已提交
1008
                                 hostarch,
1009
                                 i) < 0)
1010
            goto error;
1011 1012 1013

    return caps;

1014
 error:
1015
    virObjectUnref(caps);
1016 1017 1018 1019
    return NULL;
}


1020
static int
1021 1022
virQEMUCapsComputeCmdFlags(const char *help,
                           unsigned int version,
1023
                           bool is_kvm,
1024 1025 1026
                           unsigned int kvm_version,
                           virQEMUCapsPtr qemuCaps,
                           bool check_yajl ATTRIBUTE_UNUSED)
1027 1028
{
    const char *p;
R
Richa Marwaha 已提交
1029
    const char *fsdev, *netdev;
1030 1031

    if (strstr(help, "-no-kqemu"))
1032
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_KQEMU);
1033
    if (strstr(help, "-enable-kqemu"))
1034
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ENABLE_KQEMU);
1035
    if (strstr(help, "-no-kvm"))
1036
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_KVM);
1037
    if (strstr(help, "-enable-kvm"))
1038
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ENABLE_KVM);
1039
    if (strstr(help, "-no-reboot"))
1040
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_REBOOT);
1041
    if (strstr(help, "-name")) {
1042
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME);
1043
        if (strstr(help, ",process="))
1044
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME_PROCESS);
1045 1046
    }
    if (strstr(help, "-uuid"))
1047
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_UUID);
1048
    if (strstr(help, "-xen-domid"))
1049
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_XEN_DOMID);
1050
    else if (strstr(help, "-domid"))
1051
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DOMID);
1052
    if (strstr(help, "-drive")) {
1053 1054
        const char *cache = strstr(help, "cache=");

1055
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE);
1056 1057
        if (cache && (p = strchr(cache, ']'))) {
            if (memmem(cache, p - cache, "on|off", sizeof("on|off") - 1) == NULL)
1058
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_V2);
1059
            if (memmem(cache, p - cache, "directsync", sizeof("directsync") - 1))
1060
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_DIRECTSYNC);
1061
            if (memmem(cache, p - cache, "unsafe", sizeof("unsafe") - 1))
1062
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_UNSAFE);
1063
        }
1064
        if (strstr(help, "format="))
1065
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_FORMAT);
1066
        if (strstr(help, "readonly="))
1067
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_READONLY);
1068
        if (strstr(help, "aio=threads|native"))
1069
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_AIO);
O
Osier Yang 已提交
1070
        if (strstr(help, "copy-on-read=on|off"))
1071
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_COPY_ON_READ);
1072
        if (strstr(help, "bps="))
1073
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_IOTUNE);
1074 1075 1076 1077
    }
    if ((p = strstr(help, "-vga")) && !strstr(help, "-std-vga")) {
        const char *nl = strstr(p, "\n");

1078
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA);
1079 1080

        if (strstr(p, "|qxl"))
1081
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_QXL);
1082
        if ((p = strstr(p, "|none")) && p < nl)
1083
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_NONE);
1084 1085
    }
    if (strstr(help, "-spice"))
1086
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SPICE);
1087
    if (strstr(help, "-vnc"))
1088
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC);
1089
    if (strstr(help, "seamless-migration="))
1090
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SEAMLESS_MIGRATION);
1091
    if (strstr(help, "boot=on"))
1092
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_BOOT);
1093
    if (strstr(help, "serial=s"))
1094
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_SERIAL);
1095
    if (strstr(help, "-pcidevice"))
1096
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCIDEVICE);
1097 1098
    if (strstr(help, "host=[seg:]bus"))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_HOST_PCI_MULTIDOMAIN);
1099
    if (strstr(help, "-mem-path"))
1100
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MEM_PATH);
1101
    if (strstr(help, "-chardev")) {
1102
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV);
1103
        if (strstr(help, "-chardev spicevmc"))
1104
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC);
1105 1106
        if (strstr(help, "-chardev spiceport"))
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEPORT);
1107
    }
1108
    if (strstr(help, "-balloon"))
1109
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_BALLOON);
1110
    if (strstr(help, "-device")) {
1111
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE);
1112 1113 1114 1115
        /*
         * When -device was introduced, qemu already supported drive's
         * readonly option but didn't advertise that.
         */
1116
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_READONLY);
1117 1118
    }
    if (strstr(help, "-nodefconfig"))
1119
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NODEFCONFIG);
1120
    if (strstr(help, "-no-user-config"))
1121
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_USER_CONFIG);
1122 1123
    /* The trailing ' ' is important to avoid a bogus match */
    if (strstr(help, "-rtc "))
1124
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_RTC);
1125 1126
    /* to wit */
    if (strstr(help, "-rtc-td-hack"))
1127
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_RTC_TD_HACK);
1128
    if (strstr(help, "-no-hpet"))
1129
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_HPET);
1130
    if (strstr(help, "-no-acpi"))
1131
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_ACPI);
1132
    if (strstr(help, "-no-kvm-pit-reinjection"))
1133
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_KVM_PIT);
1134
    if (strstr(help, "-tdf"))
1135
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_TDF);
1136
    if (strstr(help, "-enable-nesting"))
1137
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NESTING);
1138
    if (strstr(help, ",menu=on"))
1139
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_BOOT_MENU);
1140
    if (strstr(help, ",reboot-timeout=rb_time"))
1141
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_REBOOT_TIMEOUT);
1142 1143
    if (strstr(help, ",splash-time=sp_time"))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SPLASH_TIMEOUT);
1144
    if ((fsdev = strstr(help, "-fsdev"))) {
1145
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV);
1146
        if (strstr(fsdev, "readonly"))
1147
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_READONLY);
1148
        if (strstr(fsdev, "writeout"))
1149
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_WRITEOUT);
1150
    }
1151
    if (strstr(help, "-smbios type"))
1152
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMBIOS_TYPE);
1153
    if (strstr(help, "-sandbox"))
1154
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SECCOMP_SANDBOX);
1155

R
Richa Marwaha 已提交
1156
    if ((netdev = strstr(help, "-netdev"))) {
1157 1158
        /* Disable -netdev on 0.12 since although it exists,
         * the corresponding netdev_add/remove monitor commands
1159 1160
         * do not, and we need them to be able to do hotplug.
         * But see below about RHEL build. */
R
Richa Marwaha 已提交
1161 1162
        if (version >= 13000) {
            if (strstr(netdev, "bridge"))
1163 1164
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV_BRIDGE);
           virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
R
Richa Marwaha 已提交
1165
        }
1166 1167 1168
    }

    if (strstr(help, "-sdl"))
1169
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SDL);
1170 1171 1172
    if (strstr(help, "cores=") &&
        strstr(help, "threads=") &&
        strstr(help, "sockets="))
1173
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMP_TOPOLOGY);
1174 1175

    if (version >= 9000)
1176
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_COLON);
1177 1178

    if (is_kvm && (version >= 10000 || kvm_version >= 74))
1179
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNET_HDR);
1180

1181
    if (strstr(help, ",vhost=")) {
1182
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VHOST_NET);
1183 1184
    }

1185 1186
    /* Do not use -no-shutdown if qemu doesn't support it or SIGTERM handling
     * is most likely buggy when used with -no-shutdown (which applies for qemu
1187
     * 0.14.* and 0.15.0)
1188
     */
1189
    if (strstr(help, "-no-shutdown") && (version < 14000 || version > 15000))
1190
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_SHUTDOWN);
1191

1192
    if (strstr(help, "dump-guest-core=on|off"))
1193
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DUMP_GUEST_CORE);
1194

O
Olivia Yin 已提交
1195 1196 1197
    if (strstr(help, "-dtb"))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DTB);

1198 1199 1200
    if (strstr(help, "-machine"))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_OPT);

1201 1202 1203 1204
    /*
     * Handling of -incoming arg with varying features
     *  -incoming tcp    (kvm >= 79, qemu >= 0.10.0)
     *  -incoming exec   (kvm >= 80, qemu >= 0.10.0)
1205 1206
     *  -incoming unix   (qemu >= 0.12.0)
     *  -incoming fd     (qemu >= 0.12.0)
1207 1208 1209 1210 1211 1212 1213
     *  -incoming stdio  (all earlier kvm)
     *
     * NB, there was a pre-kvm-79 'tcp' support, but it
     * was broken, because it blocked the monitor console
     * while waiting for data, so pretend it doesn't exist
     */
    if (version >= 10000) {
1214 1215
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_TCP);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_EXEC);
1216
        if (version >= 12000) {
1217 1218
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_UNIX);
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_FD);
1219
        }
1220
    } else if (kvm_version >= 79) {
1221
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_TCP);
1222
        if (kvm_version >= 80)
1223
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_EXEC);
1224
    } else if (kvm_version > 0) {
1225
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_KVM_STDIO);
1226 1227 1228
    }

    if (version >= 10000)
1229
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_0_10);
1230

1231
    if (version >= 11000)
1232
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VIRTIO_BLK_SG_IO);
1233

1234 1235 1236
    /* While JSON mode was available in 0.12.0, it was too
     * incomplete to contemplate using. The 0.13.0 release
     * is good enough to use, even though it lacks one or
1237 1238 1239 1240 1241
     * two features. This is also true of versions of qemu
     * built for RHEL, labeled 0.12.1, but with extra text
     * in the help output that mentions that features were
     * backported for libvirt. The benefits of JSON mode now
     * outweigh the downside.
1242
     */
1243
#if WITH_YAJL
1244
    if (version >= 13000) {
1245
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MONITOR_JSON);
1246 1247
    } else if (version >= 12000 &&
               strstr(help, "libvirt")) {
1248 1249
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MONITOR_JSON);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
1250
    }
1251 1252 1253 1254 1255 1256 1257
#else
    /* Starting with qemu 0.15 and newer, upstream qemu no longer
     * promises to keep the human interface stable, but requests that
     * we use QMP (the JSON interface) for everything.  If the user
     * forgot to include YAJL libraries when building their own
     * libvirt but is targetting a newer qemu, we are better off
     * telling them to recompile (the spec file includes the
1258
     * dependency, so distros won't hit this).  This check is
1259
     * also in m4/virt-yajl.m4 (see $with_yajl).  */
1260 1261 1262
    if (version >= 15000 ||
        (version >= 12000 && strstr(help, "libvirt"))) {
        if (check_yajl) {
1263 1264 1265
            virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                           _("this qemu binary requires libvirt to be "
                             "compiled with yajl"));
1266 1267
            return -1;
        }
1268
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
1269
    }
E
Eric Blake 已提交
1270
#endif
1271 1272

    if (version >= 13000)
1273
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_MULTIFUNCTION);
1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285

    /* Although very new versions of qemu advertise the presence of
     * the rombar option in the output of "qemu -device pci-assign,?",
     * this advertisement was added to the code long after the option
     * itself. According to qemu developers, though, rombar is
     * available in all qemu binaries from release 0.12 onward.
     * Setting the capability this way makes it available in more
     * cases where it might be needed, and shouldn't cause any false
     * positives (in the case that it did, qemu would produce an error
     * log and refuse to start, so it would be immediately obvious).
     */
    if (version >= 12000)
1286
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_ROMBAR);
1287 1288

    if (version >= 11000)
1289
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_CPU_HOST);
1290

1291
    if (version >= 1001000) {
J
Ján Tomko 已提交
1292
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_IPV6_MIGRATION);
1293 1294
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_SHARE_POLICY);
    }
J
Ján Tomko 已提交
1295

1296
    return 0;
1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322
}

/* We parse the output of 'qemu -help' to get the QEMU
 * version number. The first bit is easy, just parse
 * 'QEMU PC emulator version x.y.z'
 * or
 * 'QEMU emulator version x.y.z'.
 *
 * With qemu-kvm, however, that is followed by a string
 * in parenthesis as follows:
 *  - qemu-kvm-x.y.z in stable releases
 *  - kvm-XX for kvm versions up to kvm-85
 *  - qemu-kvm-devel-XX for kvm version kvm-86 and later
 *
 * For qemu-kvm versions before 0.10.z, we need to detect
 * the KVM version number for some features. With 0.10.z
 * and later, we just need the QEMU version number and
 * whether it is KVM QEMU or mainline QEMU.
 */
#define QEMU_VERSION_STR_1  "QEMU emulator version"
#define QEMU_VERSION_STR_2  "QEMU PC emulator version"
#define QEMU_KVM_VER_PREFIX "(qemu-kvm-"
#define KVM_VER_PREFIX      "(kvm-"

#define SKIP_BLANKS(p) do { while ((*(p) == ' ') || (*(p) == '\t')) (p)++; } while (0)

1323 1324 1325 1326
int virQEMUCapsParseHelpStr(const char *qemu,
                            const char *help,
                            virQEMUCapsPtr qemuCaps,
                            unsigned int *version,
1327
                            bool *is_kvm,
1328 1329
                            unsigned int *kvm_version,
                            bool check_yajl)
1330 1331 1332
{
    unsigned major, minor, micro;
    const char *p = help;
1333
    char *strflags;
1334

1335 1336
    *version = *kvm_version = 0;
    *is_kvm = false;
1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353

    if (STRPREFIX(p, QEMU_VERSION_STR_1))
        p += strlen(QEMU_VERSION_STR_1);
    else if (STRPREFIX(p, QEMU_VERSION_STR_2))
        p += strlen(QEMU_VERSION_STR_2);
    else
        goto fail;

    SKIP_BLANKS(p);

    major = virParseNumber(&p);
    if (major == -1 || *p != '.')
        goto fail;

    ++p;

    minor = virParseNumber(&p);
J
Jiri Denemark 已提交
1354
    if (minor == -1)
1355 1356
        goto fail;

J
Jiri Denemark 已提交
1357 1358 1359 1360 1361 1362 1363 1364
    if (*p != '.') {
        micro = 0;
    } else {
        ++p;
        micro = virParseNumber(&p);
        if (micro == -1)
            goto fail;
    }
1365 1366 1367 1368

    SKIP_BLANKS(p);

    if (STRPREFIX(p, QEMU_KVM_VER_PREFIX)) {
1369
        *is_kvm = true;
1370 1371 1372 1373
        p += strlen(QEMU_KVM_VER_PREFIX);
    } else if (STRPREFIX(p, KVM_VER_PREFIX)) {
        int ret;

1374
        *is_kvm = true;
1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385
        p += strlen(KVM_VER_PREFIX);

        ret = virParseNumber(&p);
        if (ret == -1)
            goto fail;

        *kvm_version = ret;
    }

    *version = (major * 1000 * 1000) + (minor * 1000) + micro;

1386 1387
    if (virQEMUCapsComputeCmdFlags(help, *version, *is_kvm, *kvm_version,
                                   qemuCaps, check_yajl) < 0)
1388
        goto cleanup;
1389

1390
    strflags = virBitmapString(qemuCaps->flags);
1391 1392 1393
    VIR_DEBUG("Version %u.%u.%u, cooked version %u, flags %s",
              major, minor, micro, *version, NULLSTR(strflags));
    VIR_FREE(strflags);
1394 1395 1396 1397 1398 1399 1400 1401

    if (*kvm_version)
        VIR_DEBUG("KVM version %d detected", *kvm_version);
    else if (*is_kvm)
        VIR_DEBUG("qemu-kvm version %u.%u.%u detected", major, minor, micro);

    return 0;

1402
 fail:
1403
    p = strchr(help, '\n');
1404 1405
    if (!p)
        p = strchr(help, '\0');
1406

1407 1408 1409
    virReportError(VIR_ERR_INTERNAL_ERROR,
                   _("cannot parse %s version number in '%.*s'"),
                   qemu, (int) (p - help), help);
1410

1411
 cleanup:
1412 1413 1414
    return -1;
}

1415

1416
struct virQEMUCapsStringFlags {
1417 1418 1419 1420 1421
    const char *value;
    int flag;
};


1422 1423 1424
struct virQEMUCapsStringFlags virQEMUCapsCommands[] = {
    { "system_wakeup", QEMU_CAPS_WAKEUP },
    { "transaction", QEMU_CAPS_TRANSACTION },
1425 1426
    { "block_stream", QEMU_CAPS_BLOCKJOB_SYNC },
    { "block-stream", QEMU_CAPS_BLOCKJOB_ASYNC },
1427 1428 1429 1430 1431 1432 1433 1434 1435
    { "dump-guest-memory", QEMU_CAPS_DUMP_GUEST_MEMORY },
    { "query-spice", QEMU_CAPS_SPICE },
    { "query-kvm", QEMU_CAPS_KVM },
    { "block-commit", QEMU_CAPS_BLOCK_COMMIT },
    { "query-vnc", QEMU_CAPS_VNC },
    { "drive-mirror", QEMU_CAPS_DRIVE_MIRROR },
    { "blockdev-snapshot-sync", QEMU_CAPS_DISK_SNAPSHOT },
    { "add-fd", QEMU_CAPS_ADD_FD },
    { "nbd-server-start", QEMU_CAPS_NBD_SERVER },
1436
    { "change-backing-file", QEMU_CAPS_CHANGE_BACKING_FILE },
1437
    { "rtc-reset-reinjection", QEMU_CAPS_RTC_RESET_REINJECTION },
1438 1439
};

1440 1441 1442 1443
struct virQEMUCapsStringFlags virQEMUCapsMigration[] = {
    { "rdma-pin-all", QEMU_CAPS_MIGRATE_RDMA },
};

1444 1445 1446
struct virQEMUCapsStringFlags virQEMUCapsEvents[] = {
    { "BALLOON_CHANGE", QEMU_CAPS_BALLOON_EVENT },
    { "SPICE_MIGRATE_COMPLETED", QEMU_CAPS_SEAMLESS_MIGRATION },
1447
    { "DEVICE_DELETED", QEMU_CAPS_DEVICE_DEL_EVENT },
1448 1449
};

1450
struct virQEMUCapsStringFlags virQEMUCapsObjectTypes[] = {
1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465
    { "hda-duplex", QEMU_CAPS_HDA_DUPLEX },
    { "hda-micro", QEMU_CAPS_HDA_MICRO },
    { "ccid-card-emulated", QEMU_CAPS_CCID_EMULATED },
    { "ccid-card-passthru", QEMU_CAPS_CCID_PASSTHRU },
    { "piix3-usb-uhci", QEMU_CAPS_PIIX3_USB_UHCI },
    { "piix4-usb-uhci", QEMU_CAPS_PIIX4_USB_UHCI },
    { "usb-ehci", QEMU_CAPS_USB_EHCI },
    { "ich9-usb-ehci1", QEMU_CAPS_ICH9_USB_EHCI1 },
    { "vt82c686b-usb-uhci", QEMU_CAPS_VT82C686B_USB_UHCI },
    { "pci-ohci", QEMU_CAPS_PCI_OHCI },
    { "nec-usb-xhci", QEMU_CAPS_NEC_USB_XHCI },
    { "usb-redir", QEMU_CAPS_USB_REDIR },
    { "usb-hub", QEMU_CAPS_USB_HUB },
    { "ich9-ahci", QEMU_CAPS_ICH9_AHCI },
    { "virtio-blk-s390", QEMU_CAPS_VIRTIO_S390 },
1466
    { "virtio-blk-ccw", QEMU_CAPS_VIRTIO_CCW },
1467
    { "sclpconsole", QEMU_CAPS_SCLP_S390 },
1468
    { "lsi53c895a", QEMU_CAPS_SCSI_LSI },
1469
    { "virtio-scsi-pci", QEMU_CAPS_VIRTIO_SCSI },
1470 1471
    { "virtio-scsi-s390", QEMU_CAPS_VIRTIO_SCSI },
    { "virtio-scsi-ccw", QEMU_CAPS_VIRTIO_SCSI },
1472
    { "megasas", QEMU_CAPS_SCSI_MEGASAS },
1473 1474
    { "spicevmc", QEMU_CAPS_DEVICE_SPICEVMC },
    { "qxl-vga", QEMU_CAPS_DEVICE_QXL_VGA },
1475
    { "qxl", QEMU_CAPS_DEVICE_QXL },
1476 1477 1478 1479
    { "sga", QEMU_CAPS_SGA },
    { "scsi-block", QEMU_CAPS_SCSI_BLOCK },
    { "scsi-cd", QEMU_CAPS_SCSI_CD },
    { "ide-cd", QEMU_CAPS_IDE_CD },
1480 1481 1482
    { "VGA", QEMU_CAPS_DEVICE_VGA },
    { "cirrus-vga", QEMU_CAPS_DEVICE_CIRRUS_VGA },
    { "vmware-svga", QEMU_CAPS_DEVICE_VMWARE_SVGA },
H
Han Cheng 已提交
1483 1484
    { "usb-serial", QEMU_CAPS_DEVICE_USB_SERIAL },
    { "usb-net", QEMU_CAPS_DEVICE_USB_NET },
1485
    { "virtio-rng-pci", QEMU_CAPS_DEVICE_VIRTIO_RNG },
1486 1487
    { "virtio-rng-s390", QEMU_CAPS_DEVICE_VIRTIO_RNG },
    { "virtio-rng-ccw", QEMU_CAPS_DEVICE_VIRTIO_RNG },
1488
    { "rng-random", QEMU_CAPS_OBJECT_RNG_RANDOM },
1489
    { "rng-egd", QEMU_CAPS_OBJECT_RNG_EGD },
1490
    { "spapr-nvram", QEMU_CAPS_DEVICE_NVRAM },
1491
    { "pci-bridge", QEMU_CAPS_DEVICE_PCI_BRIDGE },
1492
    { "vfio-pci", QEMU_CAPS_DEVICE_VFIO_PCI },
H
Han Cheng 已提交
1493
    { "scsi-generic", QEMU_CAPS_DEVICE_SCSI_GENERIC },
1494
    { "i82801b11-bridge", QEMU_CAPS_DEVICE_DMI_TO_PCI_BRIDGE },
1495
    { "usb-storage", QEMU_CAPS_DEVICE_USB_STORAGE },
1496
    { "virtio-mmio", QEMU_CAPS_DEVICE_VIRTIO_MMIO },
1497
    { "ich9-intel-hda", QEMU_CAPS_DEVICE_ICH9_INTEL_HDA },
H
Hu Tao 已提交
1498
    { "pvpanic", QEMU_CAPS_DEVICE_PANIC },
L
Li Zhang 已提交
1499
    { "usb-kbd", QEMU_CAPS_DEVICE_USB_KBD },
1500
    { "memory-backend-ram", QEMU_CAPS_OBJECT_MEMORY_RAM },
1501
    { "memory-backend-file", QEMU_CAPS_OBJECT_MEMORY_FILE },
1502
    { "usb-audio", QEMU_CAPS_OBJECT_USB_AUDIO },
J
John Ferlan 已提交
1503
    { "iothread", QEMU_CAPS_OBJECT_IOTHREAD},
1504
    { "ivshmem", QEMU_CAPS_DEVICE_IVSHMEM },
1505 1506
};

1507
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsVirtioBlk[] = {
1508 1509 1510 1511 1512 1513 1514 1515
    { "multifunction", QEMU_CAPS_PCI_MULTIFUNCTION },
    { "bootindex", QEMU_CAPS_BOOTINDEX },
    { "ioeventfd", QEMU_CAPS_VIRTIO_IOEVENTFD },
    { "event_idx", QEMU_CAPS_VIRTIO_BLK_EVENT_IDX },
    { "scsi", QEMU_CAPS_VIRTIO_BLK_SCSI },
    { "logical_block_size", QEMU_CAPS_BLOCKIO },
};

1516
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsVirtioNet[] = {
1517 1518 1519 1520
    { "tx", QEMU_CAPS_VIRTIO_TX_ALG },
    { "event_idx", QEMU_CAPS_VIRTIO_NET_EVENT_IDX },
};

1521
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsPCIAssign[] = {
1522
    { "rombar", QEMU_CAPS_PCI_ROMBAR },
1523 1524 1525 1526
    { "configfd", QEMU_CAPS_PCI_CONFIGFD },
    { "bootindex", QEMU_CAPS_PCI_BOOTINDEX },
};

1527
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsVfioPCI[] = {
1528 1529 1530
    { "bootindex", QEMU_CAPS_VFIO_PCI_BOOTINDEX },
};

1531
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsSCSIDisk[] = {
1532 1533 1534 1535
    { "channel", QEMU_CAPS_SCSI_DISK_CHANNEL },
    { "wwn", QEMU_CAPS_SCSI_DISK_WWN },
};

1536
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsIDEDrive[] = {
1537 1538 1539
    { "wwn", QEMU_CAPS_IDE_DRIVE_WWN },
};

1540
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsPixx4PM[] = {
1541 1542 1543 1544
    { "disable_s3", QEMU_CAPS_DISABLE_S3 },
    { "disable_s4", QEMU_CAPS_DISABLE_S4 },
};

1545
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsUSBRedir[] = {
1546
    { "filter", QEMU_CAPS_USB_REDIR_FILTER },
1547 1548 1549
    { "bootindex", QEMU_CAPS_USB_REDIR_BOOTINDEX },
};

1550
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsUSBHost[] = {
1551
    { "bootindex", QEMU_CAPS_USB_HOST_BOOTINDEX },
1552 1553
};

1554
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsSCSIGeneric[] = {
H
Han Cheng 已提交
1555 1556 1557
    { "bootindex", QEMU_CAPS_DEVICE_SCSI_GENERIC_BOOTINDEX },
};

1558
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsI440FXPCIHost[] = {
1559 1560 1561
    { "pci-hole64-size", QEMU_CAPS_I440FX_PCI_HOLE64_SIZE },
};

1562
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsQ35PCIHost[] = {
1563 1564 1565
    { "pci-hole64-size", QEMU_CAPS_Q35_PCI_HOLE64_SIZE },
};

1566
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsUSBStorage[] = {
1567 1568 1569
    { "removable", QEMU_CAPS_USB_STORAGE_REMOVABLE },
};

1570 1571 1572 1573
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsKVMPit[] = {
    { "lost_tick_policy", QEMU_CAPS_KVM_PIT_TICK_POLICY },
};

1574
struct virQEMUCapsObjectTypeProps {
1575
    const char *type;
1576
    struct virQEMUCapsStringFlags *props;
1577 1578 1579
    size_t nprops;
};

1580 1581 1582 1583
static struct virQEMUCapsObjectTypeProps virQEMUCapsObjectProps[] = {
    { "virtio-blk-pci", virQEMUCapsObjectPropsVirtioBlk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioBlk) },
    { "virtio-net-pci", virQEMUCapsObjectPropsVirtioNet,
1584 1585 1586 1587
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioNet) },
    { "virtio-blk-ccw", virQEMUCapsObjectPropsVirtioBlk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioBlk) },
    { "virtio-net-ccw", virQEMUCapsObjectPropsVirtioNet,
1588 1589 1590 1591 1592
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioNet) },
    { "virtio-blk-s390", virQEMUCapsObjectPropsVirtioBlk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioBlk) },
    { "virtio-net-s390", virQEMUCapsObjectPropsVirtioNet,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioNet) },
1593 1594 1595 1596 1597 1598
    { "pci-assign", virQEMUCapsObjectPropsPCIAssign,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsPCIAssign) },
    { "kvm-pci-assign", virQEMUCapsObjectPropsPCIAssign,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsPCIAssign) },
    { "vfio-pci", virQEMUCapsObjectPropsVfioPCI,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVfioPCI) },
1599 1600
    { "scsi-disk", virQEMUCapsObjectPropsSCSIDisk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsSCSIDisk) },
1601 1602 1603 1604
    { "ide-drive", virQEMUCapsObjectPropsIDEDrive,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsIDEDrive) },
    { "PIIX4_PM", virQEMUCapsObjectPropsPixx4PM,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsPixx4PM) },
1605 1606 1607 1608
    { "usb-redir", virQEMUCapsObjectPropsUSBRedir,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsUSBRedir) },
    { "usb-host", virQEMUCapsObjectPropsUSBHost,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsUSBHost) },
1609 1610
    { "scsi-generic", virQEMUCapsObjectPropsSCSIGeneric,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsSCSIGeneric) },
1611 1612 1613 1614
    { "i440FX-pcihost", virQEMUCapsObjectPropsI440FXPCIHost,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsI440FXPCIHost) },
    { "q35-pcihost", virQEMUCapsObjectPropsQ35PCIHost,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsQ35PCIHost) },
1615 1616
    { "usb-storage", virQEMUCapsObjectPropsUSBStorage,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsUSBStorage) },
1617 1618
    { "kvm-pit", virQEMUCapsObjectPropsKVMPit,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsKVMPit) },
1619 1620 1621 1622
};


static void
1623 1624 1625 1626 1627
virQEMUCapsProcessStringFlags(virQEMUCapsPtr qemuCaps,
                              size_t nflags,
                              struct virQEMUCapsStringFlags *flags,
                              size_t nvalues,
                              char *const*values)
1628 1629
{
    size_t i, j;
1630 1631
    for (i = 0; i < nflags; i++) {
        for (j = 0; j < nvalues; j++) {
1632
            if (STREQ(values[j], flags[i].value)) {
1633
                virQEMUCapsSet(qemuCaps, flags[i].flag);
1634 1635 1636 1637 1638 1639 1640 1641
                break;
            }
        }
    }
}


static void
1642 1643
virQEMUCapsFreeStringList(size_t len,
                          char **values)
1644 1645
{
    size_t i;
1646
    for (i = 0; i < len; i++)
1647 1648 1649 1650 1651 1652 1653 1654
        VIR_FREE(values[i]);
    VIR_FREE(values);
}


#define OBJECT_TYPE_PREFIX "name \""

static int
1655 1656
virQEMUCapsParseDeviceStrObjectTypes(const char *str,
                                     char ***types)
1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674
{
    const char *tmp = str;
    int ret = -1;
    size_t ntypelist = 0;
    char **typelist = NULL;

    *types = NULL;

    while ((tmp = strstr(tmp, OBJECT_TYPE_PREFIX))) {
        char *end;
        tmp += strlen(OBJECT_TYPE_PREFIX);
        end = strstr(tmp, "\"");
        if (!end) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("Malformed QEMU device list string, missing quote"));
            goto cleanup;
        }

1675
        if (VIR_EXPAND_N(typelist, ntypelist, 1) < 0)
1676
            goto cleanup;
1677
        if (VIR_STRNDUP(typelist[ntypelist - 1], tmp, end-tmp) < 0)
1678 1679 1680 1681 1682 1683
            goto cleanup;
    }

    *types = typelist;
    ret = ntypelist;

1684
 cleanup:
1685
    if (ret < 0)
1686
        virQEMUCapsFreeStringList(ntypelist, typelist);
1687 1688 1689 1690 1691
    return ret;
}


static int
1692 1693 1694
virQEMUCapsParseDeviceStrObjectProps(const char *str,
                                     const char *type,
                                     char ***props)
1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727
{
    const char *tmp = str;
    int ret = -1;
    size_t nproplist = 0;
    char **proplist = NULL;

    VIR_DEBUG("Extract type %s", type);
    *props = NULL;

    while ((tmp = strchr(tmp, '\n'))) {
        char *end;
        tmp += 1;

        if (*tmp == '\0')
            break;

        if (STRPREFIX(tmp, OBJECT_TYPE_PREFIX))
            continue;

        if (!STRPREFIX(tmp, type))
            continue;

        tmp += strlen(type);
        if (*tmp != '.')
            continue;
        tmp++;

        end = strstr(tmp, "=");
        if (!end) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("Malformed QEMU device list string, missing '='"));
            goto cleanup;
        }
1728
        if (VIR_EXPAND_N(proplist, nproplist, 1) < 0)
1729
            goto cleanup;
1730
        if (VIR_STRNDUP(proplist[nproplist - 1], tmp, end-tmp) < 0)
1731 1732 1733 1734 1735 1736
            goto cleanup;
    }

    *props = proplist;
    ret = nproplist;

1737
 cleanup:
1738
    if (ret < 0 && proplist)
1739
        virQEMUCapsFreeStringList(nproplist, proplist);
1740 1741 1742 1743 1744
    return ret;
}


int
1745
virQEMUCapsParseDeviceStr(virQEMUCapsPtr qemuCaps, const char *str)
1746 1747 1748 1749 1750
{
    int nvalues;
    char **values;
    size_t i;

1751
    if ((nvalues = virQEMUCapsParseDeviceStrObjectTypes(str, &values)) < 0)
1752
        return -1;
1753 1754 1755 1756 1757 1758
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsObjectTypes),
                                  virQEMUCapsObjectTypes,
                                  nvalues, values);
    virQEMUCapsFreeStringList(nvalues, values);

1759
    for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsObjectProps); i++) {
1760 1761 1762 1763
        const char *type = virQEMUCapsObjectProps[i].type;
        if ((nvalues = virQEMUCapsParseDeviceStrObjectProps(str,
                                                            type,
                                                            &values)) < 0)
1764
            return -1;
1765 1766 1767 1768 1769
        virQEMUCapsProcessStringFlags(qemuCaps,
                                      virQEMUCapsObjectProps[i].nprops,
                                      virQEMUCapsObjectProps[i].props,
                                      nvalues, values);
        virQEMUCapsFreeStringList(nvalues, values);
1770 1771 1772
    }

    /* Prefer -chardev spicevmc (detected earlier) over -device spicevmc */
1773 1774
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC))
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_DEVICE_SPICEVMC);
1775 1776 1777 1778 1779

    return 0;
}


E
Eric Blake 已提交
1780
static int
1781 1782
virQEMUCapsExtractDeviceStr(const char *qemu,
                            virQEMUCapsPtr qemuCaps,
1783
                            uid_t runUid, gid_t runGid)
1784
{
E
Eric Blake 已提交
1785
    char *output = NULL;
1786
    virCommandPtr cmd;
E
Eric Blake 已提交
1787
    int ret = -1;
1788

E
Eric Blake 已提交
1789 1790
    /* Cram together all device-related queries into one invocation;
     * the output format makes it possible to distinguish what we
1791 1792
     * need.  With qemu 0.13.0 and later, unrecognized '-device
     * bogus,?' cause an error in isolation, but are silently ignored
1793
     * in combination with '-device ?'.  Upstream qemu 0.12.x doesn't
1794 1795
     * understand '-device name,?', and always exits with status 1 for
     * the simpler '-device ?', so this function is really only useful
1796
     * if -help includes "device driver,?".  */
1797
    cmd = virQEMUCapsProbeCommand(qemu, qemuCaps, runUid, runGid);
1798 1799 1800 1801 1802 1803
    virCommandAddArgList(cmd,
                         "-device", "?",
                         "-device", "pci-assign,?",
                         "-device", "virtio-blk-pci,?",
                         "-device", "virtio-net-pci,?",
                         "-device", "scsi-disk,?",
1804
                         "-device", "PIIX4_PM,?",
1805
                         "-device", "usb-redir,?",
1806
                         "-device", "ide-drive,?",
1807
                         "-device", "usb-host,?",
H
Han Cheng 已提交
1808
                         "-device", "scsi-generic,?",
1809
                         "-device", "usb-storage,?",
1810
                         NULL);
1811
    /* qemu -help goes to stdout, but qemu -device ? goes to stderr.  */
E
Eric Blake 已提交
1812
    virCommandSetErrorBuffer(cmd, &output);
1813

1814
    if (virCommandRun(cmd, NULL) < 0)
1815 1816
        goto cleanup;

1817
    ret = virQEMUCapsParseDeviceStr(qemuCaps, output);
1818

1819
 cleanup:
E
Eric Blake 已提交
1820
    VIR_FREE(output);
1821
    virCommandFree(cmd);
E
Eric Blake 已提交
1822 1823 1824
    return ret;
}

1825

1826 1827 1828
int virQEMUCapsGetDefaultVersion(virCapsPtr caps,
                                 virQEMUCapsCachePtr capsCache,
                                 unsigned int *version)
1829 1830
{
    const char *binary;
1831
    virQEMUCapsPtr qemucaps;
T
Tal Kain 已提交
1832
    virArch hostarch;
1833 1834 1835 1836

    if (*version > 0)
        return 0;

T
Tal Kain 已提交
1837
    hostarch = virArchFromHost();
1838 1839
    if ((binary = virCapabilitiesDefaultGuestEmulator(caps,
                                                      "hvm",
T
Tal Kain 已提交
1840
                                                      hostarch,
1841
                                                      "qemu")) == NULL) {
1842
        virReportError(VIR_ERR_INTERNAL_ERROR,
1843
                       _("Cannot find suitable emulator for %s"),
T
Tal Kain 已提交
1844
                       virArchToString(hostarch));
1845 1846 1847
        return -1;
    }

1848
    if (!(qemucaps = virQEMUCapsCacheLookup(capsCache, binary)))
1849 1850
        return -1;

1851
    *version = virQEMUCapsGetVersion(qemucaps);
1852
    virObjectUnref(qemucaps);
1853 1854
    return 0;
}
1855 1856


1857 1858


1859 1860
virQEMUCapsPtr
virQEMUCapsNew(void)
1861
{
1862
    virQEMUCapsPtr qemuCaps;
1863

1864
    if (virQEMUCapsInitialize() < 0)
1865 1866
        return NULL;

1867
    if (!(qemuCaps = virObjectNew(virQEMUCapsClass)))
1868 1869
        return NULL;

1870
    if (!(qemuCaps->flags = virBitmapNew(QEMU_CAPS_LAST)))
1871
        goto error;
1872

1873
    return qemuCaps;
1874

1875
 error:
1876
    virObjectUnref(qemuCaps);
1877
    return NULL;
1878 1879 1880
}


1881
virQEMUCapsPtr virQEMUCapsNewCopy(virQEMUCapsPtr qemuCaps)
1882
{
1883
    virQEMUCapsPtr ret = virQEMUCapsNew();
1884 1885 1886 1887 1888
    size_t i;

    if (!ret)
        return NULL;

1889
    virBitmapCopy(ret->flags, qemuCaps->flags);
1890

1891 1892 1893 1894
    ret->usedQMP = qemuCaps->usedQMP;
    ret->version = qemuCaps->version;
    ret->kvmVersion = qemuCaps->kvmVersion;
    ret->arch = qemuCaps->arch;
1895

1896
    if (VIR_ALLOC_N(ret->cpuDefinitions, qemuCaps->ncpuDefinitions) < 0)
1897
        goto error;
1898
    ret->ncpuDefinitions = qemuCaps->ncpuDefinitions;
1899
    for (i = 0; i < qemuCaps->ncpuDefinitions; i++) {
1900 1901
        if (VIR_STRDUP(ret->cpuDefinitions[i], qemuCaps->cpuDefinitions[i]) < 0)
            goto error;
1902 1903
    }

1904
    if (VIR_ALLOC_N(ret->machineTypes, qemuCaps->nmachineTypes) < 0)
1905
        goto error;
1906
    if (VIR_ALLOC_N(ret->machineAliases, qemuCaps->nmachineTypes) < 0)
1907
        goto error;
1908
    if (VIR_ALLOC_N(ret->machineMaxCpus, qemuCaps->nmachineTypes) < 0)
1909
        goto error;
1910
    ret->nmachineTypes = qemuCaps->nmachineTypes;
1911
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
1912 1913 1914
        if (VIR_STRDUP(ret->machineTypes[i], qemuCaps->machineTypes[i]) < 0 ||
            VIR_STRDUP(ret->machineAliases[i], qemuCaps->machineAliases[i]) < 0)
            goto error;
1915
        ret->machineMaxCpus[i] = qemuCaps->machineMaxCpus[i];
1916 1917 1918 1919
    }

    return ret;

1920
 error:
1921 1922 1923 1924 1925
    virObjectUnref(ret);
    return NULL;
}


1926
void virQEMUCapsDispose(void *obj)
1927
{
1928
    virQEMUCapsPtr qemuCaps = obj;
1929 1930
    size_t i;

1931
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
1932 1933
        VIR_FREE(qemuCaps->machineTypes[i]);
        VIR_FREE(qemuCaps->machineAliases[i]);
1934
    }
1935 1936
    VIR_FREE(qemuCaps->machineTypes);
    VIR_FREE(qemuCaps->machineAliases);
1937
    VIR_FREE(qemuCaps->machineMaxCpus);
1938

1939
    for (i = 0; i < qemuCaps->ncpuDefinitions; i++) {
1940
        VIR_FREE(qemuCaps->cpuDefinitions[i]);
1941
    }
1942
    VIR_FREE(qemuCaps->cpuDefinitions);
1943

1944
    virBitmapFree(qemuCaps->flags);
1945

1946
    VIR_FREE(qemuCaps->binary);
1947 1948
}

1949
void
1950
virQEMUCapsSet(virQEMUCapsPtr qemuCaps,
1951
               virQEMUCapsFlags flag)
1952
{
1953
    ignore_value(virBitmapSetBit(qemuCaps->flags, flag));
1954 1955 1956 1957
}


void
1958
virQEMUCapsSetList(virQEMUCapsPtr qemuCaps, ...)
1959 1960 1961 1962
{
    va_list list;
    int flag;

1963
    va_start(list, qemuCaps);
1964
    while ((flag = va_arg(list, int)) < QEMU_CAPS_LAST)
1965
        ignore_value(virBitmapSetBit(qemuCaps->flags, flag));
1966
    va_end(list);
1967 1968 1969 1970
}


void
1971
virQEMUCapsClear(virQEMUCapsPtr qemuCaps,
1972
                 virQEMUCapsFlags flag)
1973
{
1974
    ignore_value(virBitmapClearBit(qemuCaps->flags, flag));
1975 1976 1977
}


1978
char *virQEMUCapsFlagsString(virQEMUCapsPtr qemuCaps)
1979
{
1980
    return virBitmapString(qemuCaps->flags);
1981 1982 1983 1984
}


bool
1985
virQEMUCapsGet(virQEMUCapsPtr qemuCaps,
1986
               virQEMUCapsFlags flag)
1987
{
1988 1989
    bool b;

1990
    if (!qemuCaps || virBitmapGetBit(qemuCaps->flags, flag, &b) < 0)
1991 1992 1993
        return false;
    else
        return b;
1994
}
1995 1996


D
Daniel P. Berrange 已提交
1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040 2041 2042 2043 2044 2045 2046
bool virQEMUCapsHasPCIMultiBus(virQEMUCapsPtr qemuCaps,
                               virDomainDefPtr def)
{
    bool hasMultiBus = virQEMUCapsGet(qemuCaps, QEMU_CAPS_PCI_MULTIBUS);

    if (hasMultiBus)
        return true;

    if (def->os.arch == VIR_ARCH_PPC ||
        def->os.arch == VIR_ARCH_PPC64) {
        /*
         * Usage of pci.0 naming:
         *
         *    ref405ep: no pci
         *       taihu: no pci
         *      bamboo: 1.1.0
         *       mac99: 2.0.0
         *     g3beige: 2.0.0
         *        prep: 1.4.0
         *     pseries: 2.0.0
         *   mpc8544ds: forever
         * virtex-m507: no pci
         *     ppce500: 1.6.0
         */

        if (qemuCaps->version >= 2000000)
            return true;

        if (qemuCaps->version >= 1006000 &&
            STREQ(def->os.machine, "ppce500"))
            return true;

        if (qemuCaps->version >= 1004000 &&
            STREQ(def->os.machine, "prep"))
            return true;

        if (qemuCaps->version >= 1001000 &&
            STREQ(def->os.machine, "bamboo"))
            return true;

        if (STREQ(def->os.machine, "mpc8544ds"))
            return true;

        return false;
    }

    return false;
}


2047
const char *virQEMUCapsGetBinary(virQEMUCapsPtr qemuCaps)
2048
{
2049
    return qemuCaps->binary;
2050 2051
}

2052
virArch virQEMUCapsGetArch(virQEMUCapsPtr qemuCaps)
2053
{
2054
    return qemuCaps->arch;
2055 2056 2057
}


2058
unsigned int virQEMUCapsGetVersion(virQEMUCapsPtr qemuCaps)
2059
{
2060
    return qemuCaps->version;
2061 2062 2063
}


2064
unsigned int virQEMUCapsGetKVMVersion(virQEMUCapsPtr qemuCaps)
2065
{
2066
    return qemuCaps->kvmVersion;
2067 2068 2069
}


2070 2071
int virQEMUCapsAddCPUDefinition(virQEMUCapsPtr qemuCaps,
                                const char *name)
2072
{
2073 2074 2075
    char *tmp;

    if (VIR_STRDUP(tmp, name) < 0)
2076
        return -1;
2077
    if (VIR_EXPAND_N(qemuCaps->cpuDefinitions, qemuCaps->ncpuDefinitions, 1) < 0) {
2078 2079 2080
        VIR_FREE(tmp);
        return -1;
    }
2081
    qemuCaps->cpuDefinitions[qemuCaps->ncpuDefinitions-1] = tmp;
2082 2083 2084 2085
    return 0;
}


2086 2087
size_t virQEMUCapsGetCPUDefinitions(virQEMUCapsPtr qemuCaps,
                                    char ***names)
2088
{
2089
    if (names)
2090 2091
        *names = qemuCaps->cpuDefinitions;
    return qemuCaps->ncpuDefinitions;
2092 2093 2094
}


2095 2096
size_t virQEMUCapsGetMachineTypes(virQEMUCapsPtr qemuCaps,
                                  char ***names)
2097
{
2098
    if (names)
2099 2100
        *names = qemuCaps->machineTypes;
    return qemuCaps->nmachineTypes;
2101 2102
}

2103 2104 2105
int virQEMUCapsGetMachineTypesCaps(virQEMUCapsPtr qemuCaps,
                                   size_t *nmachines,
                                   virCapsGuestMachinePtr **machines)
2106 2107 2108 2109
{
    size_t i;

    *machines = NULL;
2110
    *nmachines = qemuCaps->nmachineTypes;
2111

2112 2113 2114 2115
    if (*nmachines &&
        VIR_ALLOC_N(*machines, qemuCaps->nmachineTypes) < 0)
        goto error;

2116
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
2117 2118
        virCapsGuestMachinePtr mach;
        if (VIR_ALLOC(mach) < 0)
2119
            goto error;
2120
        (*machines)[i] = mach;
2121
        if (qemuCaps->machineAliases[i]) {
2122 2123 2124
            if (VIR_STRDUP(mach->name, qemuCaps->machineAliases[i]) < 0 ||
                VIR_STRDUP(mach->canonical, qemuCaps->machineTypes[i]) < 0)
                goto error;
2125
        } else {
2126 2127
            if (VIR_STRDUP(mach->name, qemuCaps->machineTypes[i]) < 0)
                goto error;
2128
        }
2129
        mach->maxCpus = qemuCaps->machineMaxCpus[i];
2130 2131 2132 2133
    }

    return 0;

2134
 error:
2135 2136 2137 2138 2139 2140 2141 2142
    virCapabilitiesFreeMachines(*machines, *nmachines);
    *nmachines = 0;
    *machines = NULL;
    return -1;
}



2143

2144 2145
const char *virQEMUCapsGetCanonicalMachine(virQEMUCapsPtr qemuCaps,
                                           const char *name)
2146 2147 2148
{
    size_t i;

2149 2150 2151
    if (!name)
        return NULL;

2152
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
2153
        if (!qemuCaps->machineAliases[i])
2154
            continue;
2155 2156
        if (STREQ(qemuCaps->machineAliases[i], name))
            return qemuCaps->machineTypes[i];
2157 2158 2159 2160
    }

    return name;
}
2161 2162


2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181
int virQEMUCapsGetMachineMaxCpus(virQEMUCapsPtr qemuCaps,
                                 const char *name)
{
    size_t i;

    if (!name)
        return 0;

    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
        if (!qemuCaps->machineMaxCpus[i])
            continue;
        if (STREQ(qemuCaps->machineTypes[i], name))
            return qemuCaps->machineMaxCpus[i];
    }

    return 0;
}


2182
static int
2183 2184
virQEMUCapsProbeQMPCommands(virQEMUCapsPtr qemuCaps,
                            qemuMonitorPtr mon)
2185 2186 2187 2188 2189 2190 2191
{
    char **commands = NULL;
    int ncommands;

    if ((ncommands = qemuMonitorGetCommands(mon, &commands)) < 0)
        return -1;

2192 2193 2194 2195 2196
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsCommands),
                                  virQEMUCapsCommands,
                                  ncommands, commands);
    virQEMUCapsFreeStringList(ncommands, commands);
2197

2198 2199 2200 2201
    /* QMP add-fd was introduced in 1.2, but did not support
     * management control of set numbering, and did not have a
     * counterpart -add-fd command line option.  We require the
     * add-fd features from 1.3 or later.  */
2202
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_ADD_FD)) {
2203 2204 2205 2206 2207 2208 2209
        int fd = open("/dev/null", O_RDONLY);
        if (fd < 0) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("unable to probe for add-fd"));
            return -1;
        }
        if (qemuMonitorAddFd(mon, 0, fd, "/dev/null") < 0)
2210
            virQEMUCapsClear(qemuCaps, QEMU_CAPS_ADD_FD);
2211 2212 2213
        VIR_FORCE_CLOSE(fd);
    }

2214 2215 2216 2217 2218 2219
    /* Probe for active commit of qemu 2.1 (for now, we are choosing
     * to ignore the fact that qemu 2.0 can also do active commit) */
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_BLOCK_COMMIT) &&
        qemuMonitorSupportsActiveCommit(mon))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ACTIVE_COMMIT);

2220 2221 2222 2223 2224
    return 0;
}


static int
2225 2226
virQEMUCapsProbeQMPEvents(virQEMUCapsPtr qemuCaps,
                          qemuMonitorPtr mon)
2227 2228 2229 2230 2231 2232 2233
{
    char **events = NULL;
    int nevents;

    if ((nevents = qemuMonitorGetEvents(mon, &events)) < 0)
        return -1;

2234 2235 2236 2237 2238
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsEvents),
                                  virQEMUCapsEvents,
                                  nevents, events);
    virQEMUCapsFreeStringList(nevents, events);
2239 2240 2241 2242 2243

    return 0;
}


2244
static int
2245 2246
virQEMUCapsProbeQMPObjects(virQEMUCapsPtr qemuCaps,
                           qemuMonitorPtr mon)
2247 2248 2249 2250 2251 2252 2253
{
    int nvalues;
    char **values;
    size_t i;

    if ((nvalues = qemuMonitorGetObjectTypes(mon, &values)) < 0)
        return -1;
2254 2255 2256 2257 2258 2259
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsObjectTypes),
                                  virQEMUCapsObjectTypes,
                                  nvalues, values);
    virQEMUCapsFreeStringList(nvalues, values);

2260
    for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsObjectProps); i++) {
2261
        const char *type = virQEMUCapsObjectProps[i].type;
2262 2263 2264 2265
        if ((nvalues = qemuMonitorGetObjectProps(mon,
                                                 type,
                                                 &values)) < 0)
            return -1;
2266 2267 2268 2269 2270
        virQEMUCapsProcessStringFlags(qemuCaps,
                                      virQEMUCapsObjectProps[i].nprops,
                                      virQEMUCapsObjectProps[i].props,
                                      nvalues, values);
        virQEMUCapsFreeStringList(nvalues, values);
2271 2272 2273
    }

    /* Prefer -chardev spicevmc (detected earlier) over -device spicevmc */
2274 2275
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC))
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_DEVICE_SPICEVMC);
2276
    /* If qemu supports newer -device qxl it supports -vga qxl as well */
2277 2278
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE_QXL))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_QXL);
2279 2280 2281 2282 2283 2284

    return 0;
}


static int
2285 2286
virQEMUCapsProbeQMPMachineTypes(virQEMUCapsPtr qemuCaps,
                                qemuMonitorPtr mon)
2287 2288 2289 2290 2291
{
    qemuMonitorMachineInfoPtr *machines = NULL;
    int nmachines = 0;
    int ret = -1;
    size_t i;
2292
    size_t defIdx = 0;
2293 2294

    if ((nmachines = qemuMonitorGetMachines(mon, &machines)) < 0)
2295
        return -1;
2296

2297
    if (VIR_ALLOC_N(qemuCaps->machineTypes, nmachines) < 0)
2298
        goto cleanup;
2299
    if (VIR_ALLOC_N(qemuCaps->machineAliases, nmachines) < 0)
2300
        goto cleanup;
2301
    if (VIR_ALLOC_N(qemuCaps->machineMaxCpus, nmachines) < 0)
2302
        goto cleanup;
2303

2304
    for (i = 0; i < nmachines; i++) {
2305 2306
        if (STREQ(machines[i]->name, "none"))
            continue;
2307 2308 2309 2310 2311
        qemuCaps->nmachineTypes++;
        if (VIR_STRDUP(qemuCaps->machineAliases[qemuCaps->nmachineTypes -1],
                       machines[i]->alias) < 0 ||
            VIR_STRDUP(qemuCaps->machineTypes[qemuCaps->nmachineTypes - 1],
                       machines[i]->name) < 0)
2312
            goto cleanup;
2313
        if (machines[i]->isDefault)
2314
            defIdx = qemuCaps->nmachineTypes - 1;
2315 2316
        qemuCaps->machineMaxCpus[qemuCaps->nmachineTypes - 1] =
            machines[i]->maxCpus;
2317
    }
2318 2319

    if (defIdx)
2320
        virQEMUCapsSetDefaultMachine(qemuCaps, defIdx);
2321 2322 2323

    ret = 0;

2324
 cleanup:
2325
    for (i = 0; i < nmachines; i++)
2326 2327 2328 2329 2330 2331 2332
        qemuMonitorMachineInfoFree(machines[i]);
    VIR_FREE(machines);
    return ret;
}


static int
2333 2334
virQEMUCapsProbeQMPCPUDefinitions(virQEMUCapsPtr qemuCaps,
                                  qemuMonitorPtr mon)
2335 2336 2337 2338 2339 2340 2341
{
    int ncpuDefinitions;
    char **cpuDefinitions;

    if ((ncpuDefinitions = qemuMonitorGetCPUDefinitions(mon, &cpuDefinitions)) < 0)
        return -1;

2342 2343
    qemuCaps->ncpuDefinitions = ncpuDefinitions;
    qemuCaps->cpuDefinitions = cpuDefinitions;
2344 2345 2346 2347

    return 0;
}

2348 2349
struct tpmTypeToCaps {
    int type;
2350
    virQEMUCapsFlags caps;
2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370
};

static const struct tpmTypeToCaps virQEMUCapsTPMTypesToCaps[] = {
    {
        .type = VIR_DOMAIN_TPM_TYPE_PASSTHROUGH,
        .caps = QEMU_CAPS_DEVICE_TPM_PASSTHROUGH,
    },
};

const struct tpmTypeToCaps virQEMUCapsTPMModelsToCaps[] = {
    {
        .type = VIR_DOMAIN_TPM_MODEL_TIS,
        .caps = QEMU_CAPS_DEVICE_TPM_TIS,
    },
};

static int
virQEMUCapsProbeQMPTPM(virQEMUCapsPtr qemuCaps,
                       qemuMonitorPtr mon)
{
2371 2372
    int nentries;
    size_t i;
2373
    char **entries = NULL;
S
Stefan Berger 已提交
2374

2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404
    if ((nentries = qemuMonitorGetTPMModels(mon, &entries)) < 0)
        return -1;

    if (nentries > 0) {
        for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsTPMModelsToCaps); i++) {
            const char *needle = virDomainTPMModelTypeToString(
                virQEMUCapsTPMModelsToCaps[i].type);
            if (virStringArrayHasString(entries, needle))
                virQEMUCapsSet(qemuCaps,
                               virQEMUCapsTPMModelsToCaps[i].caps);
        }
    }
    virStringFreeList(entries);

    if ((nentries = qemuMonitorGetTPMTypes(mon, &entries)) < 0)
        return -1;

    if (nentries > 0) {
        for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsTPMTypesToCaps); i++) {
            const char *needle = virDomainTPMBackendTypeToString(
                virQEMUCapsTPMTypesToCaps[i].type);
            if (virStringArrayHasString(entries, needle))
                virQEMUCapsSet(qemuCaps, virQEMUCapsTPMTypesToCaps[i].caps);
        }
    }
    virStringFreeList(entries);

    return 0;
}

2405

2406
static int
2407 2408
virQEMUCapsProbeQMPKVMState(virQEMUCapsPtr qemuCaps,
                            qemuMonitorPtr mon)
2409 2410 2411 2412
{
    bool enabled = false;
    bool present = false;

2413
    if (!virQEMUCapsGet(qemuCaps, QEMU_CAPS_KVM))
2414 2415 2416 2417 2418 2419
        return 0;

    if (qemuMonitorGetKVMState(mon, &enabled, &present) < 0)
        return -1;

    /* The QEMU_CAPS_KVM flag was initially set according to the QEMU
2420
     * reporting the recognition of 'query-kvm' QMP command. That merely
N
Nehal J Wani 已提交
2421
     * indicates existence of the command though, not whether KVM support
2422 2423 2424 2425 2426 2427
     * is actually available, nor whether it is enabled by default.
     *
     * If it is not present we need to clear the flag, and if it is
     * not enabled by default we need to change the flag.
     */
    if (!present) {
2428
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_KVM);
2429
    } else if (!enabled) {
2430 2431
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_KVM);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ENABLE_KVM);
2432 2433 2434 2435 2436
    }

    return 0;
}

2437 2438 2439 2440 2441 2442 2443 2444
struct virQEMUCapsCommandLineProps {
    const char *option;
    const char *param;
    int flag;
};

static struct virQEMUCapsCommandLineProps virQEMUCapsCommandLine[] = {
    { "machine", "mem-merge", QEMU_CAPS_MEM_MERGE },
O
Osier Yang 已提交
2445
    { "drive", "discard", QEMU_CAPS_DRIVE_DISCARD },
2446
    { "realtime", "mlock", QEMU_CAPS_MLOCK },
2447
    { "boot-opts", "strict", QEMU_CAPS_BOOT_STRICT },
2448
    { "boot-opts", "reboot-timeout", QEMU_CAPS_REBOOT_TIMEOUT },
2449
    { "boot-opts", "splash-time", QEMU_CAPS_SPLASH_TIMEOUT },
2450
    { "spice", "disable-agent-file-xfer", QEMU_CAPS_SPICE_FILE_XFER_DISABLE },
2451
    { "msg", "timestamp", QEMU_CAPS_MSG_TIMESTAMP },
2452
    { "numa", NULL, QEMU_CAPS_NUMA },
2453 2454 2455 2456 2457 2458
};

static int
virQEMUCapsProbeQMPCommandLine(virQEMUCapsPtr qemuCaps,
                               qemuMonitorPtr mon)
{
2459
    bool found = false;
2460 2461 2462 2463 2464 2465 2466
    int nvalues;
    char **values;
    size_t i, j;

    for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsCommandLine); i++) {
        if ((nvalues = qemuMonitorGetCommandLineOptionParameters(mon,
                                                                 virQEMUCapsCommandLine[i].option,
2467 2468
                                                                 &values,
                                                                 &found)) < 0)
2469
            return -1;
2470 2471 2472 2473

        if (found && !virQEMUCapsCommandLine[i].param)
            virQEMUCapsSet(qemuCaps, virQEMUCapsCommandLine[i].flag);

2474
        for (j = 0; j < nvalues; j++) {
2475
            if (STREQ_NULLABLE(virQEMUCapsCommandLine[i].param, values[j])) {
2476 2477 2478 2479 2480 2481 2482 2483 2484
                virQEMUCapsSet(qemuCaps, virQEMUCapsCommandLine[i].flag);
                break;
            }
        }
        virStringFreeList(values);
    }

    return 0;
}
2485

2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504
static int
virQEMUCapsProbeQMPMigrationCapabilities(virQEMUCapsPtr qemuCaps,
                                         qemuMonitorPtr mon)
{
    char **caps = NULL;
    int ncaps;

    if ((ncaps = qemuMonitorGetMigrationCapabilities(mon, &caps)) < 0)
        return -1;

    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsMigration),
                                  virQEMUCapsMigration,
                                  ncaps, caps);
    virQEMUCapsFreeStringList(ncaps, caps);

    return 0;
}

2505 2506
int virQEMUCapsProbeQMP(virQEMUCapsPtr qemuCaps,
                        qemuMonitorPtr mon)
2507
{
2508
    VIR_DEBUG("qemuCaps=%p mon=%p", qemuCaps, mon);
2509

2510
    if (qemuCaps->usedQMP)
2511 2512
        return 0;

2513
    if (virQEMUCapsProbeQMPCommands(qemuCaps, mon) < 0)
2514 2515
        return -1;

2516
    if (virQEMUCapsProbeQMPEvents(qemuCaps, mon) < 0)
2517 2518 2519 2520 2521 2522
        return -1;

    return 0;
}


2523 2524 2525 2526 2527 2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546 2547 2548
/*
 * Parsing a doc that looks like
 *
 * <qemuCaps>
 *   <qemuctime>234235253</qemuctime>
 *   <selfctime>234235253</selfctime>
 *   <usedQMP/>
 *   <flag name='foo'/>
 *   <flag name='bar'/>
 *   ...
 *   <cpu name="pentium3"/>
 *   ...
 *   <machine name="pc-1.0" alias="pc" maxCpus="4"/>
 *   ...
 * </qemuCaps>
 */
static int
virQEMUCapsLoadCache(virQEMUCapsPtr qemuCaps, const char *filename,
                     time_t *qemuctime, time_t *selfctime)
{
    xmlDocPtr doc = NULL;
    int ret = -1;
    size_t i;
    int n;
    xmlNodePtr *nodes = NULL;
    xmlXPathContextPtr ctxt = NULL;
J
Ján Tomko 已提交
2549
    char *str = NULL;
2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566 2567 2568 2569 2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606 2607 2608 2609 2610 2611 2612 2613 2614 2615 2616 2617 2618 2619 2620 2621 2622 2623 2624 2625 2626 2627 2628 2629 2630 2631 2632 2633 2634
    long long int l;

    if (!(doc = virXMLParseFile(filename)))
        goto cleanup;

    if (!(ctxt = xmlXPathNewContext(doc))) {
        virReportOOMError();
        goto cleanup;
    }

    ctxt->node = xmlDocGetRootElement(doc);

    if (STRNEQ((const char *)ctxt->node->name, "qemuCaps")) {
        virReportError(VIR_ERR_XML_ERROR,
                       _("unexpected root element <%s>, "
                         "expecting <qemuCaps>"),
                       ctxt->node->name);
        goto cleanup;
    }

    if (virXPathLongLong("string(./qemuctime)", ctxt, &l) < 0) {
        virReportError(VIR_ERR_XML_ERROR, "%s",
                       _("missing qemuctime in QEMU capabilities XML"));
        goto cleanup;
    }
    *qemuctime = (time_t)l;

    if (virXPathLongLong("string(./selfctime)", ctxt, &l) < 0) {
        virReportError(VIR_ERR_XML_ERROR, "%s",
                       _("missing selfctime in QEMU capabilities XML"));
        goto cleanup;
    }
    *selfctime = (time_t)l;

    qemuCaps->usedQMP = virXPathBoolean("count(./usedQMP) > 0",
                                        ctxt) > 0;

    if ((n = virXPathNodeSet("./flag", ctxt, &nodes)) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("failed to parse qemu capabilities flags"));
        goto cleanup;
    }
    VIR_DEBUG("Got flags %d", n);
    if (n > 0) {
        for (i = 0; i < n; i++) {
            int flag;
            if (!(str = virXMLPropString(nodes[i], "name"))) {
                virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                               _("missing flag name in QEMU capabilities cache"));
                goto cleanup;
            }
            flag = virQEMUCapsTypeFromString(str);
            if (flag < 0) {
                virReportError(VIR_ERR_INTERNAL_ERROR,
                               _("Unknown qemu capabilities flag %s"), str);
                goto cleanup;
            }
            VIR_FREE(str);
            virQEMUCapsSet(qemuCaps, flag);
        }
    }
    VIR_FREE(nodes);

    if (virXPathUInt("string(./version)", ctxt, &qemuCaps->version) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("missing version in QEMU capabilities cache"));
        goto cleanup;
    }

    if (virXPathUInt("string(./kvmVersion)", ctxt, &qemuCaps->kvmVersion) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("missing version in QEMU capabilities cache"));
        goto cleanup;
    }

    if (!(str = virXPathString("string(./arch)", ctxt))) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("missing arch in QEMU capabilities cache"));
        goto cleanup;
    }
    if (!(qemuCaps->arch = virArchFromString(str))) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("unknown arch %s in QEMU capabilities cache"), str);
        goto cleanup;
    }
J
Ján Tomko 已提交
2635
    VIR_FREE(str);
2636 2637 2638 2639 2640 2641 2642 2643 2644 2645 2646 2647 2648

    if ((n = virXPathNodeSet("./cpu", ctxt, &nodes)) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("failed to parse qemu capabilities cpus"));
        goto cleanup;
    }
    if (n > 0) {
        qemuCaps->ncpuDefinitions = n;
        if (VIR_ALLOC_N(qemuCaps->cpuDefinitions,
                        qemuCaps->ncpuDefinitions) < 0)
            goto cleanup;

        for (i = 0; i < n; i++) {
J
Ján Tomko 已提交
2649
            if (!(qemuCaps->cpuDefinitions[i] = virXMLPropString(nodes[i], "name"))) {
2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674
                virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                               _("missing cpu name in QEMU capabilities cache"));
                goto cleanup;
            }
        }
    }
    VIR_FREE(nodes);


    if ((n = virXPathNodeSet("./machine", ctxt, &nodes)) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("failed to parse qemu capabilities machines"));
        goto cleanup;
    }
    if (n > 0) {
        qemuCaps->nmachineTypes = n;
        if (VIR_ALLOC_N(qemuCaps->machineTypes,
                        qemuCaps->nmachineTypes) < 0 ||
            VIR_ALLOC_N(qemuCaps->machineAliases,
                        qemuCaps->nmachineTypes) < 0 ||
            VIR_ALLOC_N(qemuCaps->machineMaxCpus,
                        qemuCaps->nmachineTypes) < 0)
            goto cleanup;

        for (i = 0; i < n; i++) {
J
Ján Tomko 已提交
2675
            if (!(qemuCaps->machineTypes[i] = virXMLPropString(nodes[i], "name"))) {
2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687 2688
                virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                               _("missing machine name in QEMU capabilities cache"));
                goto cleanup;
            }
            qemuCaps->machineAliases[i] = virXMLPropString(nodes[i], "alias");

            str = virXMLPropString(nodes[i], "maxCpus");
            if (str &&
                virStrToLong_ui(str, NULL, 10, &(qemuCaps->machineMaxCpus[i])) < 0) {
                virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                               _("malformed machine cpu count in QEMU capabilities cache"));
                goto cleanup;
            }
J
Ján Tomko 已提交
2689
            VIR_FREE(str);
2690 2691 2692 2693 2694
        }
    }
    VIR_FREE(nodes);

    ret = 0;
2695
 cleanup:
J
Ján Tomko 已提交
2696
    VIR_FREE(str);
2697 2698 2699 2700 2701 2702 2703 2704 2705 2706 2707
    VIR_FREE(nodes);
    xmlXPathFreeContext(ctxt);
    xmlFreeDoc(doc);
    return ret;
}


static int
virQEMUCapsSaveCache(virQEMUCapsPtr qemuCaps, const char *filename)
{
    virBuffer buf = VIR_BUFFER_INITIALIZER;
M
Michal Privoznik 已提交
2708
    char *xml = NULL;
2709 2710 2711 2712
    int ret = -1;
    size_t i;

    virBufferAddLit(&buf, "<qemuCaps>\n");
2713
    virBufferAdjustIndent(&buf, 2);
2714

2715
    virBufferAsprintf(&buf, "<qemuctime>%llu</qemuctime>\n",
2716
                      (long long)qemuCaps->ctime);
2717
    virBufferAsprintf(&buf, "<selfctime>%llu</selfctime>\n",
2718 2719 2720
                      (long long)virGetSelfLastChanged());

    if (qemuCaps->usedQMP)
2721
        virBufferAddLit(&buf, "<usedQMP/>\n");
2722 2723 2724

    for (i = 0; i < QEMU_CAPS_LAST; i++) {
        if (virQEMUCapsGet(qemuCaps, i)) {
2725
            virBufferAsprintf(&buf, "<flag name='%s'/>\n",
2726 2727 2728 2729
                              virQEMUCapsTypeToString(i));
        }
    }

2730
    virBufferAsprintf(&buf, "<version>%d</version>\n",
2731 2732
                      qemuCaps->version);

2733
    virBufferAsprintf(&buf, "<kvmVersion>%d</kvmVersion>\n",
2734 2735
                      qemuCaps->kvmVersion);

2736
    virBufferAsprintf(&buf, "<arch>%s</arch>\n",
2737 2738 2739
                      virArchToString(qemuCaps->arch));

    for (i = 0; i < qemuCaps->ncpuDefinitions; i++) {
2740
        virBufferEscapeString(&buf, "<cpu name='%s'/>\n",
2741 2742 2743 2744
                              qemuCaps->cpuDefinitions[i]);
    }

    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
2745
        virBufferEscapeString(&buf, "<machine name='%s'",
2746 2747 2748 2749 2750 2751 2752 2753
                              qemuCaps->machineTypes[i]);
        if (qemuCaps->machineAliases[i])
            virBufferEscapeString(&buf, " alias='%s'",
                              qemuCaps->machineAliases[i]);
        virBufferAsprintf(&buf, " maxCpus='%u'/>\n",
                          qemuCaps->machineMaxCpus[i]);
    }

2754
    virBufferAdjustIndent(&buf, -2);
2755 2756
    virBufferAddLit(&buf, "</qemuCaps>\n");

2757
    if (virBufferCheckError(&buf) < 0)
2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783 2784 2785 2786 2787 2788 2789 2790 2791 2792 2793 2794 2795 2796 2797 2798 2799 2800 2801 2802 2803 2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830 2831 2832 2833 2834 2835 2836 2837 2838 2839
        goto cleanup;

    xml = virBufferContentAndReset(&buf);

    if (virFileWriteStr(filename, xml, 0600) < 0) {
        virReportSystemError(errno,
                             _("Failed to save '%s' for '%s'"),
                             filename, qemuCaps->binary);
        goto cleanup;
    }

    VIR_DEBUG("Saved caps '%s' for '%s' with (%lld, %lld)",
              filename, qemuCaps->binary,
              (long long)qemuCaps->ctime,
              (long long)virGetSelfLastChanged());

    ret = 0;
 cleanup:
    VIR_FREE(xml);
    return ret;
}

static int
virQEMUCapsRememberCached(virQEMUCapsPtr qemuCaps, const char *cacheDir)
{
    char *capsdir = NULL;
    char *capsfile = NULL;
    int ret = -1;
    char *binaryhash = NULL;

    if (virAsprintf(&capsdir, "%s/capabilities", cacheDir) < 0)
        goto cleanup;

    if (virCryptoHashString(VIR_CRYPTO_HASH_SHA256,
                            qemuCaps->binary,
                            &binaryhash) < 0)
        goto cleanup;

    if (virAsprintf(&capsfile, "%s/%s.xml", capsdir, binaryhash) < 0)
        goto cleanup;

    if (virFileMakePath(capsdir) < 0) {
        virReportSystemError(errno,
                             _("Unable to create directory '%s'"),
                             capsdir);
        goto cleanup;
    }

    if (virQEMUCapsSaveCache(qemuCaps, capsfile) < 0)
        goto cleanup;

    ret = 0;
 cleanup:
    VIR_FREE(binaryhash);
    VIR_FREE(capsfile);
    VIR_FREE(capsdir);
    return ret;
}


static void
virQEMUCapsReset(virQEMUCapsPtr qemuCaps)
{
    size_t i;

    virBitmapClearAll(qemuCaps->flags);
    qemuCaps->version = qemuCaps->kvmVersion = 0;
    qemuCaps->arch = VIR_ARCH_NONE;
    qemuCaps->usedQMP = false;

    for (i = 0; i < qemuCaps->ncpuDefinitions; i++) {
        VIR_FREE(qemuCaps->cpuDefinitions[i]);
    }
    VIR_FREE(qemuCaps->cpuDefinitions);
    qemuCaps->ncpuDefinitions = 0;

    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
        VIR_FREE(qemuCaps->machineTypes[i]);
        VIR_FREE(qemuCaps->machineAliases[i]);
    }
    VIR_FREE(qemuCaps->machineTypes);
    VIR_FREE(qemuCaps->machineAliases);
J
Ján Tomko 已提交
2840
    VIR_FREE(qemuCaps->machineMaxCpus);
2841 2842 2843 2844 2845 2846 2847 2848 2849 2850 2851 2852 2853 2854 2855 2856 2857 2858 2859 2860 2861 2862 2863 2864 2865 2866 2867 2868 2869 2870 2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883 2884 2885 2886 2887 2888 2889 2890 2891 2892 2893 2894 2895 2896 2897 2898 2899 2900 2901 2902 2903 2904 2905 2906 2907 2908 2909 2910 2911 2912 2913 2914 2915 2916 2917 2918 2919 2920 2921 2922 2923 2924
    qemuCaps->nmachineTypes = 0;
}


static int
virQEMUCapsInitCached(virQEMUCapsPtr qemuCaps, const char *cacheDir)
{
    char *capsdir = NULL;
    char *capsfile = NULL;
    int ret = -1;
    char *binaryhash = NULL;
    struct stat sb;
    time_t qemuctime;
    time_t selfctime;

    if (virAsprintf(&capsdir, "%s/capabilities", cacheDir) < 0)
        goto cleanup;

    if (virCryptoHashString(VIR_CRYPTO_HASH_SHA256,
                            qemuCaps->binary,
                            &binaryhash) < 0)
        goto cleanup;

    if (virAsprintf(&capsfile, "%s/%s.xml", capsdir, binaryhash) < 0)
        goto cleanup;

    if (virFileMakePath(capsdir) < 0) {
        virReportSystemError(errno,
                             _("Unable to create directory '%s'"),
                             capsdir);
        goto cleanup;
    }

    if (stat(capsfile, &sb) < 0) {
        if (errno == ENOENT) {
            VIR_DEBUG("No cached capabilities '%s' for '%s'",
                      capsfile, qemuCaps->binary);
            ret = 0;
            goto cleanup;
        }
        virReportSystemError(errno,
                             _("Unable to access cache '%s' for '%s'"),
                             capsfile, qemuCaps->binary);
        goto cleanup;
    }

    if (virQEMUCapsLoadCache(qemuCaps, capsfile, &qemuctime, &selfctime) < 0) {
        virErrorPtr err = virGetLastError();
        VIR_WARN("Failed to load cached caps from '%s' for '%s': %s",
                 capsfile, qemuCaps->binary, err ? NULLSTR(err->message) :
                 _("unknown error"));
        virResetLastError();
        ret = 0;
        virQEMUCapsReset(qemuCaps);
        goto cleanup;
    }

    /* Discard if cache is older that QEMU binary */
    if (qemuctime != qemuCaps->ctime ||
        selfctime < virGetSelfLastChanged()) {
        VIR_DEBUG("Outdated cached capabilities '%s' for '%s' "
                  "(%lld vs %lld, %lld vs %lld)",
                  capsfile, qemuCaps->binary,
                  (long long)qemuctime, (long long)qemuCaps->ctime,
                  (long long)selfctime, (long long)virGetSelfLastChanged());
        ignore_value(unlink(capsfile));
        virQEMUCapsReset(qemuCaps);
        ret = 0;
        goto cleanup;
    }

    VIR_DEBUG("Loaded '%s' for '%s' ctime %lld usedQMP=%d",
              capsfile, qemuCaps->binary,
              (long long)qemuCaps->ctime, qemuCaps->usedQMP);

    ret = 1;
 cleanup:
    VIR_FREE(binaryhash);
    VIR_FREE(capsfile);
    VIR_FREE(capsdir);
    return ret;
}


2925 2926
#define QEMU_SYSTEM_PREFIX "qemu-system-"

2927
static int
2928
virQEMUCapsInitHelp(virQEMUCapsPtr qemuCaps, uid_t runUid, gid_t runGid)
2929
{
2930
    virCommandPtr cmd = NULL;
2931
    bool is_kvm;
2932
    char *help = NULL;
2933 2934
    int ret = -1;
    const char *tmp;
2935

2936
    VIR_DEBUG("qemuCaps=%p", qemuCaps);
2937

2938
    tmp = strstr(qemuCaps->binary, QEMU_SYSTEM_PREFIX);
2939 2940
    if (tmp) {
        tmp += strlen(QEMU_SYSTEM_PREFIX);
2941

2942
        qemuCaps->arch = virQEMUCapsArchFromString(tmp);
2943
    } else {
2944
        qemuCaps->arch = virArchFromHost();
2945 2946
    }

2947
    cmd = virQEMUCapsProbeCommand(qemuCaps->binary, NULL, runUid, runGid);
2948 2949 2950 2951
    virCommandAddArgList(cmd, "-help", NULL);
    virCommandSetOutputBuffer(cmd, &help);

    if (virCommandRun(cmd, NULL) < 0)
2952
        goto cleanup;
2953

2954 2955 2956 2957 2958 2959
    if (virQEMUCapsParseHelpStr(qemuCaps->binary,
                                help, qemuCaps,
                                &qemuCaps->version,
                                &is_kvm,
                                &qemuCaps->kvmVersion,
                                false) < 0)
2960
        goto cleanup;
2961

D
Daniel P. Berrange 已提交
2962 2963 2964 2965 2966 2967 2968
    /* x86_64 and i686 support PCI-multibus on all machine types
     * since forever. For other architectures, it has been changing
     * across releases, per machine type, so we can't simply detect
     * it here. Thus the rest of the logic is provided in a separate
     * helper virQEMUCapsHasPCIMultiBus() which keys off the machine
     * stored in virDomainDef and QEMU version number
     */
2969
    if (qemuCaps->arch == VIR_ARCH_X86_64 ||
D
Daniel P. Berrange 已提交
2970
        qemuCaps->arch == VIR_ARCH_I686)
2971
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_MULTIBUS);
D
Daniel P. Berrange 已提交
2972 2973 2974 2975 2976

    /* -no-acpi is not supported on non-x86
     * even if qemu reports it in -help */
    if (qemuCaps->arch != VIR_ARCH_X86_64 &&
        qemuCaps->arch != VIR_ARCH_I686)
2977
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_NO_ACPI);
2978

2979
    /* virQEMUCapsExtractDeviceStr will only set additional caps if qemu
2980
     * understands the 0.13.0+ notion of "-device driver,".  */
2981
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE) &&
2982
        strstr(help, "-device driver,?") &&
2983 2984
        virQEMUCapsExtractDeviceStr(qemuCaps->binary,
                                    qemuCaps, runUid, runGid) < 0) {
2985
        goto cleanup;
2986
    }
2987

2988
    if (virQEMUCapsProbeCPUModels(qemuCaps, runUid, runGid) < 0)
2989
        goto cleanup;
2990

2991
    if (virQEMUCapsProbeMachineTypes(qemuCaps, runUid, runGid) < 0)
2992
        goto cleanup;
2993

2994
    ret = 0;
2995
 cleanup:
2996
    virCommandFree(cmd);
2997
    VIR_FREE(help);
2998 2999 3000 3001
    return ret;
}


3002
static void virQEMUCapsMonitorNotify(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
3003 3004
                                     virDomainObjPtr vm ATTRIBUTE_UNUSED,
                                     void *opaque ATTRIBUTE_UNUSED)
3005 3006 3007 3008
{
}

static qemuMonitorCallbacks callbacks = {
3009 3010
    .eofNotify = virQEMUCapsMonitorNotify,
    .errorNotify = virQEMUCapsMonitorNotify,
3011 3012 3013 3014 3015 3016 3017
};


/* Capabilities that we assume are always enabled
 * for QEMU >= 1.2.0
 */
static void
3018
virQEMUCapsInitQMPBasic(virQEMUCapsPtr qemuCaps)
3019
{
3020 3021 3022 3023 3024 3025 3026 3027 3028 3029 3030 3031 3032 3033 3034 3035 3036 3037 3038 3039 3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059 3060 3061 3062 3063 3064 3065 3066 3067
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_COLON);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_REBOOT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_UUID);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNET_HDR);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_TCP);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_EXEC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_V2);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_FORMAT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_0_10);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MEM_PATH);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_SERIAL);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_UNIX);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MONITOR_JSON);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_BALLOON);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SDL);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMP_TOPOLOGY);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_RTC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VHOST_NET);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NODEFCONFIG);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_BOOT_MENU);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME_PROCESS);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_READONLY);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMBIOS_TYPE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_NONE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_FD);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_AIO);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE_QXL_VGA);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_DIRECTSYNC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_SHUTDOWN);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_UNSAFE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_READONLY);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VIRTIO_BLK_SG_IO);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_COPY_ON_READ);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_CPU_HOST);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_WRITEOUT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_IOTUNE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_WAKEUP);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_USER_CONFIG);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV_BRIDGE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SECCOMP_SANDBOX);
O
Olivia Yin 已提交
3068
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DTB);
J
Ján Tomko 已提交
3069
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_IPV6_MIGRATION);
3070 3071
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_OPT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DUMP_GUEST_CORE);
3072
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_SHARE_POLICY);
3073
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_HOST_PCI_MULTIDOMAIN);
3074 3075
}

3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090 3091 3092 3093 3094
/* Capabilities that are architecture depending
 * initialized for QEMU.
 */
static int
virQEMUCapsInitArchQMPBasic(virQEMUCapsPtr qemuCaps,
                            qemuMonitorPtr mon)
{
    char *archstr = NULL;
    int ret = -1;

    if (!(archstr = qemuMonitorGetTargetArch(mon)))
        return -1;

    if ((qemuCaps->arch = virQEMUCapsArchFromString(archstr)) == VIR_ARCH_NONE) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("Unknown QEMU arch %s"), archstr);
        goto cleanup;
    }

D
Daniel P. Berrange 已提交
3095 3096 3097 3098 3099 3100 3101 3102
    /* x86_64 and i686 support PCI-multibus on all machine types
     * since forever. For other architectures, it has been changing
     * across releases, per machine type, so we can't simply detect
     * it here. Thus the rest of the logic is provided in a separate
     * helper virQEMUCapsHasPCIMultiBus() which keys off the machine
     * stored in virDomainDef and QEMU version number
     *
     * ACPI/HPET/KVM PIT are also x86 specific
3103 3104 3105 3106 3107
     */
    if (qemuCaps->arch == VIR_ARCH_X86_64 ||
        qemuCaps->arch == VIR_ARCH_I686) {
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_MULTIBUS);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_ACPI);
J
Ján Tomko 已提交
3108
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_HPET);
3109 3110 3111 3112 3113
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_KVM_PIT);
    }

    ret = 0;

3114
 cleanup:
3115 3116 3117
    VIR_FREE(archstr);
    return ret;
}
3118

3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131 3132 3133 3134 3135 3136 3137 3138 3139 3140 3141 3142 3143 3144 3145 3146 3147 3148 3149 3150 3151 3152 3153 3154 3155 3156 3157 3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170 3171
int
virQEMUCapsInitQMPMonitor(virQEMUCapsPtr qemuCaps,
                          qemuMonitorPtr mon)
{
    int ret = -1;
    int major, minor, micro;
    char *package = NULL;

    /* @mon is supposed to be locked by callee */

    if (qemuMonitorSetCapabilities(mon) < 0) {
        virErrorPtr err = virGetLastError();
        VIR_DEBUG("Failed to set monitor capabilities %s",
                  err ? err->message : "<unknown problem>");
        ret = 0;
        goto cleanup;
    }

    if (qemuMonitorGetVersion(mon,
                              &major, &minor, &micro,
                              &package) < 0) {
        virErrorPtr err = virGetLastError();
        VIR_DEBUG("Failed to query monitor version %s",
                  err ? err->message : "<unknown problem>");
        ret = 0;
        goto cleanup;
    }

    VIR_DEBUG("Got version %d.%d.%d (%s)",
              major, minor, micro, NULLSTR(package));

    if (major < 1 || (major == 1 && minor < 2)) {
        VIR_DEBUG("Not new enough for QMP capabilities detection");
        ret = 0;
        goto cleanup;
    }

    qemuCaps->version = major * 1000000 + minor * 1000 + micro;
    qemuCaps->usedQMP = true;

    virQEMUCapsInitQMPBasic(qemuCaps);

    if (virQEMUCapsInitArchQMPBasic(qemuCaps, mon) < 0)
        goto cleanup;

    /* USB option is supported v1.3.0 onwards */
    if (qemuCaps->version >= 1003000)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_USB_OPT);

    /* WebSockets were introduced between 1.3.0 and 1.3.1 */
    if (qemuCaps->version >= 1003001)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_WEBSOCKET);

3172 3173 3174 3175 3176 3177
    /* -chardev spiceport is supported from 1.4.0, but usable through
     * qapi only since 1.5.0, however, it still cannot be queried
     * for as a capability */
    if (qemuCaps->version >= 1005000)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEPORT);

3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196
    if (qemuCaps->version >= 1006000)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE_VIDEO_PRIMARY);

    if (virQEMUCapsProbeQMPCommands(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPEvents(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPObjects(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPMachineTypes(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPCPUDefinitions(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPKVMState(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPTPM(qemuCaps, mon) < 0)
        goto cleanup;
    if (virQEMUCapsProbeQMPCommandLine(qemuCaps, mon) < 0)
        goto cleanup;
3197 3198
    if (virQEMUCapsProbeQMPMigrationCapabilities(qemuCaps, mon) < 0)
        goto cleanup;
3199 3200

    ret = 0;
3201
 cleanup:
3202 3203 3204 3205
    VIR_FREE(package);
    return ret;
}

3206
static int
3207 3208 3209 3210
virQEMUCapsInitQMP(virQEMUCapsPtr qemuCaps,
                   const char *libDir,
                   uid_t runUid,
                   gid_t runGid)
3211 3212 3213 3214 3215 3216 3217 3218
{
    int ret = -1;
    virCommandPtr cmd = NULL;
    qemuMonitorPtr mon = NULL;
    int status = 0;
    virDomainChrSourceDef config;
    char *monarg = NULL;
    char *monpath = NULL;
3219
    char *pidfile = NULL;
3220
    pid_t pid = 0;
3221 3222
    virDomainObjPtr vm = NULL;
    virDomainXMLOptionPtr xmlopt = NULL;
3223

3224 3225 3226
    /* the ".sock" sufix is important to avoid a possible clash with a qemu
     * domain called "capabilities"
     */
3227
    if (virAsprintf(&monpath, "%s/%s", libDir, "capabilities.monitor.sock") < 0)
3228
        goto cleanup;
3229
    if (virAsprintf(&monarg, "unix:%s,server,nowait", monpath) < 0)
3230 3231
        goto cleanup;

3232 3233
    /* ".pidfile" suffix is used rather than ".pid" to avoid a possible clash
     * with a qemu domain called "capabilities"
3234 3235 3236
     * Normally we'd use runDir for pid files, but because we're using
     * -daemonize we need QEMU to be allowed to create them, rather
     * than libvirtd. So we're using libDir which QEMU can write to
3237
     */
3238
    if (virAsprintf(&pidfile, "%s/%s", libDir, "capabilities.pidfile") < 0)
3239 3240
        goto cleanup;

3241 3242 3243 3244 3245
    memset(&config, 0, sizeof(config));
    config.type = VIR_DOMAIN_CHR_TYPE_UNIX;
    config.data.nix.path = monpath;
    config.data.nix.listen = false;

3246 3247
    virPidFileForceCleanupPath(pidfile);

3248
    VIR_DEBUG("Try to get caps via QMP qemuCaps=%p", qemuCaps);
3249

3250 3251 3252 3253 3254 3255 3256
    /*
     * We explicitly need to use -daemonize here, rather than
     * virCommandDaemonize, because we need to synchronize
     * with QEMU creating its monitor socket API. Using
     * daemonize guarantees control won't return to libvirt
     * until the socket is present.
     */
3257
    cmd = virCommandNewArgList(qemuCaps->binary,
3258 3259 3260 3261 3262 3263
                               "-S",
                               "-no-user-config",
                               "-nodefaults",
                               "-nographic",
                               "-M", "none",
                               "-qmp", monarg,
3264 3265
                               "-pidfile", pidfile,
                               "-daemonize",
3266 3267 3268
                               NULL);
    virCommandAddEnvPassCommon(cmd);
    virCommandClearCaps(cmd);
3269 3270
    virCommandSetGID(cmd, runGid);
    virCommandSetUID(cmd, runUid);
3271

3272
    /* Log, but otherwise ignore, non-zero status.  */
3273 3274 3275 3276 3277
    if (virCommandRun(cmd, &status) < 0)
        goto cleanup;

    if (status != 0) {
        ret = 0;
3278
        VIR_DEBUG("QEMU %s exited with status %d", qemuCaps->binary, status);
3279 3280 3281
        goto cleanup;
    }

3282 3283 3284 3285 3286 3287
    if (virPidFileReadPath(pidfile, &pid) < 0) {
        VIR_DEBUG("Failed to read pidfile %s", pidfile);
        ret = 0;
        goto cleanup;
    }

3288 3289 3290 3291 3292
    if (!(xmlopt = virDomainXMLOptionNew(NULL, NULL, NULL)) ||
        !(vm = virDomainObjNew(xmlopt)))
        goto cleanup;

    vm->pid = pid;
3293

3294
    if (!(mon = qemuMonitorOpen(vm, &config, true, &callbacks, NULL))) {
3295
        ret = 0;
3296
        goto cleanup;
3297
    }
3298

3299
    virObjectLock(mon);
3300

3301
    if (virQEMUCapsInitQMPMonitor(qemuCaps, mon) < 0)
3302
        goto cleanup;
3303 3304 3305

    ret = 0;

3306
 cleanup:
3307
    if (mon)
3308
        virObjectUnlock(mon);
3309 3310
    qemuMonitorClose(mon);
    virCommandAbort(cmd);
3311
    virCommandFree(cmd);
3312
    VIR_FREE(monarg);
3313 3314
    if (monpath)
        ignore_value(unlink(monpath));
3315
    VIR_FREE(monpath);
3316 3317
    virObjectUnref(vm);
    virObjectUnref(xmlopt);
3318

3319
    if (pid != 0) {
3320 3321
        char ebuf[1024];

3322 3323 3324 3325 3326 3327 3328
        VIR_DEBUG("Killing QMP caps process %lld", (long long) pid);
        if (virProcessKill(pid, SIGKILL) < 0 && errno != ESRCH)
            VIR_ERROR(_("Failed to kill process %lld: %s"),
                      (long long) pid,
                      virStrerror(errno, ebuf, sizeof(ebuf)));
    }
    if (pidfile) {
3329 3330 3331
        unlink(pidfile);
        VIR_FREE(pidfile);
    }
3332 3333 3334 3335
    return ret;
}


3336 3337 3338 3339 3340 3341 3342 3343 3344 3345 3346 3347
#define MESSAGE_ID_CAPS_PROBE_FAILURE "8ae2f3fb-2dbe-498e-8fbd-012d40afa361"

static void
virQEMUCapsLogProbeFailure(const char *binary)
{
    virLogMetadata meta[] = {
        { .key = "MESSAGE_ID", .s = MESSAGE_ID_CAPS_PROBE_FAILURE, .iv = 0 },
        { .key = "LIBVIRT_QEMU_BINARY", .s = binary, .iv = 0 },
        { .key = NULL },
    };
    virErrorPtr err = virGetLastError();

3348
    virLogMessage(&virLogSelf,
3349 3350 3351 3352 3353 3354 3355 3356 3357
                  VIR_LOG_WARN,
                  __FILE__, __LINE__, __func__,
                  meta,
                  _("Failed to probe capabilities for %s: %s"),
                  binary, err && err->message ? err->message :
                  _("unknown failure"));
}


3358 3359
virQEMUCapsPtr virQEMUCapsNewForBinary(const char *binary,
                                       const char *libDir,
3360
                                       const char *cacheDir,
3361 3362
                                       uid_t runUid,
                                       gid_t runGid)
3363
{
3364
    virQEMUCapsPtr qemuCaps;
3365 3366 3367
    struct stat sb;
    int rv;

3368 3369 3370
    if (!(qemuCaps = virQEMUCapsNew()))
        goto error;

3371 3372
    if (VIR_STRDUP(qemuCaps->binary, binary) < 0)
        goto error;
3373 3374 3375 3376 3377 3378 3379 3380

    /* We would also want to check faccessat if we cared about ACLs,
     * but we don't.  */
    if (stat(binary, &sb) < 0) {
        virReportSystemError(errno, _("Cannot check QEMU binary %s"),
                             binary);
        goto error;
    }
3381
    qemuCaps->ctime = sb.st_ctime;
3382 3383 3384 3385 3386 3387 3388 3389 3390 3391 3392

    /* Make sure the binary we are about to try exec'ing exists.
     * Technically we could catch the exec() failure, but that's
     * in a sub-process so it's hard to feed back a useful error.
     */
    if (!virFileIsExecutable(binary)) {
        virReportSystemError(errno, _("QEMU binary %s is not executable"),
                             binary);
        goto error;
    }

3393
    if ((rv = virQEMUCapsInitCached(qemuCaps, cacheDir)) < 0)
3394 3395
        goto error;

3396 3397 3398 3399 3400 3401 3402 3403 3404 3405 3406 3407 3408 3409
    if (rv == 0) {
        if (virQEMUCapsInitQMP(qemuCaps, libDir, runUid, runGid) < 0) {
            virQEMUCapsLogProbeFailure(binary);
            goto error;
        }

        if (!qemuCaps->usedQMP &&
            virQEMUCapsInitHelp(qemuCaps, runUid, runGid) < 0) {
            virQEMUCapsLogProbeFailure(binary);
            goto error;
        }

        if (virQEMUCapsRememberCached(qemuCaps, cacheDir) < 0)
            goto error;
3410
    }
3411

3412
    return qemuCaps;
3413

3414
 error:
3415 3416
    virObjectUnref(qemuCaps);
    qemuCaps = NULL;
3417
    return NULL;
3418 3419 3420
}


3421
bool virQEMUCapsIsValid(virQEMUCapsPtr qemuCaps)
3422 3423 3424
{
    struct stat sb;

3425
    if (!qemuCaps->binary)
3426 3427
        return true;

3428
    if (stat(qemuCaps->binary, &sb) < 0)
3429 3430
        return false;

3431
    return sb.st_ctime == qemuCaps->ctime;
3432
}
3433 3434


3435 3436
virQEMUCapsCachePtr
virQEMUCapsCacheNew(const char *libDir,
3437
                    const char *cacheDir,
3438 3439
                    uid_t runUid,
                    gid_t runGid)
3440
{
3441
    virQEMUCapsCachePtr cache;
3442

3443
    if (VIR_ALLOC(cache) < 0)
3444 3445 3446 3447 3448 3449 3450 3451 3452
        return NULL;

    if (virMutexInit(&cache->lock) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Unable to initialize mutex"));
        VIR_FREE(cache);
        return NULL;
    }

E
Eric Blake 已提交
3453
    if (!(cache->binaries = virHashCreate(10, virObjectFreeHashData)))
3454
        goto error;
3455
    if (VIR_STRDUP(cache->libDir, libDir) < 0)
3456
        goto error;
3457 3458
    if (VIR_STRDUP(cache->cacheDir, cacheDir) < 0)
        goto error;
3459

3460 3461 3462
    cache->runUid = runUid;
    cache->runGid = runGid;

3463 3464
    return cache;

3465
 error:
3466
    virQEMUCapsCacheFree(cache);
3467 3468 3469 3470
    return NULL;
}


3471 3472
virQEMUCapsPtr
virQEMUCapsCacheLookup(virQEMUCapsCachePtr cache, const char *binary)
3473
{
3474
    virQEMUCapsPtr ret = NULL;
3475 3476 3477
    virMutexLock(&cache->lock);
    ret = virHashLookup(cache->binaries, binary);
    if (ret &&
3478
        !virQEMUCapsIsValid(ret)) {
3479 3480 3481 3482 3483 3484 3485 3486
        VIR_DEBUG("Cached capabilities %p no longer valid for %s",
                  ret, binary);
        virHashRemoveEntry(cache->binaries, binary);
        ret = NULL;
    }
    if (!ret) {
        VIR_DEBUG("Creating capabilities for %s",
                  binary);
3487
        ret = virQEMUCapsNewForBinary(binary, cache->libDir,
3488
                                      cache->cacheDir,
3489
                                      cache->runUid, cache->runGid);
3490 3491 3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502 3503 3504 3505
        if (ret) {
            VIR_DEBUG("Caching capabilities %p for %s",
                      ret, binary);
            if (virHashAddEntry(cache->binaries, binary, ret) < 0) {
                virObjectUnref(ret);
                ret = NULL;
            }
        }
    }
    VIR_DEBUG("Returning caps %p for %s", ret, binary);
    virObjectRef(ret);
    virMutexUnlock(&cache->lock);
    return ret;
}


3506 3507
virQEMUCapsPtr
virQEMUCapsCacheLookupCopy(virQEMUCapsCachePtr cache, const char *binary)
3508
{
3509 3510
    virQEMUCapsPtr qemuCaps = virQEMUCapsCacheLookup(cache, binary);
    virQEMUCapsPtr ret;
3511

3512
    if (!qemuCaps)
3513 3514
        return NULL;

3515 3516
    ret = virQEMUCapsNewCopy(qemuCaps);
    virObjectUnref(qemuCaps);
3517 3518 3519 3520
    return ret;
}


3521 3522 3523 3524 3525 3526 3527 3528 3529 3530 3531 3532 3533 3534 3535 3536 3537 3538 3539 3540 3541 3542 3543 3544 3545 3546 3547 3548 3549
static int
virQEMUCapsCompareArch(const void *payload,
                       const void *name ATTRIBUTE_UNUSED,
                       const void *opaque)
{
    struct virQEMUCapsSearchData *data = (struct virQEMUCapsSearchData *) opaque;
    const virQEMUCaps *qemuCaps = payload;

    return qemuCaps->arch == data->arch;
}


virQEMUCapsPtr
virQEMUCapsCacheLookupByArch(virQEMUCapsCachePtr cache,
                             virArch arch)
{
    virQEMUCapsPtr ret = NULL;
    struct virQEMUCapsSearchData data = { .arch = arch };

    virMutexLock(&cache->lock);
    ret = virHashSearch(cache->binaries, virQEMUCapsCompareArch, &data);
    VIR_DEBUG("Returning caps %p for arch %s", ret, virArchToString(arch));
    virObjectRef(ret);
    virMutexUnlock(&cache->lock);

    return ret;
}


3550
void
3551
virQEMUCapsCacheFree(virQEMUCapsCachePtr cache)
3552 3553 3554 3555
{
    if (!cache)
        return;

3556
    VIR_FREE(cache->libDir);
3557
    VIR_FREE(cache->cacheDir);
3558 3559 3560 3561
    virHashFree(cache->binaries);
    virMutexDestroy(&cache->lock);
    VIR_FREE(cache);
}
3562 3563

bool
3564
virQEMUCapsUsedQMP(virQEMUCapsPtr qemuCaps)
3565
{
3566
    return qemuCaps->usedQMP;
3567
}
3568 3569 3570 3571

bool
virQEMUCapsSupportsChardev(virDomainDefPtr def,
                           virQEMUCapsPtr qemuCaps,
3572
                           virDomainChrDefPtr chr)
3573 3574 3575 3576 3577
{
    if (!virQEMUCapsGet(qemuCaps, QEMU_CAPS_CHARDEV) ||
        !virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE))
        return false;

3578 3579 3580 3581 3582 3583
    if ((def->os.arch == VIR_ARCH_PPC) || (def->os.arch == VIR_ARCH_PPC64)) {
        /* only pseries need -device spapr-vty with -chardev */
        return (chr->deviceType == VIR_DOMAIN_CHR_DEVICE_TYPE_SERIAL &&
                chr->info.type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_SPAPRVIO);
    }

3584
    if ((def->os.arch != VIR_ARCH_ARMV7L) && (def->os.arch != VIR_ARCH_AARCH64))
3585
        return true;
3586

3587 3588 3589 3590 3591 3592
    /* This may not be true for all ARM machine types, but at least
     * the only supported non-virtio serial devices of vexpress and versatile
     * don't have the -chardev property wired up. */
    return (chr->info.type == VIR_DOMAIN_DEVICE_ADDRESS_TYPE_VIRTIO_MMIO ||
            (chr->deviceType == VIR_DOMAIN_CHR_DEVICE_TYPE_CONSOLE &&
             chr->targetType == VIR_DOMAIN_CHR_CONSOLE_TARGET_TYPE_VIRTIO));
3593
}
3594 3595 3596 3597 3598 3599 3600 3601 3602 3603 3604 3605 3606 3607


bool
virQEMUCapsIsMachineSupported(virQEMUCapsPtr qemuCaps,
                              const char *canonical_machine)
{
    size_t i;

    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
        if (STREQ(canonical_machine, qemuCaps->machineTypes[i]))
            return true;
    }
    return false;
}
3608 3609 3610 3611 3612 3613 3614 3615 3616


const char *
virQEMUCapsGetDefaultMachine(virQEMUCapsPtr qemuCaps)
{
    if (!qemuCaps->nmachineTypes)
        return NULL;
    return qemuCaps->machineTypes[0];
}
3617 3618


3619
static int
3620
virQEMUCapsFillDomainLoaderCaps(virQEMUCapsPtr qemuCaps,
3621
                                virDomainCapsLoaderPtr capsLoader,
3622
                                virArch arch,
3623 3624
                                char **loader,
                                size_t nloader)
3625
{
3626 3627
    size_t i;

3628
    capsLoader->device.supported = true;
3629

3630
    if (VIR_ALLOC_N(capsLoader->values.values, nloader) < 0)
3631 3632
        return -1;

3633 3634
    for (i = 0; i < nloader; i++) {
        const char *filename = loader[i];
3635 3636 3637 3638 3639 3640

        if (!virFileExists(filename)) {
            VIR_DEBUG("loader filename=%s does not exist", filename);
            continue;
        }

3641
        if (VIR_STRDUP(capsLoader->values.values[capsLoader->values.nvalues],
3642 3643
                       filename) < 0)
            return -1;
3644
        capsLoader->values.nvalues++;
3645 3646
    }

3647
    VIR_DOMAIN_CAPS_ENUM_SET(capsLoader->type,
3648 3649 3650 3651 3652
                             VIR_DOMAIN_LOADER_TYPE_ROM);

    if (arch == VIR_ARCH_X86_64 &&
        virQEMUCapsGet(qemuCaps, QEMU_CAPS_DRIVE) &&
        virQEMUCapsGet(qemuCaps, QEMU_CAPS_DRIVE_FORMAT))
3653
        VIR_DOMAIN_CAPS_ENUM_SET(capsLoader->type,
3654 3655 3656 3657
                                 VIR_DOMAIN_LOADER_TYPE_PFLASH);


    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DRIVE_READONLY))
3658
        VIR_DOMAIN_CAPS_ENUM_SET(capsLoader->readonly,
3659 3660
                                 VIR_TRISTATE_BOOL_YES,
                                 VIR_TRISTATE_BOOL_NO);
3661
    return 0;
3662 3663 3664
}


3665
static int
3666 3667
virQEMUCapsFillDomainOSCaps(virQEMUCapsPtr qemuCaps,
                            virDomainCapsOSPtr os,
3668
                            virArch arch,
3669 3670
                            char **loader,
                            size_t nloader)
3671
{
3672
    virDomainCapsLoaderPtr capsLoader = &os->loader;
3673 3674

    os->device.supported = true;
3675 3676
    if (virQEMUCapsFillDomainLoaderCaps(qemuCaps, capsLoader, arch,
                                        loader, nloader) < 0)
3677 3678
        return -1;
    return 0;
3679 3680 3681
}


3682
static int
3683 3684 3685 3686 3687 3688 3689 3690 3691 3692 3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704
virQEMUCapsFillDomainDeviceDiskCaps(virQEMUCapsPtr qemuCaps,
                                    virDomainCapsDeviceDiskPtr disk)
{
    disk->device.supported = true;
    /* QEMU supports all of these */
    VIR_DOMAIN_CAPS_ENUM_SET(disk->diskDevice,
                             VIR_DOMAIN_DISK_DEVICE_DISK,
                             VIR_DOMAIN_DISK_DEVICE_CDROM,
                             VIR_DOMAIN_DISK_DEVICE_FLOPPY);

    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_VIRTIO_BLK_SG_IO))
        VIR_DOMAIN_CAPS_ENUM_SET(disk->diskDevice, VIR_DOMAIN_DISK_DEVICE_LUN);

    VIR_DOMAIN_CAPS_ENUM_SET(disk->bus,
                             VIR_DOMAIN_DISK_BUS_IDE,
                             VIR_DOMAIN_DISK_BUS_FDC,
                             VIR_DOMAIN_DISK_BUS_SCSI,
                             VIR_DOMAIN_DISK_BUS_VIRTIO,
                             /* VIR_DOMAIN_DISK_BUS_SD */);

    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE_USB_STORAGE))
        VIR_DOMAIN_CAPS_ENUM_SET(disk->bus, VIR_DOMAIN_DISK_BUS_USB);
3705
    return 0;
3706 3707 3708
}


3709
static int
3710 3711 3712 3713 3714 3715 3716 3717 3718 3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729 3730 3731 3732 3733 3734 3735 3736 3737 3738 3739 3740 3741 3742 3743 3744 3745 3746 3747 3748 3749 3750 3751 3752 3753
virQEMUCapsFillDomainDeviceHostdevCaps(virQEMUCapsPtr qemuCaps,
                                       virDomainCapsDeviceHostdevPtr hostdev)
{
    bool supportsPassthroughKVM = qemuHostdevHostSupportsPassthroughLegacy();
    bool supportsPassthroughVFIO = qemuHostdevHostSupportsPassthroughVFIO();

    hostdev->device.supported = true;
    /* VIR_DOMAIN_HOSTDEV_MODE_CAPABILITIES is for containers only */
    VIR_DOMAIN_CAPS_ENUM_SET(hostdev->mode,
                             VIR_DOMAIN_HOSTDEV_MODE_SUBSYS);

    VIR_DOMAIN_CAPS_ENUM_SET(hostdev->startupPolicy,
                             VIR_DOMAIN_STARTUP_POLICY_DEFAULT,
                             VIR_DOMAIN_STARTUP_POLICY_MANDATORY,
                             VIR_DOMAIN_STARTUP_POLICY_REQUISITE,
                             VIR_DOMAIN_STARTUP_POLICY_OPTIONAL);

    VIR_DOMAIN_CAPS_ENUM_SET(hostdev->subsysType,
                             VIR_DOMAIN_HOSTDEV_SUBSYS_TYPE_USB,
                             VIR_DOMAIN_HOSTDEV_SUBSYS_TYPE_PCI);
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DRIVE) &&
        virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE) &&
        virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE_SCSI_GENERIC))
        VIR_DOMAIN_CAPS_ENUM_SET(hostdev->subsysType,
                                 VIR_DOMAIN_HOSTDEV_SUBSYS_TYPE_SCSI);

    /* No virDomainHostdevCapsType for QEMU */
    virDomainCapsEnumClear(&hostdev->capsType);

    virDomainCapsEnumClear(&hostdev->pciBackend);
    if (supportsPassthroughVFIO &&
        virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE_VFIO_PCI)) {
        VIR_DOMAIN_CAPS_ENUM_SET(hostdev->pciBackend,
                                 VIR_DOMAIN_HOSTDEV_PCI_BACKEND_DEFAULT,
                                 VIR_DOMAIN_HOSTDEV_PCI_BACKEND_VFIO);
    }

    if (supportsPassthroughKVM &&
        (virQEMUCapsGet(qemuCaps, QEMU_CAPS_PCIDEVICE) ||
         virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE))) {
        VIR_DOMAIN_CAPS_ENUM_SET(hostdev->pciBackend,
                                 VIR_DOMAIN_HOSTDEV_PCI_BACKEND_DEFAULT,
                                 VIR_DOMAIN_HOSTDEV_PCI_BACKEND_KVM);
    }
3754
    return 0;
3755 3756 3757
}


3758
int
3759
virQEMUCapsFillDomainCaps(virDomainCapsPtr domCaps,
3760
                          virQEMUCapsPtr qemuCaps,
3761 3762
                          char **loader,
                          size_t nloader)
3763
{
3764
    virDomainCapsOSPtr os = &domCaps->os;
3765 3766 3767 3768 3769 3770
    virDomainCapsDeviceDiskPtr disk = &domCaps->disk;
    virDomainCapsDeviceHostdevPtr hostdev = &domCaps->hostdev;
    int maxvcpus = virQEMUCapsGetMachineMaxCpus(qemuCaps, domCaps->machine);

    domCaps->maxvcpus = maxvcpus;

3771 3772
    if (virQEMUCapsFillDomainOSCaps(qemuCaps, os, domCaps->arch,
                                    loader, nloader) < 0 ||
3773 3774 3775 3776
        virQEMUCapsFillDomainDeviceDiskCaps(qemuCaps, disk) < 0 ||
        virQEMUCapsFillDomainDeviceHostdevCaps(qemuCaps, hostdev) < 0)
        return -1;
    return 0;
3777
}