qemu_capabilities.c 81.9 KB
Newer Older
1 2 3
/*
 * qemu_capabilities.c: QEMU capabilities generation
 *
4
 * Copyright (C) 2006-2013 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2006 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with this library.  If not, see
O
Osier Yang 已提交
19
 * <http://www.gnu.org/licenses/>.
20 21 22 23 24 25 26
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

#include <config.h>

#include "qemu_capabilities.h"
27
#include "viralloc.h"
28
#include "virlog.h"
29
#include "virerror.h"
E
Eric Blake 已提交
30
#include "virfile.h"
31 32
#include "virpidfile.h"
#include "virprocess.h"
33 34 35
#include "nodeinfo.h"
#include "cpu/cpu.h"
#include "domain_conf.h"
36
#include "vircommand.h"
37
#include "virbitmap.h"
38
#include "virnodesuspend.h"
39
#include "qemu_monitor.h"
40
#include "virstring.h"
41

42
#include <fcntl.h>
43 44 45
#include <sys/stat.h>
#include <unistd.h>
#include <sys/wait.h>
46
#include <stdarg.h>
47 48 49

#define VIR_FROM_THIS VIR_FROM_QEMU

50 51 52 53
/* While not public, these strings must not change. They
 * are used in domain status files which are read on
 * daemon restarts
 */
54
VIR_ENUM_IMPL(virQEMUCaps, QEMU_CAPS_LAST,
55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91
              "kqemu",  /* 0 */
              "vnc-colon",
              "no-reboot",
              "drive",
              "drive-boot",

              "name", /* 5 */
              "uuid",
              "domid",
              "vnet-hdr",
              "migrate-kvm-stdio",

              "migrate-qemu-tcp", /* 10 */
              "migrate-qemu-exec",
              "drive-cache-v2",
              "kvm",
              "drive-format",

              "vga", /* 15 */
              "0.10",
              "pci-device",
              "mem-path",
              "drive-serial",

              "xen-domid", /* 20 */
              "migrate-qemu-unix",
              "chardev",
              "enable-kvm",
              "monitor-json",

              "balloon", /* 25 */
              "device",
              "sdl",
              "smp-topology",
              "netdev",

              "rtc", /* 30 */
92
              "vhost-net",
93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
              "rtc-td-hack",
              "no-hpet",
              "no-kvm-pit",

              "tdf", /* 35 */
              "pci-configfd",
              "nodefconfig",
              "boot-menu",
              "enable-kqemu",

              "fsdev", /* 40 */
              "nesting",
              "name-process",
              "drive-readonly",
              "smbios-type",

              "vga-qxl", /* 45 */
              "spice",
              "vga-none",
              "migrate-qemu-fd",
              "boot-index",

              "hda-duplex", /* 50 */
              "drive-aio",
              "pci-multibus",
              "pci-bootindex",
              "ccid-emulated",

              "ccid-passthru", /* 55 */
              "chardev-spicevmc",
              "device-spicevmc",
              "virtio-tx-alg",
              "device-qxl-vga",
126 127

              "pci-multifunction", /* 60 */
128
              "virtio-blk-pci.ioeventfd",
M
Michal Privoznik 已提交
129
              "sga",
130 131
              "virtio-blk-pci.event_idx",
              "virtio-net-pci.event_idx",
132 133 134 135 136 137 138 139 140 141

              "cache-directsync", /* 65 */
              "piix3-usb-uhci",
              "piix4-usb-uhci",
              "usb-ehci",
              "ich9-usb-ehci1",

              "vt82c686b-usb-uhci", /* 70 */
              "pci-ohci",
              "usb-redir",
M
Marc-André Lureau 已提交
142
              "usb-hub",
143
              "no-shutdown",
144 145

              "cache-unsafe", /* 75 */
146
              "rombar",
J
Jim Fehlig 已提交
147
              "ich9-ahci",
148
              "no-acpi",
149
              "fsdev-readonly",
150

151
              "virtio-blk-pci.scsi", /* 80 */
152
              "blk-sg-io",
O
Osier Yang 已提交
153
              "drive-copy-on-read",
154
              "cpu-host",
155
              "fsdev-writeout",
156 157

              "drive-iotune", /* 85 */
158
              "system_wakeup",
159
              "scsi-disk.channel",
160
              "scsi-block",
161
              "transaction",
162 163 164

              "block-job-sync", /* 90 */
              "block-job-async",
165
              "scsi-cd",
166
              "ide-cd",
167
              "no-user-config",
M
Marc-André Lureau 已提交
168 169

              "hda-micro", /* 95 */
170
              "dump-guest-memory",
G
Gerd Hoffmann 已提交
171
              "nec-usb-xhci",
172
              "virtio-s390",
173
              "balloon-event",
M
Marc-André Lureau 已提交
174

R
Richa Marwaha 已提交
175
              "bridge", /* 100 */
176 177
              "lsi",
              "virtio-scsi-pci",
V
Viktor Mihajlovski 已提交
178
              "blockio",
179
              "disable-s3",
R
Richa Marwaha 已提交
180

181
              "disable-s4", /* 105 */
182
              "usb-redir.filter",
183 184
              "ide-drive.wwn",
              "scsi-disk.wwn",
185
              "seccomp-sandbox",
186 187

              "reboot-timeout", /* 110 */
188
              "dump-guest-core",
189
              "seamless-migration",
190
              "block-commit",
191
              "vnc",
192 193

              "drive-mirror", /* 115 */
194 195
              "usb-redir.bootindex",
              "usb-host.bootindex",
196
              "blockdev-snapshot-sync",
197 198 199 200 201 202
              "qxl",

              "VGA", /* 120 */
              "cirrus-vga",
              "vmware-svga",
              "device-video-primary",
203
              "s390-sclp",
204 205

              "usb-serial", /* 125 */
G
Guannan Ren 已提交
206
              "usb-net",
207
              "add-fd",
208
              "nbd-server",
209 210 211
              "virtio-rng",

              "rng-random", /* 130 */
212
              "rng-egd",
O
Olivia Yin 已提交
213 214
              "virtio-ccw",
              "dtb",
215
              "megasas",
J
Ján Tomko 已提交
216 217

              "ipv6-migration", /* 135 */
218
              "machine-opt",
L
Li Zhang 已提交
219
              "machine-usb-opt",
S
Stefan Berger 已提交
220 221
              "tpm-passthrough",
              "tpm-tis",
222 223

              "nvram",  /* 140 */
H
Han Cheng 已提交
224 225 226 227 228 229
              "pci-bridge",
              "vfio-pci",
              "vfio-pci.bootindex",
              "scsi-generic",

              "scsi-generic.bootindex", /* 145 */
230
              "mem-merge",
231
              "vnc-websocket",
O
Osier Yang 已提交
232
              "drive-discard",
233
              "mlock",
234 235

              "vnc-share-policy", /* 150 */
236
              "device-del-event",
237 238
    );

239
struct _virQEMUCaps {
240 241
    virObject object;

242 243
    bool usedQMP;

244 245 246
    char *binary;
    time_t mtime;

247
    virBitmapPtr flags;
248 249 250 251

    unsigned int version;
    unsigned int kvmVersion;

252
    virArch arch;
253 254 255 256 257 258 259

    size_t ncpuDefinitions;
    char **cpuDefinitions;

    size_t nmachineTypes;
    char **machineTypes;
    char **machineAliases;
260
    unsigned int *machineMaxCpus;
261 262
};

263
struct _virQEMUCapsCache {
264 265
    virMutex lock;
    virHashTablePtr binaries;
266
    char *libDir;
267
    char *runDir;
268 269
    uid_t runUid;
    gid_t runGid;
270 271
};

272

273 274
static virClassPtr virQEMUCapsClass;
static void virQEMUCapsDispose(void *obj);
275

276
static int virQEMUCapsOnceInit(void)
277
{
278 279 280 281
    if (!(virQEMUCapsClass = virClassNew(virClassForObject(),
                                         "virQEMUCaps",
                                         sizeof(virQEMUCaps),
                                         virQEMUCapsDispose)))
282 283 284 285 286
        return -1;

    return 0;
}

287
VIR_ONCE_GLOBAL_INIT(virQEMUCaps)
288

289
static virArch virQEMUCapsArchFromString(const char *arch)
290 291 292 293 294 295 296 297 298 299
{
    if (STREQ(arch, "i386"))
        return VIR_ARCH_I686;
    if (STREQ(arch, "arm"))
        return VIR_ARCH_ARMV7L;

    return virArchFromString(arch);
}


300
static const char *virQEMUCapsArchToString(virArch arch)
301 302 303 304 305 306 307 308 309 310
{
    if (arch == VIR_ARCH_I686)
        return "i386";
    else if (arch == VIR_ARCH_ARMV7L)
        return "arm";

    return virArchToString(arch);
}


311
static virCommandPtr
312 313
virQEMUCapsProbeCommand(const char *qemu,
                        virQEMUCapsPtr qemuCaps,
314
                        uid_t runUid, gid_t runGid)
315 316 317
{
    virCommandPtr cmd = virCommandNew(qemu);

318 319
    if (qemuCaps) {
        if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_NO_USER_CONFIG))
320
            virCommandAddArg(cmd, "-no-user-config");
321
        else if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_NODEFCONFIG))
322 323 324 325 326
            virCommandAddArg(cmd, "-nodefconfig");
    }

    virCommandAddEnvPassCommon(cmd);
    virCommandClearCaps(cmd);
327 328
    virCommandSetGID(cmd, runGid);
    virCommandSetUID(cmd, runUid);
329 330 331 332 333

    return cmd;
}


334
static void
335 336
virQEMUCapsSetDefaultMachine(virQEMUCapsPtr qemuCaps,
                             size_t defIdx)
337
{
338 339
    char *name = qemuCaps->machineTypes[defIdx];
    char *alias = qemuCaps->machineAliases[defIdx];
340
    unsigned int maxCpus = qemuCaps->machineMaxCpus[defIdx];
341 342 343 344 345 346 347

    memmove(qemuCaps->machineTypes + 1,
            qemuCaps->machineTypes,
            sizeof(qemuCaps->machineTypes[0]) * defIdx);
    memmove(qemuCaps->machineAliases + 1,
            qemuCaps->machineAliases,
            sizeof(qemuCaps->machineAliases[0]) * defIdx);
348 349 350
    memmove(qemuCaps->machineMaxCpus + 1,
            qemuCaps->machineMaxCpus,
            sizeof(qemuCaps->machineMaxCpus[0]) * defIdx);
351 352
    qemuCaps->machineTypes[0] = name;
    qemuCaps->machineAliases[0] = alias;
353
    qemuCaps->machineMaxCpus[0] = maxCpus;
354 355
}

356 357 358 359
/* Format is:
 * <machine> <desc> [(default)|(alias of <canonical>)]
 */
static int
360 361
virQEMUCapsParseMachineTypesStr(const char *output,
                                virQEMUCapsPtr qemuCaps)
362 363 364
{
    const char *p = output;
    const char *next;
365
    size_t defIdx = 0;
366 367 368

    do {
        const char *t;
369 370
        char *name;
        char *canonical = NULL;
371 372 373 374 375 376 377 378 379 380

        if ((next = strchr(p, '\n')))
            ++next;

        if (STRPREFIX(p, "Supported machines are:"))
            continue;

        if (!(t = strchr(p, ' ')) || (next && t >= next))
            continue;

381 382
        if (VIR_STRNDUP(name, p, t - p) < 0)
            return -1;
383 384

        p = t;
385
        if ((t = strstr(p, "(default)")) && (!next || t < next))
386
            defIdx = qemuCaps->nmachineTypes;
387 388 389 390 391 392

        if ((t = strstr(p, "(alias of ")) && (!next || t < next)) {
            p = t + strlen("(alias of ");
            if (!(t = strchr(p, ')')) || (next && t >= next))
                continue;

393
            if (VIR_STRNDUP(canonical, p, t - p) < 0) {
394
                VIR_FREE(name);
395
                return -1;
396 397 398
            }
        }

399
        if (VIR_REALLOC_N(qemuCaps->machineTypes, qemuCaps->nmachineTypes + 1) < 0 ||
400 401
            VIR_REALLOC_N(qemuCaps->machineAliases, qemuCaps->nmachineTypes + 1) < 0 ||
            VIR_REALLOC_N(qemuCaps->machineMaxCpus, qemuCaps->nmachineTypes + 1) < 0) {
402 403
            VIR_FREE(name);
            VIR_FREE(canonical);
404
            return -1;
405
        }
406
        qemuCaps->nmachineTypes++;
407
        if (canonical) {
408 409
            qemuCaps->machineTypes[qemuCaps->nmachineTypes-1] = canonical;
            qemuCaps->machineAliases[qemuCaps->nmachineTypes-1] = name;
410
        } else {
411 412
            qemuCaps->machineTypes[qemuCaps->nmachineTypes-1] = name;
            qemuCaps->machineAliases[qemuCaps->nmachineTypes-1] = NULL;
413
        }
414 415
        /* When parsing from command line we don't have information about maxCpus */
        qemuCaps->machineMaxCpus[qemuCaps->nmachineTypes-1] = 0;
416 417
    } while ((p = next));

418

419
    if (defIdx)
420
        virQEMUCapsSetDefaultMachine(qemuCaps, defIdx);
421 422 423 424

    return 0;
}

425
static int
426 427
virQEMUCapsProbeMachineTypes(virQEMUCapsPtr qemuCaps,
                             uid_t runUid, gid_t runGid)
428 429
{
    char *output;
430 431
    int ret = -1;
    virCommandPtr cmd;
432
    int status;
433

434 435 436 437
    /* Make sure the binary we are about to try exec'ing exists.
     * Technically we could catch the exec() failure, but that's
     * in a sub-process so it's hard to feed back a useful error.
     */
438
    if (!virFileIsExecutable(qemuCaps->binary)) {
439
        virReportSystemError(errno, _("Cannot find QEMU binary %s"),
440
                             qemuCaps->binary);
441 442 443
        return -1;
    }

444
    cmd = virQEMUCapsProbeCommand(qemuCaps->binary, qemuCaps, runUid, runGid);
445
    virCommandAddArgList(cmd, "-M", "?", NULL);
446
    virCommandSetOutputBuffer(cmd, &output);
447

448 449
    /* Ignore failure from older qemu that did not understand '-M ?'.  */
    if (virCommandRun(cmd, &status) < 0)
450 451
        goto cleanup;

452
    if (virQEMUCapsParseMachineTypesStr(output, qemuCaps) < 0)
453
        goto cleanup;
454 455 456 457

    ret = 0;

cleanup:
458 459
    VIR_FREE(output);
    virCommandFree(cmd);
460 461 462 463 464 465

    return ret;
}


typedef int
466 467
(*virQEMUCapsParseCPUModels)(const char *output,
                             virQEMUCapsPtr qemuCaps);
468 469 470 471 472 473 474

/* Format:
 *      <arch> <model>
 * qemu-0.13 encloses some model names in []:
 *      <arch> [<model>]
 */
static int
475 476
virQEMUCapsParseX86Models(const char *output,
                          virQEMUCapsPtr qemuCaps)
477 478 479
{
    const char *p = output;
    const char *next;
480
    int ret = -1;
481 482 483

    do {
        const char *t;
484
        size_t len;
485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501

        if ((next = strchr(p, '\n')))
            next++;

        if (!(t = strchr(p, ' ')) || (next && t >= next))
            continue;

        if (!STRPREFIX(p, "x86"))
            continue;

        p = t;
        while (*p == ' ')
            p++;

        if (*p == '\0' || *p == '\n')
            continue;

502
        if (VIR_EXPAND_N(qemuCaps->cpuDefinitions, qemuCaps->ncpuDefinitions, 1) < 0)
503
            goto cleanup;
504

505 506 507 508
        if (next)
            len = next - p - 1;
        else
            len = strlen(p);
509

510 511 512 513
        if (len > 2 && *p == '[' && p[len - 1] == ']') {
            p++;
            len -= 2;
        }
514

515
        if (VIR_STRNDUP(qemuCaps->cpuDefinitions[qemuCaps->ncpuDefinitions - 1], p, len) < 0)
516
            goto cleanup;
517 518
    } while ((p = next));

519
    ret = 0;
520

521 522
cleanup:
    return ret;
523 524
}

P
Prerna Saxena 已提交
525 526 527 528
/* ppc64 parser.
 * Format : PowerPC <machine> <description>
 */
static int
529 530
virQEMUCapsParsePPCModels(const char *output,
                          virQEMUCapsPtr qemuCaps)
P
Prerna Saxena 已提交
531 532 533
{
    const char *p = output;
    const char *next;
534
    int ret = -1;
P
Prerna Saxena 已提交
535 536 537

    do {
        const char *t;
538
        size_t len;
P
Prerna Saxena 已提交
539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558

        if ((next = strchr(p, '\n')))
            next++;

        if (!STRPREFIX(p, "PowerPC "))
            continue;

        /* Skip the preceding sub-string "PowerPC " */
        p += 8;

        /*Malformed string, does not obey the format 'PowerPC <model> <desc>'*/
        if (!(t = strchr(p, ' ')) || (next && t >= next))
            continue;

        if (*p == '\0')
            break;

        if (*p == '\n')
            continue;

559
        if (VIR_EXPAND_N(qemuCaps->cpuDefinitions, qemuCaps->ncpuDefinitions, 1) < 0)
560
            goto cleanup;
P
Prerna Saxena 已提交
561

562
        len = t - p - 1;
P
Prerna Saxena 已提交
563

564
        if (VIR_STRNDUP(qemuCaps->cpuDefinitions[qemuCaps->ncpuDefinitions - 1], p, len) < 0)
565
            goto cleanup;
P
Prerna Saxena 已提交
566 567
    } while ((p = next));

568
    ret = 0;
P
Prerna Saxena 已提交
569

570 571
cleanup:
    return ret;
P
Prerna Saxena 已提交
572
}
573

574
static int
575
virQEMUCapsProbeCPUModels(virQEMUCapsPtr qemuCaps, uid_t runUid, gid_t runGid)
576 577 578
{
    char *output = NULL;
    int ret = -1;
579
    virQEMUCapsParseCPUModels parse;
580
    virCommandPtr cmd;
581

582 583 584 585 586
    if (qemuCaps->arch == VIR_ARCH_I686 ||
        qemuCaps->arch == VIR_ARCH_X86_64)
        parse = virQEMUCapsParseX86Models;
    else if (qemuCaps->arch == VIR_ARCH_PPC64)
        parse = virQEMUCapsParsePPCModels;
587
    else {
588
        VIR_DEBUG("don't know how to parse %s CPU models",
589
                  virArchToString(qemuCaps->arch));
590 591 592
        return 0;
    }

593
    cmd = virQEMUCapsProbeCommand(qemuCaps->binary, qemuCaps, runUid, runGid);
594
    virCommandAddArgList(cmd, "-cpu", "?", NULL);
595
    virCommandSetOutputBuffer(cmd, &output);
596

597
    if (virCommandRun(cmd, NULL) < 0)
598 599
        goto cleanup;

600
    if (parse(output, qemuCaps) < 0)
601 602 603 604 605 606
        goto cleanup;

    ret = 0;

cleanup:
    VIR_FREE(output);
607
    virCommandFree(cmd);
608 609 610 611 612

    return ret;
}


613
static char *
614 615
virQEMUCapsFindBinaryForArch(virArch hostarch,
                             virArch guestarch)
616 617
{
    char *ret;
618
    const char *archstr = virQEMUCapsArchToString(guestarch);
619
    char *binary;
620

621
    if (virAsprintf(&binary, "qemu-system-%s", archstr) < 0)
622 623 624 625 626 627 628 629 630 631 632
        return NULL;

    ret = virFindFileInPath(binary);
    VIR_FREE(binary);
    if (ret && !virFileIsExecutable(ret))
        VIR_FREE(ret);

    if (guestarch == VIR_ARCH_I686 &&
        !ret &&
        hostarch == VIR_ARCH_X86_64) {
        ret = virFindFileInPath("qemu-system-x86_64");
633 634
        if (ret && !virFileIsExecutable(ret))
            VIR_FREE(ret);
635
    }
636

637 638 639 640 641
    if (guestarch == VIR_ARCH_I686 &&
        !ret) {
        ret = virFindFileInPath("qemu");
        if (ret && !virFileIsExecutable(ret))
            VIR_FREE(ret);
642
    }
643

644 645 646 647 648
    return ret;
}


static bool
649 650
virQEMUCapsIsValidForKVM(virArch hostarch,
                         virArch guestarch)
651
{
652
    if (hostarch == guestarch)
653
        return true;
654 655
    if (hostarch == VIR_ARCH_X86_64 &&
        guestarch == VIR_ARCH_I686)
656 657 658 659
        return true;
    return false;
}

660
static int
661 662 663 664
virQEMUCapsInitGuest(virCapsPtr caps,
                     virQEMUCapsCachePtr cache,
                     virArch hostarch,
                     virArch guestarch)
665 666
{
    virCapsGuestPtr guest;
667
    size_t i;
668 669
    bool haskvm = false;
    bool haskqemu = false;
670 671 672
    char *kvmbin = NULL;
    char *binary = NULL;
    virCapsGuestMachinePtr *machines = NULL;
673
    size_t nmachines = 0;
674 675
    virQEMUCapsPtr qemubinCaps = NULL;
    virQEMUCapsPtr kvmbinCaps = NULL;
676 677
    int ret = -1;

J
Ján Tomko 已提交
678
    /* Check for existence of base emulator, or alternate base
679 680
     * which can be used with magic cpu choice
     */
681
    binary = virQEMUCapsFindBinaryForArch(hostarch, guestarch);
682

683
    /* Ignore binary if extracting version info fails */
684
    if (binary) {
685
        if (!(qemubinCaps = virQEMUCapsCacheLookup(cache, binary))) {
686 687 688 689
            virResetLastError();
            VIR_FREE(binary);
        }
    }
690 691

    /* qemu-kvm/kvm binaries can only be used if
692 693 694 695 696
     *  - host & guest arches match
     * Or
     *  - hostarch is x86_64 and guest arch is i686
     * The latter simply needs "-cpu qemu32"
     */
697
    if (virQEMUCapsIsValidForKVM(hostarch, guestarch)) {
698 699 700
        const char *const kvmbins[] = { "/usr/libexec/qemu-kvm", /* RHEL */
                                        "qemu-kvm", /* Fedora */
                                        "kvm" }; /* Upstream .spec */
701

702 703
        for (i = 0; i < ARRAY_CARDINALITY(kvmbins); ++i) {
            kvmbin = virFindFileInPath(kvmbins[i]);
704

705 706
            if (!kvmbin)
                continue;
707

708
            if (!(kvmbinCaps = virQEMUCapsCacheLookup(cache, kvmbin))) {
709
                virResetLastError();
710 711 712
                VIR_FREE(kvmbin);
                continue;
            }
713

714 715
            if (!binary) {
                binary = kvmbin;
716
                qemubinCaps = kvmbinCaps;
717
                kvmbin = NULL;
718
                kvmbinCaps = NULL;
719
            }
720
            break;
721 722 723 724 725 726
        }
    }

    if (!binary)
        return 0;

727
    if (access("/dev/kvm", F_OK) == 0 &&
728 729
        (virQEMUCapsGet(qemubinCaps, QEMU_CAPS_KVM) ||
         virQEMUCapsGet(qemubinCaps, QEMU_CAPS_ENABLE_KVM) ||
730
         kvmbin))
731
        haskvm = true;
732 733

    if (access("/dev/kqemu", F_OK) == 0 &&
734
        virQEMUCapsGet(qemubinCaps, QEMU_CAPS_KQEMU))
735
        haskqemu = true;
J
Jiri Denemark 已提交
736

737
    if (virQEMUCapsGetMachineTypesCaps(qemubinCaps, &nmachines, &machines) < 0)
D
Daniel P. Berrange 已提交
738
        goto error;
739 740 741 742

    /* We register kvm as the base emulator too, since we can
     * just give -no-kvm to disable acceleration if required */
    if ((guest = virCapabilitiesAddGuest(caps,
D
Daniel P. Berrange 已提交
743
                                         "hvm",
744
                                         guestarch,
745 746 747 748 749 750 751 752 753 754
                                         binary,
                                         NULL,
                                         nmachines,
                                         machines)) == NULL)
        goto error;

    machines = NULL;
    nmachines = 0;

    if (caps->host.cpu &&
J
Jiri Denemark 已提交
755
        caps->host.cpu->model &&
756
        virQEMUCapsGetCPUDefinitions(qemubinCaps, NULL) > 0 &&
757 758 759
        !virCapabilitiesAddGuestFeature(guest, "cpuselection", 1, 0))
        goto error;

760
    if (virQEMUCapsGet(qemubinCaps, QEMU_CAPS_BOOTINDEX) &&
J
Jiri Denemark 已提交
761
        !virCapabilitiesAddGuestFeature(guest, "deviceboot", 1, 0))
762 763
        goto error;

D
Daniel P. Berrange 已提交
764 765 766 767 768 769 770
    if (virCapabilitiesAddGuestDomain(guest,
                                      "qemu",
                                      NULL,
                                      NULL,
                                      0,
                                      NULL) == NULL)
        goto error;
771

D
Daniel P. Berrange 已提交
772 773 774 775 776 777 778 779
    if (haskqemu &&
        virCapabilitiesAddGuestDomain(guest,
                                      "kqemu",
                                      NULL,
                                      NULL,
                                      0,
                                      NULL) == NULL)
        goto error;
780

D
Daniel P. Berrange 已提交
781 782
    if (haskvm) {
        virCapsGuestDomainPtr dom;
783

D
Daniel P. Berrange 已提交
784
        if (kvmbin &&
785
            virQEMUCapsGetMachineTypesCaps(kvmbinCaps, &nmachines, &machines) < 0)
D
Daniel P. Berrange 已提交
786
            goto error;
787

D
Daniel P. Berrange 已提交
788 789 790 791 792 793 794 795
        if ((dom = virCapabilitiesAddGuestDomain(guest,
                                                 "kvm",
                                                 kvmbin ? kvmbin : binary,
                                                 NULL,
                                                 nmachines,
                                                 machines)) == NULL) {
            goto error;
        }
796

D
Daniel P. Berrange 已提交
797 798
        machines = NULL;
        nmachines = 0;
799 800 801

    }

802 803
    if (((guestarch == VIR_ARCH_I686) ||
         (guestarch == VIR_ARCH_X86_64)) &&
804 805 806 807
        (virCapabilitiesAddGuestFeature(guest, "acpi", 1, 1) == NULL ||
         virCapabilitiesAddGuestFeature(guest, "apic", 1, 0) == NULL))
        goto error;

808
    if ((guestarch == VIR_ARCH_I686) &&
809 810 811
        (virCapabilitiesAddGuestFeature(guest, "pae", 1, 0) == NULL ||
         virCapabilitiesAddGuestFeature(guest, "nonpae", 1, 0) == NULL))
        goto error;
812 813 814 815

    ret = 0;

cleanup:
816 817
    VIR_FREE(binary);
    VIR_FREE(kvmbin);
818 819
    virObjectUnref(qemubinCaps);
    virObjectUnref(kvmbinCaps);
820 821 822 823 824 825 826 827 828 829 830

    return ret;

error:
    virCapabilitiesFreeMachines(machines, nmachines);

    goto cleanup;
}


static int
831 832
virQEMUCapsInitCPU(virCapsPtr caps,
                   virArch arch)
833 834 835 836 837 838
{
    virCPUDefPtr cpu = NULL;
    union cpuData *data = NULL;
    virNodeInfo nodeinfo;
    int ret = -1;

839
    if (VIR_ALLOC(cpu) < 0)
840 841
        goto error;

842 843
    cpu->arch = arch;

844
    if (nodeGetInfo(&nodeinfo))
845 846 847 848 849 850
        goto error;

    cpu->type = VIR_CPU_TYPE_HOST;
    cpu->sockets = nodeinfo.sockets;
    cpu->cores = nodeinfo.cores;
    cpu->threads = nodeinfo.threads;
J
Jiri Denemark 已提交
851
    caps->host.cpu = cpu;
852

853
    if (!(data = cpuNodeData(arch))
854
        || cpuDecode(cpu, data, NULL, 0, NULL) < 0)
J
Jiri Denemark 已提交
855
        goto cleanup;
856 857 858 859

    ret = 0;

cleanup:
860
    cpuDataFree(arch, data);
861 862 863 864 865 866 867 868 869

    return ret;

error:
    virCPUDefFree(cpu);
    goto cleanup;
}


870
virCapsPtr virQEMUCapsInit(virQEMUCapsCachePtr cache)
871 872
{
    virCapsPtr caps;
873
    size_t i;
T
Tal Kain 已提交
874
    virArch hostarch = virArchFromHost();
875

T
Tal Kain 已提交
876
    if ((caps = virCapabilitiesNew(hostarch,
877
                                   1, 1)) == NULL)
878
        goto error;
879 880 881 882 883 884 885

    /* Some machines have problematic NUMA toplogy causing
     * unexpected failures. We don't want to break the QEMU
     * driver in this scenario, so log errors & carry on
     */
    if (nodeCapsInitNUMA(caps) < 0) {
        virCapabilitiesFreeNUMAInfo(caps);
886
        VIR_WARN("Failed to query host NUMA topology, disabling NUMA capabilities");
887 888
    }

T
Tal Kain 已提交
889
    if (virQEMUCapsInitCPU(caps, hostarch) < 0)
890
        VIR_WARN("Failed to get host CPU");
891

892 893
    /* Add the power management features of the host */

894
    if (virNodeSuspendGetTargetMask(&caps->host.powerMgmt) < 0)
895 896
        VIR_WARN("Failed to get host power management capabilities");

897 898 899
    virCapabilitiesAddHostMigrateTransport(caps,
                                           "tcp");

900 901 902 903
    /* QEMU can support pretty much every arch that exists,
     * so just probe for them all - we gracefully fail
     * if a qemu-system-$ARCH binary can't be found
     */
904
    for (i = 0; i < VIR_ARCH_LAST; i++)
905
        if (virQEMUCapsInitGuest(caps, cache,
T
Tal Kain 已提交
906
                                 hostarch,
907
                                 i) < 0)
908
            goto error;
909 910 911

    return caps;

912
error:
913
    virObjectUnref(caps);
914 915 916 917
    return NULL;
}


918
static int
919 920
virQEMUCapsComputeCmdFlags(const char *help,
                           unsigned int version,
921
                           bool is_kvm,
922 923 924
                           unsigned int kvm_version,
                           virQEMUCapsPtr qemuCaps,
                           bool check_yajl ATTRIBUTE_UNUSED)
925 926
{
    const char *p;
R
Richa Marwaha 已提交
927
    const char *fsdev, *netdev;
928 929

    if (strstr(help, "-no-kqemu"))
930
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_KQEMU);
931
    if (strstr(help, "-enable-kqemu"))
932
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ENABLE_KQEMU);
933
    if (strstr(help, "-no-kvm"))
934
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_KVM);
935
    if (strstr(help, "-enable-kvm"))
936
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ENABLE_KVM);
937
    if (strstr(help, "-no-reboot"))
938
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_REBOOT);
939
    if (strstr(help, "-name")) {
940
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME);
941
        if (strstr(help, ",process="))
942
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME_PROCESS);
943 944
    }
    if (strstr(help, "-uuid"))
945
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_UUID);
946
    if (strstr(help, "-xen-domid"))
947
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_XEN_DOMID);
948
    else if (strstr(help, "-domid"))
949
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DOMID);
950
    if (strstr(help, "-drive")) {
951 952
        const char *cache = strstr(help, "cache=");

953
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE);
954 955
        if (cache && (p = strchr(cache, ']'))) {
            if (memmem(cache, p - cache, "on|off", sizeof("on|off") - 1) == NULL)
956
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_V2);
957
            if (memmem(cache, p - cache, "directsync", sizeof("directsync") - 1))
958
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_DIRECTSYNC);
959
            if (memmem(cache, p - cache, "unsafe", sizeof("unsafe") - 1))
960
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_UNSAFE);
961
        }
962
        if (strstr(help, "format="))
963
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_FORMAT);
964
        if (strstr(help, "readonly="))
965
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_READONLY);
966
        if (strstr(help, "aio=threads|native"))
967
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_AIO);
O
Osier Yang 已提交
968
        if (strstr(help, "copy-on-read=on|off"))
969
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_COPY_ON_READ);
970
        if (strstr(help, "bps="))
971
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_IOTUNE);
972 973 974 975
    }
    if ((p = strstr(help, "-vga")) && !strstr(help, "-std-vga")) {
        const char *nl = strstr(p, "\n");

976
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA);
977 978

        if (strstr(p, "|qxl"))
979
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_QXL);
980
        if ((p = strstr(p, "|none")) && p < nl)
981
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_NONE);
982 983
    }
    if (strstr(help, "-spice"))
984
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SPICE);
985
    if (strstr(help, "-vnc"))
986
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC);
987
    if (strstr(help, "seamless-migration="))
988
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SEAMLESS_MIGRATION);
989
    if (strstr(help, "boot=on"))
990
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_BOOT);
991
    if (strstr(help, "serial=s"))
992
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_SERIAL);
993
    if (strstr(help, "-pcidevice"))
994
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCIDEVICE);
995
    if (strstr(help, "-mem-path"))
996
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MEM_PATH);
997
    if (strstr(help, "-chardev")) {
998
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV);
999
        if (strstr(help, "-chardev spicevmc"))
1000
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC);
1001
    }
1002
    if (strstr(help, "-balloon"))
1003
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_BALLOON);
1004
    if (strstr(help, "-device")) {
1005
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE);
1006 1007 1008 1009
        /*
         * When -device was introduced, qemu already supported drive's
         * readonly option but didn't advertise that.
         */
1010
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_READONLY);
1011 1012
    }
    if (strstr(help, "-nodefconfig"))
1013
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NODEFCONFIG);
1014
    if (strstr(help, "-no-user-config"))
1015
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_USER_CONFIG);
1016 1017
    /* The trailing ' ' is important to avoid a bogus match */
    if (strstr(help, "-rtc "))
1018
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_RTC);
1019 1020
    /* to wit */
    if (strstr(help, "-rtc-td-hack"))
1021
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_RTC_TD_HACK);
1022
    if (strstr(help, "-no-hpet"))
1023
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_HPET);
1024
    if (strstr(help, "-no-acpi"))
1025
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_ACPI);
1026
    if (strstr(help, "-no-kvm-pit-reinjection"))
1027
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_KVM_PIT);
1028
    if (strstr(help, "-tdf"))
1029
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_TDF);
1030
    if (strstr(help, "-enable-nesting"))
1031
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NESTING);
1032
    if (strstr(help, ",menu=on"))
1033
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_BOOT_MENU);
1034
    if (strstr(help, ",reboot-timeout=rb_time"))
1035
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_REBOOT_TIMEOUT);
1036
    if ((fsdev = strstr(help, "-fsdev"))) {
1037
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV);
1038
        if (strstr(fsdev, "readonly"))
1039
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_READONLY);
1040
        if (strstr(fsdev, "writeout"))
1041
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_WRITEOUT);
1042
    }
1043
    if (strstr(help, "-smbios type"))
1044
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMBIOS_TYPE);
1045
    if (strstr(help, "-sandbox"))
1046
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SECCOMP_SANDBOX);
1047

R
Richa Marwaha 已提交
1048
    if ((netdev = strstr(help, "-netdev"))) {
1049 1050
        /* Disable -netdev on 0.12 since although it exists,
         * the corresponding netdev_add/remove monitor commands
1051 1052
         * do not, and we need them to be able to do hotplug.
         * But see below about RHEL build. */
R
Richa Marwaha 已提交
1053 1054
        if (version >= 13000) {
            if (strstr(netdev, "bridge"))
1055 1056
                virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV_BRIDGE);
           virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
R
Richa Marwaha 已提交
1057
        }
1058 1059 1060
    }

    if (strstr(help, "-sdl"))
1061
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SDL);
1062 1063 1064
    if (strstr(help, "cores=") &&
        strstr(help, "threads=") &&
        strstr(help, "sockets="))
1065
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMP_TOPOLOGY);
1066 1067

    if (version >= 9000)
1068
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_COLON);
1069 1070

    if (is_kvm && (version >= 10000 || kvm_version >= 74))
1071
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNET_HDR);
1072

1073
    if (strstr(help, ",vhost=")) {
1074
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VHOST_NET);
1075 1076
    }

1077 1078
    /* Do not use -no-shutdown if qemu doesn't support it or SIGTERM handling
     * is most likely buggy when used with -no-shutdown (which applies for qemu
1079
     * 0.14.* and 0.15.0)
1080
     */
1081
    if (strstr(help, "-no-shutdown") && (version < 14000 || version > 15000))
1082
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_SHUTDOWN);
1083

1084
    if (strstr(help, "dump-guest-core=on|off"))
1085
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DUMP_GUEST_CORE);
1086

O
Olivia Yin 已提交
1087 1088 1089
    if (strstr(help, "-dtb"))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DTB);

1090 1091 1092
    if (strstr(help, "-machine"))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_OPT);

L
Li Zhang 已提交
1093 1094 1095 1096
     /* USB option is supported v1.3.0 onwards */
    if (qemuCaps->version >= 1003000)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_USB_OPT);

1097 1098 1099 1100
    /*
     * Handling of -incoming arg with varying features
     *  -incoming tcp    (kvm >= 79, qemu >= 0.10.0)
     *  -incoming exec   (kvm >= 80, qemu >= 0.10.0)
1101 1102
     *  -incoming unix   (qemu >= 0.12.0)
     *  -incoming fd     (qemu >= 0.12.0)
1103 1104 1105 1106 1107 1108 1109
     *  -incoming stdio  (all earlier kvm)
     *
     * NB, there was a pre-kvm-79 'tcp' support, but it
     * was broken, because it blocked the monitor console
     * while waiting for data, so pretend it doesn't exist
     */
    if (version >= 10000) {
1110 1111
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_TCP);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_EXEC);
1112
        if (version >= 12000) {
1113 1114
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_UNIX);
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_FD);
1115
        }
1116
    } else if (kvm_version >= 79) {
1117
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_TCP);
1118
        if (kvm_version >= 80)
1119
            virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_EXEC);
1120
    } else if (kvm_version > 0) {
1121
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_KVM_STDIO);
1122 1123 1124
    }

    if (version >= 10000)
1125
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_0_10);
1126

1127
    if (version >= 11000)
1128
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VIRTIO_BLK_SG_IO);
1129

1130 1131 1132
    /* While JSON mode was available in 0.12.0, it was too
     * incomplete to contemplate using. The 0.13.0 release
     * is good enough to use, even though it lacks one or
1133 1134 1135 1136 1137
     * two features. This is also true of versions of qemu
     * built for RHEL, labeled 0.12.1, but with extra text
     * in the help output that mentions that features were
     * backported for libvirt. The benefits of JSON mode now
     * outweigh the downside.
1138
     */
1139
#if WITH_YAJL
1140
    if (version >= 13000) {
1141
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MONITOR_JSON);
1142 1143
    } else if (version >= 12000 &&
               strstr(help, "libvirt")) {
1144 1145
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MONITOR_JSON);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
1146
    }
1147 1148 1149 1150 1151 1152 1153
#else
    /* Starting with qemu 0.15 and newer, upstream qemu no longer
     * promises to keep the human interface stable, but requests that
     * we use QMP (the JSON interface) for everything.  If the user
     * forgot to include YAJL libraries when building their own
     * libvirt but is targetting a newer qemu, we are better off
     * telling them to recompile (the spec file includes the
1154
     * dependency, so distros won't hit this).  This check is
1155
     * also in m4/virt-yajl.m4 (see $with_yajl).  */
1156 1157 1158
    if (version >= 15000 ||
        (version >= 12000 && strstr(help, "libvirt"))) {
        if (check_yajl) {
1159 1160 1161
            virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                           _("this qemu binary requires libvirt to be "
                             "compiled with yajl"));
1162 1163
            return -1;
        }
1164
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
1165
    }
E
Eric Blake 已提交
1166
#endif
1167 1168

    if (version >= 13000)
1169
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_MULTIFUNCTION);
1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181

    /* Although very new versions of qemu advertise the presence of
     * the rombar option in the output of "qemu -device pci-assign,?",
     * this advertisement was added to the code long after the option
     * itself. According to qemu developers, though, rombar is
     * available in all qemu binaries from release 0.12 onward.
     * Setting the capability this way makes it available in more
     * cases where it might be needed, and shouldn't cause any false
     * positives (in the case that it did, qemu would produce an error
     * log and refuse to start, so it would be immediately obvious).
     */
    if (version >= 12000)
1182
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_ROMBAR);
1183 1184

    if (version >= 11000)
1185
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_CPU_HOST);
1186

1187
    if (version >= 1001000) {
J
Ján Tomko 已提交
1188
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_IPV6_MIGRATION);
1189 1190
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_SHARE_POLICY);
    }
J
Ján Tomko 已提交
1191

1192
    if (version >= 1002000)
1193
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE_VIDEO_PRIMARY);
1194
    return 0;
1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220
}

/* We parse the output of 'qemu -help' to get the QEMU
 * version number. The first bit is easy, just parse
 * 'QEMU PC emulator version x.y.z'
 * or
 * 'QEMU emulator version x.y.z'.
 *
 * With qemu-kvm, however, that is followed by a string
 * in parenthesis as follows:
 *  - qemu-kvm-x.y.z in stable releases
 *  - kvm-XX for kvm versions up to kvm-85
 *  - qemu-kvm-devel-XX for kvm version kvm-86 and later
 *
 * For qemu-kvm versions before 0.10.z, we need to detect
 * the KVM version number for some features. With 0.10.z
 * and later, we just need the QEMU version number and
 * whether it is KVM QEMU or mainline QEMU.
 */
#define QEMU_VERSION_STR_1  "QEMU emulator version"
#define QEMU_VERSION_STR_2  "QEMU PC emulator version"
#define QEMU_KVM_VER_PREFIX "(qemu-kvm-"
#define KVM_VER_PREFIX      "(kvm-"

#define SKIP_BLANKS(p) do { while ((*(p) == ' ') || (*(p) == '\t')) (p)++; } while (0)

1221 1222 1223 1224
int virQEMUCapsParseHelpStr(const char *qemu,
                            const char *help,
                            virQEMUCapsPtr qemuCaps,
                            unsigned int *version,
1225
                            bool *is_kvm,
1226 1227
                            unsigned int *kvm_version,
                            bool check_yajl)
1228 1229 1230
{
    unsigned major, minor, micro;
    const char *p = help;
1231
    char *strflags;
1232

1233 1234
    *version = *kvm_version = 0;
    *is_kvm = false;
1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251

    if (STRPREFIX(p, QEMU_VERSION_STR_1))
        p += strlen(QEMU_VERSION_STR_1);
    else if (STRPREFIX(p, QEMU_VERSION_STR_2))
        p += strlen(QEMU_VERSION_STR_2);
    else
        goto fail;

    SKIP_BLANKS(p);

    major = virParseNumber(&p);
    if (major == -1 || *p != '.')
        goto fail;

    ++p;

    minor = virParseNumber(&p);
J
Jiri Denemark 已提交
1252
    if (minor == -1)
1253 1254
        goto fail;

J
Jiri Denemark 已提交
1255 1256 1257 1258 1259 1260 1261 1262
    if (*p != '.') {
        micro = 0;
    } else {
        ++p;
        micro = virParseNumber(&p);
        if (micro == -1)
            goto fail;
    }
1263 1264 1265 1266

    SKIP_BLANKS(p);

    if (STRPREFIX(p, QEMU_KVM_VER_PREFIX)) {
1267
        *is_kvm = true;
1268 1269 1270 1271
        p += strlen(QEMU_KVM_VER_PREFIX);
    } else if (STRPREFIX(p, KVM_VER_PREFIX)) {
        int ret;

1272
        *is_kvm = true;
1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283
        p += strlen(KVM_VER_PREFIX);

        ret = virParseNumber(&p);
        if (ret == -1)
            goto fail;

        *kvm_version = ret;
    }

    *version = (major * 1000 * 1000) + (minor * 1000) + micro;

1284 1285
    if (virQEMUCapsComputeCmdFlags(help, *version, *is_kvm, *kvm_version,
                                   qemuCaps, check_yajl) < 0)
1286
        goto cleanup;
1287

1288
    strflags = virBitmapString(qemuCaps->flags);
1289 1290 1291
    VIR_DEBUG("Version %u.%u.%u, cooked version %u, flags %s",
              major, minor, micro, *version, NULLSTR(strflags));
    VIR_FREE(strflags);
1292 1293 1294 1295 1296 1297 1298 1299 1300 1301

    if (*kvm_version)
        VIR_DEBUG("KVM version %d detected", *kvm_version);
    else if (*is_kvm)
        VIR_DEBUG("qemu-kvm version %u.%u.%u detected", major, minor, micro);

    return 0;

fail:
    p = strchr(help, '\n');
1302 1303
    if (!p)
        p = strchr(help, '\0');
1304

1305 1306 1307
    virReportError(VIR_ERR_INTERNAL_ERROR,
                   _("cannot parse %s version number in '%.*s'"),
                   qemu, (int) (p - help), help);
1308

1309
cleanup:
1310 1311 1312
    return -1;
}

1313

1314
struct virQEMUCapsStringFlags {
1315 1316 1317 1318 1319
    const char *value;
    int flag;
};


1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335
struct virQEMUCapsStringFlags virQEMUCapsCommands[] = {
    { "system_wakeup", QEMU_CAPS_WAKEUP },
    { "transaction", QEMU_CAPS_TRANSACTION },
    { "block_job_cancel", QEMU_CAPS_BLOCKJOB_SYNC },
    { "block-job-cancel", QEMU_CAPS_BLOCKJOB_ASYNC },
    { "dump-guest-memory", QEMU_CAPS_DUMP_GUEST_MEMORY },
    { "query-spice", QEMU_CAPS_SPICE },
    { "query-kvm", QEMU_CAPS_KVM },
    { "block-commit", QEMU_CAPS_BLOCK_COMMIT },
    { "query-vnc", QEMU_CAPS_VNC },
    { "drive-mirror", QEMU_CAPS_DRIVE_MIRROR },
    { "blockdev-snapshot-sync", QEMU_CAPS_DISK_SNAPSHOT },
    { "add-fd", QEMU_CAPS_ADD_FD },
    { "nbd-server-start", QEMU_CAPS_NBD_SERVER },
};

1336 1337 1338
struct virQEMUCapsStringFlags virQEMUCapsEvents[] = {
    { "BALLOON_CHANGE", QEMU_CAPS_BALLOON_EVENT },
    { "SPICE_MIGRATE_COMPLETED", QEMU_CAPS_SEAMLESS_MIGRATION },
1339
    { "DEVICE_DELETED", QEMU_CAPS_DEVICE_DEL_EVENT },
1340 1341
};

1342
struct virQEMUCapsStringFlags virQEMUCapsObjectTypes[] = {
1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357
    { "hda-duplex", QEMU_CAPS_HDA_DUPLEX },
    { "hda-micro", QEMU_CAPS_HDA_MICRO },
    { "ccid-card-emulated", QEMU_CAPS_CCID_EMULATED },
    { "ccid-card-passthru", QEMU_CAPS_CCID_PASSTHRU },
    { "piix3-usb-uhci", QEMU_CAPS_PIIX3_USB_UHCI },
    { "piix4-usb-uhci", QEMU_CAPS_PIIX4_USB_UHCI },
    { "usb-ehci", QEMU_CAPS_USB_EHCI },
    { "ich9-usb-ehci1", QEMU_CAPS_ICH9_USB_EHCI1 },
    { "vt82c686b-usb-uhci", QEMU_CAPS_VT82C686B_USB_UHCI },
    { "pci-ohci", QEMU_CAPS_PCI_OHCI },
    { "nec-usb-xhci", QEMU_CAPS_NEC_USB_XHCI },
    { "usb-redir", QEMU_CAPS_USB_REDIR },
    { "usb-hub", QEMU_CAPS_USB_HUB },
    { "ich9-ahci", QEMU_CAPS_ICH9_AHCI },
    { "virtio-blk-s390", QEMU_CAPS_VIRTIO_S390 },
1358
    { "virtio-blk-ccw", QEMU_CAPS_VIRTIO_CCW },
1359
    { "sclpconsole", QEMU_CAPS_SCLP_S390 },
1360
    { "lsi53c895a", QEMU_CAPS_SCSI_LSI },
1361
    { "virtio-scsi-pci", QEMU_CAPS_VIRTIO_SCSI },
1362 1363
    { "virtio-scsi-s390", QEMU_CAPS_VIRTIO_SCSI },
    { "virtio-scsi-ccw", QEMU_CAPS_VIRTIO_SCSI },
1364
    { "megasas", QEMU_CAPS_SCSI_MEGASAS },
1365 1366
    { "spicevmc", QEMU_CAPS_DEVICE_SPICEVMC },
    { "qxl-vga", QEMU_CAPS_DEVICE_QXL_VGA },
1367
    { "qxl", QEMU_CAPS_DEVICE_QXL },
1368 1369 1370 1371
    { "sga", QEMU_CAPS_SGA },
    { "scsi-block", QEMU_CAPS_SCSI_BLOCK },
    { "scsi-cd", QEMU_CAPS_SCSI_CD },
    { "ide-cd", QEMU_CAPS_IDE_CD },
1372 1373 1374
    { "VGA", QEMU_CAPS_DEVICE_VGA },
    { "cirrus-vga", QEMU_CAPS_DEVICE_CIRRUS_VGA },
    { "vmware-svga", QEMU_CAPS_DEVICE_VMWARE_SVGA },
H
Han Cheng 已提交
1375 1376
    { "usb-serial", QEMU_CAPS_DEVICE_USB_SERIAL },
    { "usb-net", QEMU_CAPS_DEVICE_USB_NET },
1377
    { "virtio-rng-pci", QEMU_CAPS_DEVICE_VIRTIO_RNG },
1378 1379
    { "virtio-rng-s390", QEMU_CAPS_DEVICE_VIRTIO_RNG },
    { "virtio-rng-ccw", QEMU_CAPS_DEVICE_VIRTIO_RNG },
1380
    { "rng-random", QEMU_CAPS_OBJECT_RNG_RANDOM },
1381
    { "rng-egd", QEMU_CAPS_OBJECT_RNG_EGD },
1382
    { "spapr-nvram", QEMU_CAPS_DEVICE_NVRAM },
1383
    { "pci-bridge", QEMU_CAPS_DEVICE_PCI_BRIDGE },
1384
    { "vfio-pci", QEMU_CAPS_DEVICE_VFIO_PCI },
H
Han Cheng 已提交
1385
    { "scsi-generic", QEMU_CAPS_DEVICE_SCSI_GENERIC },
1386 1387
};

1388
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsVirtioBlk[] = {
1389 1390 1391 1392 1393 1394 1395 1396
    { "multifunction", QEMU_CAPS_PCI_MULTIFUNCTION },
    { "bootindex", QEMU_CAPS_BOOTINDEX },
    { "ioeventfd", QEMU_CAPS_VIRTIO_IOEVENTFD },
    { "event_idx", QEMU_CAPS_VIRTIO_BLK_EVENT_IDX },
    { "scsi", QEMU_CAPS_VIRTIO_BLK_SCSI },
    { "logical_block_size", QEMU_CAPS_BLOCKIO },
};

1397
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsVirtioNet[] = {
1398 1399 1400 1401
    { "tx", QEMU_CAPS_VIRTIO_TX_ALG },
    { "event_idx", QEMU_CAPS_VIRTIO_NET_EVENT_IDX },
};

1402
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsPciAssign[] = {
1403
    { "rombar", QEMU_CAPS_PCI_ROMBAR },
1404 1405 1406 1407
    { "configfd", QEMU_CAPS_PCI_CONFIGFD },
    { "bootindex", QEMU_CAPS_PCI_BOOTINDEX },
};

1408 1409 1410 1411
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsVfioPci[] = {
    { "bootindex", QEMU_CAPS_VFIO_PCI_BOOTINDEX },
};

1412
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsScsiDisk[] = {
1413 1414 1415 1416
    { "channel", QEMU_CAPS_SCSI_DISK_CHANNEL },
    { "wwn", QEMU_CAPS_SCSI_DISK_WWN },
};

1417
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsIDEDrive[] = {
1418 1419 1420
    { "wwn", QEMU_CAPS_IDE_DRIVE_WWN },
};

1421
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsPixx4PM[] = {
1422 1423 1424 1425
    { "disable_s3", QEMU_CAPS_DISABLE_S3 },
    { "disable_s4", QEMU_CAPS_DISABLE_S4 },
};

1426
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsUsbRedir[] = {
1427
    { "filter", QEMU_CAPS_USB_REDIR_FILTER },
1428 1429 1430
    { "bootindex", QEMU_CAPS_USB_REDIR_BOOTINDEX },
};

1431
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsUsbHost[] = {
1432
    { "bootindex", QEMU_CAPS_USB_HOST_BOOTINDEX },
1433 1434
};

H
Han Cheng 已提交
1435 1436 1437 1438
static struct virQEMUCapsStringFlags virQEMUCapsObjectPropsScsiGeneric[] = {
    { "bootindex", QEMU_CAPS_DEVICE_SCSI_GENERIC_BOOTINDEX },
};

1439
struct virQEMUCapsObjectTypeProps {
1440
    const char *type;
1441
    struct virQEMUCapsStringFlags *props;
1442 1443 1444
    size_t nprops;
};

1445 1446 1447 1448
static struct virQEMUCapsObjectTypeProps virQEMUCapsObjectProps[] = {
    { "virtio-blk-pci", virQEMUCapsObjectPropsVirtioBlk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioBlk) },
    { "virtio-net-pci", virQEMUCapsObjectPropsVirtioNet,
1449 1450 1451 1452
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioNet) },
    { "virtio-blk-ccw", virQEMUCapsObjectPropsVirtioBlk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioBlk) },
    { "virtio-net-ccw", virQEMUCapsObjectPropsVirtioNet,
1453 1454 1455 1456 1457 1458 1459 1460 1461
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioNet) },
    { "virtio-blk-s390", virQEMUCapsObjectPropsVirtioBlk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioBlk) },
    { "virtio-net-s390", virQEMUCapsObjectPropsVirtioNet,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVirtioNet) },
    { "pci-assign", virQEMUCapsObjectPropsPciAssign,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsPciAssign) },
    { "kvm-pci-assign", virQEMUCapsObjectPropsPciAssign,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsPciAssign) },
1462 1463
    { "vfio-pci", virQEMUCapsObjectPropsVfioPci,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsVfioPci) },
1464 1465 1466 1467 1468 1469 1470 1471 1472 1473
    { "scsi-disk", virQEMUCapsObjectPropsScsiDisk,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsScsiDisk) },
    { "ide-drive", virQEMUCapsObjectPropsIDEDrive,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsIDEDrive) },
    { "PIIX4_PM", virQEMUCapsObjectPropsPixx4PM,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsPixx4PM) },
    { "usb-redir", virQEMUCapsObjectPropsUsbRedir,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsUsbRedir) },
    { "usb-host", virQEMUCapsObjectPropsUsbHost,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsUsbHost) },
H
Han Cheng 已提交
1474 1475
    { "scsi-generic", virQEMUCapsObjectPropsScsiGeneric,
      ARRAY_CARDINALITY(virQEMUCapsObjectPropsScsiGeneric) },
1476 1477 1478 1479
};


static void
1480 1481 1482 1483 1484
virQEMUCapsProcessStringFlags(virQEMUCapsPtr qemuCaps,
                              size_t nflags,
                              struct virQEMUCapsStringFlags *flags,
                              size_t nvalues,
                              char *const*values)
1485 1486
{
    size_t i, j;
1487 1488
    for (i = 0; i < nflags; i++) {
        for (j = 0; j < nvalues; j++) {
1489
            if (STREQ(values[j], flags[i].value)) {
1490
                virQEMUCapsSet(qemuCaps, flags[i].flag);
1491 1492 1493 1494 1495 1496 1497 1498
                break;
            }
        }
    }
}


static void
1499 1500
virQEMUCapsFreeStringList(size_t len,
                          char **values)
1501 1502
{
    size_t i;
1503
    for (i = 0; i < len; i++)
1504 1505 1506 1507 1508 1509 1510 1511
        VIR_FREE(values[i]);
    VIR_FREE(values);
}


#define OBJECT_TYPE_PREFIX "name \""

static int
1512 1513
virQEMUCapsParseDeviceStrObjectTypes(const char *str,
                                     char ***types)
1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531
{
    const char *tmp = str;
    int ret = -1;
    size_t ntypelist = 0;
    char **typelist = NULL;

    *types = NULL;

    while ((tmp = strstr(tmp, OBJECT_TYPE_PREFIX))) {
        char *end;
        tmp += strlen(OBJECT_TYPE_PREFIX);
        end = strstr(tmp, "\"");
        if (!end) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("Malformed QEMU device list string, missing quote"));
            goto cleanup;
        }

1532
        if (VIR_EXPAND_N(typelist, ntypelist, 1) < 0)
1533
            goto cleanup;
1534
        if (VIR_STRNDUP(typelist[ntypelist - 1], tmp, end-tmp) < 0)
1535 1536 1537 1538 1539 1540 1541 1542
            goto cleanup;
    }

    *types = typelist;
    ret = ntypelist;

cleanup:
    if (ret < 0)
1543
        virQEMUCapsFreeStringList(ntypelist, typelist);
1544 1545 1546 1547 1548
    return ret;
}


static int
1549 1550 1551
virQEMUCapsParseDeviceStrObjectProps(const char *str,
                                     const char *type,
                                     char ***props)
1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584
{
    const char *tmp = str;
    int ret = -1;
    size_t nproplist = 0;
    char **proplist = NULL;

    VIR_DEBUG("Extract type %s", type);
    *props = NULL;

    while ((tmp = strchr(tmp, '\n'))) {
        char *end;
        tmp += 1;

        if (*tmp == '\0')
            break;

        if (STRPREFIX(tmp, OBJECT_TYPE_PREFIX))
            continue;

        if (!STRPREFIX(tmp, type))
            continue;

        tmp += strlen(type);
        if (*tmp != '.')
            continue;
        tmp++;

        end = strstr(tmp, "=");
        if (!end) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("Malformed QEMU device list string, missing '='"));
            goto cleanup;
        }
1585
        if (VIR_EXPAND_N(proplist, nproplist, 1) < 0)
1586
            goto cleanup;
1587
        if (VIR_STRNDUP(proplist[nproplist - 1], tmp, end-tmp) < 0)
1588 1589 1590 1591 1592 1593 1594 1595
            goto cleanup;
    }

    *props = proplist;
    ret = nproplist;

cleanup:
    if (ret < 0)
1596
        virQEMUCapsFreeStringList(nproplist, proplist);
1597 1598 1599 1600 1601
    return ret;
}


int
1602
virQEMUCapsParseDeviceStr(virQEMUCapsPtr qemuCaps, const char *str)
1603 1604 1605 1606 1607
{
    int nvalues;
    char **values;
    size_t i;

1608
    if ((nvalues = virQEMUCapsParseDeviceStrObjectTypes(str, &values)) < 0)
1609
        return -1;
1610 1611 1612 1613 1614 1615
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsObjectTypes),
                                  virQEMUCapsObjectTypes,
                                  nvalues, values);
    virQEMUCapsFreeStringList(nvalues, values);

1616
    for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsObjectProps); i++) {
1617 1618 1619 1620
        const char *type = virQEMUCapsObjectProps[i].type;
        if ((nvalues = virQEMUCapsParseDeviceStrObjectProps(str,
                                                            type,
                                                            &values)) < 0)
1621
            return -1;
1622 1623 1624 1625 1626
        virQEMUCapsProcessStringFlags(qemuCaps,
                                      virQEMUCapsObjectProps[i].nprops,
                                      virQEMUCapsObjectProps[i].props,
                                      nvalues, values);
        virQEMUCapsFreeStringList(nvalues, values);
1627 1628 1629
    }

    /* Prefer -chardev spicevmc (detected earlier) over -device spicevmc */
1630 1631
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC))
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_DEVICE_SPICEVMC);
1632 1633 1634 1635 1636

    return 0;
}


E
Eric Blake 已提交
1637
static int
1638 1639
virQEMUCapsExtractDeviceStr(const char *qemu,
                            virQEMUCapsPtr qemuCaps,
1640
                            uid_t runUid, gid_t runGid)
1641
{
E
Eric Blake 已提交
1642
    char *output = NULL;
1643
    virCommandPtr cmd;
E
Eric Blake 已提交
1644
    int ret = -1;
1645

E
Eric Blake 已提交
1646 1647
    /* Cram together all device-related queries into one invocation;
     * the output format makes it possible to distinguish what we
1648 1649
     * need.  With qemu 0.13.0 and later, unrecognized '-device
     * bogus,?' cause an error in isolation, but are silently ignored
1650
     * in combination with '-device ?'.  Upstream qemu 0.12.x doesn't
1651 1652
     * understand '-device name,?', and always exits with status 1 for
     * the simpler '-device ?', so this function is really only useful
1653
     * if -help includes "device driver,?".  */
1654
    cmd = virQEMUCapsProbeCommand(qemu, qemuCaps, runUid, runGid);
1655 1656 1657 1658 1659 1660
    virCommandAddArgList(cmd,
                         "-device", "?",
                         "-device", "pci-assign,?",
                         "-device", "virtio-blk-pci,?",
                         "-device", "virtio-net-pci,?",
                         "-device", "scsi-disk,?",
1661
                         "-device", "PIIX4_PM,?",
1662
                         "-device", "usb-redir,?",
1663
                         "-device", "ide-drive,?",
1664
                         "-device", "usb-host,?",
H
Han Cheng 已提交
1665
                         "-device", "scsi-generic,?",
1666
                         NULL);
1667
    /* qemu -help goes to stdout, but qemu -device ? goes to stderr.  */
E
Eric Blake 已提交
1668
    virCommandSetErrorBuffer(cmd, &output);
1669

1670
    if (virCommandRun(cmd, NULL) < 0)
1671 1672
        goto cleanup;

1673
    ret = virQEMUCapsParseDeviceStr(qemuCaps, output);
1674 1675

cleanup:
E
Eric Blake 已提交
1676
    VIR_FREE(output);
1677
    virCommandFree(cmd);
E
Eric Blake 已提交
1678 1679 1680
    return ret;
}

1681

1682 1683 1684
int virQEMUCapsGetDefaultVersion(virCapsPtr caps,
                                 virQEMUCapsCachePtr capsCache,
                                 unsigned int *version)
1685 1686
{
    const char *binary;
1687
    virQEMUCapsPtr qemucaps;
T
Tal Kain 已提交
1688
    virArch hostarch;
1689 1690 1691 1692

    if (*version > 0)
        return 0;

T
Tal Kain 已提交
1693
    hostarch = virArchFromHost();
1694 1695
    if ((binary = virCapabilitiesDefaultGuestEmulator(caps,
                                                      "hvm",
T
Tal Kain 已提交
1696
                                                      hostarch,
1697
                                                      "qemu")) == NULL) {
1698
        virReportError(VIR_ERR_INTERNAL_ERROR,
1699
                       _("Cannot find suitable emulator for %s"),
T
Tal Kain 已提交
1700
                       virArchToString(hostarch));
1701 1702 1703
        return -1;
    }

1704
    if (!(qemucaps = virQEMUCapsCacheLookup(capsCache, binary)))
1705 1706
        return -1;

1707
    *version = virQEMUCapsGetVersion(qemucaps);
1708
    virObjectUnref(qemucaps);
1709 1710
    return 0;
}
1711 1712


1713 1714


1715 1716
virQEMUCapsPtr
virQEMUCapsNew(void)
1717
{
1718
    virQEMUCapsPtr qemuCaps;
1719

1720
    if (virQEMUCapsInitialize() < 0)
1721 1722
        return NULL;

1723
    if (!(qemuCaps = virObjectNew(virQEMUCapsClass)))
1724 1725
        return NULL;

1726
    if (!(qemuCaps->flags = virBitmapNew(QEMU_CAPS_LAST)))
1727
        goto error;
1728

1729
    return qemuCaps;
1730

1731
error:
1732
    virObjectUnref(qemuCaps);
1733
    return NULL;
1734 1735 1736
}


1737
virQEMUCapsPtr virQEMUCapsNewCopy(virQEMUCapsPtr qemuCaps)
1738
{
1739
    virQEMUCapsPtr ret = virQEMUCapsNew();
1740 1741 1742 1743 1744
    size_t i;

    if (!ret)
        return NULL;

1745
    virBitmapCopy(ret->flags, qemuCaps->flags);
1746

1747 1748 1749 1750
    ret->usedQMP = qemuCaps->usedQMP;
    ret->version = qemuCaps->version;
    ret->kvmVersion = qemuCaps->kvmVersion;
    ret->arch = qemuCaps->arch;
1751

1752
    if (VIR_ALLOC_N(ret->cpuDefinitions, qemuCaps->ncpuDefinitions) < 0)
1753
        goto error;
1754
    ret->ncpuDefinitions = qemuCaps->ncpuDefinitions;
1755
    for (i = 0; i < qemuCaps->ncpuDefinitions; i++) {
1756 1757
        if (VIR_STRDUP(ret->cpuDefinitions[i], qemuCaps->cpuDefinitions[i]) < 0)
            goto error;
1758 1759
    }

1760
    if (VIR_ALLOC_N(ret->machineTypes, qemuCaps->nmachineTypes) < 0)
1761
        goto error;
1762
    if (VIR_ALLOC_N(ret->machineAliases, qemuCaps->nmachineTypes) < 0)
1763
        goto error;
1764
    if (VIR_ALLOC_N(ret->machineMaxCpus, qemuCaps->nmachineTypes) < 0)
1765
        goto error;
1766
    ret->nmachineTypes = qemuCaps->nmachineTypes;
1767
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
1768 1769 1770
        if (VIR_STRDUP(ret->machineTypes[i], qemuCaps->machineTypes[i]) < 0 ||
            VIR_STRDUP(ret->machineAliases[i], qemuCaps->machineAliases[i]) < 0)
            goto error;
1771
        ret->machineMaxCpus[i] = qemuCaps->machineMaxCpus[i];
1772 1773 1774 1775
    }

    return ret;

1776
error:
1777 1778 1779 1780 1781
    virObjectUnref(ret);
    return NULL;
}


1782
void virQEMUCapsDispose(void *obj)
1783
{
1784
    virQEMUCapsPtr qemuCaps = obj;
1785 1786
    size_t i;

1787
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
1788 1789
        VIR_FREE(qemuCaps->machineTypes[i]);
        VIR_FREE(qemuCaps->machineAliases[i]);
1790
    }
1791 1792
    VIR_FREE(qemuCaps->machineTypes);
    VIR_FREE(qemuCaps->machineAliases);
1793
    VIR_FREE(qemuCaps->machineMaxCpus);
1794

1795
    for (i = 0; i < qemuCaps->ncpuDefinitions; i++) {
1796
        VIR_FREE(qemuCaps->cpuDefinitions[i]);
1797
    }
1798
    VIR_FREE(qemuCaps->cpuDefinitions);
1799

1800
    virBitmapFree(qemuCaps->flags);
1801

1802
    VIR_FREE(qemuCaps->binary);
1803 1804
}

1805
void
1806 1807
virQEMUCapsSet(virQEMUCapsPtr qemuCaps,
               enum virQEMUCapsFlags flag)
1808
{
1809
    ignore_value(virBitmapSetBit(qemuCaps->flags, flag));
1810 1811 1812 1813
}


void
1814
virQEMUCapsSetList(virQEMUCapsPtr qemuCaps, ...)
1815 1816 1817 1818
{
    va_list list;
    int flag;

1819
    va_start(list, qemuCaps);
1820
    while ((flag = va_arg(list, int)) < QEMU_CAPS_LAST)
1821
        ignore_value(virBitmapSetBit(qemuCaps->flags, flag));
1822
    va_end(list);
1823 1824 1825 1826
}


void
1827 1828
virQEMUCapsClear(virQEMUCapsPtr qemuCaps,
                 enum virQEMUCapsFlags flag)
1829
{
1830
    ignore_value(virBitmapClearBit(qemuCaps->flags, flag));
1831 1832 1833
}


1834
char *virQEMUCapsFlagsString(virQEMUCapsPtr qemuCaps)
1835
{
1836
    return virBitmapString(qemuCaps->flags);
1837 1838 1839 1840
}


bool
1841 1842
virQEMUCapsGet(virQEMUCapsPtr qemuCaps,
               enum virQEMUCapsFlags flag)
1843
{
1844 1845
    bool b;

1846
    if (!qemuCaps || virBitmapGetBit(qemuCaps->flags, flag, &b) < 0)
1847 1848 1849
        return false;
    else
        return b;
1850
}
1851 1852


1853
const char *virQEMUCapsGetBinary(virQEMUCapsPtr qemuCaps)
1854
{
1855
    return qemuCaps->binary;
1856 1857
}

1858
virArch virQEMUCapsGetArch(virQEMUCapsPtr qemuCaps)
1859
{
1860
    return qemuCaps->arch;
1861 1862 1863
}


1864
unsigned int virQEMUCapsGetVersion(virQEMUCapsPtr qemuCaps)
1865
{
1866
    return qemuCaps->version;
1867 1868 1869
}


1870
unsigned int virQEMUCapsGetKVMVersion(virQEMUCapsPtr qemuCaps)
1871
{
1872
    return qemuCaps->kvmVersion;
1873 1874 1875
}


1876 1877
int virQEMUCapsAddCPUDefinition(virQEMUCapsPtr qemuCaps,
                                const char *name)
1878
{
1879 1880 1881
    char *tmp;

    if (VIR_STRDUP(tmp, name) < 0)
1882
        return -1;
1883
    if (VIR_EXPAND_N(qemuCaps->cpuDefinitions, qemuCaps->ncpuDefinitions, 1) < 0) {
1884 1885 1886
        VIR_FREE(tmp);
        return -1;
    }
1887
    qemuCaps->cpuDefinitions[qemuCaps->ncpuDefinitions-1] = tmp;
1888 1889 1890 1891
    return 0;
}


1892 1893
size_t virQEMUCapsGetCPUDefinitions(virQEMUCapsPtr qemuCaps,
                                    char ***names)
1894
{
1895
    if (names)
1896 1897
        *names = qemuCaps->cpuDefinitions;
    return qemuCaps->ncpuDefinitions;
1898 1899 1900
}


1901 1902
size_t virQEMUCapsGetMachineTypes(virQEMUCapsPtr qemuCaps,
                                  char ***names)
1903
{
1904
    if (names)
1905 1906
        *names = qemuCaps->machineTypes;
    return qemuCaps->nmachineTypes;
1907 1908
}

1909 1910 1911
int virQEMUCapsGetMachineTypesCaps(virQEMUCapsPtr qemuCaps,
                                   size_t *nmachines,
                                   virCapsGuestMachinePtr **machines)
1912 1913 1914 1915 1916
{
    size_t i;

    *nmachines = 0;
    *machines = NULL;
1917
    if (VIR_ALLOC_N(*machines, qemuCaps->nmachineTypes) < 0)
1918
        goto error;
1919
    *nmachines = qemuCaps->nmachineTypes;
1920

1921
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
1922 1923
        virCapsGuestMachinePtr mach;
        if (VIR_ALLOC(mach) < 0)
1924
            goto error;
1925
        if (qemuCaps->machineAliases[i]) {
1926 1927 1928
            if (VIR_STRDUP(mach->name, qemuCaps->machineAliases[i]) < 0 ||
                VIR_STRDUP(mach->canonical, qemuCaps->machineTypes[i]) < 0)
                goto error;
1929
        } else {
1930 1931
            if (VIR_STRDUP(mach->name, qemuCaps->machineTypes[i]) < 0)
                goto error;
1932
        }
1933
        mach->maxCpus = qemuCaps->machineMaxCpus[i];
1934 1935 1936 1937 1938
        (*machines)[i] = mach;
    }

    return 0;

1939
error:
1940 1941 1942 1943 1944 1945 1946 1947
    virCapabilitiesFreeMachines(*machines, *nmachines);
    *nmachines = 0;
    *machines = NULL;
    return -1;
}



1948

1949 1950
const char *virQEMUCapsGetCanonicalMachine(virQEMUCapsPtr qemuCaps,
                                           const char *name)
1951 1952 1953
{
    size_t i;

1954 1955 1956
    if (!name)
        return NULL;

1957
    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
1958
        if (!qemuCaps->machineAliases[i])
1959
            continue;
1960 1961
        if (STREQ(qemuCaps->machineAliases[i], name))
            return qemuCaps->machineTypes[i];
1962 1963 1964 1965
    }

    return name;
}
1966 1967


1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986
int virQEMUCapsGetMachineMaxCpus(virQEMUCapsPtr qemuCaps,
                                 const char *name)
{
    size_t i;

    if (!name)
        return 0;

    for (i = 0; i < qemuCaps->nmachineTypes; i++) {
        if (!qemuCaps->machineMaxCpus[i])
            continue;
        if (STREQ(qemuCaps->machineTypes[i], name))
            return qemuCaps->machineMaxCpus[i];
    }

    return 0;
}


1987
static int
1988 1989
virQEMUCapsProbeQMPCommands(virQEMUCapsPtr qemuCaps,
                            qemuMonitorPtr mon)
1990 1991 1992 1993 1994 1995 1996
{
    char **commands = NULL;
    int ncommands;

    if ((ncommands = qemuMonitorGetCommands(mon, &commands)) < 0)
        return -1;

1997 1998 1999 2000 2001
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsCommands),
                                  virQEMUCapsCommands,
                                  ncommands, commands);
    virQEMUCapsFreeStringList(ncommands, commands);
2002

2003 2004 2005 2006
    /* QMP add-fd was introduced in 1.2, but did not support
     * management control of set numbering, and did not have a
     * counterpart -add-fd command line option.  We require the
     * add-fd features from 1.3 or later.  */
2007
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_ADD_FD)) {
2008 2009 2010 2011 2012 2013 2014
        int fd = open("/dev/null", O_RDONLY);
        if (fd < 0) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("unable to probe for add-fd"));
            return -1;
        }
        if (qemuMonitorAddFd(mon, 0, fd, "/dev/null") < 0)
2015
            virQEMUCapsClear(qemuCaps, QEMU_CAPS_ADD_FD);
2016 2017 2018
        VIR_FORCE_CLOSE(fd);
    }

2019 2020 2021 2022 2023
    return 0;
}


static int
2024 2025
virQEMUCapsProbeQMPEvents(virQEMUCapsPtr qemuCaps,
                          qemuMonitorPtr mon)
2026 2027 2028 2029 2030 2031 2032
{
    char **events = NULL;
    int nevents;

    if ((nevents = qemuMonitorGetEvents(mon, &events)) < 0)
        return -1;

2033 2034 2035 2036 2037
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsEvents),
                                  virQEMUCapsEvents,
                                  nevents, events);
    virQEMUCapsFreeStringList(nevents, events);
2038 2039 2040 2041 2042

    return 0;
}


2043
static int
2044 2045
virQEMUCapsProbeQMPObjects(virQEMUCapsPtr qemuCaps,
                           qemuMonitorPtr mon)
2046 2047 2048 2049 2050 2051 2052
{
    int nvalues;
    char **values;
    size_t i;

    if ((nvalues = qemuMonitorGetObjectTypes(mon, &values)) < 0)
        return -1;
2053 2054 2055 2056 2057 2058
    virQEMUCapsProcessStringFlags(qemuCaps,
                                  ARRAY_CARDINALITY(virQEMUCapsObjectTypes),
                                  virQEMUCapsObjectTypes,
                                  nvalues, values);
    virQEMUCapsFreeStringList(nvalues, values);

2059
    for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsObjectProps); i++) {
2060
        const char *type = virQEMUCapsObjectProps[i].type;
2061 2062 2063 2064
        if ((nvalues = qemuMonitorGetObjectProps(mon,
                                                 type,
                                                 &values)) < 0)
            return -1;
2065 2066 2067 2068 2069
        virQEMUCapsProcessStringFlags(qemuCaps,
                                      virQEMUCapsObjectProps[i].nprops,
                                      virQEMUCapsObjectProps[i].props,
                                      nvalues, values);
        virQEMUCapsFreeStringList(nvalues, values);
2070 2071 2072
    }

    /* Prefer -chardev spicevmc (detected earlier) over -device spicevmc */
2073 2074
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC))
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_DEVICE_SPICEVMC);
2075
    /* If qemu supports newer -device qxl it supports -vga qxl as well */
2076 2077
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE_QXL))
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_QXL);
2078 2079 2080 2081 2082 2083

    return 0;
}


static int
2084 2085
virQEMUCapsProbeQMPMachineTypes(virQEMUCapsPtr qemuCaps,
                                qemuMonitorPtr mon)
2086 2087 2088 2089 2090
{
    qemuMonitorMachineInfoPtr *machines = NULL;
    int nmachines = 0;
    int ret = -1;
    size_t i;
2091
    size_t defIdx = 0;
2092 2093 2094 2095

    if ((nmachines = qemuMonitorGetMachines(mon, &machines)) < 0)
        goto cleanup;

2096
    if (VIR_ALLOC_N(qemuCaps->machineTypes, nmachines) < 0)
2097
        goto cleanup;
2098
    if (VIR_ALLOC_N(qemuCaps->machineAliases, nmachines) < 0)
2099
        goto cleanup;
2100
    if (VIR_ALLOC_N(qemuCaps->machineMaxCpus, nmachines) < 0)
2101
        goto cleanup;
2102

2103
    for (i = 0; i < nmachines; i++) {
2104 2105
        if (VIR_STRDUP(qemuCaps->machineAliases[i], machines[i]->alias) < 0 ||
            VIR_STRDUP(qemuCaps->machineTypes[i], machines[i]->name) < 0)
2106
            goto cleanup;
2107 2108
        if (machines[i]->isDefault)
            defIdx = i;
2109
        qemuCaps->machineMaxCpus[i] = machines[i]->maxCpus;
2110
    }
2111
    qemuCaps->nmachineTypes = nmachines;
2112 2113

    if (defIdx)
2114
        virQEMUCapsSetDefaultMachine(qemuCaps, defIdx);
2115 2116 2117 2118

    ret = 0;

cleanup:
2119
    for (i = 0; i < nmachines; i++)
2120 2121 2122 2123 2124 2125 2126
        qemuMonitorMachineInfoFree(machines[i]);
    VIR_FREE(machines);
    return ret;
}


static int
2127 2128
virQEMUCapsProbeQMPCPUDefinitions(virQEMUCapsPtr qemuCaps,
                                  qemuMonitorPtr mon)
2129 2130 2131 2132 2133 2134 2135
{
    int ncpuDefinitions;
    char **cpuDefinitions;

    if ((ncpuDefinitions = qemuMonitorGetCPUDefinitions(mon, &cpuDefinitions)) < 0)
        return -1;

2136 2137
    qemuCaps->ncpuDefinitions = ncpuDefinitions;
    qemuCaps->cpuDefinitions = cpuDefinitions;
2138 2139 2140 2141

    return 0;
}

2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164
struct tpmTypeToCaps {
    int type;
    enum virQEMUCapsFlags caps;
};

static const struct tpmTypeToCaps virQEMUCapsTPMTypesToCaps[] = {
    {
        .type = VIR_DOMAIN_TPM_TYPE_PASSTHROUGH,
        .caps = QEMU_CAPS_DEVICE_TPM_PASSTHROUGH,
    },
};

const struct tpmTypeToCaps virQEMUCapsTPMModelsToCaps[] = {
    {
        .type = VIR_DOMAIN_TPM_MODEL_TIS,
        .caps = QEMU_CAPS_DEVICE_TPM_TIS,
    },
};

static int
virQEMUCapsProbeQMPTPM(virQEMUCapsPtr qemuCaps,
                       qemuMonitorPtr mon)
{
2165 2166
    int nentries;
    size_t i;
2167
    char **entries = NULL;
S
Stefan Berger 已提交
2168

2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198
    if ((nentries = qemuMonitorGetTPMModels(mon, &entries)) < 0)
        return -1;

    if (nentries > 0) {
        for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsTPMModelsToCaps); i++) {
            const char *needle = virDomainTPMModelTypeToString(
                virQEMUCapsTPMModelsToCaps[i].type);
            if (virStringArrayHasString(entries, needle))
                virQEMUCapsSet(qemuCaps,
                               virQEMUCapsTPMModelsToCaps[i].caps);
        }
    }
    virStringFreeList(entries);

    if ((nentries = qemuMonitorGetTPMTypes(mon, &entries)) < 0)
        return -1;

    if (nentries > 0) {
        for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsTPMTypesToCaps); i++) {
            const char *needle = virDomainTPMBackendTypeToString(
                virQEMUCapsTPMTypesToCaps[i].type);
            if (virStringArrayHasString(entries, needle))
                virQEMUCapsSet(qemuCaps, virQEMUCapsTPMTypesToCaps[i].caps);
        }
    }
    virStringFreeList(entries);

    return 0;
}

2199

2200
static int
2201 2202
virQEMUCapsProbeQMPKVMState(virQEMUCapsPtr qemuCaps,
                            qemuMonitorPtr mon)
2203 2204 2205 2206
{
    bool enabled = false;
    bool present = false;

2207
    if (!virQEMUCapsGet(qemuCaps, QEMU_CAPS_KVM))
2208 2209 2210 2211 2212 2213
        return 0;

    if (qemuMonitorGetKVMState(mon, &enabled, &present) < 0)
        return -1;

    /* The QEMU_CAPS_KVM flag was initially set according to the QEMU
2214 2215 2216 2217 2218 2219 2220 2221
     * reporting the recognition of 'query-kvm' QMP command. That merely
     * indicates existance of the command though, not whether KVM support
     * is actually available, nor whether it is enabled by default.
     *
     * If it is not present we need to clear the flag, and if it is
     * not enabled by default we need to change the flag.
     */
    if (!present) {
2222
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_KVM);
2223
    } else if (!enabled) {
2224 2225
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_KVM);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_ENABLE_KVM);
2226 2227 2228 2229 2230
    }

    return 0;
}

2231 2232 2233 2234 2235 2236 2237 2238
struct virQEMUCapsCommandLineProps {
    const char *option;
    const char *param;
    int flag;
};

static struct virQEMUCapsCommandLineProps virQEMUCapsCommandLine[] = {
    { "machine", "mem-merge", QEMU_CAPS_MEM_MERGE },
O
Osier Yang 已提交
2239
    { "drive", "discard", QEMU_CAPS_DRIVE_DISCARD },
2240
    { "realtime", "mlock", QEMU_CAPS_MLOCK },
2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266
};

static int
virQEMUCapsProbeQMPCommandLine(virQEMUCapsPtr qemuCaps,
                               qemuMonitorPtr mon)
{
    int nvalues;
    char **values;
    size_t i, j;

    for (i = 0; i < ARRAY_CARDINALITY(virQEMUCapsCommandLine); i++) {
        if ((nvalues = qemuMonitorGetCommandLineOptionParameters(mon,
                                                                 virQEMUCapsCommandLine[i].option,
                                                                 &values)) < 0)
            return -1;
        for (j = 0; j < nvalues; j++) {
            if (STREQ(virQEMUCapsCommandLine[i].param, values[j])) {
                virQEMUCapsSet(qemuCaps, virQEMUCapsCommandLine[i].flag);
                break;
            }
        }
        virStringFreeList(values);
    }

    return 0;
}
2267

2268 2269
int virQEMUCapsProbeQMP(virQEMUCapsPtr qemuCaps,
                        qemuMonitorPtr mon)
2270
{
2271
    VIR_DEBUG("qemuCaps=%p mon=%p", qemuCaps, mon);
2272

2273
    if (qemuCaps->usedQMP)
2274 2275
        return 0;

2276
    if (virQEMUCapsProbeQMPCommands(qemuCaps, mon) < 0)
2277 2278
        return -1;

2279
    if (virQEMUCapsProbeQMPEvents(qemuCaps, mon) < 0)
2280 2281 2282 2283 2284 2285
        return -1;

    return 0;
}


2286 2287
#define QEMU_SYSTEM_PREFIX "qemu-system-"

2288
static int
2289
virQEMUCapsInitHelp(virQEMUCapsPtr qemuCaps, uid_t runUid, gid_t runGid)
2290
{
2291
    virCommandPtr cmd = NULL;
2292
    bool is_kvm;
2293
    char *help = NULL;
2294 2295
    int ret = -1;
    const char *tmp;
2296

2297
    VIR_DEBUG("qemuCaps=%p", qemuCaps);
2298

2299
    tmp = strstr(qemuCaps->binary, QEMU_SYSTEM_PREFIX);
2300 2301
    if (tmp) {
        tmp += strlen(QEMU_SYSTEM_PREFIX);
2302

2303
        qemuCaps->arch = virQEMUCapsArchFromString(tmp);
2304
    } else {
2305
        qemuCaps->arch = virArchFromHost();
2306 2307
    }

2308
    cmd = virQEMUCapsProbeCommand(qemuCaps->binary, NULL, runUid, runGid);
2309 2310 2311 2312
    virCommandAddArgList(cmd, "-help", NULL);
    virCommandSetOutputBuffer(cmd, &help);

    if (virCommandRun(cmd, NULL) < 0)
2313
        goto cleanup;
2314

2315 2316 2317 2318 2319 2320
    if (virQEMUCapsParseHelpStr(qemuCaps->binary,
                                help, qemuCaps,
                                &qemuCaps->version,
                                &is_kvm,
                                &qemuCaps->kvmVersion,
                                false) < 0)
2321
        goto cleanup;
2322 2323

    /* Currently only x86_64 and i686 support PCI-multibus. */
2324 2325 2326
    if (qemuCaps->arch == VIR_ARCH_X86_64 ||
        qemuCaps->arch == VIR_ARCH_I686) {
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_MULTIBUS);
2327 2328 2329
    } else {
        /* -no-acpi is not supported on other archs
         * even if qemu reports it in -help */
2330
        virQEMUCapsClear(qemuCaps, QEMU_CAPS_NO_ACPI);
2331
    }
2332

2333
    /* virQEMUCapsExtractDeviceStr will only set additional caps if qemu
2334
     * understands the 0.13.0+ notion of "-device driver,".  */
2335
    if (virQEMUCapsGet(qemuCaps, QEMU_CAPS_DEVICE) &&
2336
        strstr(help, "-device driver,?") &&
2337 2338
        virQEMUCapsExtractDeviceStr(qemuCaps->binary,
                                    qemuCaps, runUid, runGid) < 0) {
2339
        goto cleanup;
2340
    }
2341

2342
    if (virQEMUCapsProbeCPUModels(qemuCaps, runUid, runGid) < 0)
2343
        goto cleanup;
2344

2345
    if (virQEMUCapsProbeMachineTypes(qemuCaps, runUid, runGid) < 0)
2346
        goto cleanup;
2347

2348
    ret = 0;
2349
cleanup:
2350
    virCommandFree(cmd);
2351
    VIR_FREE(help);
2352 2353 2354 2355
    return ret;
}


2356 2357
static void virQEMUCapsMonitorNotify(qemuMonitorPtr mon ATTRIBUTE_UNUSED,
                                     virDomainObjPtr vm ATTRIBUTE_UNUSED)
2358 2359 2360 2361
{
}

static qemuMonitorCallbacks callbacks = {
2362 2363
    .eofNotify = virQEMUCapsMonitorNotify,
    .errorNotify = virQEMUCapsMonitorNotify,
2364 2365 2366 2367 2368 2369 2370
};


/* Capabilities that we assume are always enabled
 * for QEMU >= 1.2.0
 */
static void
2371
virQEMUCapsInitQMPBasic(virQEMUCapsPtr qemuCaps)
2372
{
2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_COLON);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_REBOOT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_UUID);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNET_HDR);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_TCP);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_EXEC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_V2);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_FORMAT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_0_10);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MEM_PATH);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_SERIAL);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_UNIX);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MONITOR_JSON);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_BALLOON);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SDL);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMP_TOPOLOGY);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_RTC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VHOST_NET);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_HPET);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NODEFCONFIG);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_BOOT_MENU);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NAME_PROCESS);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_READONLY);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SMBIOS_TYPE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VGA_NONE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MIGRATE_QEMU_FD);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_AIO);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_CHARDEV_SPICEVMC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE_QXL_VGA);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_DIRECTSYNC);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_SHUTDOWN);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_CACHE_UNSAFE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_READONLY);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VIRTIO_BLK_SG_IO);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_COPY_ON_READ);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_CPU_HOST);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_FSDEV_WRITEOUT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DRIVE_IOTUNE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_WAKEUP);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_USER_CONFIG);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_NETDEV_BRIDGE);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_SECCOMP_SANDBOX);
O
Olivia Yin 已提交
2422
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DTB);
J
Ján Tomko 已提交
2423
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_IPV6_MIGRATION);
2424 2425
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_OPT);
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DUMP_GUEST_CORE);
2426
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_SHARE_POLICY);
2427
    virQEMUCapsSet(qemuCaps, QEMU_CAPS_DEVICE_VIDEO_PRIMARY);
2428 2429
}

2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448 2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465
/* Capabilities that are architecture depending
 * initialized for QEMU.
 */
static int
virQEMUCapsInitArchQMPBasic(virQEMUCapsPtr qemuCaps,
                            qemuMonitorPtr mon)
{
    char *archstr = NULL;
    int ret = -1;

    if (!(archstr = qemuMonitorGetTargetArch(mon)))
        return -1;

    if ((qemuCaps->arch = virQEMUCapsArchFromString(archstr)) == VIR_ARCH_NONE) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("Unknown QEMU arch %s"), archstr);
        goto cleanup;
    }

    /*
     * Currently only x86_64 and i686 support PCI-multibus,
     * -no-acpi and -no-kvm-pit-reinjection.
     */
    if (qemuCaps->arch == VIR_ARCH_X86_64 ||
        qemuCaps->arch == VIR_ARCH_I686) {
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_PCI_MULTIBUS);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_ACPI);
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_NO_KVM_PIT);
    }

    ret = 0;

cleanup:
    VIR_FREE(archstr);
    return ret;
}
2466 2467

static int
2468 2469 2470 2471
virQEMUCapsInitQMP(virQEMUCapsPtr qemuCaps,
                   const char *libDir,
                   uid_t runUid,
                   gid_t runGid)
2472 2473 2474 2475 2476
{
    int ret = -1;
    virCommandPtr cmd = NULL;
    qemuMonitorPtr mon = NULL;
    int major, minor, micro;
2477
    char *package = NULL;
2478 2479 2480 2481
    int status = 0;
    virDomainChrSourceDef config;
    char *monarg = NULL;
    char *monpath = NULL;
2482
    char *pidfile = NULL;
2483 2484
    pid_t pid = 0;
    virDomainObj vm;
2485

2486 2487 2488
    /* the ".sock" sufix is important to avoid a possible clash with a qemu
     * domain called "capabilities"
     */
2489
    if (virAsprintf(&monpath, "%s/%s", libDir, "capabilities.monitor.sock") < 0)
2490
        goto cleanup;
2491
    if (virAsprintf(&monarg, "unix:%s,server,nowait", monpath) < 0)
2492 2493
        goto cleanup;

2494 2495
    /* ".pidfile" suffix is used rather than ".pid" to avoid a possible clash
     * with a qemu domain called "capabilities"
2496 2497 2498
     * Normally we'd use runDir for pid files, but because we're using
     * -daemonize we need QEMU to be allowed to create them, rather
     * than libvirtd. So we're using libDir which QEMU can write to
2499
     */
2500
    if (virAsprintf(&pidfile, "%s/%s", libDir, "capabilities.pidfile") < 0)
2501 2502
        goto cleanup;

2503 2504 2505 2506 2507
    memset(&config, 0, sizeof(config));
    config.type = VIR_DOMAIN_CHR_TYPE_UNIX;
    config.data.nix.path = monpath;
    config.data.nix.listen = false;

2508
    VIR_DEBUG("Try to get caps via QMP qemuCaps=%p", qemuCaps);
2509

2510 2511 2512 2513 2514 2515 2516
    /*
     * We explicitly need to use -daemonize here, rather than
     * virCommandDaemonize, because we need to synchronize
     * with QEMU creating its monitor socket API. Using
     * daemonize guarantees control won't return to libvirt
     * until the socket is present.
     */
2517
    cmd = virCommandNewArgList(qemuCaps->binary,
2518 2519 2520 2521 2522 2523
                               "-S",
                               "-no-user-config",
                               "-nodefaults",
                               "-nographic",
                               "-M", "none",
                               "-qmp", monarg,
2524 2525
                               "-pidfile", pidfile,
                               "-daemonize",
2526 2527 2528
                               NULL);
    virCommandAddEnvPassCommon(cmd);
    virCommandClearCaps(cmd);
2529 2530
    virCommandSetGID(cmd, runGid);
    virCommandSetUID(cmd, runUid);
2531 2532 2533 2534 2535 2536

    if (virCommandRun(cmd, &status) < 0)
        goto cleanup;

    if (status != 0) {
        ret = 0;
2537
        VIR_DEBUG("QEMU %s exited with status %d", qemuCaps->binary, status);
2538 2539 2540
        goto cleanup;
    }

2541 2542 2543 2544 2545 2546 2547 2548 2549 2550
    if (virPidFileReadPath(pidfile, &pid) < 0) {
        VIR_DEBUG("Failed to read pidfile %s", pidfile);
        ret = 0;
        goto cleanup;
    }

    memset(&vm, 0, sizeof(vm));
    vm.pid = pid;

    if (!(mon = qemuMonitorOpen(&vm, &config, true, &callbacks))) {
2551
        ret = 0;
2552
        goto cleanup;
2553
    }
2554

2555
    virObjectLock(mon);
2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566 2567 2568 2569 2570 2571 2572 2573 2574 2575 2576 2577

    if (qemuMonitorSetCapabilities(mon) < 0) {
        virErrorPtr err = virGetLastError();
        VIR_DEBUG("Failed to set monitor capabilities %s",
                  err ? err->message : "<unknown problem>");
        ret = 0;
        goto cleanup;
    }

    if (qemuMonitorGetVersion(mon,
                              &major, &minor, &micro,
                              &package) < 0) {
        virErrorPtr err = virGetLastError();
        VIR_DEBUG("Failed to query monitor version %s",
                  err ? err->message : "<unknown problem>");
        ret = 0;
        goto cleanup;
    }

    VIR_DEBUG("Got version %d.%d.%d (%s)",
              major, minor, micro, NULLSTR(package));

2578
    if (major < 1 || (major == 1 && minor < 2)) {
2579 2580 2581 2582 2583
        VIR_DEBUG("Not new enough for QMP capabilities detection");
        ret = 0;
        goto cleanup;
    }

2584 2585
    qemuCaps->version = major * 1000000 + minor * 1000 + micro;
    qemuCaps->usedQMP = true;
2586

2587
    virQEMUCapsInitQMPBasic(qemuCaps);
2588

2589 2590 2591
    if (virQEMUCapsInitArchQMPBasic(qemuCaps, mon) < 0)
        goto cleanup;

L
Li Zhang 已提交
2592 2593 2594 2595
    /* USB option is supported v1.3.0 onwards */
    if (qemuCaps->version >= 1003000)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_MACHINE_USB_OPT);

2596 2597 2598 2599
    /* WebSockets were introduced between 1.3.0 and 1.3.1 */
    if (qemuCaps->version >= 1003001)
        virQEMUCapsSet(qemuCaps, QEMU_CAPS_VNC_WEBSOCKET);

2600
    if (virQEMUCapsProbeQMPCommands(qemuCaps, mon) < 0)
2601
        goto cleanup;
2602
    if (virQEMUCapsProbeQMPEvents(qemuCaps, mon) < 0)
2603
        goto cleanup;
2604
    if (virQEMUCapsProbeQMPObjects(qemuCaps, mon) < 0)
2605
        goto cleanup;
2606
    if (virQEMUCapsProbeQMPMachineTypes(qemuCaps, mon) < 0)
2607
        goto cleanup;
2608
    if (virQEMUCapsProbeQMPCPUDefinitions(qemuCaps, mon) < 0)
2609
        goto cleanup;
2610
    if (virQEMUCapsProbeQMPKVMState(qemuCaps, mon) < 0)
2611
        goto cleanup;
2612 2613
    if (virQEMUCapsProbeQMPTPM(qemuCaps, mon) < 0)
        goto cleanup;
2614 2615
    if (virQEMUCapsProbeQMPCommandLine(qemuCaps, mon) < 0)
        goto cleanup;
2616 2617 2618 2619 2620

    ret = 0;

cleanup:
    if (mon)
2621
        virObjectUnlock(mon);
2622 2623
    qemuMonitorClose(mon);
    virCommandAbort(cmd);
2624
    virCommandFree(cmd);
2625 2626
    VIR_FREE(monarg);
    VIR_FREE(monpath);
2627
    VIR_FREE(package);
2628

2629
    if (pid != 0) {
2630 2631
        char ebuf[1024];

2632 2633 2634 2635 2636 2637 2638
        VIR_DEBUG("Killing QMP caps process %lld", (long long) pid);
        if (virProcessKill(pid, SIGKILL) < 0 && errno != ESRCH)
            VIR_ERROR(_("Failed to kill process %lld: %s"),
                      (long long) pid,
                      virStrerror(errno, ebuf, sizeof(ebuf)));
    }
    if (pidfile) {
2639 2640 2641
        unlink(pidfile);
        VIR_FREE(pidfile);
    }
2642 2643 2644 2645
    return ret;
}


2646 2647 2648 2649
virQEMUCapsPtr virQEMUCapsNewForBinary(const char *binary,
                                       const char *libDir,
                                       uid_t runUid,
                                       gid_t runGid)
2650
{
2651
    virQEMUCapsPtr qemuCaps = virQEMUCapsNew();
2652 2653 2654
    struct stat sb;
    int rv;

2655 2656
    if (VIR_STRDUP(qemuCaps->binary, binary) < 0)
        goto error;
2657 2658 2659 2660 2661 2662 2663 2664

    /* We would also want to check faccessat if we cared about ACLs,
     * but we don't.  */
    if (stat(binary, &sb) < 0) {
        virReportSystemError(errno, _("Cannot check QEMU binary %s"),
                             binary);
        goto error;
    }
2665
    qemuCaps->mtime = sb.st_mtime;
2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676

    /* Make sure the binary we are about to try exec'ing exists.
     * Technically we could catch the exec() failure, but that's
     * in a sub-process so it's hard to feed back a useful error.
     */
    if (!virFileIsExecutable(binary)) {
        virReportSystemError(errno, _("QEMU binary %s is not executable"),
                             binary);
        goto error;
    }

2677
    if ((rv = virQEMUCapsInitQMP(qemuCaps, libDir, runUid, runGid)) < 0)
2678 2679
        goto error;

2680 2681
    if (!qemuCaps->usedQMP &&
        virQEMUCapsInitHelp(qemuCaps, runUid, runGid) < 0)
2682 2683
        goto error;

2684
    return qemuCaps;
2685 2686

error:
2687 2688
    virObjectUnref(qemuCaps);
    qemuCaps = NULL;
2689
    return NULL;
2690 2691 2692
}


2693
bool virQEMUCapsIsValid(virQEMUCapsPtr qemuCaps)
2694 2695 2696
{
    struct stat sb;

2697
    if (!qemuCaps->binary)
2698 2699
        return true;

2700
    if (stat(qemuCaps->binary, &sb) < 0)
2701 2702
        return false;

2703
    return sb.st_mtime == qemuCaps->mtime;
2704
}
2705 2706 2707


static void
2708
virQEMUCapsHashDataFree(void *payload, const void *key ATTRIBUTE_UNUSED)
2709 2710 2711 2712 2713
{
    virObjectUnref(payload);
}


2714 2715 2716 2717
virQEMUCapsCachePtr
virQEMUCapsCacheNew(const char *libDir,
                    uid_t runUid,
                    gid_t runGid)
2718
{
2719
    virQEMUCapsCachePtr cache;
2720

2721
    if (VIR_ALLOC(cache) < 0)
2722 2723 2724 2725 2726 2727 2728 2729 2730
        return NULL;

    if (virMutexInit(&cache->lock) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Unable to initialize mutex"));
        VIR_FREE(cache);
        return NULL;
    }

2731
    if (!(cache->binaries = virHashCreate(10, virQEMUCapsHashDataFree)))
2732
        goto error;
2733
    if (VIR_STRDUP(cache->libDir, libDir) < 0)
2734
        goto error;
2735

2736 2737 2738
    cache->runUid = runUid;
    cache->runGid = runGid;

2739 2740 2741
    return cache;

error:
2742
    virQEMUCapsCacheFree(cache);
2743 2744 2745 2746
    return NULL;
}


2747 2748
virQEMUCapsPtr
virQEMUCapsCacheLookup(virQEMUCapsCachePtr cache, const char *binary)
2749
{
2750
    virQEMUCapsPtr ret = NULL;
2751 2752 2753
    virMutexLock(&cache->lock);
    ret = virHashLookup(cache->binaries, binary);
    if (ret &&
2754
        !virQEMUCapsIsValid(ret)) {
2755 2756 2757 2758 2759 2760 2761 2762
        VIR_DEBUG("Cached capabilities %p no longer valid for %s",
                  ret, binary);
        virHashRemoveEntry(cache->binaries, binary);
        ret = NULL;
    }
    if (!ret) {
        VIR_DEBUG("Creating capabilities for %s",
                  binary);
2763 2764
        ret = virQEMUCapsNewForBinary(binary, cache->libDir,
                                      cache->runUid, cache->runGid);
2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780
        if (ret) {
            VIR_DEBUG("Caching capabilities %p for %s",
                      ret, binary);
            if (virHashAddEntry(cache->binaries, binary, ret) < 0) {
                virObjectUnref(ret);
                ret = NULL;
            }
        }
    }
    VIR_DEBUG("Returning caps %p for %s", ret, binary);
    virObjectRef(ret);
    virMutexUnlock(&cache->lock);
    return ret;
}


2781 2782
virQEMUCapsPtr
virQEMUCapsCacheLookupCopy(virQEMUCapsCachePtr cache, const char *binary)
2783
{
2784 2785
    virQEMUCapsPtr qemuCaps = virQEMUCapsCacheLookup(cache, binary);
    virQEMUCapsPtr ret;
2786

2787
    if (!qemuCaps)
2788 2789
        return NULL;

2790 2791
    ret = virQEMUCapsNewCopy(qemuCaps);
    virObjectUnref(qemuCaps);
2792 2793 2794 2795 2796
    return ret;
}


void
2797
virQEMUCapsCacheFree(virQEMUCapsCachePtr cache)
2798 2799 2800 2801
{
    if (!cache)
        return;

2802
    VIR_FREE(cache->libDir);
2803 2804 2805 2806
    virHashFree(cache->binaries);
    virMutexDestroy(&cache->lock);
    VIR_FREE(cache);
}
2807 2808

bool
2809
virQEMUCapsUsedQMP(virQEMUCapsPtr qemuCaps)
2810
{
2811
    return qemuCaps->usedQMP;
2812
}