storage_backend.c 54.6 KB
Newer Older
1
/*
2
 * storage_backend.c: internal storage driver backend contract
3
 *
4
 * Copyright (C) 2007-2013 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2007-2008 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with this library.  If not, see
O
Osier Yang 已提交
19
 * <http://www.gnu.org/licenses/>.
20 21 22 23 24 25 26
 *
 * Author: Daniel P. Berrange <berrange@redhat.com>
 */

#include <config.h>

#include <string.h>
27
#include <stdio.h>
28
#include <regex.h>
29
#include <sys/types.h>
E
Eric Blake 已提交
30
#include <sys/wait.h>
31
#include <unistd.h>
32 33
#include <fcntl.h>
#include <sys/stat.h>
34
#include <sys/param.h>
35
#include <dirent.h>
36
#include "dirname.h"
37 38 39 40
#ifdef __linux__
# include <sys/ioctl.h>
# include <linux/fs.h>
#endif
41

42
#if WITH_SELINUX
43
# include <selinux/selinux.h>
44
#endif
45

46
#include "datatypes.h"
47
#include "virerror.h"
48
#include "viralloc.h"
49
#include "internal.h"
50
#include "secret_conf.h"
51
#include "viruuid.h"
52
#include "virstoragefile.h"
D
Daniel P. Berrange 已提交
53
#include "storage_backend.h"
54
#include "virlog.h"
E
Eric Blake 已提交
55
#include "virfile.h"
56
#include "stat-time.h"
57
#include "virstring.h"
58

59
#if WITH_STORAGE_LVM
60
# include "storage_backend_logical.h"
61 62
#endif
#if WITH_STORAGE_ISCSI
63
# include "storage_backend_iscsi.h"
64
#endif
65
#if WITH_STORAGE_SCSI
66
# include "storage_backend_scsi.h"
67
#endif
D
Dave Allan 已提交
68
#if WITH_STORAGE_MPATH
69
# include "storage_backend_mpath.h"
D
Dave Allan 已提交
70
#endif
71
#if WITH_STORAGE_DISK
72
# include "storage_backend_disk.h"
73 74
#endif
#if WITH_STORAGE_DIR
75
# include "storage_backend_fs.h"
76
#endif
77 78 79
#if WITH_STORAGE_RBD
# include "storage_backend_rbd.h"
#endif
80 81 82
#if WITH_STORAGE_SHEEPDOG
# include "storage_backend_sheepdog.h"
#endif
83

84 85
#define VIR_FROM_THIS VIR_FROM_STORAGE

86 87 88 89 90 91 92 93 94 95 96 97 98 99
static virStorageBackendPtr backends[] = {
#if WITH_STORAGE_DIR
    &virStorageBackendDirectory,
#endif
#if WITH_STORAGE_FS
    &virStorageBackendFileSystem,
    &virStorageBackendNetFileSystem,
#endif
#if WITH_STORAGE_LVM
    &virStorageBackendLogical,
#endif
#if WITH_STORAGE_ISCSI
    &virStorageBackendISCSI,
#endif
100 101 102
#if WITH_STORAGE_SCSI
    &virStorageBackendSCSI,
#endif
D
Dave Allan 已提交
103 104 105
#if WITH_STORAGE_MPATH
    &virStorageBackendMpath,
#endif
106 107
#if WITH_STORAGE_DISK
    &virStorageBackendDisk,
108 109 110
#endif
#if WITH_STORAGE_RBD
    &virStorageBackendRBD,
111 112 113
#endif
#if WITH_STORAGE_SHEEPDOG
    &virStorageBackendSheepdog,
114 115 116
#endif
    NULL
};
117

118 119 120 121 122 123
enum {
    TOOL_QEMU_IMG,
    TOOL_KVM_IMG,
    TOOL_QCOW_CREATE,
};

124 125 126
#define READ_BLOCK_SIZE_DEFAULT  (1024 * 1024)
#define WRITE_BLOCK_SIZE_DEFAULT (4 * 1024)

127
static int ATTRIBUTE_NONNULL(2)
128
virStorageBackendCopyToFD(virStorageVolDefPtr vol,
129 130
                          virStorageVolDefPtr inputvol,
                          int fd,
131
                          unsigned long long *total,
J
Ján Tomko 已提交
132
                          bool want_sparse)
133 134 135
{
    int inputfd = -1;
    int amtread = -1;
136
    int ret = 0;
137 138 139
    size_t rbytes = READ_BLOCK_SIZE_DEFAULT;
    size_t wbytes = 0;
    int interval;
140
    char *zerobuf = NULL;
141
    char *buf = NULL;
142
    struct stat st;
143

144
    if ((inputfd = open(inputvol->target.path, O_RDONLY)) < 0) {
145
        ret = -errno;
146
        virReportSystemError(errno,
147 148 149
                             _("could not open input path '%s'"),
                             inputvol->target.path);
        goto cleanup;
150 151
    }

152 153 154 155 156 157 158 159 160 161 162 163 164 165
#ifdef __linux__
    if (ioctl(fd, BLKBSZGET, &wbytes) < 0) {
        wbytes = 0;
    }
#endif
    if ((wbytes == 0) && fstat(fd, &st) == 0)
        wbytes = st.st_blksize;
    if (wbytes < WRITE_BLOCK_SIZE_DEFAULT)
        wbytes = WRITE_BLOCK_SIZE_DEFAULT;

    if (VIR_ALLOC_N(zerobuf, wbytes) < 0) {
        ret = -errno;
        goto cleanup;
    }
166

167
    if (VIR_ALLOC_N(buf, rbytes) < 0) {
168
        ret = -errno;
169 170 171 172 173 174
        goto cleanup;
    }

    while (amtread != 0) {
        int amtleft;

175 176
        if (*total < rbytes)
            rbytes = *total;
177

178
        if ((amtread = saferead(inputfd, buf, rbytes)) < 0) {
179
            ret = -errno;
180
            virReportSystemError(errno,
181 182 183 184
                                 _("failed reading from file '%s'"),
                                 inputvol->target.path);
            goto cleanup;
        }
185
        *total -= amtread;
186 187 188 189 190

        /* Loop over amt read in 512 byte increments, looking for sparse
         * blocks */
        amtleft = amtread;
        do {
191
            interval = ((wbytes > amtleft) ? amtleft : wbytes);
192 193
            int offset = amtread - amtleft;

194
            if (want_sparse && memcmp(buf+offset, zerobuf, interval) == 0) {
195
                if (lseek(fd, interval, SEEK_CUR) < 0) {
196
                    ret = -errno;
197
                    virReportSystemError(errno,
198 199 200 201 202
                                         _("cannot extend file '%s'"),
                                         vol->target.path);
                    goto cleanup;
                }
            } else if (safewrite(fd, buf+offset, interval) < 0) {
203
                ret = -errno;
204
                virReportSystemError(errno,
205 206 207 208 209
                                     _("failed writing to file '%s'"),
                                     vol->target.path);
                goto cleanup;

            }
210
        } while ((amtleft -= interval) > 0);
211 212
    }

213 214 215 216 217 218 219 220
    if (fdatasync(fd) < 0) {
        ret = -errno;
        virReportSystemError(errno, _("cannot sync data to file '%s'"),
                             vol->target.path);
        goto cleanup;
    }


221
    if (VIR_CLOSE(inputfd) < 0) {
222
        ret = -errno;
223
        virReportSystemError(errno,
224 225 226 227 228 229 230
                             _("cannot close file '%s'"),
                             inputvol->target.path);
        goto cleanup;
    }
    inputfd = -1;

cleanup:
231
    VIR_FORCE_CLOSE(inputfd);
232

233
    VIR_FREE(zerobuf);
234 235
    VIR_FREE(buf);

236 237 238
    return ret;
}

239
static int
240
virStorageBackendCreateBlockFrom(virConnectPtr conn ATTRIBUTE_UNUSED,
241
                                 virStoragePoolObjPtr pool ATTRIBUTE_UNUSED,
242 243
                                 virStorageVolDefPtr vol,
                                 virStorageVolDefPtr inputvol,
E
Eric Blake 已提交
244
                                 unsigned int flags)
245 246 247 248
{
    int fd = -1;
    int ret = -1;
    unsigned long long remain;
249 250 251
    struct stat st;
    gid_t gid;
    uid_t uid;
252

253 254 255 256 257 258 259 260
    virCheckFlags(VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA, -1);

    if (flags & VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("metadata preallocation is not supported for block "
                         "volumes"));
        goto cleanup;
    }
E
Eric Blake 已提交
261

262
    if ((fd = open(vol->target.path, O_RDWR)) < 0) {
263
        virReportSystemError(errno,
264 265 266 267 268 269 270 271
                             _("cannot create path '%s'"),
                             vol->target.path);
        goto cleanup;
    }

    remain = vol->allocation;

    if (inputvol) {
272
        int res = virStorageBackendCopyToFD(vol, inputvol,
J
Ján Tomko 已提交
273
                                            fd, &remain, false);
274 275 276 277
        if (res < 0)
            goto cleanup;
    }

278
    if (fstat(fd, &st) == -1) {
279
        virReportSystemError(errno, _("stat of '%s' failed"),
280 281 282
                             vol->target.path);
        goto cleanup;
    }
P
Philipp Hahn 已提交
283 284 285
    uid = (vol->target.perms.uid != st.st_uid) ? vol->target.perms.uid : (uid_t) -1;
    gid = (vol->target.perms.gid != st.st_gid) ? vol->target.perms.gid : (gid_t) -1;
    if (((uid != (uid_t) -1) || (gid != (gid_t) -1))
286
        && (fchown(fd, uid, gid) < 0)) {
287
        virReportSystemError(errno,
288
                             _("cannot chown '%s' to (%u, %u)"),
289 290
                             vol->target.path, (unsigned int) uid,
                             (unsigned int) gid);
291 292 293
        goto cleanup;
    }
    if (fchmod(fd, vol->target.perms.mode) < 0) {
294
        virReportSystemError(errno,
295 296 297 298
                             _("cannot set mode of '%s' to %04o"),
                             vol->target.path, vol->target.perms.mode);
        goto cleanup;
    }
299
    if (VIR_CLOSE(fd) < 0) {
300
        virReportSystemError(errno,
301 302 303 304 305 306 307 308
                             _("cannot close file '%s'"),
                             vol->target.path);
        goto cleanup;
    }
    fd = -1;

    ret = 0;
cleanup:
309
    VIR_FORCE_CLOSE(fd);
310 311 312 313

    return ret;
}

E
Eric Blake 已提交
314 315 316 317
static int
createRawFile(int fd, virStorageVolDefPtr vol,
              virStorageVolDefPtr inputvol)
{
J
Ján Tomko 已提交
318
    bool need_alloc = true;
319 320
    int ret = 0;
    unsigned long long remain;
321

322 323
    /* Seek to the final size, so the capacity is available upfront
     * for progress reporting */
E
Eric Blake 已提交
324
    if (ftruncate(fd, vol->capacity) < 0) {
325
        ret = -errno;
326
        virReportSystemError(errno,
327
                             _("cannot extend file '%s'"),
E
Eric Blake 已提交
328
                             vol->target.path);
329 330 331
        goto cleanup;
    }

E
Eric Blake 已提交
332 333
/* Avoid issues with older kernel's <linux/fs.h> namespace pollution. */
#if HAVE_FALLOCATE - 0
334 335 336 337 338 339 340
    /* Try to preallocate all requested disk space, but fall back to
     * other methods if this fails with ENOSYS or EOPNOTSUPP.
     * NOTE: do not use posix_fallocate; posix_fallocate falls back
     * to writing zeroes block by block in case fallocate isn't
     * available, and since we're going to copy data from another
     * file it doesn't make sense to write the file twice. */
    if (fallocate(fd, 0, 0, vol->allocation) == 0) {
J
Ján Tomko 已提交
341
        need_alloc = false;
342 343 344 345 346 347 348 349 350
    } else if (errno != ENOSYS && errno != EOPNOTSUPP) {
        ret = -errno;
        virReportSystemError(errno,
                             _("cannot allocate %llu bytes in file '%s'"),
                             vol->allocation, vol->target.path);
        goto cleanup;
    }
#endif

E
Eric Blake 已提交
351
    remain = vol->allocation;
352

E
Eric Blake 已提交
353
    if (inputvol) {
354 355 356
        /* allow zero blocks to be skipped if we've requested sparse
         * allocation (allocation < capacity) or we have already
         * been able to allocate the required space. */
J
Ján Tomko 已提交
357 358
        bool want_sparse = !need_alloc ||
                           (vol->allocation < inputvol->capacity);
359 360

        ret = virStorageBackendCopyToFD(vol, inputvol, fd, &remain, want_sparse);
361
        if (ret < 0) {
362
            goto cleanup;
363
        }
364 365
    }

366 367
    if (remain && need_alloc) {
        if (safezero(fd, vol->allocation - remain, remain) < 0) {
368 369 370 371
            ret = -errno;
            virReportSystemError(errno, _("cannot fill file '%s'"),
                                 vol->target.path);
            goto cleanup;
372
        }
373 374 375
    }

    if (fsync(fd) < 0) {
376
        ret = -errno;
377
        virReportSystemError(errno, _("cannot sync data to file '%s'"),
E
Eric Blake 已提交
378
                             vol->target.path);
379
        goto cleanup;
380 381
    }

382 383 384 385 386 387 388 389 390
cleanup:
    return ret;
}

int
virStorageBackendCreateRaw(virConnectPtr conn ATTRIBUTE_UNUSED,
                           virStoragePoolObjPtr pool,
                           virStorageVolDefPtr vol,
                           virStorageVolDefPtr inputvol,
E
Eric Blake 已提交
391
                           unsigned int flags)
392 393
{
    int ret = -1;
E
Eric Blake 已提交
394 395 396
    int fd = -1;
    int operation_flags;

397 398 399 400 401 402 403 404
    virCheckFlags(VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA, -1);

    if (flags & VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("metadata preallocation is not supported for raw "
                         "volumes"));
        goto cleanup;
    }
405 406

    if (vol->target.encryption != NULL) {
407 408
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("storage pool does not support encrypted volumes"));
409 410
        goto cleanup;
    }
411

L
Laine Stump 已提交
412
    operation_flags = VIR_FILE_OPEN_FORCE_MODE | VIR_FILE_OPEN_FORCE_OWNER;
E
Eric Blake 已提交
413
    if (pool->def->type == VIR_STORAGE_POOL_NETFS)
L
Laine Stump 已提交
414
        operation_flags |= VIR_FILE_OPEN_FORK;
E
Eric Blake 已提交
415

416 417
    if ((fd = virFileOpenAs(vol->target.path,
                            O_RDWR | O_CREAT | O_EXCL,
L
Laine Stump 已提交
418 419 420
                            vol->target.perms.mode,
                            vol->target.perms.uid,
                            vol->target.perms.gid,
421
                            operation_flags)) < 0) {
E
Eric Blake 已提交
422
        virReportSystemError(-fd,
423
                             _("Failed to create file '%s'"),
E
Eric Blake 已提交
424 425 426 427
                             vol->target.path);
        goto cleanup;
    }

428 429
    if ((ret = createRawFile(fd, vol, inputvol)) < 0)
        /* createRawFile already reported the exact error. */
E
Eric Blake 已提交
430
        ret = -1;
431 432

cleanup:
E
Eric Blake 已提交
433
    VIR_FORCE_CLOSE(fd);
434 435 436
    return ret;
}

437 438 439 440 441 442 443 444 445
static int
virStorageGenerateSecretUUID(virConnectPtr conn,
                             unsigned char *uuid)
{
    unsigned attempt;

    for (attempt = 0; attempt < 65536; attempt++) {
        virSecretPtr tmp;
        if (virUUIDGenerate(uuid) < 0) {
446 447
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("unable to generate uuid"));
448 449
            return -1;
        }
450
        tmp = conn->secretDriver->secretLookupByUUID(conn, uuid);
451 452 453 454 455 456
        if (tmp == NULL)
            return 0;

        virSecretFree(tmp);
    }

457 458
    virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                   _("too many conflicts when generating an uuid"));
459 460 461 462

    return -1;
}

463 464 465 466 467 468 469 470 471
static int
virStorageGenerateQcowEncryption(virConnectPtr conn,
                                 virStorageVolDefPtr vol)
{
    virSecretDefPtr def = NULL;
    virBuffer buf = VIR_BUFFER_INITIALIZER;
    virStorageEncryptionPtr enc;
    virStorageEncryptionSecretPtr enc_secret = NULL;
    virSecretPtr secret = NULL;
472
    char *xml;
473 474 475
    unsigned char value[VIR_STORAGE_QCOW_PASSPHRASE_SIZE];
    int ret = -1;

476
    if (conn->secretDriver == NULL ||
477 478 479
        conn->secretDriver->secretLookupByUUID == NULL ||
        conn->secretDriver->secretDefineXML == NULL ||
        conn->secretDriver->secretSetValue == NULL) {
480 481
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("secret storage not supported"));
482 483 484 485 486
        goto cleanup;
    }

    enc = vol->target.encryption;
    if (enc->nsecrets != 0) {
487 488
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("secrets already defined"));
489 490 491 492
        goto cleanup;
    }

    if (VIR_ALLOC(enc_secret) < 0 || VIR_REALLOC_N(enc->secrets, 1) < 0 ||
493
        VIR_ALLOC(def) < 0)
494 495
        goto cleanup;

496
    def->ephemeral = false;
497
    def->private = false;
498
    if (virStorageGenerateSecretUUID(conn, def->uuid) < 0)
499
        goto cleanup;
500

501
    def->usage_type = VIR_SECRET_USAGE_TYPE_VOLUME;
502
    if (VIR_STRDUP(def->usage.volume, vol->target.path) < 0)
503
        goto cleanup;
504
    xml = virSecretDefFormat(def);
505 506 507 508 509
    virSecretDefFree(def);
    def = NULL;
    if (xml == NULL)
        goto cleanup;

510
    secret = conn->secretDriver->secretDefineXML(conn, xml, 0);
511 512 513 514 515 516
    if (secret == NULL) {
        VIR_FREE(xml);
        goto cleanup;
    }
    VIR_FREE(xml);

517
    if (virStorageGenerateQcowPassphrase(value) < 0)
518 519
        goto cleanup;

520
    if (conn->secretDriver->secretSetValue(secret, value, sizeof(value), 0) < 0)
521 522 523
        goto cleanup;

    enc_secret->type = VIR_STORAGE_ENCRYPTION_SECRET_TYPE_PASSPHRASE;
524
    memcpy(enc_secret->uuid, secret->uuid, VIR_UUID_BUFLEN);
525 526 527 528 529 530 531 532 533
    enc->format = VIR_STORAGE_ENCRYPTION_FORMAT_QCOW;
    enc->secrets[0] = enc_secret; /* Space for secrets[0] allocated above */
    enc_secret = NULL;
    enc->nsecrets = 1;

    ret = 0;

cleanup:
    if (secret != NULL) {
534
        if (ret != 0 &&
535 536
            conn->secretDriver->secretUndefine != NULL)
            conn->secretDriver->secretUndefine(secret);
537 538
        virSecretFree(secret);
    }
539
    virBufferFreeAndReset(&buf);
540 541 542 543 544
    virSecretDefFree(def);
    VIR_FREE(enc_secret);
    return ret;
}

545 546 547 548 549
static int
virStorageBackendCreateExecCommand(virStoragePoolObjPtr pool,
                                   virStorageVolDefPtr vol,
                                   virCommandPtr cmd)
{
550 551 552
    struct stat st;
    gid_t gid;
    uid_t uid;
553
    bool filecreated = false;
554 555

    if ((pool->def->type == VIR_STORAGE_POOL_NETFS)
556
        && (((getuid() == 0)
P
Philipp Hahn 已提交
557
             && (vol->target.perms.uid != (uid_t) -1)
558
             && (vol->target.perms.uid != 0))
P
Philipp Hahn 已提交
559
            || ((vol->target.perms.gid != (gid_t) -1)
560
                && (vol->target.perms.gid != getgid())))) {
561

562 563
        virCommandSetUID(cmd, vol->target.perms.uid);
        virCommandSetGID(cmd, vol->target.perms.gid);
564 565

        if (virCommandRun(cmd, NULL) == 0) {
566 567
            /* command was successfully run, check if the file was created */
            if (stat(vol->target.path, &st) >=0)
568
                filecreated = true;
569 570
        }
    }
571

572 573 574
    /* don't change uid/gid if we retry */
    virCommandSetUID(cmd, -1);
    virCommandSetGID(cmd, -1);
575

576
    if (!filecreated) {
577
        if (virCommandRun(cmd, NULL) < 0) {
578 579 580
            return -1;
        }
        if (stat(vol->target.path, &st) < 0) {
581
            virReportSystemError(errno,
582
                                 _("failed to create %s"), vol->target.path);
583 584 585 586
            return -1;
        }
    }

P
Philipp Hahn 已提交
587 588 589
    uid = (vol->target.perms.uid != st.st_uid) ? vol->target.perms.uid : (uid_t) -1;
    gid = (vol->target.perms.gid != st.st_gid) ? vol->target.perms.gid : (gid_t) -1;
    if (((uid != (uid_t) -1) || (gid != (gid_t) -1))
590
        && (chown(vol->target.path, uid, gid) < 0)) {
591
        virReportSystemError(errno,
592
                             _("cannot chown %s to (%u, %u)"),
593 594
                             vol->target.path, (unsigned int) uid,
                             (unsigned int) gid);
595 596 597
        return -1;
    }
    if (chmod(vol->target.path, vol->target.perms.mode) < 0) {
598
        virReportSystemError(errno,
599 600 601 602 603 604 605
                             _("cannot set mode of '%s' to %04o"),
                             vol->target.path, vol->target.perms.mode);
        return -1;
    }
    return 0;
}

606 607 608 609
enum {
    QEMU_IMG_BACKING_FORMAT_NONE = 0,
    QEMU_IMG_BACKING_FORMAT_FLAG,
    QEMU_IMG_BACKING_FORMAT_OPTIONS,
610
    QEMU_IMG_BACKING_FORMAT_OPTIONS_COMPAT,
611 612
};

613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637
static bool
virStorageBackendQemuImgSupportsCompat(const char *qemuimg)
{
    bool ret = false;
    char *output;
    virCommandPtr cmd = NULL;

    cmd = virCommandNewArgList(qemuimg, "create", "-o", "?", "-f", "qcow2",
                               "/dev/null", NULL);

    virCommandAddEnvString(cmd, "LC_ALL=C");
    virCommandSetOutputBuffer(cmd, &output);

    if (virCommandRun(cmd, NULL) < 0)
        goto cleanup;

    if (strstr(output, "\ncompat "))
        ret = true;

cleanup:
    virCommandFree(cmd);
    VIR_FREE(output);
    return ret;
}

638 639
static int
virStorageBackendQEMUImgBackingFormat(const char *qemuimg)
640 641 642 643 644 645
{
    char *help = NULL;
    char *start;
    char *end;
    char *tmp;
    int ret = -1;
646
    int exitstatus;
647
    virCommandPtr cmd = virCommandNewArgList(qemuimg, "-h", NULL);
648

649 650 651
    virCommandAddEnvString(cmd, "LC_ALL=C");
    virCommandSetOutputBuffer(cmd, &help);
    virCommandClearCaps(cmd);
652

653 654 655
    /* qemuimg doesn't return zero exit status on -h,
     * therefore we need to provide pointer for storing
     * exit status, although we don't parse it any later */
656
    if (virCommandRun(cmd, &exitstatus) < 0)
657 658
        goto cleanup;

659 660
    if ((start = strstr(help, " create ")) == NULL ||
        (end = strstr(start, "\n")) == NULL) {
661 662 663
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("unable to parse qemu-img output '%s'"),
                       help);
664 665
        goto cleanup;
    }
666
    if (((tmp = strstr(start, "-F fmt")) && tmp < end) ||
667
        ((tmp = strstr(start, "-F backing_fmt")) && tmp < end)) {
668
        ret = QEMU_IMG_BACKING_FORMAT_FLAG;
669 670 671 672 673 674
    } else if ((tmp = strstr(start, "[-o options]")) && tmp < end) {
        if (virStorageBackendQemuImgSupportsCompat(qemuimg))
            ret = QEMU_IMG_BACKING_FORMAT_OPTIONS_COMPAT;
        else
            ret = QEMU_IMG_BACKING_FORMAT_OPTIONS;
    } else {
675
        ret = QEMU_IMG_BACKING_FORMAT_NONE;
676
    }
677 678

cleanup:
679
    virCommandFree(cmd);
680 681 682 683
    VIR_FREE(help);
    return ret;
}

684 685 686 687
static int
virStorageBackendCreateQemuImgOpts(char **opts,
                                   const char *backingType,
                                   bool encryption,
688 689 690 691
                                   bool preallocate,
                                   int format,
                                   const char *compat,
                                   virBitmapPtr features)
692 693
{
    virBuffer buf = VIR_BUFFER_INITIALIZER;
694
    bool b;
695
    size_t i;
696

697 698 699 700 701 702 703
    if (backingType)
        virBufferAsprintf(&buf, "backing_fmt=%s,", backingType);
    if (encryption)
        virBufferAddLit(&buf, "encryption=on,");
    if (preallocate)
        virBufferAddLit(&buf, "preallocation=metadata,");

704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720
    if (compat)
        virBufferAsprintf(&buf, "compat=%s,", compat);
    if (features && format == VIR_STORAGE_FILE_QCOW2) {
        for (i = 0; i < VIR_STORAGE_FILE_FEATURE_LAST; i++) {
            ignore_value(virBitmapGetBit(features, i, &b));
            if (b) {
                switch ((enum virStorageFileFeature) i) {
                case VIR_STORAGE_FILE_FEATURE_LAZY_REFCOUNTS:
                    if (STREQ_NULLABLE(compat, "0.10")) {
                        virReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                                       _("Feature %s not supported with compat"
                                         " level %s"),
                                       virStorageFileFeatureTypeToString(i),
                                       compat);
                        goto error;
                    }
                    break;
721

722
                /* coverity[dead_error_begin] */
723 724 725 726 727 728 729 730 731
                case VIR_STORAGE_FILE_FEATURE_LAST:
                    ;
                }
                virBufferAsprintf(&buf, "%s,",
                                  virStorageFileFeatureTypeToString(i));
            }
        }
    }

732 733
    virBufferTrim(&buf, ",", -1);

734 735
    if (virBufferError(&buf))
        goto no_memory;
736 737 738

    *opts = virBufferContentAndReset(&buf);
    return 0;
739 740 741 742 743 744

no_memory:
    virReportOOMError();
error:
    virBufferFreeAndReset(&buf);
    return -1;
745 746
}

747 748 749 750 751 752 753 754
virCommandPtr
virStorageBackendCreateQemuImgCmd(virConnectPtr conn,
                                  virStoragePoolObjPtr pool,
                                  virStorageVolDefPtr vol,
                                  virStorageVolDefPtr inputvol,
                                  unsigned int flags,
                                  const char *create_tool,
                                  int imgformat)
755
{
756 757
    virCommandPtr cmd = NULL;
    bool do_encryption = (vol->target.encryption != NULL);
758
    unsigned long long int size_arg;
759 760 761 762 763
    bool preallocate = !!(flags & VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA);
    const char *type;
    const char *backingType = NULL;
    const char *inputPath = NULL;
    const char *inputType = NULL;
764
    const char *compat = vol->target.compat;
765 766 767
    char *opts = NULL;
    bool convert = false;
    bool backing = false;
768

769 770
    virCheckFlags(VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA, NULL);

771 772 773 774
    /* Treat output block devices as 'raw' format */
    type = virStorageFileFormatTypeToString(vol->type == VIR_STORAGE_VOL_BLOCK ?
                                            VIR_STORAGE_FILE_RAW :
                                            vol->target.format);
775

776
    if (!type) {
777 778 779
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("unknown storage vol type %d"),
                       vol->target.format);
780
        return NULL;
781
    }
782

783 784 785
    if (preallocate && vol->target.format != VIR_STORAGE_FILE_QCOW2) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("metadata preallocation only available with qcow2"));
786
        return NULL;
787
    }
788 789 790 791 792 793 794 795 796 797
    if (vol->target.compat && vol->target.format != VIR_STORAGE_FILE_QCOW2) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("compatibility option only available with qcow2"));
        return NULL;
    }
    if (vol->target.features && vol->target.format != VIR_STORAGE_FILE_QCOW2) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("format features only available with qcow2"));
        return NULL;
    }
798

799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818
    if (inputvol) {
        if (!(inputPath = inputvol->target.path)) {
            virReportError(VIR_ERR_INVALID_ARG, "%s",
                           _("missing input volume target path"));
            return NULL;
        }

        inputType = virStorageFileFormatTypeToString(inputvol->type == VIR_STORAGE_VOL_BLOCK ?
                                                     VIR_STORAGE_FILE_RAW :
                                                     inputvol->target.format);

        if (!inputType) {
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("unknown storage vol type %d"),
                           inputvol->target.format);
            return NULL;
        }

    }

819
    if (vol->backingStore.path) {
820 821
        int accessRetCode = -1;
        char *absolutePath = NULL;
822

823 824
        backingType = virStorageFileFormatTypeToString(vol->backingStore.format);

825 826 827 828
        if (preallocate) {
            virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                           _("metadata preallocation conflicts with backing"
                             " store"));
829
            return NULL;
830 831
        }

832 833 834 835 836
        /* XXX: Not strictly required: qemu-img has an option a different
         * backing store, not really sure what use it serves though, and it
         * may cause issues with lvm. Untested essentially.
         */
        if (inputvol &&
837 838 839
            STRNEQ_NULLABLE(inputvol->backingStore.path, vol->backingStore.path)) {
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("a different backing store cannot be specified."));
840
            return NULL;
841 842 843
        }

        if (backingType == NULL) {
844 845 846
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("unknown storage vol backing store type %d"),
                           vol->backingStore.format);
847
            return NULL;
848
        }
849 850 851 852 853 854

        /* Convert relative backing store paths to absolute paths for access
         * validation.
         */
        if ('/' != *(vol->backingStore.path) &&
            virAsprintf(&absolutePath, "%s/%s", pool->def->target.path,
855
                        vol->backingStore.path) < 0)
856
            return NULL;
857 858 859 860
        accessRetCode = access(absolutePath ? absolutePath
                               : vol->backingStore.path, R_OK);
        VIR_FREE(absolutePath);
        if (accessRetCode != 0) {
861
            virReportSystemError(errno,
862 863
                                 _("inaccessible backing store volume %s"),
                                 vol->backingStore.path);
864
            return NULL;
865 866 867
        }
    }

868
    if (do_encryption) {
869 870
        virStorageEncryptionPtr enc;

871 872
        if (vol->target.format != VIR_STORAGE_FILE_QCOW &&
            vol->target.format != VIR_STORAGE_FILE_QCOW2) {
873 874 875
            virReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                           _("qcow volume encryption unsupported with "
                             "volume format %s"), type);
876
            return NULL;
877
        }
878 879 880
        enc = vol->target.encryption;
        if (enc->format != VIR_STORAGE_ENCRYPTION_FORMAT_QCOW &&
            enc->format != VIR_STORAGE_ENCRYPTION_FORMAT_DEFAULT) {
881 882 883
            virReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                           _("unsupported volume encryption format %d"),
                           vol->target.encryption->format);
884
            return NULL;
885
        }
886
        if (enc->nsecrets > 1) {
887 888
            virReportError(VIR_ERR_XML_ERROR, "%s",
                           _("too many secrets for qcow encryption"));
889
            return NULL;
890
        }
891 892 893
        if (enc->format == VIR_STORAGE_ENCRYPTION_FORMAT_DEFAULT ||
            enc->nsecrets == 0) {
            if (virStorageGenerateQcowEncryption(conn, vol) < 0)
894
                return NULL;
895
        }
896 897
    }

898
    /* Size in KB */
899
    size_arg = VIR_DIV_UP(vol->capacity, 1024);
900

901 902
    cmd = virCommandNew(create_tool);

903 904
    convert = !!inputvol;
    backing = !inputvol && vol->backingStore.path;
905

906 907 908
    if (convert)
        virCommandAddArgList(cmd, "convert", "-f", inputType, "-O", type, NULL);
    else
909
        virCommandAddArgList(cmd, "create", "-f", type, NULL);
910

911 912 913
    if (backing)
        virCommandAddArgList(cmd, "-b", vol->backingStore.path, NULL);

914 915 916 917 918
    if (imgformat >= QEMU_IMG_BACKING_FORMAT_OPTIONS) {
        if (vol->target.format == VIR_STORAGE_FILE_QCOW2 && !compat &&
            imgformat == QEMU_IMG_BACKING_FORMAT_OPTIONS_COMPAT)
            compat = "0.10";

919 920
        if (virStorageBackendCreateQemuImgOpts(&opts,
                                               backing ? backingType : NULL,
921 922
                                               do_encryption, preallocate,
                                               vol->target.format,
923
                                               compat,
924 925
                                               vol->target.features) < 0) {
            virCommandFree(cmd);
926
            return NULL;
927
        }
928 929 930 931 932 933 934 935 936 937
        if (opts)
            virCommandAddArgList(cmd, "-o", opts, NULL);
        VIR_FREE(opts);
    } else {
        if (backing) {
            if (imgformat == QEMU_IMG_BACKING_FORMAT_FLAG)
                virCommandAddArgList(cmd, "-F", backingType, NULL);
            else
                VIR_DEBUG("Unable to set backing store format for %s with %s",
                          vol->target.path, create_tool);
938
        }
939 940
        if (do_encryption)
            virCommandAddArg(cmd, "-e");
941
    }
942

943 944 945 946 947 948
    if (convert)
        virCommandAddArg(cmd, inputPath);
    virCommandAddArg(cmd, vol->target.path);
    if (!convert)
        virCommandAddArgFormat(cmd, "%lluK", size_arg);

949 950 951 952 953 954 955 956 957 958 959
    return cmd;
}

static int
virStorageBackendCreateQemuImg(virConnectPtr conn,
                               virStoragePoolObjPtr pool,
                               virStorageVolDefPtr vol,
                               virStorageVolDefPtr inputvol,
                               unsigned int flags)
{
    int ret = -1;
960
    char *create_tool;
961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985
    int imgformat;
    virCommandPtr cmd;

    virCheckFlags(VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA, -1);

    /* KVM is usually ahead of qemu on features, so try that first */
    create_tool = virFindFileInPath("kvm-img");
    if (!create_tool)
        create_tool = virFindFileInPath("qemu-img");

    if (!create_tool) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("unable to find kvm-img or qemu-img"));
        return -1;
    }

    imgformat = virStorageBackendQEMUImgBackingFormat(create_tool);
    if (imgformat < 0)
        goto cleanup;

    cmd = virStorageBackendCreateQemuImgCmd(conn, pool, vol, inputvol, flags,
                                            create_tool, imgformat);
    if (!cmd)
        goto cleanup;

986
    ret = virStorageBackendCreateExecCommand(pool, vol, cmd);
987 988

    virCommandFree(cmd);
989
cleanup:
990
    VIR_FREE(create_tool);
991
    return ret;
992 993 994 995 996 997 998
}

/*
 * Xen removed the fully-functional qemu-img, and replaced it
 * with a partially functional qcow-create. Go figure ??!?
 */
static int
999
virStorageBackendCreateQcowCreate(virConnectPtr conn ATTRIBUTE_UNUSED,
1000
                                  virStoragePoolObjPtr pool,
1001
                                  virStorageVolDefPtr vol,
1002
                                  virStorageVolDefPtr inputvol,
E
Eric Blake 已提交
1003
                                  unsigned int flags)
1004
{
1005
    int ret;
E
Eric Blake 已提交
1006
    char *size;
1007
    virCommandPtr cmd;
1008

1009 1010 1011 1012 1013 1014 1015 1016
    virCheckFlags(VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA, -1);

    if (flags & VIR_STORAGE_VOL_CREATE_PREALLOC_METADATA) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("metadata preallocation is not supported with "
                         "qcow-create"));
        return -1;
    }
E
Eric Blake 已提交
1017

1018
    if (inputvol) {
1019 1020
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("cannot copy from volume with qcow-create"));
1021 1022 1023
        return -1;
    }

1024
    if (vol->target.format != VIR_STORAGE_FILE_QCOW2) {
1025 1026 1027
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("unsupported storage vol type %d"),
                       vol->target.format);
1028 1029 1030
        return -1;
    }
    if (vol->backingStore.path != NULL) {
1031 1032 1033
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("copy-on-write image not supported with "
                         "qcow-create"));
1034 1035
        return -1;
    }
1036
    if (vol->target.encryption != NULL) {
1037 1038 1039
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED,
                       "%s", _("encrypted volumes not supported with "
                               "qcow-create"));
1040 1041
        return -1;
    }
1042 1043

    /* Size in MB - yes different units to qemu-img :-( */
1044
    if (virAsprintf(&size, "%llu",
1045
                    VIR_DIV_UP(vol->capacity, (1024 * 1024))) < 0)
E
Eric Blake 已提交
1046
        return -1;
1047

1048
    cmd = virCommandNewArgList("qcow-create", size, vol->target.path, NULL);
1049

1050 1051
    ret = virStorageBackendCreateExecCommand(pool, vol, cmd);
    virCommandFree(cmd);
E
Eric Blake 已提交
1052
    VIR_FREE(size);
1053

1054
    return ret;
1055 1056
}

1057
virStorageBackendBuildVolFrom
1058
virStorageBackendFSImageToolTypeToFunc(int tool_type)
1059 1060 1061 1062 1063 1064 1065 1066
{
    switch (tool_type) {
    case TOOL_KVM_IMG:
    case TOOL_QEMU_IMG:
        return virStorageBackendCreateQemuImg;
    case TOOL_QCOW_CREATE:
        return virStorageBackendCreateQcowCreate;
    default:
1067 1068 1069
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("Unknown file create tool type '%d'."),
                       tool_type);
1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096
    }

    return NULL;
}

int
virStorageBackendFindFSImageTool(char **tool)
{
    int tool_type = -1;
    char *tmp = NULL;

    if ((tmp = virFindFileInPath("kvm-img")) != NULL) {
        tool_type = TOOL_KVM_IMG;
    } else if ((tmp = virFindFileInPath("qemu-img")) != NULL) {
        tool_type = TOOL_QEMU_IMG;
    } else if ((tmp = virFindFileInPath("qcow-create")) != NULL) {
        tool_type = TOOL_QCOW_CREATE;
    }

    if (tool)
        *tool = tmp;
    else
        VIR_FREE(tmp);

    return tool_type;
}

1097
virStorageBackendBuildVolFrom
1098
virStorageBackendGetBuildVolFromFunction(virStorageVolDefPtr vol,
1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109
                                         virStorageVolDefPtr inputvol)
{
    int tool_type;

    if (!inputvol)
        return NULL;

    /* If either volume is a non-raw file vol, we need to use an external
     * tool for converting
     */
    if ((vol->type == VIR_STORAGE_VOL_FILE &&
1110
         vol->target.format != VIR_STORAGE_FILE_RAW) ||
1111
        (inputvol->type == VIR_STORAGE_VOL_FILE &&
1112
         inputvol->target.format != VIR_STORAGE_FILE_RAW)) {
1113

D
Daniel P. Berrange 已提交
1114
        if ((tool_type = virStorageBackendFindFSImageTool(NULL)) < 0) {
1115 1116 1117
            virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                           _("creation of non-raw file images is "
                             "not supported without qemu-img."));
1118 1119 1120
            return NULL;
        }

1121
        return virStorageBackendFSImageToolTypeToFunc(tool_type);
1122 1123
    }

1124 1125 1126 1127
    if (vol->type == VIR_STORAGE_VOL_BLOCK)
        return virStorageBackendCreateBlockFrom;
    else
        return virStorageBackendCreateRaw;
1128
}
1129

1130

1131
virStorageBackendPtr
1132 1133
virStorageBackendForType(int type)
{
1134
    size_t i;
1135
    for (i = 0; backends[i]; i++)
1136 1137 1138
        if (backends[i]->type == type)
            return backends[i];

1139 1140
    virReportError(VIR_ERR_INTERNAL_ERROR,
                   _("missing backend for pool type %d"), type);
1141 1142 1143 1144
    return NULL;
}


1145 1146 1147
/*
 * Allows caller to silently ignore files with improper mode
 *
1148 1149
 * Returns -1 on error, -2 if file mode is unexpected or the
 * volume is a dangling symbolic link.
1150
 */
1151
int
1152
virStorageBackendVolOpenCheckMode(const char *path, unsigned int flags)
1153
{
1154 1155
    int fd, mode = 0;
    struct stat sb;
1156
    char *base = last_component(path);
1157

1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172
    if (lstat(path, &sb) < 0) {
        virReportSystemError(errno,
                             _("cannot stat file '%s'"),
                             path);
        return -1;
    }

    if (S_ISFIFO(sb.st_mode)) {
        VIR_WARN("ignoring FIFO '%s'", path);
        return -2;
    } else if (S_ISSOCK(sb.st_mode)) {
        VIR_WARN("ignoring socket '%s'", path);
        return -2;
    }

1173
    if ((fd = open(path, O_RDONLY|O_NONBLOCK|O_NOCTTY)) < 0) {
1174
        if ((errno == ENOENT || errno == ELOOP) &&
1175
            S_ISLNK(sb.st_mode)) {
1176 1177 1178 1179
            VIR_WARN("ignoring dangling symlink '%s'", path);
            return -2;
        }

1180
        virReportSystemError(errno,
1181
                             _("cannot open volume '%s'"),
1182
                             path);
1183 1184 1185
        return -1;
    }

1186 1187 1188 1189 1190 1191 1192 1193
    if (fstat(fd, &sb) < 0) {
        virReportSystemError(errno,
                             _("cannot stat file '%s'"),
                             path);
        VIR_FORCE_CLOSE(fd);
        return -1;
    }

1194 1195 1196 1197 1198 1199
    if (S_ISREG(sb.st_mode))
        mode = VIR_STORAGE_VOL_OPEN_REG;
    else if (S_ISCHR(sb.st_mode))
        mode = VIR_STORAGE_VOL_OPEN_CHAR;
    else if (S_ISBLK(sb.st_mode))
        mode = VIR_STORAGE_VOL_OPEN_BLOCK;
1200 1201 1202 1203 1204 1205 1206 1207 1208 1209
    else if (S_ISDIR(sb.st_mode)) {
        mode = VIR_STORAGE_VOL_OPEN_DIR;

        if (STREQ(base, ".") ||
            STREQ(base, "..")) {
            VIR_FORCE_CLOSE(fd);
            VIR_INFO("Skipping special dir '%s'", base);
            return -2;
        }
    }
1210 1211

    if (!(mode & flags)) {
1212
        VIR_FORCE_CLOSE(fd);
1213
        VIR_INFO("Skipping volume '%s'", path);
1214 1215

        if (mode & VIR_STORAGE_VOL_OPEN_ERROR) {
1216 1217
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("unexpected storage mode for '%s'"), path);
1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235
            return -1;
        }

        return -2;
    }

    return fd;
}

int virStorageBackendVolOpen(const char *path)
{
    return virStorageBackendVolOpenCheckMode(path,
                                             VIR_STORAGE_VOL_OPEN_DEFAULT);
}

int
virStorageBackendUpdateVolTargetInfo(virStorageVolTargetPtr target,
                                     unsigned long long *allocation,
1236 1237
                                     unsigned long long *capacity,
                                     unsigned int openflags)
1238 1239 1240
{
    int ret, fd;

1241 1242
    if ((ret = virStorageBackendVolOpenCheckMode(target->path,
                                                 openflags)) < 0)
1243 1244 1245
        return ret;

    fd = ret;
1246
    ret = virStorageBackendUpdateVolTargetInfoFD(target,
1247 1248 1249
                                                 fd,
                                                 allocation,
                                                 capacity);
1250

1251
    VIR_FORCE_CLOSE(fd);
1252 1253 1254 1255

    return ret;
}

1256
int
1257 1258 1259
virStorageBackendUpdateVolInfoFlags(virStorageVolDefPtr vol,
                                    int withCapacity,
                                    unsigned int openflags)
1260 1261 1262
{
    int ret;

1263
    if ((ret = virStorageBackendUpdateVolTargetInfo(&vol->target,
1264 1265 1266
                                    &vol->allocation,
                                    withCapacity ? &vol->capacity : NULL,
                                    openflags)) < 0)
1267 1268 1269
        return ret;

    if (vol->backingStore.path &&
1270
        (ret = virStorageBackendUpdateVolTargetInfo(&vol->backingStore,
1271 1272
                                            NULL, NULL,
                                            VIR_STORAGE_VOL_OPEN_DEFAULT)) < 0)
1273 1274 1275 1276 1277
        return ret;

    return 0;
}

1278 1279 1280 1281 1282 1283 1284
int virStorageBackendUpdateVolInfo(virStorageVolDefPtr vol,
                                   int withCapacity)
{
    return virStorageBackendUpdateVolInfoFlags(vol, withCapacity,
                                               VIR_STORAGE_VOL_OPEN_DEFAULT);
}

1285 1286 1287 1288
/*
 * virStorageBackendUpdateVolTargetInfoFD:
 * @conn: connection to report errors on
 * @target: target definition ptr of volume to update
1289
 * @fd: fd of storage volume to update, via virStorageBackendOpenVol*
1290 1291 1292
 * @allocation: If not NULL, updated allocation information will be stored
 * @capacity: If not NULL, updated capacity info will be stored
 *
1293
 * Returns 0 for success, -1 on a legitimate error condition.
1294
 */
1295
int
1296
virStorageBackendUpdateVolTargetInfoFD(virStorageVolTargetPtr target,
1297 1298 1299
                                       int fd,
                                       unsigned long long *allocation,
                                       unsigned long long *capacity)
1300 1301
{
    struct stat sb;
1302
#if WITH_SELINUX
1303 1304 1305 1306
    security_context_t filecon = NULL;
#endif

    if (fstat(fd, &sb) < 0) {
1307
        virReportSystemError(errno,
1308
                             _("cannot stat file '%s'"),
1309
                             target->path);
1310 1311 1312
        return -1;
    }

1313 1314
    if (allocation) {
        if (S_ISREG(sb.st_mode)) {
1315
#ifndef WIN32
1316
            *allocation = (unsigned long long)sb.st_blocks *
1317
                          (unsigned long long)DEV_BSIZE;
D
Daniel P. Berrange 已提交
1318
#else
1319
            *allocation = sb.st_size;
D
Daniel P. Berrange 已提交
1320
#endif
1321 1322 1323 1324 1325
            /* Regular files may be sparse, so logical size (capacity) is not same
             * as actual allocation above
             */
            if (capacity)
                *capacity = sb.st_size;
1326 1327 1328 1329 1330
        } else if (S_ISDIR(sb.st_mode)) {
            *allocation = 0;
            if (capacity)
                *capacity = 0;

1331 1332
        } else {
            off_t end;
E
Eric Blake 已提交
1333
            /* XXX this is POSIX compliant, but doesn't work for CHAR files,
1334 1335 1336 1337 1338 1339
             * only BLOCK. There is a Linux specific ioctl() for getting
             * size of both CHAR / BLOCK devices we should check for in
             * configure
             */
            end = lseek(fd, 0, SEEK_END);
            if (end == (off_t)-1) {
1340
                virReportSystemError(errno,
1341 1342 1343 1344 1345 1346 1347
                                     _("cannot seek to end of file '%s'"),
                                     target->path);
                return -1;
            }
            *allocation = end;
            if (capacity)
                *capacity = end;
1348 1349 1350
        }
    }

1351 1352 1353
    target->perms.mode = sb.st_mode & S_IRWXUGO;
    target->perms.uid = sb.st_uid;
    target->perms.gid = sb.st_gid;
1354

1355
    if (!target->timestamps && VIR_ALLOC(target->timestamps) < 0)
1356 1357 1358 1359 1360 1361
        return -1;
    target->timestamps->atime = get_stat_atime(&sb);
    target->timestamps->btime = get_stat_birthtime(&sb);
    target->timestamps->ctime = get_stat_ctime(&sb);
    target->timestamps->mtime = get_stat_mtime(&sb);

1362
    VIR_FREE(target->perms.label);
1363

1364
#if WITH_SELINUX
1365
    /* XXX: make this a security driver call */
M
Martin Kletzander 已提交
1366
    if (fgetfilecon_raw(fd, &filecon) == -1) {
1367
        if (errno != ENODATA && errno != ENOTSUP) {
1368
            virReportSystemError(errno,
1369
                                 _("cannot get file context of '%s'"),
1370
                                 target->path);
1371 1372
            return -1;
        } else {
1373
            target->perms.label = NULL;
1374 1375
        }
    } else {
1376 1377
        if (VIR_STRDUP(target->perms.label, filecon) < 0) {
            freecon(filecon);
1378 1379
            return -1;
        }
1380
        freecon(filecon);
1381 1382
    }
#else
1383
    target->perms.label = NULL;
1384 1385 1386 1387 1388
#endif

    return 0;
}

D
Dave Allan 已提交
1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423

struct diskType {
    int part_table_type;
    unsigned short offset;
    unsigned short length;
    unsigned long long magic;
};


static struct diskType const disk_types[] = {
    { VIR_STORAGE_POOL_DISK_LVM2, 0x218, 8, 0x31303020324D564CULL },
    { VIR_STORAGE_POOL_DISK_GPT,  0x200, 8, 0x5452415020494645ULL },
    { VIR_STORAGE_POOL_DISK_DVH,  0x0,   4, 0x41A9E50BULL },
    { VIR_STORAGE_POOL_DISK_MAC,  0x0,   2, 0x5245ULL },
    { VIR_STORAGE_POOL_DISK_BSD,  0x40,  4, 0x82564557ULL },
    { VIR_STORAGE_POOL_DISK_SUN,  0x1fc, 2, 0xBEDAULL },
    /*
     * NOTE: pc98 is funky; the actual signature is 0x55AA (just like dos), so
     * we can't use that.  At the moment I'm relying on the "dummy" IPL
     * bootloader data that comes from parted.  Luckily, the chances of running
     * into a pc98 machine running libvirt are approximately nil.
     */
    /*{ 0x1fe, 2, 0xAA55UL },*/
    { VIR_STORAGE_POOL_DISK_PC98, 0x0,   8, 0x314C5049000000CBULL },
    /*
     * NOTE: the order is important here; some other disk types (like GPT and
     * and PC98) also have 0x55AA at this offset.  For that reason, the DOS
     * one must be the last one.
     */
    { VIR_STORAGE_POOL_DISK_DOS,  0x1fe, 2, 0xAA55ULL },
    { -1,                         0x0,   0, 0x0ULL },
};


int
1424 1425
virStorageBackendDetectBlockVolFormatFD(virStorageVolTargetPtr target,
                                        int fd)
D
Dave Allan 已提交
1426
{
1427
    size_t i;
D
Dave Allan 已提交
1428 1429 1430 1431 1432 1433 1434 1435 1436
    off_t start;
    unsigned char buffer[1024];
    ssize_t bytes;

    /* make sure to set the target format "unknown" to begin with */
    target->format = VIR_STORAGE_POOL_DISK_UNKNOWN;

    start = lseek(fd, 0, SEEK_SET);
    if (start < 0) {
1437
        virReportSystemError(errno,
D
Dave Allan 已提交
1438 1439 1440 1441 1442 1443
                             _("cannot seek to beginning of file '%s'"),
                             target->path);
        return -1;
    }
    bytes = saferead(fd, buffer, sizeof(buffer));
    if (bytes < 0) {
1444
        virReportSystemError(errno,
D
Dave Allan 已提交
1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463
                             _("cannot read beginning of file '%s'"),
                             target->path);
        return -1;
    }

    for (i = 0; disk_types[i].part_table_type != -1; i++) {
        if (disk_types[i].offset + disk_types[i].length > bytes)
            continue;
        if (memcmp(buffer+disk_types[i].offset, &disk_types[i].magic,
            disk_types[i].length) == 0) {
            target->format = disk_types[i].part_table_type;
            break;
        }
    }

    return 0;
}


1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475
/*
 * Given a volume path directly in /dev/XXX, iterate over the
 * entries in the directory pool->def->target.path and find the
 * first symlink pointing to the volume path.
 *
 * If, the target.path is /dev/, then return the original volume
 * path.
 *
 * If no symlink is found, then return the original volume path
 *
 * Typically target.path is one of the /dev/disk/by-XXX dirs
 * with stable paths.
1476
 *
1477
 * If 'loop' is true, we use a timeout loop to give dynamic paths
1478
 * a change to appear.
1479 1480
 */
char *
1481
virStorageBackendStablePath(virStoragePoolObjPtr pool,
1482
                            const char *devpath,
1483
                            bool loop)
1484 1485 1486
{
    DIR *dh;
    struct dirent *dent;
1487
    char *stablepath;
1488
    int opentries = 0;
1489
    int retry = 0;
1490 1491 1492 1493 1494

    /* Short circuit if pool has no target, or if its /dev */
    if (pool->def->target.path == NULL ||
        STREQ(pool->def->target.path, "/dev") ||
        STREQ(pool->def->target.path, "/dev/"))
1495
        goto ret_strdup;
1496

1497
    /* Skip whole thing for a pool which isn't in /dev
1498
     * so we don't mess filesystem/dir based pools
1499 1500 1501 1502
     */
    if (!STRPREFIX(pool->def->target.path, "/dev"))
        goto ret_strdup;

1503 1504 1505 1506
    /* Logical pools are under /dev but already have stable paths */
    if (pool->def->type == VIR_STORAGE_POOL_LOGICAL)
        goto ret_strdup;

1507 1508 1509
    /* We loop here because /dev/disk/by-{id,path} may not have existed
     * before we started this operation, so we have to give it some time to
     * get created.
1510
     */
1511
 reopen:
1512
    if ((dh = opendir(pool->def->target.path)) == NULL) {
1513
        opentries++;
1514
        if (loop && errno == ENOENT && opentries < 50) {
1515 1516 1517
            usleep(100 * 1000);
            goto reopen;
        }
1518
        virReportSystemError(errno,
1519 1520
                             _("cannot read dir '%s'"),
                             pool->def->target.path);
1521 1522 1523
        return NULL;
    }

1524 1525 1526
    /* The pool is pointing somewhere like /dev/disk/by-path
     * or /dev/disk/by-id, so we need to check all symlinks in
     * the target directory and figure out which one points
1527 1528
     * to this device node.
     *
1529
     * And it might need some time till the stable path shows
1530
     * up, so add timeout to retry here.
1531
     */
1532
 retry:
1533 1534 1535 1536
    while ((dent = readdir(dh)) != NULL) {
        if (dent->d_name[0] == '.')
            continue;

1537 1538 1539
        if (virAsprintf(&stablepath, "%s/%s",
                        pool->def->target.path,
                        dent->d_name) == -1) {
1540 1541 1542 1543 1544 1545 1546 1547 1548
            closedir(dh);
            return NULL;
        }

        if (virFileLinkPointsTo(stablepath, devpath)) {
            closedir(dh);
            return stablepath;
        }

1549
        VIR_FREE(stablepath);
1550 1551
    }

1552
    if (loop && ++retry < 100) {
1553 1554 1555 1556
        usleep(100 * 1000);
        goto retry;
    }

1557 1558
    closedir(dh);

1559
 ret_strdup:
1560 1561 1562
    /* Couldn't find any matching stable link so give back
     * the original non-stable dev path
     */
1563

1564
    ignore_value(VIR_STRDUP(stablepath, devpath));
1565 1566

    return stablepath;
1567 1568
}

D
Daniel P. Berrange 已提交
1569

1570
#ifndef WIN32
1571 1572 1573 1574
/*
 * Run an external program.
 *
 * Read its output and apply a series of regexes to each line
R
Richard W.M. Jones 已提交
1575
 * When the entire set of regexes has matched consecutively
1576 1577 1578
 * then run a callback passing in all the matches
 */
int
1579
virStorageBackendRunProgRegex(virStoragePoolObjPtr pool,
1580
                              virCommandPtr cmd,
1581 1582 1583 1584
                              int nregex,
                              const char **regex,
                              int *nvars,
                              virStorageBackendListVolRegexFunc func,
1585
                              void *data, const char *prefix)
1586
{
1587
    int fd = -1, err, ret = -1;
1588 1589 1590 1591
    FILE *list = NULL;
    regex_t *reg;
    regmatch_t *vars = NULL;
    char line[1024];
1592 1593
    int maxReg = 0;
    size_t i, j;
1594 1595 1596 1597
    int totgroups = 0, ngroup = 0, maxvars = 0;
    char **groups;

    /* Compile all regular expressions */
1598
    if (VIR_ALLOC_N(reg, nregex) < 0)
1599 1600
        return -1;

1601
    for (i = 0; i < nregex; i++) {
1602 1603 1604 1605
        err = regcomp(&reg[i], regex[i], REG_EXTENDED);
        if (err != 0) {
            char error[100];
            regerror(err, &reg[i], error, sizeof(error));
1606 1607
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           _("Failed to compile regex %s"), error);
1608
            for (j = 0; j < i; j++)
1609
                regfree(&reg[j]);
1610
            VIR_FREE(reg);
1611 1612 1613 1614 1615 1616 1617 1618 1619 1620
            return -1;
        }

        totgroups += nvars[i];
        if (nvars[i] > maxvars)
            maxvars = nvars[i];

    }

    /* Storage for matched variables */
1621
    if (VIR_ALLOC_N(groups, totgroups) < 0)
1622
        goto cleanup;
1623
    if (VIR_ALLOC_N(vars, maxvars+1) < 0)
1624 1625
        goto cleanup;

1626 1627
    virCommandSetOutputFD(cmd, &fd);
    if (virCommandRunAsync(cmd, NULL) < 0) {
1628 1629 1630
        goto cleanup;
    }

1631
    if ((list = VIR_FDOPEN(fd, "r")) == NULL) {
1632 1633
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("cannot read fd"));
1634 1635 1636 1637
        goto cleanup;
    }

    while (fgets(line, sizeof(line), list) != NULL) {
1638
        char *p = NULL;
1639 1640 1641 1642 1643
        /* Strip trailing newline */
        int len = strlen(line);
        if (len && line[len-1] == '\n')
            line[len-1] = '\0';

1644 1645 1646 1647 1648 1649
        /* ignore any command prefix */
        if (prefix)
            p = STRSKIP(line, prefix);
        if (!p)
            p = line;

1650
        for (i = 0; i <= maxReg && i < nregex; i++) {
1651
            if (regexec(&reg[i], p, nvars[i]+1, vars, 0) == 0) {
1652 1653 1654 1655 1656 1657
                maxReg++;

                if (i == 0)
                    ngroup = 0;

                /* NULL terminate each captured group in the line */
1658
                for (j = 0; j < nvars[i]; j++) {
1659
                    /* NB vars[0] is the full pattern, so we offset j by 1 */
1660
                    p[vars[j+1].rm_eo] = '\0';
1661
                    if (VIR_STRDUP(groups[ngroup++], p + vars[j+1].rm_so) < 0)
1662 1663 1664 1665 1666
                        goto cleanup;
                }

                /* We're matching on the last regex, so callback time */
                if (i == (nregex-1)) {
1667
                    if (((*func)(pool, groups, data)) < 0)
1668 1669 1670
                        goto cleanup;

                    /* Release matches & restart to matching the first regex */
1671
                    for (j = 0; j < totgroups; j++)
1672
                        VIR_FREE(groups[j]);
1673 1674 1675 1676 1677 1678 1679
                    maxReg = 0;
                    ngroup = 0;
                }
            }
        }
    }

1680
    ret = virCommandWait(cmd, NULL);
1681
cleanup:
1682
    if (groups) {
1683
        for (j = 0; j < totgroups; j++)
1684 1685
            VIR_FREE(groups[j]);
        VIR_FREE(groups);
1686
    }
1687
    VIR_FREE(vars);
1688

1689
    for (i = 0; i < nregex; i++)
1690 1691
        regfree(&reg[i]);

1692
    VIR_FREE(reg);
1693

1694 1695
    VIR_FORCE_FCLOSE(list);
    VIR_FORCE_CLOSE(fd);
1696

1697
    return ret;
1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711
}

/*
 * Run an external program and read from its standard output
 * a stream of tokens from IN_STREAM, applying FUNC to
 * each successive sequence of N_COLUMNS tokens.
 * If FUNC returns < 0, stop processing input and return -1.
 * Return -1 if N_COLUMNS == 0.
 * Return -1 upon memory allocation error.
 * If the number of input tokens is not a multiple of N_COLUMNS,
 * then the final FUNC call will specify a number smaller than N_COLUMNS.
 * If there are no input tokens (empty input), call FUNC with N_COLUMNS == 0.
 */
int
1712
virStorageBackendRunProgNul(virStoragePoolObjPtr pool,
1713
                            virCommandPtr cmd,
1714 1715 1716 1717 1718
                            size_t n_columns,
                            virStorageBackendListVolNulFunc func,
                            void *data)
{
    size_t n_tok = 0;
1719
    int fd = -1;
1720 1721
    FILE *fp = NULL;
    char **v;
1722
    int ret = -1;
1723
    size_t i;
1724 1725 1726 1727

    if (n_columns == 0)
        return -1;

1728
    if (VIR_ALLOC_N(v, n_columns) < 0)
1729 1730 1731 1732
        return -1;
    for (i = 0; i < n_columns; i++)
        v[i] = NULL;

1733 1734
    virCommandSetOutputFD(cmd, &fd);
    if (virCommandRunAsync(cmd, NULL) < 0) {
1735 1736 1737
        goto cleanup;
    }

1738
    if ((fp = VIR_FDOPEN(fd, "r")) == NULL) {
1739 1740
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("cannot open file using fd"));
1741 1742 1743 1744 1745 1746 1747 1748
        goto cleanup;
    }

    while (1) {
        char *buf = NULL;
        size_t buf_len = 0;
        /* Be careful: even when it returns -1,
           this use of getdelim allocates memory.  */
1749
        ssize_t tok_len = getdelim(&buf, &buf_len, 0, fp);
1750 1751 1752 1753
        v[n_tok] = buf;
        if (tok_len < 0) {
            /* Maybe EOF, maybe an error.
               If n_tok > 0, then we know it's an error.  */
1754
            if (n_tok && func(pool, n_tok, v, data) < 0)
1755 1756 1757 1758 1759
                goto cleanup;
            break;
        }
        ++n_tok;
        if (n_tok == n_columns) {
1760
            if (func(pool, n_tok, v, data) < 0)
1761 1762 1763
                goto cleanup;
            n_tok = 0;
            for (i = 0; i < n_columns; i++) {
1764
                VIR_FREE(v[i]);
1765 1766 1767 1768
            }
        }
    }

1769 1770 1771
    if (feof(fp) < 0) {
        virReportSystemError(errno, "%s",
                             _("read error on pipe"));
1772 1773
        goto cleanup;
    }
1774

1775
    ret = virCommandWait(cmd, NULL);
1776 1777
 cleanup:
    for (i = 0; i < n_columns; i++)
1778 1779
        VIR_FREE(v[i]);
    VIR_FREE(v);
1780

1781 1782
    VIR_FORCE_FCLOSE(fp);
    VIR_FORCE_CLOSE(fd);
1783

1784
    return ret;
1785
}
D
Daniel P. Berrange 已提交
1786

1787
#else /* WIN32 */
D
Daniel P. Berrange 已提交
1788 1789 1790 1791 1792 1793 1794 1795 1796

int
virStorageBackendRunProgRegex(virConnectPtr conn,
                              virStoragePoolObjPtr pool ATTRIBUTE_UNUSED,
                              const char *const*prog ATTRIBUTE_UNUSED,
                              int nregex ATTRIBUTE_UNUSED,
                              const char **regex ATTRIBUTE_UNUSED,
                              int *nvars ATTRIBUTE_UNUSED,
                              virStorageBackendListVolRegexFunc func ATTRIBUTE_UNUSED,
1797
                              void *data ATTRIBUTE_UNUSED)
D
Daniel P. Berrange 已提交
1798
{
1799 1800
    virReportError(VIR_ERR_INTERNAL_ERROR,
                   _("%s not implemented on Win32"), __FUNCTION__);
D
Daniel P. Berrange 已提交
1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811
    return -1;
}

int
virStorageBackendRunProgNul(virConnectPtr conn,
                            virStoragePoolObjPtr pool ATTRIBUTE_UNUSED,
                            const char **prog ATTRIBUTE_UNUSED,
                            size_t n_columns ATTRIBUTE_UNUSED,
                            virStorageBackendListVolNulFunc func ATTRIBUTE_UNUSED,
                            void *data ATTRIBUTE_UNUSED)
{
1812 1813
    virReportError(VIR_ERR_INTERNAL_ERROR,
                   _("%s not implemented on Win32"), __FUNCTION__);
D
Daniel P. Berrange 已提交
1814 1815
    return -1;
}
1816
#endif /* WIN32 */