storage_backend_disk.c 34.3 KB
Newer Older
1 2 3
/*
 * storage_backend_disk.c: storage backend for disk handling
 *
4
 * Copyright (C) 2007-2016 Red Hat, Inc.
5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2007-2008 Daniel P. Berrange
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with this library.  If not, see
O
Osier Yang 已提交
19
 * <http://www.gnu.org/licenses/>.
20 21 22
 */

#include <config.h>
23
#include <unistd.h>
24

25
#include "dirname.h"
26
#include "virerror.h"
27
#include "virlog.h"
28
#include "storage_backend_disk.h"
29
#include "storage_util.h"
30
#include "viralloc.h"
31
#include "vircommand.h"
32
#include "virfile.h"
33
#include "configmake.h"
34
#include "virstring.h"
35

36 37
#define VIR_FROM_THIS VIR_FROM_STORAGE

38 39
VIR_LOG_INIT("storage.storage_backend_disk");

40 41
#define SECTOR_SIZE 512

42 43 44 45 46 47 48 49 50 51 52
static bool
virStorageVolPartFindExtended(virStorageVolDefPtr def,
                              const void *opaque ATTRIBUTE_UNUSED)
{
    if (def->source.partType == VIR_STORAGE_VOL_DISK_TYPE_EXTENDED)
        return true;

    return false;
}


53
static int
54
virStorageBackendDiskMakeDataVol(virStoragePoolObjPtr pool,
55 56 57
                                 char **const groups,
                                 virStorageVolDefPtr vol)
{
58
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
59
    char *tmp, *partname;
60
    bool addVol = false;
61
    VIR_AUTOFREE(char *) devpath = NULL;
62 63 64 65 66 67 68 69

    /* Prepended path will be same for all partitions, so we can
     * strip the path to form a reasonable pool-unique name
     */
    if ((tmp = strrchr(groups[0], '/')))
        partname = tmp + 1;
    else
        partname = groups[0];
70 71

    if (vol == NULL) {
72 73 74
        /* This is typically a reload/restart/refresh path where
         * we're discovering the existing partitions for the pool
         */
75
        addVol = true;
76
        if (VIR_ALLOC(vol) < 0)
77
            return -1;
78 79
        if (VIR_STRDUP(vol->name, partname) < 0)
            goto error;
80 81 82
    }

    if (vol->target.path == NULL) {
83
        if (VIR_STRDUP(devpath, groups[0]) < 0)
84
            goto error;
85 86 87 88 89 90 91

        /* Now figure out the stable path
         *
         * XXX this method is O(N) because it scans the pool target
         * dir every time its run. Should figure out a more efficient
         * way of doing this...
         */
92
        vol->target.path = virStorageBackendStablePath(pool, devpath, true);
93
        if (vol->target.path == NULL)
94
            goto error;
95 96
    }

97 98 99 100 101 102 103 104
    /* Enforce provided vol->name is the same as what parted created.
     * We do this after filling target.path so that we have a chance at
     * deleting the partition with this failure from CreateVol path
     */
    if (STRNEQ(vol->name, partname)) {
        virReportError(VIR_ERR_INVALID_ARG,
                       _("invalid partition name '%s', expected '%s'"),
                       vol->name, partname);
105 106 107 108 109 110 111 112

        /* Let's see if by chance parthelper created a name that won't be
         * found later when we try to delete. We tell parthelper to add a 'p'
         * to the output via the part_separator flag, but if devmapper has
         * user_friendly_names set, the creation won't happen that way, thus
         * our deletion will fail because the name we generated is wrong.
         * Check for our conditions and see if the generated name is the
         * same as StablePath returns and has the 'p' in it */
113
        if (def->source.devices[0].part_separator == VIR_TRISTATE_BOOL_YES &&
114 115 116 117 118 119 120 121 122 123 124 125 126
            !virIsDevMapperDevice(vol->target.path) &&
            STREQ(groups[0], vol->target.path) &&
            (tmp = strrchr(groups[0], 'p'))) {

            /* If we remove the 'p' from groups[0] and the resulting
             * device is a devmapper device, then we know parthelper
             * was told to create the wrong name based on the results.
             * So just remove the 'p' from the vol->target.path too. */
            memmove(tmp, tmp + 1, strlen(tmp));
            if (virIsDevMapperDevice(groups[0]) &&
                (tmp = strrchr(vol->target.path, 'p')))
                memmove(tmp, tmp + 1, strlen(tmp));
        }
127
        goto error;
128 129
    }

130 131
    if (vol->key == NULL) {
        /* XXX base off a unique key of the underlying disk */
132
        if (VIR_STRDUP(vol->key, vol->target.path) < 0)
133
            goto error;
134 135 136
    }

    if (vol->source.extents == NULL) {
137
        if (VIR_ALLOC(vol->source.extents) < 0)
138
            goto error;
139 140 141 142
        vol->source.nextent = 1;

        if (virStrToLong_ull(groups[3], NULL, 10,
                             &vol->source.extents[0].start) < 0) {
143 144
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("cannot parse device start location"));
145
            goto error;
146 147 148 149
        }

        if (virStrToLong_ull(groups[4], NULL, 10,
                             &vol->source.extents[0].end) < 0) {
150 151
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("cannot parse device end location"));
152
            goto error;
153 154
        }

155
        if (VIR_STRDUP(vol->source.extents[0].path,
156
                       def->source.devices[0].path) < 0)
157
            goto error;
158 159
    }

160
    /* set partition type */
E
Eric Blake 已提交
161
    if (STREQ(groups[1], "normal"))
162
       vol->source.partType = VIR_STORAGE_VOL_DISK_TYPE_PRIMARY;
E
Eric Blake 已提交
163
    else if (STREQ(groups[1], "logical"))
164
       vol->source.partType = VIR_STORAGE_VOL_DISK_TYPE_LOGICAL;
E
Eric Blake 已提交
165
    else if (STREQ(groups[1], "extended"))
166
       vol->source.partType = VIR_STORAGE_VOL_DISK_TYPE_EXTENDED;
167
    else
168
       vol->source.partType = VIR_STORAGE_VOL_DISK_TYPE_NONE;
169

170 171
    vol->type = VIR_STORAGE_VOL_BLOCK;

172 173 174 175 176 177 178 179 180 181
    /* Refresh allocation/capacity/perms
     *
     * For an extended partition, virStorageBackendUpdateVolInfo will
     * return incorrect values for allocation and capacity, so use the
     * extent information captured above instead.
     *
     * Also once a logical partition exists or another primary partition
     * after an extended partition is created an open on the extended
     * partition will fail, so pass the NOERROR flag and only error if a
     * -1 was returned indicating some other error than an open error.
182 183 184 185 186 187 188 189
     *
     * NB: A small window exists in some cases where the just created
     * partition disappears, but then reappears. Since we were given
     * vol->target.path from parthelper, let's just be sure that any
     * kernel magic that occurs as a result of parthelper doesn't cause
     * us to fail with some sort of ENOENT failure since that would be
     * quite "unexpected". So rather than just fail, let's use the
     * virWaitForDevices to ensure everything has settled properly.
190
     */
191
    virWaitForDevices();
192
    if (vol->source.partType == VIR_STORAGE_VOL_DISK_TYPE_EXTENDED) {
193
        if (virStorageBackendUpdateVolInfo(vol, false,
194
                                           VIR_STORAGE_VOL_OPEN_DEFAULT |
195 196
                                           VIR_STORAGE_VOL_OPEN_NOERROR,
                                           0) == -1)
197
            goto error;
198 199
        vol->target.allocation = 0;
        vol->target.capacity =
200 201
            (vol->source.extents[0].end - vol->source.extents[0].start);
    } else {
202
        if (virStorageBackendUpdateVolInfo(vol, false,
203
                                           VIR_STORAGE_VOL_OPEN_DEFAULT, 0) < 0)
204
            goto error;
205
    }
206

207 208 209 210 211 212
    /* Now that we've updated @vol enough, let's add it to the pool
     * if it's not already there so that the subsequent pool search
     * pool def adjustments will work properly */
    if (addVol && virStoragePoolObjAddVol(pool, vol) < 0)
        goto error;

213 214
    /* Find the extended partition and increase the allocation value */
    if (vol->source.partType == VIR_STORAGE_VOL_DISK_TYPE_LOGICAL) {
215
        virStorageVolDefPtr voldef;
216

217 218 219 220 221
        voldef = virStoragePoolObjSearchVolume(pool,
                                               virStorageVolPartFindExtended,
                                               NULL);
        if (voldef)
            voldef->target.allocation += vol->target.allocation;
222 223
    }

224
    if (STRNEQ(groups[2], "metadata"))
225 226 227
        def->allocation += vol->target.allocation;
    if (vol->source.extents[0].end > def->capacity)
        def->capacity = vol->source.extents[0].end;
228 229

    return 0;
230 231 232 233 234

 error:
    if (addVol)
        virStorageVolDefFree(vol);
    return -1;
235 236 237
}

static int
238
virStorageBackendDiskMakeFreeExtent(virStoragePoolObjPtr pool,
239 240
                                    char **const groups)
{
241 242
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
    virStoragePoolSourceDevicePtr dev = &def->source.devices[0];
243

244 245
    if (VIR_REALLOC_N(dev->freeExtents,
                      dev->nfreeExtent + 1) < 0)
246 247 248
        return -1;

    memset(dev->freeExtents +
249 250
           dev->nfreeExtent, 0,
           sizeof(dev->freeExtents[0]));
251

252
    /* set type of free area */
E
Eric Blake 已提交
253
    if (STREQ(groups[1], "logical")) {
254 255 256 257 258 259
        dev->freeExtents[dev->nfreeExtent].type = VIR_STORAGE_FREE_LOGICAL;
    } else {
        dev->freeExtents[dev->nfreeExtent].type = VIR_STORAGE_FREE_NORMAL;
    }


260 261 262 263 264 265 266 267
    if (virStrToLong_ull(groups[3], NULL, 10,
                         &dev->freeExtents[dev->nfreeExtent].start) < 0)
        return -1; /* Don't bother to re-alloc freeExtents - it'll be free'd shortly */

    if (virStrToLong_ull(groups[4], NULL, 10,
                         &dev->freeExtents[dev->nfreeExtent].end) < 0)
        return -1; /* Don't bother to re-alloc freeExtents - it'll be free'd shortly */

268
    /* first block reported as free, even if it is not */
269
    if (dev->freeExtents[dev->nfreeExtent].start == 0)
270 271
        dev->freeExtents[dev->nfreeExtent].start = SECTOR_SIZE;

272 273 274 275
    def->available += (dev->freeExtents[dev->nfreeExtent].end -
                       dev->freeExtents[dev->nfreeExtent].start);
    if (dev->freeExtents[dev->nfreeExtent].end > def->capacity)
        def->capacity = dev->freeExtents[dev->nfreeExtent].end;
276 277 278 279 280 281 282

    dev->nfreeExtent++;

    return 0;
}


283 284 285 286 287
struct virStorageBackendDiskPoolVolData {
    virStoragePoolObjPtr pool;
    virStorageVolDefPtr vol;
};

288
static int
289
virStorageBackendDiskMakeVol(size_t ntok ATTRIBUTE_UNUSED,
290
                             char **const groups,
291
                             void *opaque)
292
{
293 294
    struct virStorageBackendDiskPoolVolData *data = opaque;
    virStoragePoolObjPtr pool = data->pool;
295 296 297 298 299 300 301 302 303 304 305 306
    /*
     * Ignore normal+metadata, and logical+metadata partitions
     * since they're basically internal book-keeping regions
     * we have no control over. Do keep extended+metadata though
     * because that's the MS-DOS extended partition region we
     * need to be able to view/create/delete
     */
    if ((STREQ(groups[1], "normal") ||
         STREQ(groups[1], "logical")) &&
        STREQ(groups[2], "metadata"))
        return 0;

R
Richard W.M. Jones 已提交
307
    /* Remaining data / metadata parts get turn into volumes... */
308 309
    if (STREQ(groups[2], "metadata") ||
        STREQ(groups[2], "data")) {
310
        virStorageVolDefPtr vol = data->vol;
311 312 313 314 315 316 317 318 319 320 321 322

        if (vol) {
            /* We're searching for a specific vol only */
            if (vol->key) {
                if (STRNEQ(vol->key, groups[0]))
                    return 0;
            } else if (virStorageVolDefFindByKey(pool, groups[0]) != NULL) {
                /* If no key, the volume must be newly created. If groups[0]
                 * isn't already a volume, assume it's the path we want */
                return 0;
            }
        }
323

324
        return virStorageBackendDiskMakeDataVol(pool, groups, vol);
325 326
    } else if (STREQ(groups[2], "free")) {
        /* ....or free space extents */
327
        return virStorageBackendDiskMakeFreeExtent(pool, groups);
328
    } else {
R
Richard W.M. Jones 已提交
329
        /* This code path should never happen unless someone changed
330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345
         * libvirt_parthelper forgot to change this code */
        return -1;
    }
}

/* To get a list of partitions we run an external helper
 * tool which then uses parted APIs. This is because
 * parted's API is not compatible with libvirt's license
 * but we really really want to use parted because the
 * other options all suck :-)
 *
 * All the other storage backends run an external tool for
 * listing volumes so this really isn't too much of a pain,
 * and we can even ensure the output is friendly.
 */
static int
346
virStorageBackendDiskReadPartitions(virStoragePoolObjPtr pool,
347 348 349 350 351 352 353 354 355
                                    virStorageVolDefPtr vol)
{
    /*
     *  # libvirt_parthelper DEVICE
     * /dev/sda1      normal       data        32256    106928128    106896384
     * /dev/sda2      normal       data    106928640 100027629568  99920701440
     * -              normal   metadata 100027630080 100030242304      2612736
     *
     */
356

357
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
358 359 360 361
    struct virStorageBackendDiskPoolVolData cbdata = {
        .pool = pool,
        .vol = vol,
    };
362
    VIR_AUTOFREE(char *) parthelper_path = NULL;
363
    VIR_AUTOPTR(virCommand) cmd = NULL;
364

365
    if (!(parthelper_path = virFileFindResource("libvirt_parthelper",
366
                                                abs_top_builddir "/src",
367 368 369 370
                                                LIBEXECDIR)))
        return -1;

    cmd = virCommandNewArgList(parthelper_path,
371
                               def->source.devices[0].path,
372 373
                               NULL);

374
    /* Check for the presence of the part_separator='yes'. Pass this
375
     * along to the libvirt_parthelper as option '-p'. This will cause
376 377 378
     * libvirt_parthelper to append the "p" partition separator to
     * the generated device name for a source device which ends with
     * a non-numeric value (e.g. mpatha would generate mpathap#).
379
     */
380
    if (def->source.devices[0].part_separator == VIR_TRISTATE_BOOL_YES)
381 382
        virCommandAddArg(cmd, "-p");

383 384 385 386
    /* If a volume is passed, virStorageBackendDiskMakeVol only updates the
     * pool allocation for that single volume.
     */
    if (!vol)
387 388
        def->allocation = 0;
    def->capacity = def->available = 0;
389

390
    return virCommandRunNul(cmd, 6, virStorageBackendDiskMakeVol, &cbdata);
391 392
}

393
static int
394
virStorageBackendDiskMakePoolGeometry(size_t ntok ATTRIBUTE_UNUSED,
395
                                      char **const groups,
396
                                      void *data)
397
{
398
    virStoragePoolObjPtr pool = data;
399 400
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
    virStoragePoolSourceDevicePtr device = &(def->source.devices[0]);
P
Peter Krempa 已提交
401 402 403 404 405 406 407
    if (virStrToLong_i(groups[0], NULL, 0, &device->geometry.cylinders) < 0 ||
        virStrToLong_i(groups[1], NULL, 0, &device->geometry.heads) < 0 ||
        virStrToLong_i(groups[2], NULL, 0, &device->geometry.sectors) < 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                       _("Failed to create disk pool geometry"));
        return -1;
    }
408

P
Peter Krempa 已提交
409
    return 0;
410 411 412
}

static int
413
virStorageBackendDiskReadGeometry(virStoragePoolObjPtr pool)
414
{
415
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
416
    VIR_AUTOFREE(char *) parthelper_path = NULL;
417
    VIR_AUTOPTR(virCommand) cmd = NULL;
418 419

    if (!(parthelper_path = virFileFindResource("libvirt_parthelper",
420
                                                abs_top_builddir "/src",
421 422 423 424
                                                LIBEXECDIR)))
        return -1;

    cmd = virCommandNewArgList(parthelper_path,
425 426 427
                               def->source.devices[0].path,
                               "-g",
                               NULL);
428

429 430
    return virCommandRunNul(cmd, 3, virStorageBackendDiskMakePoolGeometry,
                            pool);
431
}
432 433

static int
434
virStorageBackendDiskRefreshPool(virStoragePoolObjPtr pool)
435
{
436 437 438 439
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);

    VIR_FREE(def->source.devices[0].freeExtents);
    def->source.devices[0].nfreeExtent = 0;
440

J
John Ferlan 已提交
441
    virWaitForDevices();
442

443
    if (!virFileExists(def->source.devices[0].path)) {
444 445
        virReportError(VIR_ERR_INVALID_ARG,
                       _("device path '%s' doesn't exist"),
446
                       def->source.devices[0].path);
447 448 449
        return -1;
    }

450
    if (virStorageBackendDiskReadGeometry(pool) != 0)
451 452
        return -1;

453
    return virStorageBackendDiskReadPartitions(pool, NULL);
454 455 456
}


457
static int
458
virStorageBackendDiskStartPool(virStoragePoolObjPtr pool)
459
{
460
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
461
    const char *format;
462
    const char *path = def->source.devices[0].path;
463

J
John Ferlan 已提交
464
    virWaitForDevices();
465

466
    if (!virFileExists(path)) {
467
        virReportError(VIR_ERR_INVALID_ARG,
468
                       _("device path '%s' doesn't exist"), path);
469 470 471
        return -1;
    }

472 473 474
    if (def->source.format == VIR_STORAGE_POOL_DISK_UNKNOWN)
        def->source.format = VIR_STORAGE_POOL_DISK_DOS;
    format = virStoragePoolFormatDiskTypeToString(def->source.format);
475
    if (!virStorageBackendDeviceIsEmpty(path, format, false))
476 477 478 479 480 481
        return -1;

    return 0;
}


482 483 484 485
/**
 * Write a new partition table header
 */
static int
486
virStorageBackendDiskBuildPool(virStoragePoolObjPtr pool,
E
Eric Blake 已提交
487
                               unsigned int flags)
488
{
489 490
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
    int format = def->source.format;
491
    const char *fmt;
492
    VIR_AUTOPTR(virCommand) cmd = NULL;
493

494
    virCheckFlags(VIR_STORAGE_POOL_BUILD_OVERWRITE |
495
                  VIR_STORAGE_POOL_BUILD_NO_OVERWRITE, -1);
E
Eric Blake 已提交
496

497 498 499
    VIR_EXCLUSIVE_FLAGS_RET(VIR_STORAGE_POOL_BUILD_OVERWRITE,
                            VIR_STORAGE_POOL_BUILD_NO_OVERWRITE,
                            -1);
500

501
    fmt = virStoragePoolFormatDiskTypeToString(format);
502

503 504 505
    if (!(flags & VIR_STORAGE_POOL_BUILD_OVERWRITE) &&
        !(virStorageBackendDeviceIsEmpty(def->source.devices[0].path,
                                         fmt, true)))
506
        return -1;
507

508 509
    if (virStorageBackendZeroPartitionTable(def->source.devices[0].path,
                                            1024 * 1024) < 0)
510
        return -1;
511 512 513 514 515 516 517 518 519 520 521 522 523 524 525

    /* eg parted /dev/sda mklabel --script msdos */
    if (format == VIR_STORAGE_POOL_DISK_UNKNOWN)
        format = def->source.format = VIR_STORAGE_POOL_DISK_DOS;
    if (format == VIR_STORAGE_POOL_DISK_DOS)
        fmt = "msdos";
    else
        fmt = virStoragePoolFormatDiskTypeToString(format);

    cmd = virCommandNewArgList(PARTED,
                               def->source.devices[0].path,
                               "mklabel",
                               "--script",
                               fmt,
                               NULL);
526
    return virCommandRun(cmd, NULL);
527 528
}

529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547

struct virStorageVolNumData {
    int count;
};

static int
virStorageVolNumOfPartTypes(virStorageVolDefPtr def,
                            const void *opaque)
{
    struct virStorageVolNumData *data = (struct virStorageVolNumData *)opaque;

    if (def->source.partType == VIR_STORAGE_VOL_DISK_TYPE_PRIMARY ||
        def->source.partType == VIR_STORAGE_VOL_DISK_TYPE_EXTENDED)
        data->count++;

    return 0;
}


548 549 550 551
/**
 * Decides what kind of partition type that should be created.
 * Important when the partition table is of msdos type
 */
552
static int
553 554
virStorageBackendDiskPartTypeToCreate(virStoragePoolObjPtr pool)
{
555
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
556 557
    struct virStorageVolNumData data = { .count = 0 };

558
    if (def->source.format == VIR_STORAGE_POOL_DISK_DOS) {
559
        /* count primary and extended partitions,
560
           can't be more than 3 to create a new primary partition */
561 562 563 564
        if (virStoragePoolObjForEachVolume(pool, virStorageVolNumOfPartTypes,
                                           &data) == 0) {
            if (data.count >= 4)
                return VIR_STORAGE_VOL_DISK_TYPE_LOGICAL;
565 566 567 568 569 570 571 572
        }
    }

    /* for all other cases, all partitions are primary */
    return VIR_STORAGE_VOL_DISK_TYPE_PRIMARY;
}

static int
573
virStorageBackendDiskPartFormat(virStoragePoolObjPtr pool,
574
                                virStorageVolDefPtr vol,
E
Eric Blake 已提交
575
                                char** partFormat)
576
{
577 578 579
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);

    if (def->source.format == VIR_STORAGE_POOL_DISK_DOS) {
E
Eric Blake 已提交
580
        const char *partedFormat;
581
        partedFormat = virStoragePartedFsTypeToString(vol->target.format);
E
Eric Blake 已提交
582
        if (partedFormat == NULL) {
583 584
            virReportError(VIR_ERR_INTERNAL_ERROR,
                           "%s", _("Invalid partition type"));
E
Eric Blake 已提交
585
            return -1;
586 587
        }
        if (vol->target.format == VIR_STORAGE_VOL_DISK_EXTENDED) {
Y
Yuri Chornoivan 已提交
588
            /* make sure we don't have an extended partition already */
589 590 591
            if (virStoragePoolObjSearchVolume(pool,
                                              virStorageVolPartFindExtended,
                                              NULL)) {
592 593
                    virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                                   _("extended partition already exists"));
E
Eric Blake 已提交
594
                    return -1;
595
            }
596
            if (VIR_STRDUP(*partFormat, partedFormat) < 0)
E
Eric Blake 已提交
597
                return -1;
598 599 600 601 602 603
        } else {
            /* create primary partition as long as it is possible
               and after that check if an extended partition exists
               to create logical partitions. */
            /* XXX Only support one extended partition */
            switch (virStorageBackendDiskPartTypeToCreate(pool)) {
E
Eric Blake 已提交
604
            case VIR_STORAGE_VOL_DISK_TYPE_PRIMARY:
605
                if (virAsprintf(partFormat, "primary %s", partedFormat) < 0)
E
Eric Blake 已提交
606
                    return -1;
E
Eric Blake 已提交
607 608
                break;
            case VIR_STORAGE_VOL_DISK_TYPE_LOGICAL:
Y
Yuri Chornoivan 已提交
609
                /* make sure we have an extended partition */
610 611 612 613 614 615 616 617 618 619
                if (virStoragePoolObjSearchVolume(pool,
                                                  virStorageVolPartFindExtended,
                                                  NULL)) {
                    if (virAsprintf(partFormat, "logical %s",
                                    partedFormat) < 0)
                        return -1;
                } else {
                    virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
                                   _("no extended partition found and no "
                                     "primary partition available"));
E
Eric Blake 已提交
620 621 622 623
                    return -1;
                }
                break;
            default:
624 625
                virReportError(VIR_ERR_INTERNAL_ERROR,
                               "%s", _("unknown partition type"));
E
Eric Blake 已提交
626
                return -1;
627 628 629
            }
        }
    } else {
630
        if (VIR_STRDUP(*partFormat, "primary") < 0)
E
Eric Blake 已提交
631
            return -1;
632 633 634 635 636
    }
    return 0;
}

/**
J
Ján Tomko 已提交
637
 * Aligns a new partition to nearest cylinder boundary
E
Eric Blake 已提交
638
 * when having a msdos partition table type
J
Ján Tomko 已提交
639
 * to avoid any problem with already existing
640 641 642
 * partitions
 */
static int
643 644 645 646
virStorageBackendDiskPartBoundaries(virStoragePoolObjPtr pool,
                                    unsigned long long *start,
                                    unsigned long long *end,
                                    unsigned long long allocation)
647
{
648
    size_t i;
649
    int smallestExtent = -1;
650 651 652
    unsigned long long smallestSize = 0;
    unsigned long long extraBytes = 0;
    unsigned long long alignedAllocation = allocation;
653 654
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
    virStoragePoolSourceDevicePtr dev = &def->source.devices[0];
655
    unsigned long long cylinderSize = (unsigned long long)dev->geometry.heads *
656 657
                                      dev->geometry.sectors * SECTOR_SIZE;

658
    VIR_DEBUG("find free area: allocation %llu, cyl size %llu", allocation,
E
Eric Blake 已提交
659
          cylinderSize);
660 661 662
    int partType = virStorageBackendDiskPartTypeToCreate(pool);

    /* how many extra bytes we have since we allocate
J
Ján Tomko 已提交
663
       aligned to the cylinder boundary */
664 665
    extraBytes = cylinderSize - (allocation % cylinderSize);

666
    for (i = 0; i < dev->nfreeExtent; i++) {
667 668 669 670 671
         unsigned long long size =
             dev->freeExtents[i].end -
             dev->freeExtents[i].start;
         unsigned long long neededSize = allocation;

672
         if (def->source.format == VIR_STORAGE_POOL_DISK_DOS) {
J
Ján Tomko 已提交
673
             /* align to cylinder boundary */
674 675 676 677 678 679
             neededSize += extraBytes;
             if ((*start % cylinderSize) > extraBytes) {
                 /* add an extra cylinder if the offset can't fit within
                    the extra bytes we have */
                 neededSize += cylinderSize;
             }
680
             /* if we are creating a logical partition, we need one extra
681
                block between partitions (or actually move start one block) */
682
             if (partType == VIR_STORAGE_VOL_DISK_TYPE_LOGICAL)
683 684 685 686 687 688 689 690 691 692 693 694
                 size -= SECTOR_SIZE;
         }
         if (size > neededSize &&
             (smallestSize == 0 ||
             size < smallestSize)) {
             /* for logical partition, the free extent
                must be within a logical free area */
             if (partType == VIR_STORAGE_VOL_DISK_TYPE_LOGICAL &&
                 dev->freeExtents[i].type != VIR_STORAGE_FREE_LOGICAL) {
                 continue;
                 /* for primary partition, the free extent
                    must not be within a logical free area */
E
Eric Blake 已提交
695 696 697
             } else if (partType == VIR_STORAGE_VOL_DISK_TYPE_PRIMARY &&
                        dev->freeExtents[i].type != VIR_STORAGE_FREE_NORMAL) {
                 continue;
698 699 700 701 702 703 704 705
             }
             smallestSize = size;
             smallestExtent = i;
             alignedAllocation = neededSize;
         }
    }

    if (smallestExtent == -1) {
706 707
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       "%s", _("no large enough free extent"));
708 709 710
        return -1;
    }

711
    VIR_DEBUG("aligned alloc %llu", alignedAllocation);
712 713 714 715 716 717 718 719
    *start = dev->freeExtents[smallestExtent].start;

    if (partType == VIR_STORAGE_VOL_DISK_TYPE_LOGICAL) {
        /* for logical partition, skip one block */
        *start += SECTOR_SIZE;
    }

    *end = *start + alignedAllocation;
720
    if (def->source.format == VIR_STORAGE_POOL_DISK_DOS) {
J
Ján Tomko 已提交
721
        /* adjust our allocation if start is not at a cylinder boundary */
722 723 724
        *end -= (*start % cylinderSize);
    }

725
    /* counting in bytes, we want the last byte of the current sector */
726
    *end -= 1;
727
    VIR_DEBUG("final aligned start %llu, end %llu", *start, *end);
728 729 730 731
    return 0;
}


732 733 734 735 736 737 738 739 740 741
/* virStorageBackendDiskDeleteVol
 * @pool: Pointer to the storage pool
 * @vol: Pointer to the volume definition
 * @flags: flags (unused for now)
 *
 * This API will remove the disk volume partition either from direct
 * API call or as an error path during creation when the partition
 * name provided during create doesn't match the name read from
 * virStorageBackendDiskReadPartitions.
 *
742
 * For a device mapper device, device representation is dependent upon
743 744 745 746 747 748 749 750 751 752 753 754 755
 * device mapper configuration, but the general rule of thumb is that at
 * creation if a device name ends with a number, then a partition separator
 * "p" is added to the created name; otherwise, if the device name doesn't
 * end with a number, then there is no partition separator. This name is
 * what ends up in the vol->target.path. This ends up being a link to a
 * /dev/mapper/dm-# device which cannot be used in the algorithm to determine
 * which partition to remove, but a properly handled target.path can be.
 *
 * For non device mapper devices, just need to resolve the link of the
 * vol->target.path in order to get the path.
 *
 * Returns 0 on success, -1 on failure with error message set.
 */
756
static int
757
virStorageBackendDiskDeleteVol(virStoragePoolObjPtr pool,
758 759 760 761
                               virStorageVolDefPtr vol,
                               unsigned int flags)
{
    char *part_num = NULL;
762
    char *dev_name;
763 764
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
    char *src_path = def->source.devices[0].path;
765
    char *srcname = last_component(src_path);
766
    bool isDevMapperDevice;
767
    VIR_AUTOFREE(char *) devpath = NULL;
768
    VIR_AUTOPTR(virCommand) cmd = NULL;
769 770 771

    virCheckFlags(0, -1);

772 773 774
    if (!vol->target.path) {
        virReportError(VIR_ERR_INVALID_ARG,
                       _("volume target path empty for source path '%s'"),
775
                      src_path);
776 777 778
        return -1;
    }

779 780 781 782 783 784 785 786 787 788 789 790
    /* NB: This is the corollary to the algorithm in libvirt_parthelper
     *     (parthelper.c) that is used to generate the target.path name
     *     for use by libvirt. Changes to either, need to be reflected
     *     in both places */
    isDevMapperDevice = virIsDevMapperDevice(vol->target.path);
    if (isDevMapperDevice) {
        dev_name = last_component(vol->target.path);
    } else {
        if (virFileResolveLink(vol->target.path, &devpath) < 0) {
            virReportSystemError(errno,
                                 _("Couldn't read volume target path '%s'"),
                                 vol->target.path);
791
            return -1;
792 793
        }
        dev_name = last_component(devpath);
794 795 796 797
    }

    VIR_DEBUG("dev_name=%s, srcname=%s", dev_name, srcname);

798
    if (!STRPREFIX(dev_name, srcname)) {
799 800 801
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("Volume path '%s' did not start with parent "
                         "pool source device name."), dev_name);
802
        return -1;
803 804
    }

805
    part_num = dev_name + strlen(srcname);
806

807 808 809 810
    /* For device mapper and we have a partition character 'p' as the
     * current character, let's move beyond that before checking part_num */
    if (isDevMapperDevice && *part_num == 'p')
        part_num++;
811

812 813 814 815
    if (*part_num == 0) {
        virReportError(VIR_ERR_INTERNAL_ERROR,
                       _("cannot parse partition number from target "
                         "'%s'"), dev_name);
816
        return -1;
817 818
    }

819 820 821 822 823 824 825 826
    /* eg parted /dev/sda rm 2 or /dev/mapper/mpathc rm 2 */
    cmd = virCommandNewArgList(PARTED,
                               src_path,
                               "rm",
                               "--script",
                               part_num,
                               NULL);
    if (virCommandRun(cmd, NULL) < 0)
827
        return -1;
828

829 830 831 832
    /* Refreshing the pool is the easiest option as LOGICAL and EXTENDED
     * partition allocation/capacity management is handled within
     * virStorageBackendDiskMakeDataVol and trying to redo that logic
     * here is pointless
833
     */
834
    virStoragePoolObjClearVols(pool);
835
    if (virStorageBackendDiskRefreshPool(pool) < 0)
836
        return -1;
837

838
    return 0;
839 840 841
}


842
static int
843
virStorageBackendDiskCreateVol(virStoragePoolObjPtr pool,
844 845 846
                               virStorageVolDefPtr vol)
{
    unsigned long long startOffset = 0, endOffset = 0;
847
    virStoragePoolDefPtr def = virStoragePoolObjGetDef(pool);
848
    virErrorPtr save_err;
849
    VIR_AUTOFREE(char *)partFormat = NULL;
850 851 852 853 854 855 856
    VIR_AUTOPTR(virCommand) cmd = NULL;

    cmd = virCommandNewArgList(PARTED,
                               def->source.devices[0].path,
                               "mkpart",
                               "--script",
                               NULL);
857

858 859 860 861
    if (vol->target.encryption &&
        vol->target.encryption->format != VIR_STORAGE_ENCRYPTION_FORMAT_LUKS) {
        virReportError(VIR_ERR_CONFIG_UNSUPPORTED, "%s",
                       _("storage pool only supports LUKS encrypted volumes"));
862
        return -1;
863
    }
864

865
    if (virStorageBackendDiskPartFormat(pool, vol, &partFormat) != 0)
866
        return -1;
867
    virCommandAddArg(cmd, partFormat);
868

869 870 871 872 873 874 875
    /* If we're going to encrypt using LUKS, then we could need up to
     * an extra 2MB for the LUKS header - so account for that now */
    if (vol->target.encryption)
        vol->target.capacity += 2 * 1024 * 1024;

    if (virStorageBackendDiskPartBoundaries(pool, &startOffset, &endOffset,
                                            vol->target.capacity) < 0)
876
        return -1;
877

878 879
    virCommandAddArgFormat(cmd, "%lluB", startOffset);
    virCommandAddArgFormat(cmd, "%lluB", endOffset);
880

881
    if (virCommandRun(cmd, NULL) < 0)
882
        return -1;
883

884
    /* wait for device node to show up */
J
John Ferlan 已提交
885
    virWaitForDevices();
886

887
    /* Blow away free extent info, as we're about to re-populate it */
888 889
    VIR_FREE(def->source.devices[0].freeExtents);
    def->source.devices[0].nfreeExtent = 0;
890

891 892 893 894
    /* Specifying a target path is meaningless */
    VIR_FREE(vol->target.path);

    /* Fetch actual extent info, generate key */
895 896 897 898 899 900 901 902 903
    if (virStorageBackendDiskReadPartitions(pool, vol) < 0)
        goto error;

    if (vol->target.encryption) {
        /* Adjust the sizes to account for the LUKS header */
        vol->target.capacity -= 2 * 1024 * 1024;
        vol->target.allocation -= 2 * 1024 * 1024;
        if (virStorageBackendCreateVolUsingQemuImg(pool, vol, NULL, 0) < 0)
            goto error;
904
    }
905

906
    return 0;
907 908 909 910 911 912 913 914 915

 error:
    /* Best effort to remove the partition. Ignore any errors
     * since we could be calling this with vol->target.path == NULL
     */
    save_err = virSaveLastError();
    ignore_value(virStorageBackendDiskDeleteVol(pool, vol, 0));
    virSetError(save_err);
    virFreeError(save_err);
916
    return -1;
917 918
}

919

920
static int
921
virStorageBackendDiskBuildVolFrom(virStoragePoolObjPtr pool,
922 923 924 925 926 927
                                  virStorageVolDefPtr vol,
                                  virStorageVolDefPtr inputvol,
                                  unsigned int flags)
{
    virStorageBackendBuildVolFrom build_func;

928
    build_func = virStorageBackendGetBuildVolFromFunction(vol, inputvol);
929 930 931
    if (!build_func)
        return -1;

932
    return build_func(pool, vol, inputvol, flags);
933
}
934 935


936
static int
937
virStorageBackendDiskVolWipe(virStoragePoolObjPtr pool,
938 939 940 941 942
                             virStorageVolDefPtr vol,
                             unsigned int algorithm,
                             unsigned int flags)
{
    if (vol->source.partType != VIR_STORAGE_VOL_DISK_TYPE_EXTENDED)
943
        return virStorageBackendVolWipeLocal(pool, vol, algorithm, flags);
944 945 946 947 948 949 950 951 952

    /* Wiping an extended partition is not support */
    virReportError(VIR_ERR_NO_SUPPORT,
                   _("cannot wipe extended partition '%s'"),
                   vol->target.path);
    return -1;
}


953 954 955
virStorageBackend virStorageBackendDisk = {
    .type = VIR_STORAGE_POOL_DISK,

956
    .startPool = virStorageBackendDiskStartPool,
957 958 959 960 961
    .buildPool = virStorageBackendDiskBuildPool,
    .refreshPool = virStorageBackendDiskRefreshPool,

    .createVol = virStorageBackendDiskCreateVol,
    .deleteVol = virStorageBackendDiskDeleteVol,
962
    .buildVolFrom = virStorageBackendDiskBuildVolFrom,
963 964
    .uploadVol = virStorageBackendVolUploadLocal,
    .downloadVol = virStorageBackendVolDownloadLocal,
965
    .wipeVol = virStorageBackendDiskVolWipe,
966
};
967 968 969 970 971 972 973


int
virStorageBackendDiskRegister(void)
{
    return virStorageBackendRegister(&virStorageBackendDisk);
}