qemu-nbd.c 21.0 KB
Newer Older
1
/*
B
bellard 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15
 *  Copyright (C) 2005  Anthony Liguori <anthony@codemonkey.ws>
 *
 *  Network Block Device
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; under version 2 of the License.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
16
 *  along with this program; if not, see <http://www.gnu.org/licenses/>.
B
bellard 已提交
17 18
 */

19
#include "qemu-common.h"
20 21
#include "block/block.h"
#include "block/nbd.h"
22
#include "qemu/main-loop.h"
23 24
#include "qemu/sockets.h"
#include "qemu/error-report.h"
25
#include "block/snapshot.h"
B
bellard 已提交
26 27 28 29 30

#include <stdarg.h>
#include <stdio.h>
#include <getopt.h>
#include <err.h>
31
#include <sys/types.h>
B
bellard 已提交
32 33 34 35
#include <sys/socket.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <arpa/inet.h>
36
#include <signal.h>
37
#include <libgen.h>
P
Paolo Bonzini 已提交
38
#include <pthread.h>
39

P
Paolo Bonzini 已提交
40 41 42 43
#define SOCKET_PATH          "/var/lock/qemu-nbd-%s"
#define QEMU_NBD_OPT_CACHE   1
#define QEMU_NBD_OPT_AIO     2
#define QEMU_NBD_OPT_DISCARD 3
B
bellard 已提交
44

P
Paolo Bonzini 已提交
45
static NBDExport *exp;
46
static int verbose;
P
Paolo Bonzini 已提交
47 48
static char *srcpath;
static char *sockpath;
49 50
static int persistent = 0;
static enum { RUNNING, TERMINATE, TERMINATING, TERMINATED } state;
P
Paolo Bonzini 已提交
51 52
static int shared = 1;
static int nb_fds;
B
bellard 已提交
53 54 55

static void usage(const char *name)
{
56
    (printf) (
B
bellard 已提交
57 58 59
"Usage: %s [OPTIONS] FILE\n"
"QEMU Disk Network Block Device Server\n"
"\n"
60 61 62 63
"  -h, --help           display this help and exit\n"
"  -V, --version        output version information and exit\n"
"\n"
"Connection properties:\n"
64
"  -p, --port=PORT      port to listen on (default `%d')\n"
B
bellard 已提交
65
"  -b, --bind=IFACE     interface to bind to (default `0.0.0.0')\n"
66 67
"  -k, --socket=PATH    path to the unix socket\n"
"                       (default '"SOCKET_PATH"')\n"
68
"  -e, --shared=NUM     device can be shared by NUM clients (default '1')\n"
69
"  -t, --persistent     don't exit on the last connection\n"
B
bellard 已提交
70 71
"  -v, --verbose        display extra debugging information\n"
"\n"
72 73 74 75 76 77 78 79 80 81 82 83
"Exposing part of the image:\n"
"  -o, --offset=OFFSET  offset into the image\n"
"  -P, --partition=NUM  only expose partition NUM\n"
"\n"
#ifdef __linux__
"Kernel NBD client support:\n"
"  -c, --connect=DEV    connect FILE to the local NBD device DEV\n"
"  -d, --disconnect     disconnect the specified device\n"
"\n"
#endif
"\n"
"Block device options:\n"
W
Wenchao Xia 已提交
84
"  -f, --format=FORMAT  set image format (raw, qcow2, ...)\n"
85
"  -r, --read-only      export read-only\n"
86 87 88 89 90 91 92 93
"  -s, --snapshot       use FILE as an external snapshot, create a temporary\n"
"                       file with backing_file=FILE, redirect the write to\n"
"                       the temporary one\n"
"  -l, --load-snapshot=SNAPSHOT_PARAM\n"
"                       load an internal snapshot inside FILE and export it\n"
"                       as an read-only device, SNAPSHOT_PARAM format is\n"
"                       'snapshot.id=[ID],snapshot.name=[NAME]', or\n"
"                       '[ID_OR_NAME]'\n"
94
"  -n, --nocache        disable host cache\n"
95 96 97 98
"      --cache=MODE     set cache mode (none, writeback, ...)\n"
#ifdef CONFIG_LINUX_AIO
"      --aio=MODE       set AIO mode (native or threads)\n"
#endif
99 100
"\n"
"Report bugs to <qemu-devel@nongnu.org>\n"
101
    , name, NBD_DEFAULT_PORT, "DEVICE");
B
bellard 已提交
102 103 104 105 106
}

static void version(const char *name)
{
    printf(
107
"%s version 0.0.1\n"
B
bellard 已提交
108 109 110 111 112
"Written by Anthony Liguori.\n"
"\n"
"Copyright (C) 2006 Anthony Liguori <anthony@codemonkey.ws>.\n"
"This is free software; see the source for copying conditions.  There is NO\n"
"warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n"
113
    , name);
B
bellard 已提交
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150
}

struct partition_record
{
    uint8_t bootable;
    uint8_t start_head;
    uint32_t start_cylinder;
    uint8_t start_sector;
    uint8_t system;
    uint8_t end_head;
    uint8_t end_cylinder;
    uint8_t end_sector;
    uint32_t start_sector_abs;
    uint32_t nb_sectors_abs;
};

static void read_partition(uint8_t *p, struct partition_record *r)
{
    r->bootable = p[0];
    r->start_head = p[1];
    r->start_cylinder = p[3] | ((p[2] << 2) & 0x0300);
    r->start_sector = p[2] & 0x3f;
    r->system = p[4];
    r->end_head = p[5];
    r->end_cylinder = p[7] | ((p[6] << 2) & 0x300);
    r->end_sector = p[6] & 0x3f;
    r->start_sector_abs = p[8] | p[9] << 8 | p[10] << 16 | p[11] << 24;
    r->nb_sectors_abs = p[12] | p[13] << 8 | p[14] << 16 | p[15] << 24;
}

static int find_partition(BlockDriverState *bs, int partition,
                          off_t *offset, off_t *size)
{
    struct partition_record mbr[4];
    uint8_t data[512];
    int i;
    int ext_partnum = 4;
R
Ryota Ozaki 已提交
151
    int ret;
B
bellard 已提交
152

R
Ryota Ozaki 已提交
153 154 155 156
    if ((ret = bdrv_read(bs, 0, data, 1)) < 0) {
        errno = -ret;
        err(EXIT_FAILURE, "error while reading");
    }
B
bellard 已提交
157 158

    if (data[510] != 0x55 || data[511] != 0xaa) {
159
        return -EINVAL;
B
bellard 已提交
160 161 162 163 164 165 166 167 168 169 170 171 172
    }

    for (i = 0; i < 4; i++) {
        read_partition(&data[446 + 16 * i], &mbr[i]);

        if (!mbr[i].nb_sectors_abs)
            continue;

        if (mbr[i].system == 0xF || mbr[i].system == 0x5) {
            struct partition_record ext[4];
            uint8_t data1[512];
            int j;

R
Ryota Ozaki 已提交
173 174 175 176
            if ((ret = bdrv_read(bs, mbr[i].start_sector_abs, data1, 1)) < 0) {
                errno = -ret;
                err(EXIT_FAILURE, "error while reading");
            }
B
bellard 已提交
177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196

            for (j = 0; j < 4; j++) {
                read_partition(&data1[446 + 16 * j], &ext[j]);
                if (!ext[j].nb_sectors_abs)
                    continue;

                if ((ext_partnum + j + 1) == partition) {
                    *offset = (uint64_t)ext[j].start_sector_abs << 9;
                    *size = (uint64_t)ext[j].nb_sectors_abs << 9;
                    return 0;
                }
            }
            ext_partnum += 4;
        } else if ((i + 1) == partition) {
            *offset = (uint64_t)mbr[i].start_sector_abs << 9;
            *size = (uint64_t)mbr[i].nb_sectors_abs << 9;
            return 0;
        }
    }

197
    return -ENOENT;
B
bellard 已提交
198 199
}

P
Paolo Bonzini 已提交
200 201
static void termsig_handler(int signum)
{
202
    state = TERMINATE;
P
Paolo Bonzini 已提交
203
    qemu_notify_event();
P
Paolo Bonzini 已提交
204 205
}

206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225
static void combine_addr(char *buf, size_t len, const char* address,
                         uint16_t port)
{
    /* If the address-part contains a colon, it's an IPv6 IP so needs [] */
    if (strstr(address, ":")) {
        snprintf(buf, len, "[%s]:%u", address, port);
    } else {
        snprintf(buf, len, "%s:%u", address, port);
    }
}

static int tcp_socket_incoming(const char *address, uint16_t port)
{
    char address_and_port[128];
    Error *local_err = NULL;

    combine_addr(address_and_port, 128, address, port);
    int fd = inet_listen(address_and_port, NULL, 0, SOCK_STREAM, 0, &local_err);

    if (local_err != NULL) {
226
        error_report("%s", error_get_pretty(local_err));
227 228 229 230 231 232 233 234 235 236 237
        error_free(local_err);
    }
    return fd;
}

static int unix_socket_incoming(const char *path)
{
    Error *local_err = NULL;
    int fd = unix_listen(path, NULL, 0, &local_err);

    if (local_err != NULL) {
238
        error_report("%s", error_get_pretty(local_err));
239 240 241 242 243 244 245 246 247 248 249
        error_free(local_err);
    }
    return fd;
}

static int unix_socket_outgoing(const char *path)
{
    Error *local_err = NULL;
    int fd = unix_connect(path, &local_err);

    if (local_err != NULL) {
250
        error_report("%s", error_get_pretty(local_err));
251 252 253 254 255
        error_free(local_err);
    }
    return fd;
}

P
Paolo Bonzini 已提交
256
static void *show_parts(void *arg)
257
{
258
    char *device = arg;
P
Paolo Bonzini 已提交
259 260 261 262 263 264 265 266
    int nbd;

    /* linux just needs an open() to trigger
     * the partition table update
     * but remember to load the module with max_part != 0 :
     *     modprobe nbd max_part=63
     */
    nbd = open(device, O_RDWR);
267
    if (nbd >= 0) {
P
Paolo Bonzini 已提交
268 269 270 271
        close(nbd);
    }
    return NULL;
}
272

P
Paolo Bonzini 已提交
273 274
static void *nbd_client_thread(void *arg)
{
275
    char *device = arg;
P
Paolo Bonzini 已提交
276 277 278
    off_t size;
    size_t blocksize;
    uint32_t nbdflags;
279
    int fd, sock;
P
Paolo Bonzini 已提交
280 281 282
    int ret;
    pthread_t show_parts_thread;

283
    sock = unix_socket_outgoing(sockpath);
284
    if (sock < 0) {
285 286
        goto out;
    }
P
Paolo Bonzini 已提交
287 288 289

    ret = nbd_receive_negotiate(sock, NULL, &nbdflags,
                                &size, &blocksize);
290
    if (ret < 0) {
P
Paolo Bonzini 已提交
291
        goto out_socket;
P
Paolo Bonzini 已提交
292 293
    }

294
    fd = open(device, O_RDWR);
295
    if (fd < 0) {
296
        /* Linux-only, we can use %m in printf.  */
H
Hani Benhabiles 已提交
297
        fprintf(stderr, "Failed to open %s: %m\n", device);
P
Paolo Bonzini 已提交
298
        goto out_socket;
299 300
    }

P
Paolo Bonzini 已提交
301
    ret = nbd_init(fd, sock, nbdflags, size, blocksize);
302
    if (ret < 0) {
P
Paolo Bonzini 已提交
303
        goto out_fd;
P
Paolo Bonzini 已提交
304 305 306
    }

    /* update partition table */
307
    pthread_create(&show_parts_thread, NULL, show_parts, device);
P
Paolo Bonzini 已提交
308

309 310 311 312 313 314 315
    if (verbose) {
        fprintf(stderr, "NBD device %s is now connected to %s\n",
                device, srcpath);
    } else {
        /* Close stderr so that the qemu-nbd process exits.  */
        dup2(STDOUT_FILENO, STDERR_FILENO);
    }
P
Paolo Bonzini 已提交
316 317 318

    ret = nbd_client(fd);
    if (ret) {
P
Paolo Bonzini 已提交
319
        goto out_fd;
320
    }
P
Paolo Bonzini 已提交
321 322 323 324
    close(fd);
    kill(getpid(), SIGTERM);
    return (void *) EXIT_SUCCESS;

P
Paolo Bonzini 已提交
325 326 327 328
out_fd:
    close(fd);
out_socket:
    closesocket(sock);
P
Paolo Bonzini 已提交
329 330 331
out:
    kill(getpid(), SIGTERM);
    return (void *) EXIT_FAILURE;
332 333
}

P
Paolo Bonzini 已提交
334 335 336 337 338
static int nbd_can_accept(void *opaque)
{
    return nb_fds < shared;
}

339 340 341 342 343 344
static void nbd_export_closed(NBDExport *exp)
{
    assert(state == TERMINATING);
    state = TERMINATED;
}

345
static void nbd_client_closed(NBDClient *client)
P
Paolo Bonzini 已提交
346
{
347
    nb_fds--;
348 349 350
    if (nb_fds == 0 && !persistent && state == RUNNING) {
        state = TERMINATE;
    }
351
    qemu_notify_event();
352
    nbd_client_put(client);
P
Paolo Bonzini 已提交
353 354 355 356 357 358 359 360 361
}

static void nbd_accept(void *opaque)
{
    int server_fd = (uintptr_t) opaque;
    struct sockaddr_in addr;
    socklen_t addr_len = sizeof(addr);

    int fd = accept(server_fd, (struct sockaddr *)&addr, &addr_len);
P
Paolo Bonzini 已提交
362 363 364 365 366
    if (fd < 0) {
        perror("accept");
        return;
    }

367 368 369 370 371
    if (state >= TERMINATE) {
        close(fd);
        return;
    }

372
    if (nbd_client_new(exp, fd, nbd_client_closed)) {
P
Paolo Bonzini 已提交
373
        nb_fds++;
374
    } else {
375
        shutdown(fd, 2);
376
        close(fd);
P
Paolo Bonzini 已提交
377 378 379
    }
}

B
bellard 已提交
380 381 382
int main(int argc, char **argv)
{
    BlockDriverState *bs;
383
    BlockDriver *drv;
B
bellard 已提交
384
    off_t dev_offset = 0;
P
Paolo Bonzini 已提交
385
    uint32_t nbdflags = 0;
386
    bool disconnect = false;
B
bellard 已提交
387
    const char *bindto = "0.0.0.0";
388
    char *device = NULL;
389
    int port = NBD_DEFAULT_PORT;
B
bellard 已提交
390
    off_t fd_size;
391 392 393
    QemuOpts *sn_opts = NULL;
    const char *sn_id_or_name = NULL;
    const char *sopt = "hVb:o:p:rsnP:c:dvk:e:f:tl:";
B
bellard 已提交
394
    struct option lopt[] = {
395 396 397 398 399 400 401 402 403 404 405
        { "help", 0, NULL, 'h' },
        { "version", 0, NULL, 'V' },
        { "bind", 1, NULL, 'b' },
        { "port", 1, NULL, 'p' },
        { "socket", 1, NULL, 'k' },
        { "offset", 1, NULL, 'o' },
        { "read-only", 0, NULL, 'r' },
        { "partition", 1, NULL, 'P' },
        { "connect", 1, NULL, 'c' },
        { "disconnect", 0, NULL, 'd' },
        { "snapshot", 0, NULL, 's' },
406
        { "load-snapshot", 1, NULL, 'l' },
407
        { "nocache", 0, NULL, 'n' },
408 409 410 411
        { "cache", 1, NULL, QEMU_NBD_OPT_CACHE },
#ifdef CONFIG_LINUX_AIO
        { "aio", 1, NULL, QEMU_NBD_OPT_AIO },
#endif
P
Paolo Bonzini 已提交
412
        { "discard", 1, NULL, QEMU_NBD_OPT_DISCARD },
413
        { "shared", 1, NULL, 'e' },
414
        { "format", 1, NULL, 'f' },
415 416 417
        { "persistent", 0, NULL, 't' },
        { "verbose", 0, NULL, 'v' },
        { NULL, 0, NULL, 0 }
B
bellard 已提交
418 419 420 421 422
    };
    int ch;
    int opt_ind = 0;
    int li;
    char *end;
423
    int flags = BDRV_O_RDWR;
B
bellard 已提交
424
    int partition = -1;
425
    int ret;
426
    int fd;
427
    bool seen_cache = false;
P
Paolo Bonzini 已提交
428
    bool seen_discard = false;
429 430 431
#ifdef CONFIG_LINUX_AIO
    bool seen_aio = false;
#endif
P
Paolo Bonzini 已提交
432
    pthread_t client_thread;
433
    const char *fmt = NULL;
434
    Error *local_err = NULL;
B
bellard 已提交
435

P
Paolo Bonzini 已提交
436 437 438
    /* The client thread uses SIGTERM to interrupt the server.  A signal
     * handler ensures that "qemu-nbd -v -c" exits with a nice status code.
     */
P
Paolo Bonzini 已提交
439 440 441 442
    struct sigaction sa_sigterm;
    memset(&sa_sigterm, 0, sizeof(sa_sigterm));
    sa_sigterm.sa_handler = termsig_handler;
    sigaction(SIGTERM, &sa_sigterm, NULL);
443
    qemu_init_exec_dir(argv[0]);
P
Paolo Bonzini 已提交
444

B
bellard 已提交
445 446 447
    while ((ch = getopt_long(argc, argv, sopt, lopt, &opt_ind)) != -1) {
        switch (ch) {
        case 's':
448 449 450
            flags |= BDRV_O_SNAPSHOT;
            break;
        case 'n':
451 452 453 454 455 456 457 458 459 460
            optarg = (char *) "none";
            /* fallthrough */
        case QEMU_NBD_OPT_CACHE:
            if (seen_cache) {
                errx(EXIT_FAILURE, "-n and --cache can only be specified once");
            }
            seen_cache = true;
            if (bdrv_parse_cache_flags(optarg, &flags) == -1) {
                errx(EXIT_FAILURE, "Invalid cache mode `%s'", optarg);
            }
B
bellard 已提交
461
            break;
462 463 464 465 466 467 468 469 470 471 472 473 474 475 476
#ifdef CONFIG_LINUX_AIO
        case QEMU_NBD_OPT_AIO:
            if (seen_aio) {
                errx(EXIT_FAILURE, "--aio can only be specified once");
            }
            seen_aio = true;
            if (!strcmp(optarg, "native")) {
                flags |= BDRV_O_NATIVE_AIO;
            } else if (!strcmp(optarg, "threads")) {
                /* this is the default */
            } else {
               errx(EXIT_FAILURE, "invalid aio mode `%s'", optarg);
            }
            break;
#endif
P
Paolo Bonzini 已提交
477 478 479 480 481 482 483 484 485
        case QEMU_NBD_OPT_DISCARD:
            if (seen_discard) {
                errx(EXIT_FAILURE, "--discard can only be specified once");
            }
            seen_discard = true;
            if (bdrv_parse_discard_flags(optarg, &flags) == -1) {
                errx(EXIT_FAILURE, "Invalid discard mode `%s'", optarg);
            }
            break;
B
bellard 已提交
486 487 488 489 490 491
        case 'b':
            bindto = optarg;
            break;
        case 'p':
            li = strtol(optarg, &end, 0);
            if (*end) {
492
                errx(EXIT_FAILURE, "Invalid port `%s'", optarg);
B
bellard 已提交
493 494
            }
            if (li < 1 || li > 65535) {
495
                errx(EXIT_FAILURE, "Port out of range `%s'", optarg);
B
bellard 已提交
496 497 498 499 500 501
            }
            port = (uint16_t)li;
            break;
        case 'o':
                dev_offset = strtoll (optarg, &end, 0);
            if (*end) {
502
                errx(EXIT_FAILURE, "Invalid offset `%s'", optarg);
B
bellard 已提交
503 504
            }
            if (dev_offset < 0) {
505
                errx(EXIT_FAILURE, "Offset must be positive `%s'", optarg);
B
bellard 已提交
506 507
            }
            break;
508 509 510 511 512 513 514 515 516 517 518
        case 'l':
            if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) {
                sn_opts = qemu_opts_parse(&internal_snapshot_opts, optarg, 0);
                if (!sn_opts) {
                    errx(EXIT_FAILURE, "Failed in parsing snapshot param `%s'",
                         optarg);
                }
            } else {
                sn_id_or_name = optarg;
            }
            /* fall through */
B
bellard 已提交
519
        case 'r':
P
Paolo Bonzini 已提交
520
            nbdflags |= NBD_FLAG_READ_ONLY;
N
Naphtali Sprei 已提交
521
            flags &= ~BDRV_O_RDWR;
B
bellard 已提交
522 523 524 525
            break;
        case 'P':
            partition = strtol(optarg, &end, 0);
            if (*end)
526
                errx(EXIT_FAILURE, "Invalid partition `%s'", optarg);
B
bellard 已提交
527
            if (partition < 1 || partition > 8)
528
                errx(EXIT_FAILURE, "Invalid partition %d", partition);
B
bellard 已提交
529
            break;
530
        case 'k':
P
Paolo Bonzini 已提交
531 532
            sockpath = optarg;
            if (sockpath[0] != '/')
533
                errx(EXIT_FAILURE, "socket path must be absolute\n");
534 535 536 537 538 539 540
            break;
        case 'd':
            disconnect = true;
            break;
        case 'c':
            device = optarg;
            break;
541 542 543
        case 'e':
            shared = strtol(optarg, &end, 0);
            if (*end) {
544
                errx(EXIT_FAILURE, "Invalid shared device number '%s'", optarg);
545 546
            }
            if (shared < 1) {
547
                errx(EXIT_FAILURE, "Shared device number must be greater than 0\n");
548 549
            }
            break;
550 551 552
        case 'f':
            fmt = optarg;
            break;
553 554 555
	case 't':
	    persistent = 1;
	    break;
B
bellard 已提交
556 557 558 559 560 561 562 563 564 565 566 567
        case 'v':
            verbose = 1;
            break;
        case 'V':
            version(argv[0]);
            exit(0);
            break;
        case 'h':
            usage(argv[0]);
            exit(0);
            break;
        case '?':
568
            errx(EXIT_FAILURE, "Try `%s --help' for more information.",
B
bellard 已提交
569 570 571 572 573
                 argv[0]);
        }
    }

    if ((argc - optind) != 1) {
574
        errx(EXIT_FAILURE, "Invalid number of argument.\n"
B
bellard 已提交
575 576 577 578
             "Try `%s --help' for more information.",
             argv[0]);
    }

579 580
    if (disconnect) {
        fd = open(argv[optind], O_RDWR);
581
        if (fd < 0) {
R
Ryota Ozaki 已提交
582
            err(EXIT_FAILURE, "Cannot open %s", argv[optind]);
583
        }
584 585 586 587 588 589 590 591 592
        nbd_disconnect(fd);

        close(fd);

        printf("%s disconnected\n", argv[optind]);

	return 0;
    }

593 594 595 596 597
    if (device && !verbose) {
        int stderr_fd[2];
        pid_t pid;
        int ret;

598
        if (qemu_pipe(stderr_fd) < 0) {
599 600 601 602 603 604 605 606 607
            err(EXIT_FAILURE, "Error setting up communication pipe");
        }

        /* Now daemonize, but keep a communication channel open to
         * print errors and exit with the proper status code.
         */
        pid = fork();
        if (pid == 0) {
            close(stderr_fd[0]);
608
            ret = qemu_daemon(1, 0);
609 610 611

            /* Temporarily redirect stderr to the parent's pipe...  */
            dup2(stderr_fd[1], STDERR_FILENO);
612
            if (ret < 0) {
613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629
                err(EXIT_FAILURE, "Failed to daemonize");
            }

            /* ... close the descriptor we inherited and go on.  */
            close(stderr_fd[1]);
        } else {
            bool errors = false;
            char *buf;

            /* In the parent.  Print error messages from the child until
             * it closes the pipe.
             */
            close(stderr_fd[1]);
            buf = g_malloc(1024);
            while ((ret = read(stderr_fd[0], buf, 1024)) > 0) {
                errors = true;
                ret = qemu_write_full(STDERR_FILENO, buf, ret);
630
                if (ret < 0) {
631 632 633
                    exit(EXIT_FAILURE);
                }
            }
634
            if (ret < 0) {
635 636 637 638 639 640 641 642 643 644
                err(EXIT_FAILURE, "Cannot read from daemon");
            }

            /* Usually the daemon should not print any message.
             * Exit with zero status in that case.
             */
            exit(errors);
        }
    }

645 646 647
    if (device != NULL && sockpath == NULL) {
        sockpath = g_malloc(128);
        snprintf(sockpath, 128, SOCKET_PATH, basename(device));
648 649
    }

650
    qemu_init_main_loop();
651 652 653
    bdrv_init();
    atexit(bdrv_close_all);

654 655 656 657 658 659 660 661 662
    if (fmt) {
        drv = bdrv_find_format(fmt);
        if (!drv) {
            errx(EXIT_FAILURE, "Unknown file format '%s'", fmt);
        }
    } else {
        drv = NULL;
    }

K
Kevin Wolf 已提交
663 664
    bs = bdrv_new("hda", &error_abort);

665
    srcpath = argv[optind];
666
    ret = bdrv_open(&bs, srcpath, NULL, NULL, flags, drv, &local_err);
667
    if (ret < 0) {
668
        errno = -ret;
669 670
        err(EXIT_FAILURE, "Failed to bdrv_open '%s': %s", argv[optind],
            error_get_pretty(local_err));
671 672
    }

673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688
    if (sn_opts) {
        ret = bdrv_snapshot_load_tmp(bs,
                                     qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID),
                                     qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME),
                                     &local_err);
    } else if (sn_id_or_name) {
        ret = bdrv_snapshot_load_tmp_by_id_or_name(bs, sn_id_or_name,
                                                   &local_err);
    }
    if (ret < 0) {
        errno = -ret;
        err(EXIT_FAILURE,
            "Failed to load snapshot: %s",
            error_get_pretty(local_err));
    }

P
Paolo Bonzini 已提交
689
    fd_size = bdrv_getlength(bs);
690

691 692 693 694 695 696
    if (partition != -1) {
        ret = find_partition(bs, partition, &dev_offset, &fd_size);
        if (ret < 0) {
            errno = -ret;
            err(EXIT_FAILURE, "Could not find partition %d", partition);
        }
697 698
    }

699
    exp = nbd_export_new(bs, dev_offset, fd_size, nbdflags, nbd_export_closed);
700

P
Paolo Bonzini 已提交
701
    if (sockpath) {
P
Paolo Bonzini 已提交
702
        fd = unix_socket_incoming(sockpath);
703
    } else {
P
Paolo Bonzini 已提交
704
        fd = tcp_socket_incoming(bindto, port);
705 706
    }

707
    if (fd < 0) {
B
bellard 已提交
708
        return 1;
P
Paolo Bonzini 已提交
709
    }
P
Paolo Bonzini 已提交
710 711 712 713

    if (device) {
        int ret;

714
        ret = pthread_create(&client_thread, NULL, nbd_client_thread, device);
P
Paolo Bonzini 已提交
715 716 717 718 719 720 721 722 723
        if (ret != 0) {
            errx(EXIT_FAILURE, "Failed to create client thread: %s",
                 strerror(ret));
        }
    } else {
        /* Shut up GCC warnings.  */
        memset(&client_thread, 0, sizeof(client_thread));
    }

P
Paolo Bonzini 已提交
724 725
    qemu_set_fd_handler2(fd, nbd_can_accept, nbd_accept, NULL,
                         (void *)(uintptr_t)fd);
B
bellard 已提交
726

727 728 729 730 731 732
    /* now when the initialization is (almost) complete, chdir("/")
     * to free any busy filesystems */
    if (chdir("/") < 0) {
        err(EXIT_FAILURE, "Could not chdir to root directory");
    }

733
    state = RUNNING;
734
    do {
P
Paolo Bonzini 已提交
735
        main_loop_wait(false);
736 737 738 739 740 741 742
        if (state == TERMINATE) {
            state = TERMINATING;
            nbd_export_close(exp);
            nbd_export_put(exp);
            exp = NULL;
        }
    } while (state != TERMINATED);
B
bellard 已提交
743

744
    bdrv_close(bs);
P
Paolo Bonzini 已提交
745 746 747
    if (sockpath) {
        unlink(sockpath);
    }
B
bellard 已提交
748

749 750 751 752
    if (sn_opts) {
        qemu_opts_del(sn_opts);
    }

P
Paolo Bonzini 已提交
753 754 755 756 757 758 759
    if (device) {
        void *ret;
        pthread_join(client_thread, &ret);
        exit(ret != NULL);
    } else {
        exit(EXIT_SUCCESS);
    }
B
bellard 已提交
760
}