qemu-nbd.c 20.9 KB
Newer Older
1
/*
B
bellard 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15
 *  Copyright (C) 2005  Anthony Liguori <anthony@codemonkey.ws>
 *
 *  Network Block Device
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; under version 2 of the License.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
16
 *  along with this program; if not, see <http://www.gnu.org/licenses/>.
B
bellard 已提交
17 18
 */

19
#include "qemu-common.h"
20 21
#include "block/block.h"
#include "block/nbd.h"
22
#include "qemu/main-loop.h"
23 24
#include "qemu/sockets.h"
#include "qemu/error-report.h"
25
#include "block/snapshot.h"
B
bellard 已提交
26 27 28 29 30

#include <stdarg.h>
#include <stdio.h>
#include <getopt.h>
#include <err.h>
31
#include <sys/types.h>
B
bellard 已提交
32 33 34 35
#include <sys/socket.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <arpa/inet.h>
36
#include <signal.h>
37
#include <libgen.h>
P
Paolo Bonzini 已提交
38
#include <pthread.h>
39

P
Paolo Bonzini 已提交
40 41 42 43
#define SOCKET_PATH          "/var/lock/qemu-nbd-%s"
#define QEMU_NBD_OPT_CACHE   1
#define QEMU_NBD_OPT_AIO     2
#define QEMU_NBD_OPT_DISCARD 3
B
bellard 已提交
44

P
Paolo Bonzini 已提交
45
static NBDExport *exp;
46
static int verbose;
P
Paolo Bonzini 已提交
47 48
static char *srcpath;
static char *sockpath;
49 50
static int persistent = 0;
static enum { RUNNING, TERMINATE, TERMINATING, TERMINATED } state;
P
Paolo Bonzini 已提交
51 52
static int shared = 1;
static int nb_fds;
B
bellard 已提交
53 54 55

static void usage(const char *name)
{
56
    (printf) (
B
bellard 已提交
57 58 59
"Usage: %s [OPTIONS] FILE\n"
"QEMU Disk Network Block Device Server\n"
"\n"
60 61 62 63
"  -h, --help           display this help and exit\n"
"  -V, --version        output version information and exit\n"
"\n"
"Connection properties:\n"
64
"  -p, --port=PORT      port to listen on (default `%d')\n"
B
bellard 已提交
65
"  -b, --bind=IFACE     interface to bind to (default `0.0.0.0')\n"
66 67
"  -k, --socket=PATH    path to the unix socket\n"
"                       (default '"SOCKET_PATH"')\n"
68
"  -e, --shared=NUM     device can be shared by NUM clients (default '1')\n"
69
"  -t, --persistent     don't exit on the last connection\n"
B
bellard 已提交
70 71
"  -v, --verbose        display extra debugging information\n"
"\n"
72 73 74 75 76 77 78 79 80 81 82 83
"Exposing part of the image:\n"
"  -o, --offset=OFFSET  offset into the image\n"
"  -P, --partition=NUM  only expose partition NUM\n"
"\n"
#ifdef __linux__
"Kernel NBD client support:\n"
"  -c, --connect=DEV    connect FILE to the local NBD device DEV\n"
"  -d, --disconnect     disconnect the specified device\n"
"\n"
#endif
"\n"
"Block device options:\n"
W
Wenchao Xia 已提交
84
"  -f, --format=FORMAT  set image format (raw, qcow2, ...)\n"
85
"  -r, --read-only      export read-only\n"
86 87 88 89 90 91 92 93
"  -s, --snapshot       use FILE as an external snapshot, create a temporary\n"
"                       file with backing_file=FILE, redirect the write to\n"
"                       the temporary one\n"
"  -l, --load-snapshot=SNAPSHOT_PARAM\n"
"                       load an internal snapshot inside FILE and export it\n"
"                       as an read-only device, SNAPSHOT_PARAM format is\n"
"                       'snapshot.id=[ID],snapshot.name=[NAME]', or\n"
"                       '[ID_OR_NAME]'\n"
94
"  -n, --nocache        disable host cache\n"
95 96 97 98
"      --cache=MODE     set cache mode (none, writeback, ...)\n"
#ifdef CONFIG_LINUX_AIO
"      --aio=MODE       set AIO mode (native or threads)\n"
#endif
99 100
"\n"
"Report bugs to <qemu-devel@nongnu.org>\n"
101
    , name, NBD_DEFAULT_PORT, "DEVICE");
B
bellard 已提交
102 103 104 105 106
}

static void version(const char *name)
{
    printf(
107
"%s version 0.0.1\n"
B
bellard 已提交
108 109 110 111 112
"Written by Anthony Liguori.\n"
"\n"
"Copyright (C) 2006 Anthony Liguori <anthony@codemonkey.ws>.\n"
"This is free software; see the source for copying conditions.  There is NO\n"
"warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n"
113
    , name);
B
bellard 已提交
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150
}

struct partition_record
{
    uint8_t bootable;
    uint8_t start_head;
    uint32_t start_cylinder;
    uint8_t start_sector;
    uint8_t system;
    uint8_t end_head;
    uint8_t end_cylinder;
    uint8_t end_sector;
    uint32_t start_sector_abs;
    uint32_t nb_sectors_abs;
};

static void read_partition(uint8_t *p, struct partition_record *r)
{
    r->bootable = p[0];
    r->start_head = p[1];
    r->start_cylinder = p[3] | ((p[2] << 2) & 0x0300);
    r->start_sector = p[2] & 0x3f;
    r->system = p[4];
    r->end_head = p[5];
    r->end_cylinder = p[7] | ((p[6] << 2) & 0x300);
    r->end_sector = p[6] & 0x3f;
    r->start_sector_abs = p[8] | p[9] << 8 | p[10] << 16 | p[11] << 24;
    r->nb_sectors_abs = p[12] | p[13] << 8 | p[14] << 16 | p[15] << 24;
}

static int find_partition(BlockDriverState *bs, int partition,
                          off_t *offset, off_t *size)
{
    struct partition_record mbr[4];
    uint8_t data[512];
    int i;
    int ext_partnum = 4;
R
Ryota Ozaki 已提交
151
    int ret;
B
bellard 已提交
152

R
Ryota Ozaki 已提交
153 154 155 156
    if ((ret = bdrv_read(bs, 0, data, 1)) < 0) {
        errno = -ret;
        err(EXIT_FAILURE, "error while reading");
    }
B
bellard 已提交
157 158

    if (data[510] != 0x55 || data[511] != 0xaa) {
159
        return -EINVAL;
B
bellard 已提交
160 161 162 163 164 165 166 167 168 169 170 171 172
    }

    for (i = 0; i < 4; i++) {
        read_partition(&data[446 + 16 * i], &mbr[i]);

        if (!mbr[i].nb_sectors_abs)
            continue;

        if (mbr[i].system == 0xF || mbr[i].system == 0x5) {
            struct partition_record ext[4];
            uint8_t data1[512];
            int j;

R
Ryota Ozaki 已提交
173 174 175 176
            if ((ret = bdrv_read(bs, mbr[i].start_sector_abs, data1, 1)) < 0) {
                errno = -ret;
                err(EXIT_FAILURE, "error while reading");
            }
B
bellard 已提交
177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196

            for (j = 0; j < 4; j++) {
                read_partition(&data1[446 + 16 * j], &ext[j]);
                if (!ext[j].nb_sectors_abs)
                    continue;

                if ((ext_partnum + j + 1) == partition) {
                    *offset = (uint64_t)ext[j].start_sector_abs << 9;
                    *size = (uint64_t)ext[j].nb_sectors_abs << 9;
                    return 0;
                }
            }
            ext_partnum += 4;
        } else if ((i + 1) == partition) {
            *offset = (uint64_t)mbr[i].start_sector_abs << 9;
            *size = (uint64_t)mbr[i].nb_sectors_abs << 9;
            return 0;
        }
    }

197
    return -ENOENT;
B
bellard 已提交
198 199
}

P
Paolo Bonzini 已提交
200 201
static void termsig_handler(int signum)
{
202
    state = TERMINATE;
P
Paolo Bonzini 已提交
203
    qemu_notify_event();
P
Paolo Bonzini 已提交
204 205
}

206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255
static void combine_addr(char *buf, size_t len, const char* address,
                         uint16_t port)
{
    /* If the address-part contains a colon, it's an IPv6 IP so needs [] */
    if (strstr(address, ":")) {
        snprintf(buf, len, "[%s]:%u", address, port);
    } else {
        snprintf(buf, len, "%s:%u", address, port);
    }
}

static int tcp_socket_incoming(const char *address, uint16_t port)
{
    char address_and_port[128];
    Error *local_err = NULL;

    combine_addr(address_and_port, 128, address, port);
    int fd = inet_listen(address_and_port, NULL, 0, SOCK_STREAM, 0, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
}

static int unix_socket_incoming(const char *path)
{
    Error *local_err = NULL;
    int fd = unix_listen(path, NULL, 0, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
}

static int unix_socket_outgoing(const char *path)
{
    Error *local_err = NULL;
    int fd = unix_connect(path, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
}

P
Paolo Bonzini 已提交
256
static void *show_parts(void *arg)
257
{
258
    char *device = arg;
P
Paolo Bonzini 已提交
259 260 261 262 263 264 265 266
    int nbd;

    /* linux just needs an open() to trigger
     * the partition table update
     * but remember to load the module with max_part != 0 :
     *     modprobe nbd max_part=63
     */
    nbd = open(device, O_RDWR);
267
    if (nbd >= 0) {
P
Paolo Bonzini 已提交
268 269 270 271
        close(nbd);
    }
    return NULL;
}
272

P
Paolo Bonzini 已提交
273 274
static void *nbd_client_thread(void *arg)
{
275
    char *device = arg;
P
Paolo Bonzini 已提交
276 277 278
    off_t size;
    size_t blocksize;
    uint32_t nbdflags;
279
    int fd, sock;
P
Paolo Bonzini 已提交
280 281 282
    int ret;
    pthread_t show_parts_thread;

283
    sock = unix_socket_outgoing(sockpath);
284
    if (sock < 0) {
285 286
        goto out;
    }
P
Paolo Bonzini 已提交
287 288 289

    ret = nbd_receive_negotiate(sock, NULL, &nbdflags,
                                &size, &blocksize);
290
    if (ret < 0) {
P
Paolo Bonzini 已提交
291
        goto out_socket;
P
Paolo Bonzini 已提交
292 293
    }

294
    fd = open(device, O_RDWR);
295
    if (fd < 0) {
296 297
        /* Linux-only, we can use %m in printf.  */
        fprintf(stderr, "Failed to open %s: %m", device);
P
Paolo Bonzini 已提交
298
        goto out_socket;
299 300
    }

P
Paolo Bonzini 已提交
301
    ret = nbd_init(fd, sock, nbdflags, size, blocksize);
302
    if (ret < 0) {
P
Paolo Bonzini 已提交
303
        goto out_fd;
P
Paolo Bonzini 已提交
304 305 306
    }

    /* update partition table */
307
    pthread_create(&show_parts_thread, NULL, show_parts, device);
P
Paolo Bonzini 已提交
308

309 310 311 312 313 314 315
    if (verbose) {
        fprintf(stderr, "NBD device %s is now connected to %s\n",
                device, srcpath);
    } else {
        /* Close stderr so that the qemu-nbd process exits.  */
        dup2(STDOUT_FILENO, STDERR_FILENO);
    }
P
Paolo Bonzini 已提交
316 317 318

    ret = nbd_client(fd);
    if (ret) {
P
Paolo Bonzini 已提交
319
        goto out_fd;
320
    }
P
Paolo Bonzini 已提交
321 322 323 324
    close(fd);
    kill(getpid(), SIGTERM);
    return (void *) EXIT_SUCCESS;

P
Paolo Bonzini 已提交
325 326 327 328
out_fd:
    close(fd);
out_socket:
    closesocket(sock);
P
Paolo Bonzini 已提交
329 330 331
out:
    kill(getpid(), SIGTERM);
    return (void *) EXIT_FAILURE;
332 333
}

P
Paolo Bonzini 已提交
334 335 336 337 338
static int nbd_can_accept(void *opaque)
{
    return nb_fds < shared;
}

339 340 341 342 343 344
static void nbd_export_closed(NBDExport *exp)
{
    assert(state == TERMINATING);
    state = TERMINATED;
}

345
static void nbd_client_closed(NBDClient *client)
P
Paolo Bonzini 已提交
346
{
347
    nb_fds--;
348 349 350
    if (nb_fds == 0 && !persistent && state == RUNNING) {
        state = TERMINATE;
    }
351
    qemu_notify_event();
352
    nbd_client_put(client);
P
Paolo Bonzini 已提交
353 354 355 356 357 358 359 360 361
}

static void nbd_accept(void *opaque)
{
    int server_fd = (uintptr_t) opaque;
    struct sockaddr_in addr;
    socklen_t addr_len = sizeof(addr);

    int fd = accept(server_fd, (struct sockaddr *)&addr, &addr_len);
P
Paolo Bonzini 已提交
362 363 364 365 366
    if (fd < 0) {
        perror("accept");
        return;
    }

367 368 369 370 371
    if (state >= TERMINATE) {
        close(fd);
        return;
    }

372
    if (fd >= 0 && nbd_client_new(exp, fd, nbd_client_closed)) {
P
Paolo Bonzini 已提交
373 374 375 376
        nb_fds++;
    }
}

B
bellard 已提交
377 378 379
int main(int argc, char **argv)
{
    BlockDriverState *bs;
380
    BlockDriver *drv;
B
bellard 已提交
381
    off_t dev_offset = 0;
P
Paolo Bonzini 已提交
382
    uint32_t nbdflags = 0;
383
    bool disconnect = false;
B
bellard 已提交
384
    const char *bindto = "0.0.0.0";
385
    char *device = NULL;
386
    int port = NBD_DEFAULT_PORT;
B
bellard 已提交
387
    off_t fd_size;
388 389 390
    QemuOpts *sn_opts = NULL;
    const char *sn_id_or_name = NULL;
    const char *sopt = "hVb:o:p:rsnP:c:dvk:e:f:tl:";
B
bellard 已提交
391
    struct option lopt[] = {
392 393 394 395 396 397 398 399 400 401 402
        { "help", 0, NULL, 'h' },
        { "version", 0, NULL, 'V' },
        { "bind", 1, NULL, 'b' },
        { "port", 1, NULL, 'p' },
        { "socket", 1, NULL, 'k' },
        { "offset", 1, NULL, 'o' },
        { "read-only", 0, NULL, 'r' },
        { "partition", 1, NULL, 'P' },
        { "connect", 1, NULL, 'c' },
        { "disconnect", 0, NULL, 'd' },
        { "snapshot", 0, NULL, 's' },
403
        { "load-snapshot", 1, NULL, 'l' },
404
        { "nocache", 0, NULL, 'n' },
405 406 407 408
        { "cache", 1, NULL, QEMU_NBD_OPT_CACHE },
#ifdef CONFIG_LINUX_AIO
        { "aio", 1, NULL, QEMU_NBD_OPT_AIO },
#endif
P
Paolo Bonzini 已提交
409
        { "discard", 1, NULL, QEMU_NBD_OPT_DISCARD },
410
        { "shared", 1, NULL, 'e' },
411
        { "format", 1, NULL, 'f' },
412 413 414
        { "persistent", 0, NULL, 't' },
        { "verbose", 0, NULL, 'v' },
        { NULL, 0, NULL, 0 }
B
bellard 已提交
415 416 417 418 419
    };
    int ch;
    int opt_ind = 0;
    int li;
    char *end;
420
    int flags = BDRV_O_RDWR;
B
bellard 已提交
421
    int partition = -1;
422
    int ret;
423
    int fd;
424
    bool seen_cache = false;
P
Paolo Bonzini 已提交
425
    bool seen_discard = false;
426 427 428
#ifdef CONFIG_LINUX_AIO
    bool seen_aio = false;
#endif
P
Paolo Bonzini 已提交
429
    pthread_t client_thread;
430
    const char *fmt = NULL;
431
    Error *local_err = NULL;
B
bellard 已提交
432

P
Paolo Bonzini 已提交
433 434 435
    /* The client thread uses SIGTERM to interrupt the server.  A signal
     * handler ensures that "qemu-nbd -v -c" exits with a nice status code.
     */
P
Paolo Bonzini 已提交
436 437 438 439
    struct sigaction sa_sigterm;
    memset(&sa_sigterm, 0, sizeof(sa_sigterm));
    sa_sigterm.sa_handler = termsig_handler;
    sigaction(SIGTERM, &sa_sigterm, NULL);
440
    qemu_init_exec_dir(argv[0]);
P
Paolo Bonzini 已提交
441

B
bellard 已提交
442 443 444
    while ((ch = getopt_long(argc, argv, sopt, lopt, &opt_ind)) != -1) {
        switch (ch) {
        case 's':
445 446 447
            flags |= BDRV_O_SNAPSHOT;
            break;
        case 'n':
448 449 450 451 452 453 454 455 456 457
            optarg = (char *) "none";
            /* fallthrough */
        case QEMU_NBD_OPT_CACHE:
            if (seen_cache) {
                errx(EXIT_FAILURE, "-n and --cache can only be specified once");
            }
            seen_cache = true;
            if (bdrv_parse_cache_flags(optarg, &flags) == -1) {
                errx(EXIT_FAILURE, "Invalid cache mode `%s'", optarg);
            }
B
bellard 已提交
458
            break;
459 460 461 462 463 464 465 466 467 468 469 470 471 472 473
#ifdef CONFIG_LINUX_AIO
        case QEMU_NBD_OPT_AIO:
            if (seen_aio) {
                errx(EXIT_FAILURE, "--aio can only be specified once");
            }
            seen_aio = true;
            if (!strcmp(optarg, "native")) {
                flags |= BDRV_O_NATIVE_AIO;
            } else if (!strcmp(optarg, "threads")) {
                /* this is the default */
            } else {
               errx(EXIT_FAILURE, "invalid aio mode `%s'", optarg);
            }
            break;
#endif
P
Paolo Bonzini 已提交
474 475 476 477 478 479 480 481 482
        case QEMU_NBD_OPT_DISCARD:
            if (seen_discard) {
                errx(EXIT_FAILURE, "--discard can only be specified once");
            }
            seen_discard = true;
            if (bdrv_parse_discard_flags(optarg, &flags) == -1) {
                errx(EXIT_FAILURE, "Invalid discard mode `%s'", optarg);
            }
            break;
B
bellard 已提交
483 484 485 486 487 488
        case 'b':
            bindto = optarg;
            break;
        case 'p':
            li = strtol(optarg, &end, 0);
            if (*end) {
489
                errx(EXIT_FAILURE, "Invalid port `%s'", optarg);
B
bellard 已提交
490 491
            }
            if (li < 1 || li > 65535) {
492
                errx(EXIT_FAILURE, "Port out of range `%s'", optarg);
B
bellard 已提交
493 494 495 496 497 498
            }
            port = (uint16_t)li;
            break;
        case 'o':
                dev_offset = strtoll (optarg, &end, 0);
            if (*end) {
499
                errx(EXIT_FAILURE, "Invalid offset `%s'", optarg);
B
bellard 已提交
500 501
            }
            if (dev_offset < 0) {
502
                errx(EXIT_FAILURE, "Offset must be positive `%s'", optarg);
B
bellard 已提交
503 504
            }
            break;
505 506 507 508 509 510 511 512 513 514 515
        case 'l':
            if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) {
                sn_opts = qemu_opts_parse(&internal_snapshot_opts, optarg, 0);
                if (!sn_opts) {
                    errx(EXIT_FAILURE, "Failed in parsing snapshot param `%s'",
                         optarg);
                }
            } else {
                sn_id_or_name = optarg;
            }
            /* fall through */
B
bellard 已提交
516
        case 'r':
P
Paolo Bonzini 已提交
517
            nbdflags |= NBD_FLAG_READ_ONLY;
N
Naphtali Sprei 已提交
518
            flags &= ~BDRV_O_RDWR;
B
bellard 已提交
519 520 521 522
            break;
        case 'P':
            partition = strtol(optarg, &end, 0);
            if (*end)
523
                errx(EXIT_FAILURE, "Invalid partition `%s'", optarg);
B
bellard 已提交
524
            if (partition < 1 || partition > 8)
525
                errx(EXIT_FAILURE, "Invalid partition %d", partition);
B
bellard 已提交
526
            break;
527
        case 'k':
P
Paolo Bonzini 已提交
528 529
            sockpath = optarg;
            if (sockpath[0] != '/')
530
                errx(EXIT_FAILURE, "socket path must be absolute\n");
531 532 533 534 535 536 537
            break;
        case 'd':
            disconnect = true;
            break;
        case 'c':
            device = optarg;
            break;
538 539 540
        case 'e':
            shared = strtol(optarg, &end, 0);
            if (*end) {
541
                errx(EXIT_FAILURE, "Invalid shared device number '%s'", optarg);
542 543
            }
            if (shared < 1) {
544
                errx(EXIT_FAILURE, "Shared device number must be greater than 0\n");
545 546
            }
            break;
547 548 549
        case 'f':
            fmt = optarg;
            break;
550 551 552
	case 't':
	    persistent = 1;
	    break;
B
bellard 已提交
553 554 555 556 557 558 559 560 561 562 563 564
        case 'v':
            verbose = 1;
            break;
        case 'V':
            version(argv[0]);
            exit(0);
            break;
        case 'h':
            usage(argv[0]);
            exit(0);
            break;
        case '?':
565
            errx(EXIT_FAILURE, "Try `%s --help' for more information.",
B
bellard 已提交
566 567 568 569 570
                 argv[0]);
        }
    }

    if ((argc - optind) != 1) {
571
        errx(EXIT_FAILURE, "Invalid number of argument.\n"
B
bellard 已提交
572 573 574 575
             "Try `%s --help' for more information.",
             argv[0]);
    }

576 577
    if (disconnect) {
        fd = open(argv[optind], O_RDWR);
578
        if (fd < 0) {
R
Ryota Ozaki 已提交
579
            err(EXIT_FAILURE, "Cannot open %s", argv[optind]);
580
        }
581 582 583 584 585 586 587 588 589
        nbd_disconnect(fd);

        close(fd);

        printf("%s disconnected\n", argv[optind]);

	return 0;
    }

590 591 592 593 594
    if (device && !verbose) {
        int stderr_fd[2];
        pid_t pid;
        int ret;

595
        if (qemu_pipe(stderr_fd) < 0) {
596 597 598 599 600 601 602 603 604
            err(EXIT_FAILURE, "Error setting up communication pipe");
        }

        /* Now daemonize, but keep a communication channel open to
         * print errors and exit with the proper status code.
         */
        pid = fork();
        if (pid == 0) {
            close(stderr_fd[0]);
605
            ret = qemu_daemon(1, 0);
606 607 608

            /* Temporarily redirect stderr to the parent's pipe...  */
            dup2(stderr_fd[1], STDERR_FILENO);
609
            if (ret < 0) {
610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626
                err(EXIT_FAILURE, "Failed to daemonize");
            }

            /* ... close the descriptor we inherited and go on.  */
            close(stderr_fd[1]);
        } else {
            bool errors = false;
            char *buf;

            /* In the parent.  Print error messages from the child until
             * it closes the pipe.
             */
            close(stderr_fd[1]);
            buf = g_malloc(1024);
            while ((ret = read(stderr_fd[0], buf, 1024)) > 0) {
                errors = true;
                ret = qemu_write_full(STDERR_FILENO, buf, ret);
627
                if (ret < 0) {
628 629 630
                    exit(EXIT_FAILURE);
                }
            }
631
            if (ret < 0) {
632 633 634 635 636 637 638 639 640 641
                err(EXIT_FAILURE, "Cannot read from daemon");
            }

            /* Usually the daemon should not print any message.
             * Exit with zero status in that case.
             */
            exit(errors);
        }
    }

642 643 644
    if (device != NULL && sockpath == NULL) {
        sockpath = g_malloc(128);
        snprintf(sockpath, 128, SOCKET_PATH, basename(device));
645 646
    }

647
    qemu_init_main_loop();
648 649 650
    bdrv_init();
    atexit(bdrv_close_all);

651 652 653 654 655 656 657 658 659
    if (fmt) {
        drv = bdrv_find_format(fmt);
        if (!drv) {
            errx(EXIT_FAILURE, "Unknown file format '%s'", fmt);
        }
    } else {
        drv = NULL;
    }

660 661
    bs = bdrv_new("hda");
    srcpath = argv[optind];
662
    ret = bdrv_open(&bs, srcpath, NULL, NULL, flags, drv, &local_err);
663
    if (ret < 0) {
664
        errno = -ret;
665 666
        err(EXIT_FAILURE, "Failed to bdrv_open '%s': %s", argv[optind],
            error_get_pretty(local_err));
667 668
    }

669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684
    if (sn_opts) {
        ret = bdrv_snapshot_load_tmp(bs,
                                     qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID),
                                     qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME),
                                     &local_err);
    } else if (sn_id_or_name) {
        ret = bdrv_snapshot_load_tmp_by_id_or_name(bs, sn_id_or_name,
                                                   &local_err);
    }
    if (ret < 0) {
        errno = -ret;
        err(EXIT_FAILURE,
            "Failed to load snapshot: %s",
            error_get_pretty(local_err));
    }

P
Paolo Bonzini 已提交
685
    fd_size = bdrv_getlength(bs);
686

687 688 689 690 691 692
    if (partition != -1) {
        ret = find_partition(bs, partition, &dev_offset, &fd_size);
        if (ret < 0) {
            errno = -ret;
            err(EXIT_FAILURE, "Could not find partition %d", partition);
        }
693 694
    }

695
    exp = nbd_export_new(bs, dev_offset, fd_size, nbdflags, nbd_export_closed);
696

P
Paolo Bonzini 已提交
697
    if (sockpath) {
P
Paolo Bonzini 已提交
698
        fd = unix_socket_incoming(sockpath);
699
    } else {
P
Paolo Bonzini 已提交
700
        fd = tcp_socket_incoming(bindto, port);
701 702
    }

703
    if (fd < 0) {
B
bellard 已提交
704
        return 1;
P
Paolo Bonzini 已提交
705
    }
P
Paolo Bonzini 已提交
706 707 708 709

    if (device) {
        int ret;

710
        ret = pthread_create(&client_thread, NULL, nbd_client_thread, device);
P
Paolo Bonzini 已提交
711 712 713 714 715 716 717 718 719
        if (ret != 0) {
            errx(EXIT_FAILURE, "Failed to create client thread: %s",
                 strerror(ret));
        }
    } else {
        /* Shut up GCC warnings.  */
        memset(&client_thread, 0, sizeof(client_thread));
    }

P
Paolo Bonzini 已提交
720 721
    qemu_set_fd_handler2(fd, nbd_can_accept, nbd_accept, NULL,
                         (void *)(uintptr_t)fd);
B
bellard 已提交
722

723 724 725 726 727 728
    /* now when the initialization is (almost) complete, chdir("/")
     * to free any busy filesystems */
    if (chdir("/") < 0) {
        err(EXIT_FAILURE, "Could not chdir to root directory");
    }

729
    state = RUNNING;
730
    do {
P
Paolo Bonzini 已提交
731
        main_loop_wait(false);
732 733 734 735 736 737 738
        if (state == TERMINATE) {
            state = TERMINATING;
            nbd_export_close(exp);
            nbd_export_put(exp);
            exp = NULL;
        }
    } while (state != TERMINATED);
B
bellard 已提交
739

740
    bdrv_close(bs);
P
Paolo Bonzini 已提交
741 742 743
    if (sockpath) {
        unlink(sockpath);
    }
B
bellard 已提交
744

745 746 747 748
    if (sn_opts) {
        qemu_opts_del(sn_opts);
    }

P
Paolo Bonzini 已提交
749 750 751 752 753 754 755
    if (device) {
        void *ret;
        pthread_join(client_thread, &ret);
        exit(ret != NULL);
    } else {
        exit(EXIT_SUCCESS);
    }
B
bellard 已提交
756
}