qemu-nbd.c 20.7 KB
Newer Older
1
/*
B
bellard 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15
 *  Copyright (C) 2005  Anthony Liguori <anthony@codemonkey.ws>
 *
 *  Network Block Device
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; under version 2 of the License.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
16
 *  along with this program; if not, see <http://www.gnu.org/licenses/>.
B
bellard 已提交
17 18
 */

19
#include "qemu-common.h"
20 21
#include "block/block.h"
#include "block/nbd.h"
22
#include "qemu/main-loop.h"
23 24
#include "qemu/sockets.h"
#include "qemu/error-report.h"
25
#include "block/snapshot.h"
B
bellard 已提交
26 27 28 29 30

#include <stdarg.h>
#include <stdio.h>
#include <getopt.h>
#include <err.h>
31
#include <sys/types.h>
B
bellard 已提交
32 33 34 35
#include <sys/socket.h>
#include <netinet/in.h>
#include <netinet/tcp.h>
#include <arpa/inet.h>
36
#include <signal.h>
37
#include <libgen.h>
P
Paolo Bonzini 已提交
38
#include <pthread.h>
39

P
Paolo Bonzini 已提交
40 41 42 43
#define SOCKET_PATH          "/var/lock/qemu-nbd-%s"
#define QEMU_NBD_OPT_CACHE   1
#define QEMU_NBD_OPT_AIO     2
#define QEMU_NBD_OPT_DISCARD 3
B
bellard 已提交
44

P
Paolo Bonzini 已提交
45
static NBDExport *exp;
46
static int verbose;
P
Paolo Bonzini 已提交
47 48
static char *srcpath;
static char *sockpath;
49 50
static int persistent = 0;
static enum { RUNNING, TERMINATE, TERMINATING, TERMINATED } state;
P
Paolo Bonzini 已提交
51 52
static int shared = 1;
static int nb_fds;
B
bellard 已提交
53 54 55

static void usage(const char *name)
{
56
    (printf) (
B
bellard 已提交
57 58 59
"Usage: %s [OPTIONS] FILE\n"
"QEMU Disk Network Block Device Server\n"
"\n"
60 61 62 63
"  -h, --help           display this help and exit\n"
"  -V, --version        output version information and exit\n"
"\n"
"Connection properties:\n"
64
"  -p, --port=PORT      port to listen on (default `%d')\n"
B
bellard 已提交
65
"  -b, --bind=IFACE     interface to bind to (default `0.0.0.0')\n"
66 67
"  -k, --socket=PATH    path to the unix socket\n"
"                       (default '"SOCKET_PATH"')\n"
68
"  -e, --shared=NUM     device can be shared by NUM clients (default '1')\n"
69
"  -t, --persistent     don't exit on the last connection\n"
B
bellard 已提交
70 71
"  -v, --verbose        display extra debugging information\n"
"\n"
72 73 74 75 76 77 78 79 80 81 82 83
"Exposing part of the image:\n"
"  -o, --offset=OFFSET  offset into the image\n"
"  -P, --partition=NUM  only expose partition NUM\n"
"\n"
#ifdef __linux__
"Kernel NBD client support:\n"
"  -c, --connect=DEV    connect FILE to the local NBD device DEV\n"
"  -d, --disconnect     disconnect the specified device\n"
"\n"
#endif
"\n"
"Block device options:\n"
W
Wenchao Xia 已提交
84
"  -f, --format=FORMAT  set image format (raw, qcow2, ...)\n"
85
"  -r, --read-only      export read-only\n"
86 87 88 89 90 91 92 93
"  -s, --snapshot       use FILE as an external snapshot, create a temporary\n"
"                       file with backing_file=FILE, redirect the write to\n"
"                       the temporary one\n"
"  -l, --load-snapshot=SNAPSHOT_PARAM\n"
"                       load an internal snapshot inside FILE and export it\n"
"                       as an read-only device, SNAPSHOT_PARAM format is\n"
"                       'snapshot.id=[ID],snapshot.name=[NAME]', or\n"
"                       '[ID_OR_NAME]'\n"
94
"  -n, --nocache        disable host cache\n"
95 96 97 98
"      --cache=MODE     set cache mode (none, writeback, ...)\n"
#ifdef CONFIG_LINUX_AIO
"      --aio=MODE       set AIO mode (native or threads)\n"
#endif
99 100
"\n"
"Report bugs to <qemu-devel@nongnu.org>\n"
101
    , name, NBD_DEFAULT_PORT, "DEVICE");
B
bellard 已提交
102 103 104 105 106
}

static void version(const char *name)
{
    printf(
107
"%s version 0.0.1\n"
B
bellard 已提交
108 109 110 111 112
"Written by Anthony Liguori.\n"
"\n"
"Copyright (C) 2006 Anthony Liguori <anthony@codemonkey.ws>.\n"
"This is free software; see the source for copying conditions.  There is NO\n"
"warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n"
113
    , name);
B
bellard 已提交
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150
}

struct partition_record
{
    uint8_t bootable;
    uint8_t start_head;
    uint32_t start_cylinder;
    uint8_t start_sector;
    uint8_t system;
    uint8_t end_head;
    uint8_t end_cylinder;
    uint8_t end_sector;
    uint32_t start_sector_abs;
    uint32_t nb_sectors_abs;
};

static void read_partition(uint8_t *p, struct partition_record *r)
{
    r->bootable = p[0];
    r->start_head = p[1];
    r->start_cylinder = p[3] | ((p[2] << 2) & 0x0300);
    r->start_sector = p[2] & 0x3f;
    r->system = p[4];
    r->end_head = p[5];
    r->end_cylinder = p[7] | ((p[6] << 2) & 0x300);
    r->end_sector = p[6] & 0x3f;
    r->start_sector_abs = p[8] | p[9] << 8 | p[10] << 16 | p[11] << 24;
    r->nb_sectors_abs = p[12] | p[13] << 8 | p[14] << 16 | p[15] << 24;
}

static int find_partition(BlockDriverState *bs, int partition,
                          off_t *offset, off_t *size)
{
    struct partition_record mbr[4];
    uint8_t data[512];
    int i;
    int ext_partnum = 4;
R
Ryota Ozaki 已提交
151
    int ret;
B
bellard 已提交
152

R
Ryota Ozaki 已提交
153 154 155 156
    if ((ret = bdrv_read(bs, 0, data, 1)) < 0) {
        errno = -ret;
        err(EXIT_FAILURE, "error while reading");
    }
B
bellard 已提交
157 158

    if (data[510] != 0x55 || data[511] != 0xaa) {
159
        return -EINVAL;
B
bellard 已提交
160 161 162 163 164 165 166 167 168 169 170 171 172
    }

    for (i = 0; i < 4; i++) {
        read_partition(&data[446 + 16 * i], &mbr[i]);

        if (!mbr[i].nb_sectors_abs)
            continue;

        if (mbr[i].system == 0xF || mbr[i].system == 0x5) {
            struct partition_record ext[4];
            uint8_t data1[512];
            int j;

R
Ryota Ozaki 已提交
173 174 175 176
            if ((ret = bdrv_read(bs, mbr[i].start_sector_abs, data1, 1)) < 0) {
                errno = -ret;
                err(EXIT_FAILURE, "error while reading");
            }
B
bellard 已提交
177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196

            for (j = 0; j < 4; j++) {
                read_partition(&data1[446 + 16 * j], &ext[j]);
                if (!ext[j].nb_sectors_abs)
                    continue;

                if ((ext_partnum + j + 1) == partition) {
                    *offset = (uint64_t)ext[j].start_sector_abs << 9;
                    *size = (uint64_t)ext[j].nb_sectors_abs << 9;
                    return 0;
                }
            }
            ext_partnum += 4;
        } else if ((i + 1) == partition) {
            *offset = (uint64_t)mbr[i].start_sector_abs << 9;
            *size = (uint64_t)mbr[i].nb_sectors_abs << 9;
            return 0;
        }
    }

197
    return -ENOENT;
B
bellard 已提交
198 199
}

P
Paolo Bonzini 已提交
200 201
static void termsig_handler(int signum)
{
202
    state = TERMINATE;
P
Paolo Bonzini 已提交
203
    qemu_notify_event();
P
Paolo Bonzini 已提交
204 205
}

206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255
static void combine_addr(char *buf, size_t len, const char* address,
                         uint16_t port)
{
    /* If the address-part contains a colon, it's an IPv6 IP so needs [] */
    if (strstr(address, ":")) {
        snprintf(buf, len, "[%s]:%u", address, port);
    } else {
        snprintf(buf, len, "%s:%u", address, port);
    }
}

static int tcp_socket_incoming(const char *address, uint16_t port)
{
    char address_and_port[128];
    Error *local_err = NULL;

    combine_addr(address_and_port, 128, address, port);
    int fd = inet_listen(address_and_port, NULL, 0, SOCK_STREAM, 0, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
}

static int unix_socket_incoming(const char *path)
{
    Error *local_err = NULL;
    int fd = unix_listen(path, NULL, 0, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
}

static int unix_socket_outgoing(const char *path)
{
    Error *local_err = NULL;
    int fd = unix_connect(path, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
}

P
Paolo Bonzini 已提交
256
static void *show_parts(void *arg)
257
{
258
    char *device = arg;
P
Paolo Bonzini 已提交
259 260 261 262 263 264 265 266
    int nbd;

    /* linux just needs an open() to trigger
     * the partition table update
     * but remember to load the module with max_part != 0 :
     *     modprobe nbd max_part=63
     */
    nbd = open(device, O_RDWR);
267
    if (nbd >= 0) {
P
Paolo Bonzini 已提交
268 269 270 271
        close(nbd);
    }
    return NULL;
}
272

P
Paolo Bonzini 已提交
273 274
static void *nbd_client_thread(void *arg)
{
275
    char *device = arg;
P
Paolo Bonzini 已提交
276 277 278
    off_t size;
    size_t blocksize;
    uint32_t nbdflags;
279
    int fd, sock;
P
Paolo Bonzini 已提交
280 281 282
    int ret;
    pthread_t show_parts_thread;

283
    sock = unix_socket_outgoing(sockpath);
284
    if (sock < 0) {
285 286
        goto out;
    }
P
Paolo Bonzini 已提交
287 288 289

    ret = nbd_receive_negotiate(sock, NULL, &nbdflags,
                                &size, &blocksize);
290
    if (ret < 0) {
P
Paolo Bonzini 已提交
291 292 293
        goto out;
    }

294
    fd = open(device, O_RDWR);
295
    if (fd < 0) {
296 297 298 299 300
        /* Linux-only, we can use %m in printf.  */
        fprintf(stderr, "Failed to open %s: %m", device);
        goto out;
    }

P
Paolo Bonzini 已提交
301
    ret = nbd_init(fd, sock, nbdflags, size, blocksize);
302
    if (ret < 0) {
P
Paolo Bonzini 已提交
303 304 305 306
        goto out;
    }

    /* update partition table */
307
    pthread_create(&show_parts_thread, NULL, show_parts, device);
P
Paolo Bonzini 已提交
308

309 310 311 312 313 314 315
    if (verbose) {
        fprintf(stderr, "NBD device %s is now connected to %s\n",
                device, srcpath);
    } else {
        /* Close stderr so that the qemu-nbd process exits.  */
        dup2(STDOUT_FILENO, STDERR_FILENO);
    }
P
Paolo Bonzini 已提交
316 317 318 319

    ret = nbd_client(fd);
    if (ret) {
        goto out;
320
    }
P
Paolo Bonzini 已提交
321 322 323 324 325 326 327
    close(fd);
    kill(getpid(), SIGTERM);
    return (void *) EXIT_SUCCESS;

out:
    kill(getpid(), SIGTERM);
    return (void *) EXIT_FAILURE;
328 329
}

P
Paolo Bonzini 已提交
330 331 332 333 334
static int nbd_can_accept(void *opaque)
{
    return nb_fds < shared;
}

335 336 337 338 339 340
static void nbd_export_closed(NBDExport *exp)
{
    assert(state == TERMINATING);
    state = TERMINATED;
}

341
static void nbd_client_closed(NBDClient *client)
P
Paolo Bonzini 已提交
342
{
343
    nb_fds--;
344 345 346
    if (nb_fds == 0 && !persistent && state == RUNNING) {
        state = TERMINATE;
    }
347
    qemu_notify_event();
348
    nbd_client_put(client);
P
Paolo Bonzini 已提交
349 350 351 352 353 354 355 356 357
}

static void nbd_accept(void *opaque)
{
    int server_fd = (uintptr_t) opaque;
    struct sockaddr_in addr;
    socklen_t addr_len = sizeof(addr);

    int fd = accept(server_fd, (struct sockaddr *)&addr, &addr_len);
358 359 360 361 362
    if (state >= TERMINATE) {
        close(fd);
        return;
    }

363
    if (fd >= 0 && nbd_client_new(exp, fd, nbd_client_closed)) {
P
Paolo Bonzini 已提交
364 365 366 367
        nb_fds++;
    }
}

B
bellard 已提交
368 369 370
int main(int argc, char **argv)
{
    BlockDriverState *bs;
371
    BlockDriver *drv;
B
bellard 已提交
372
    off_t dev_offset = 0;
P
Paolo Bonzini 已提交
373
    uint32_t nbdflags = 0;
374
    bool disconnect = false;
B
bellard 已提交
375
    const char *bindto = "0.0.0.0";
376
    char *device = NULL;
377
    int port = NBD_DEFAULT_PORT;
B
bellard 已提交
378
    off_t fd_size;
379 380 381
    QemuOpts *sn_opts = NULL;
    const char *sn_id_or_name = NULL;
    const char *sopt = "hVb:o:p:rsnP:c:dvk:e:f:tl:";
B
bellard 已提交
382
    struct option lopt[] = {
383 384 385 386 387 388 389 390 391 392 393
        { "help", 0, NULL, 'h' },
        { "version", 0, NULL, 'V' },
        { "bind", 1, NULL, 'b' },
        { "port", 1, NULL, 'p' },
        { "socket", 1, NULL, 'k' },
        { "offset", 1, NULL, 'o' },
        { "read-only", 0, NULL, 'r' },
        { "partition", 1, NULL, 'P' },
        { "connect", 1, NULL, 'c' },
        { "disconnect", 0, NULL, 'd' },
        { "snapshot", 0, NULL, 's' },
394
        { "load-snapshot", 1, NULL, 'l' },
395
        { "nocache", 0, NULL, 'n' },
396 397 398 399
        { "cache", 1, NULL, QEMU_NBD_OPT_CACHE },
#ifdef CONFIG_LINUX_AIO
        { "aio", 1, NULL, QEMU_NBD_OPT_AIO },
#endif
P
Paolo Bonzini 已提交
400
        { "discard", 1, NULL, QEMU_NBD_OPT_DISCARD },
401
        { "shared", 1, NULL, 'e' },
402
        { "format", 1, NULL, 'f' },
403 404 405
        { "persistent", 0, NULL, 't' },
        { "verbose", 0, NULL, 'v' },
        { NULL, 0, NULL, 0 }
B
bellard 已提交
406 407 408 409 410
    };
    int ch;
    int opt_ind = 0;
    int li;
    char *end;
411
    int flags = BDRV_O_RDWR;
B
bellard 已提交
412
    int partition = -1;
413
    int ret;
414
    int fd;
415
    bool seen_cache = false;
P
Paolo Bonzini 已提交
416
    bool seen_discard = false;
417 418 419
#ifdef CONFIG_LINUX_AIO
    bool seen_aio = false;
#endif
P
Paolo Bonzini 已提交
420
    pthread_t client_thread;
421
    const char *fmt = NULL;
422
    Error *local_err = NULL;
B
bellard 已提交
423

P
Paolo Bonzini 已提交
424 425 426
    /* The client thread uses SIGTERM to interrupt the server.  A signal
     * handler ensures that "qemu-nbd -v -c" exits with a nice status code.
     */
P
Paolo Bonzini 已提交
427 428 429 430
    struct sigaction sa_sigterm;
    memset(&sa_sigterm, 0, sizeof(sa_sigterm));
    sa_sigterm.sa_handler = termsig_handler;
    sigaction(SIGTERM, &sa_sigterm, NULL);
431
    qemu_init_exec_dir(argv[0]);
P
Paolo Bonzini 已提交
432

B
bellard 已提交
433 434 435
    while ((ch = getopt_long(argc, argv, sopt, lopt, &opt_ind)) != -1) {
        switch (ch) {
        case 's':
436 437 438
            flags |= BDRV_O_SNAPSHOT;
            break;
        case 'n':
439 440 441 442 443 444 445 446 447 448
            optarg = (char *) "none";
            /* fallthrough */
        case QEMU_NBD_OPT_CACHE:
            if (seen_cache) {
                errx(EXIT_FAILURE, "-n and --cache can only be specified once");
            }
            seen_cache = true;
            if (bdrv_parse_cache_flags(optarg, &flags) == -1) {
                errx(EXIT_FAILURE, "Invalid cache mode `%s'", optarg);
            }
B
bellard 已提交
449
            break;
450 451 452 453 454 455 456 457 458 459 460 461 462 463 464
#ifdef CONFIG_LINUX_AIO
        case QEMU_NBD_OPT_AIO:
            if (seen_aio) {
                errx(EXIT_FAILURE, "--aio can only be specified once");
            }
            seen_aio = true;
            if (!strcmp(optarg, "native")) {
                flags |= BDRV_O_NATIVE_AIO;
            } else if (!strcmp(optarg, "threads")) {
                /* this is the default */
            } else {
               errx(EXIT_FAILURE, "invalid aio mode `%s'", optarg);
            }
            break;
#endif
P
Paolo Bonzini 已提交
465 466 467 468 469 470 471 472 473
        case QEMU_NBD_OPT_DISCARD:
            if (seen_discard) {
                errx(EXIT_FAILURE, "--discard can only be specified once");
            }
            seen_discard = true;
            if (bdrv_parse_discard_flags(optarg, &flags) == -1) {
                errx(EXIT_FAILURE, "Invalid discard mode `%s'", optarg);
            }
            break;
B
bellard 已提交
474 475 476 477 478 479
        case 'b':
            bindto = optarg;
            break;
        case 'p':
            li = strtol(optarg, &end, 0);
            if (*end) {
480
                errx(EXIT_FAILURE, "Invalid port `%s'", optarg);
B
bellard 已提交
481 482
            }
            if (li < 1 || li > 65535) {
483
                errx(EXIT_FAILURE, "Port out of range `%s'", optarg);
B
bellard 已提交
484 485 486 487 488 489
            }
            port = (uint16_t)li;
            break;
        case 'o':
                dev_offset = strtoll (optarg, &end, 0);
            if (*end) {
490
                errx(EXIT_FAILURE, "Invalid offset `%s'", optarg);
B
bellard 已提交
491 492
            }
            if (dev_offset < 0) {
493
                errx(EXIT_FAILURE, "Offset must be positive `%s'", optarg);
B
bellard 已提交
494 495
            }
            break;
496 497 498 499 500 501 502 503 504 505 506
        case 'l':
            if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) {
                sn_opts = qemu_opts_parse(&internal_snapshot_opts, optarg, 0);
                if (!sn_opts) {
                    errx(EXIT_FAILURE, "Failed in parsing snapshot param `%s'",
                         optarg);
                }
            } else {
                sn_id_or_name = optarg;
            }
            /* fall through */
B
bellard 已提交
507
        case 'r':
P
Paolo Bonzini 已提交
508
            nbdflags |= NBD_FLAG_READ_ONLY;
N
Naphtali Sprei 已提交
509
            flags &= ~BDRV_O_RDWR;
B
bellard 已提交
510 511 512 513
            break;
        case 'P':
            partition = strtol(optarg, &end, 0);
            if (*end)
514
                errx(EXIT_FAILURE, "Invalid partition `%s'", optarg);
B
bellard 已提交
515
            if (partition < 1 || partition > 8)
516
                errx(EXIT_FAILURE, "Invalid partition %d", partition);
B
bellard 已提交
517
            break;
518
        case 'k':
P
Paolo Bonzini 已提交
519 520
            sockpath = optarg;
            if (sockpath[0] != '/')
521
                errx(EXIT_FAILURE, "socket path must be absolute\n");
522 523 524 525 526 527 528
            break;
        case 'd':
            disconnect = true;
            break;
        case 'c':
            device = optarg;
            break;
529 530 531
        case 'e':
            shared = strtol(optarg, &end, 0);
            if (*end) {
532
                errx(EXIT_FAILURE, "Invalid shared device number '%s'", optarg);
533 534
            }
            if (shared < 1) {
535
                errx(EXIT_FAILURE, "Shared device number must be greater than 0\n");
536 537
            }
            break;
538 539 540
        case 'f':
            fmt = optarg;
            break;
541 542 543
	case 't':
	    persistent = 1;
	    break;
B
bellard 已提交
544 545 546 547 548 549 550 551 552 553 554 555
        case 'v':
            verbose = 1;
            break;
        case 'V':
            version(argv[0]);
            exit(0);
            break;
        case 'h':
            usage(argv[0]);
            exit(0);
            break;
        case '?':
556
            errx(EXIT_FAILURE, "Try `%s --help' for more information.",
B
bellard 已提交
557 558 559 560 561
                 argv[0]);
        }
    }

    if ((argc - optind) != 1) {
562
        errx(EXIT_FAILURE, "Invalid number of argument.\n"
B
bellard 已提交
563 564 565 566
             "Try `%s --help' for more information.",
             argv[0]);
    }

567 568
    if (disconnect) {
        fd = open(argv[optind], O_RDWR);
569
        if (fd < 0) {
R
Ryota Ozaki 已提交
570
            err(EXIT_FAILURE, "Cannot open %s", argv[optind]);
571
        }
572 573 574 575 576 577 578 579 580
        nbd_disconnect(fd);

        close(fd);

        printf("%s disconnected\n", argv[optind]);

	return 0;
    }

581 582 583 584 585
    if (device && !verbose) {
        int stderr_fd[2];
        pid_t pid;
        int ret;

586
        if (qemu_pipe(stderr_fd) < 0) {
587 588 589 590 591 592 593 594 595
            err(EXIT_FAILURE, "Error setting up communication pipe");
        }

        /* Now daemonize, but keep a communication channel open to
         * print errors and exit with the proper status code.
         */
        pid = fork();
        if (pid == 0) {
            close(stderr_fd[0]);
596
            ret = qemu_daemon(1, 0);
597 598 599

            /* Temporarily redirect stderr to the parent's pipe...  */
            dup2(stderr_fd[1], STDERR_FILENO);
600
            if (ret < 0) {
601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617
                err(EXIT_FAILURE, "Failed to daemonize");
            }

            /* ... close the descriptor we inherited and go on.  */
            close(stderr_fd[1]);
        } else {
            bool errors = false;
            char *buf;

            /* In the parent.  Print error messages from the child until
             * it closes the pipe.
             */
            close(stderr_fd[1]);
            buf = g_malloc(1024);
            while ((ret = read(stderr_fd[0], buf, 1024)) > 0) {
                errors = true;
                ret = qemu_write_full(STDERR_FILENO, buf, ret);
618
                if (ret < 0) {
619 620 621
                    exit(EXIT_FAILURE);
                }
            }
622
            if (ret < 0) {
623 624 625 626 627 628 629 630 631 632
                err(EXIT_FAILURE, "Cannot read from daemon");
            }

            /* Usually the daemon should not print any message.
             * Exit with zero status in that case.
             */
            exit(errors);
        }
    }

633 634 635
    if (device != NULL && sockpath == NULL) {
        sockpath = g_malloc(128);
        snprintf(sockpath, 128, SOCKET_PATH, basename(device));
636 637
    }

638
    qemu_init_main_loop();
639 640 641
    bdrv_init();
    atexit(bdrv_close_all);

642 643 644 645 646 647 648 649 650
    if (fmt) {
        drv = bdrv_find_format(fmt);
        if (!drv) {
            errx(EXIT_FAILURE, "Unknown file format '%s'", fmt);
        }
    } else {
        drv = NULL;
    }

651 652
    bs = bdrv_new("hda");
    srcpath = argv[optind];
653
    ret = bdrv_open(&bs, srcpath, NULL, NULL, flags, drv, &local_err);
654
    if (ret < 0) {
655
        errno = -ret;
656 657
        err(EXIT_FAILURE, "Failed to bdrv_open '%s': %s", argv[optind],
            error_get_pretty(local_err));
658 659
    }

660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675
    if (sn_opts) {
        ret = bdrv_snapshot_load_tmp(bs,
                                     qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID),
                                     qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME),
                                     &local_err);
    } else if (sn_id_or_name) {
        ret = bdrv_snapshot_load_tmp_by_id_or_name(bs, sn_id_or_name,
                                                   &local_err);
    }
    if (ret < 0) {
        errno = -ret;
        err(EXIT_FAILURE,
            "Failed to load snapshot: %s",
            error_get_pretty(local_err));
    }

P
Paolo Bonzini 已提交
676
    fd_size = bdrv_getlength(bs);
677

678 679 680 681 682 683
    if (partition != -1) {
        ret = find_partition(bs, partition, &dev_offset, &fd_size);
        if (ret < 0) {
            errno = -ret;
            err(EXIT_FAILURE, "Could not find partition %d", partition);
        }
684 685
    }

686
    exp = nbd_export_new(bs, dev_offset, fd_size, nbdflags, nbd_export_closed);
687

P
Paolo Bonzini 已提交
688
    if (sockpath) {
P
Paolo Bonzini 已提交
689
        fd = unix_socket_incoming(sockpath);
690
    } else {
P
Paolo Bonzini 已提交
691
        fd = tcp_socket_incoming(bindto, port);
692 693
    }

694
    if (fd < 0) {
B
bellard 已提交
695
        return 1;
P
Paolo Bonzini 已提交
696
    }
P
Paolo Bonzini 已提交
697 698 699 700

    if (device) {
        int ret;

701
        ret = pthread_create(&client_thread, NULL, nbd_client_thread, device);
P
Paolo Bonzini 已提交
702 703 704 705 706 707 708 709 710
        if (ret != 0) {
            errx(EXIT_FAILURE, "Failed to create client thread: %s",
                 strerror(ret));
        }
    } else {
        /* Shut up GCC warnings.  */
        memset(&client_thread, 0, sizeof(client_thread));
    }

P
Paolo Bonzini 已提交
711 712
    qemu_set_fd_handler2(fd, nbd_can_accept, nbd_accept, NULL,
                         (void *)(uintptr_t)fd);
B
bellard 已提交
713

714 715 716 717 718 719
    /* now when the initialization is (almost) complete, chdir("/")
     * to free any busy filesystems */
    if (chdir("/") < 0) {
        err(EXIT_FAILURE, "Could not chdir to root directory");
    }

720
    state = RUNNING;
721
    do {
P
Paolo Bonzini 已提交
722
        main_loop_wait(false);
723 724 725 726 727 728 729
        if (state == TERMINATE) {
            state = TERMINATING;
            nbd_export_close(exp);
            nbd_export_put(exp);
            exp = NULL;
        }
    } while (state != TERMINATED);
B
bellard 已提交
730

731
    bdrv_close(bs);
P
Paolo Bonzini 已提交
732 733 734
    if (sockpath) {
        unlink(sockpath);
    }
B
bellard 已提交
735

736 737 738 739
    if (sn_opts) {
        qemu_opts_del(sn_opts);
    }

P
Paolo Bonzini 已提交
740 741 742 743 744 745 746
    if (device) {
        void *ret;
        pthread_join(client_thread, &ret);
        exit(ret != NULL);
    } else {
        exit(EXIT_SUCCESS);
    }
B
bellard 已提交
747
}