nbd.c 31.0 KB
Newer Older
1
/*
B
bellard 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15
 *  Copyright (C) 2005  Anthony Liguori <anthony@codemonkey.ws>
 *
 *  Network Block Device
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; under version 2 of the License.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
16
 *  along with this program; if not, see <http://www.gnu.org/licenses/>.
17
 */
B
bellard 已提交
18

19 20
#include "block/nbd.h"
#include "block/block.h"
B
bellard 已提交
21

22
#include "block/coroutine.h"
P
Paolo Bonzini 已提交
23

B
bellard 已提交
24 25
#include <errno.h>
#include <string.h>
26
#ifndef _WIN32
B
bellard 已提交
27
#include <sys/ioctl.h>
28
#endif
29
#if defined(__sun__) || defined(__HAIKU__)
30 31
#include <sys/ioccom.h>
#endif
B
bellard 已提交
32 33
#include <ctype.h>
#include <inttypes.h>
34

P
Paolo Bonzini 已提交
35 36 37 38
#ifdef __linux__
#include <linux/fs.h>
#endif

39
#include "qemu_socket.h"
P
Paolo Bonzini 已提交
40
#include "qemu-queue.h"
41 42 43 44

//#define DEBUG_NBD

#ifdef DEBUG_NBD
45
#define TRACE(msg, ...) do { \
46
    LOG(msg, ## __VA_ARGS__); \
47
} while(0)
48 49 50 51
#else
#define TRACE(msg, ...) \
    do { } while (0)
#endif
B
bellard 已提交
52 53 54 55 56 57 58 59

#define LOG(msg, ...) do { \
    fprintf(stderr, "%s:%s():L%d: " msg "\n", \
            __FILE__, __FUNCTION__, __LINE__, ## __VA_ARGS__); \
} while(0)

/* This is all part of the "official" NBD API */

P
Paolo Bonzini 已提交
60
#define NBD_REQUEST_SIZE        (4 + 4 + 8 + 8 + 4)
N
Nick Thomas 已提交
61
#define NBD_REPLY_SIZE          (4 + 4 + 8)
B
bellard 已提交
62 63
#define NBD_REQUEST_MAGIC       0x25609513
#define NBD_REPLY_MAGIC         0x67446698
P
Paolo Bonzini 已提交
64 65
#define NBD_OPTS_MAGIC          0x49484156454F5054LL
#define NBD_CLIENT_MAGIC        0x0000420281861253LL
B
bellard 已提交
66 67 68 69 70 71 72

#define NBD_SET_SOCK            _IO(0xab, 0)
#define NBD_SET_BLKSIZE         _IO(0xab, 1)
#define NBD_SET_SIZE            _IO(0xab, 2)
#define NBD_DO_IT               _IO(0xab, 3)
#define NBD_CLEAR_SOCK          _IO(0xab, 4)
#define NBD_CLEAR_QUE           _IO(0xab, 5)
N
Nick Thomas 已提交
73 74
#define NBD_PRINT_DEBUG         _IO(0xab, 6)
#define NBD_SET_SIZE_BLOCKS     _IO(0xab, 7)
B
bellard 已提交
75
#define NBD_DISCONNECT          _IO(0xab, 8)
76 77
#define NBD_SET_TIMEOUT         _IO(0xab, 9)
#define NBD_SET_FLAGS           _IO(0xab, 10)
B
bellard 已提交
78

N
Nick Thomas 已提交
79
#define NBD_OPT_EXPORT_NAME     (1 << 0)
80

81 82 83 84 85 86 87 88 89 90 91
/* Definitions for opaque data types */

typedef struct NBDRequest NBDRequest;

struct NBDRequest {
    QSIMPLEQ_ENTRY(NBDRequest) entry;
    NBDClient *client;
    uint8_t *data;
};

struct NBDExport {
92
    int refcount;
93 94
    void (*close)(NBDExport *exp);

95
    BlockDriverState *bs;
P
Paolo Bonzini 已提交
96
    char *name;
97 98 99
    off_t dev_offset;
    off_t size;
    uint32_t nbdflags;
100
    QTAILQ_HEAD(, NBDClient) clients;
101
    QSIMPLEQ_HEAD(, NBDRequest) requests;
P
Paolo Bonzini 已提交
102
    QTAILQ_ENTRY(NBDExport) next;
103 104
};

P
Paolo Bonzini 已提交
105 106
static QTAILQ_HEAD(, NBDExport) exports = QTAILQ_HEAD_INITIALIZER(exports);

107 108 109 110 111 112 113 114 115 116 117 118
struct NBDClient {
    int refcount;
    void (*close)(NBDClient *client);

    NBDExport *exp;
    int sock;

    Coroutine *recv_coroutine;

    CoMutex send_lock;
    Coroutine *send_coroutine;

119
    QTAILQ_ENTRY(NBDClient) next;
120
    int nb_requests;
121
    bool closing;
122 123
};

B
bellard 已提交
124 125
/* That's all folks */

126
ssize_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read)
B
bellard 已提交
127 128
{
    size_t offset = 0;
129
    int err;
B
bellard 已提交
130

131 132 133 134 135 136 137 138
    if (qemu_in_coroutine()) {
        if (do_read) {
            return qemu_co_recv(fd, buffer, size);
        } else {
            return qemu_co_send(fd, buffer, size);
        }
    }

B
bellard 已提交
139 140 141 142
    while (offset < size) {
        ssize_t len;

        if (do_read) {
B
Blue Swirl 已提交
143
            len = qemu_recv(fd, buffer + offset, size - offset, 0);
B
bellard 已提交
144
        } else {
145
            len = send(fd, buffer + offset, size - offset, 0);
B
bellard 已提交
146 147
        }

148
        if (len < 0) {
149
            err = socket_error();
150

151
            /* recoverable error */
152
            if (err == EINTR || (offset > 0 && err == EAGAIN)) {
153 154 155 156
                continue;
            }

            /* unrecoverable error */
157
            return -err;
B
bellard 已提交
158 159 160 161 162 163 164 165 166 167 168 169 170
        }

        /* eof */
        if (len == 0) {
            break;
        }

        offset += len;
    }

    return offset;
}

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190
static ssize_t read_sync(int fd, void *buffer, size_t size)
{
    /* Sockets are kept in blocking mode in the negotiation phase.  After
     * that, a non-readable socket simply means that another thread stole
     * our request/reply.  Synchronization is done with recv_coroutine, so
     * that this is coroutine-safe.
     */
    return nbd_wr_sync(fd, buffer, size, true);
}

static ssize_t write_sync(int fd, void *buffer, size_t size)
{
    int ret;
    do {
        /* For writes, we do expect the socket to be writable.  */
        ret = nbd_wr_sync(fd, buffer, size, false);
    } while (ret == -EAGAIN);
    return ret;
}

191 192
static void combine_addr(char *buf, size_t len, const char* address,
                         uint16_t port)
B
bellard 已提交
193
{
194 195 196 197 198
    /* If the address-part contains a colon, it's an IPv6 IP so needs [] */
    if (strstr(address, ":")) {
        snprintf(buf, len, "[%s]:%u", address, port);
    } else {
        snprintf(buf, len, "%s:%u", address, port);
B
bellard 已提交
199 200 201
    }
}

202
int tcp_socket_outgoing(const char *address, uint16_t port)
B
bellard 已提交
203
{
204 205 206
    char address_and_port[128];
    combine_addr(address_and_port, 128, address, port);
    return tcp_socket_outgoing_spec(address_and_port);
B
bellard 已提交
207 208
}

209
int tcp_socket_outgoing_spec(const char *address_and_port)
210
{
211 212 213 214 215 216 217 218
    Error *local_err = NULL;
    int fd = inet_connect(address_and_port, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
219 220
}

221
int tcp_socket_incoming(const char *address, uint16_t port)
222
{
223 224 225 226
    char address_and_port[128];
    combine_addr(address_and_port, 128, address, port);
    return tcp_socket_incoming_spec(address_and_port);
}
227

228 229
int tcp_socket_incoming_spec(const char *address_and_port)
{
230 231 232 233 234 235 236 237
    Error *local_err = NULL;
    int fd = inet_listen(address_and_port, NULL, 0, SOCK_STREAM, 0, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
238
}
239

240 241
int unix_socket_incoming(const char *path)
{
242 243
    Error *local_err = NULL;
    int fd = unix_listen(path, NULL, 0, &local_err);
244

245 246 247 248 249
    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
250 251
}

252 253
int unix_socket_outgoing(const char *path)
{
254 255 256 257 258 259 260 261
    Error *local_err = NULL;
    int fd = unix_connect(path, &local_err);

    if (local_err != NULL) {
        qerror_report_err(local_err);
        error_free(local_err);
    }
    return fd;
262
}
263

264
/* Basic flow for negotiation
B
bellard 已提交
265 266 267

   Server         Client
   Negotiate
268 269 270 271 272 273 274 275 276 277 278 279 280

   or

   Server         Client
   Negotiate #1
                  Option
   Negotiate #2

   ----

   followed by

   Server         Client
B
bellard 已提交
281 282 283 284 285 286 287
                  Request
   Response
                  Request
   Response
                  ...
   ...
                  Request (type == 2)
288

B
bellard 已提交
289 290
*/

291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368
static int nbd_receive_options(NBDClient *client)
{
    int csock = client->sock;
    char name[256];
    uint32_t tmp, length;
    uint64_t magic;
    int rc;

    /* Client sends:
        [ 0 ..   3]   reserved (0)
        [ 4 ..  11]   NBD_OPTS_MAGIC
        [12 ..  15]   NBD_OPT_EXPORT_NAME
        [16 ..  19]   length
        [20 ..  xx]   export name (length bytes)
     */

    rc = -EINVAL;
    if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) {
        LOG("read failed");
        goto fail;
    }
    TRACE("Checking reserved");
    if (tmp != 0) {
        LOG("Bad reserved received");
        goto fail;
    }

    if (read_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) {
        LOG("read failed");
        goto fail;
    }
    TRACE("Checking reserved");
    if (magic != be64_to_cpu(NBD_OPTS_MAGIC)) {
        LOG("Bad magic received");
        goto fail;
    }

    if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) {
        LOG("read failed");
        goto fail;
    }
    TRACE("Checking option");
    if (tmp != be32_to_cpu(NBD_OPT_EXPORT_NAME)) {
        LOG("Bad option received");
        goto fail;
    }

    if (read_sync(csock, &length, sizeof(length)) != sizeof(length)) {
        LOG("read failed");
        goto fail;
    }
    TRACE("Checking length");
    length = be32_to_cpu(length);
    if (length > 255) {
        LOG("Bad length received");
        goto fail;
    }
    if (read_sync(csock, name, length) != length) {
        LOG("read failed");
        goto fail;
    }
    name[length] = '\0';

    client->exp = nbd_export_find(name);
    if (!client->exp) {
        LOG("export not found");
        goto fail;
    }

    QTAILQ_INSERT_TAIL(&client->exp->clients, client, next);
    nbd_export_get(client->exp);

    TRACE("Option negotiation succeeded.");
    rc = 0;
fail:
    return rc;
}

369
static int nbd_send_negotiate(NBDClient *client)
B
bellard 已提交
370
{
371
    int csock = client->sock;
N
Nick Thomas 已提交
372
    char buf[8 + 8 + 8 + 128];
373
    int rc;
374 375
    const int myflags = (NBD_FLAG_HAS_FLAGS | NBD_FLAG_SEND_TRIM |
                         NBD_FLAG_SEND_FLUSH | NBD_FLAG_SEND_FUA);
N
Nick Thomas 已提交
376

377 378 379
    /* Negotiation header without options:
        [ 0 ..   7]   passwd       ("NBDMAGIC")
        [ 8 ..  15]   magic        (NBD_CLIENT_MAGIC)
N
Nick Thomas 已提交
380
        [16 ..  23]   size
381 382 383 384 385 386 387 388 389 390 391 392 393
        [24 ..  25]   server flags (0)
        [24 ..  27]   export flags
        [28 .. 151]   reserved     (0)

       Negotiation header with options, part 1:
        [ 0 ..   7]   passwd       ("NBDMAGIC")
        [ 8 ..  15]   magic        (NBD_OPTS_MAGIC)
        [16 ..  17]   server flags (0)

       part 2 (after options are sent):
        [18 ..  25]   size
        [26 ..  27]   export flags
        [28 .. 151]   reserved     (0)
N
Nick Thomas 已提交
394 395
     */

396
    socket_set_block(csock);
397 398
    rc = -EINVAL;

N
Nick Thomas 已提交
399
    TRACE("Beginning negotiation.");
400
    memset(buf, 0, sizeof(buf));
N
Nick Thomas 已提交
401
    memcpy(buf, "NBDMAGIC", 8);
402 403 404 405 406 407 408 409
    if (client->exp) {
        assert ((client->exp->nbdflags & ~65535) == 0);
        cpu_to_be64w((uint64_t*)(buf + 8), NBD_CLIENT_MAGIC);
        cpu_to_be64w((uint64_t*)(buf + 16), client->exp->size);
        cpu_to_be16w((uint16_t*)(buf + 26), client->exp->nbdflags | myflags);
    } else {
        cpu_to_be64w((uint64_t*)(buf + 8), NBD_OPTS_MAGIC);
    }
N
Nick Thomas 已提交
410

411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433
    if (client->exp) {
        if (write_sync(csock, buf, sizeof(buf)) != sizeof(buf)) {
            LOG("write failed");
            goto fail;
        }
    } else {
        if (write_sync(csock, buf, 18) != 18) {
            LOG("write failed");
            goto fail;
        }
        rc = nbd_receive_options(client);
        if (rc < 0) {
            LOG("option negotiation failed");
            goto fail;
        }

        assert ((client->exp->nbdflags & ~65535) == 0);
        cpu_to_be64w((uint64_t*)(buf + 18), client->exp->size);
        cpu_to_be16w((uint16_t*)(buf + 26), client->exp->nbdflags | myflags);
        if (write_sync(csock, buf + 18, sizeof(buf) - 18) != sizeof(buf) - 18) {
            LOG("write failed");
            goto fail;
        }
N
Nick Thomas 已提交
434 435
    }

D
Dong Xu Wang 已提交
436
    TRACE("Negotiation succeeded.");
437 438
    rc = 0;
fail:
439
    socket_set_nonblock(csock);
440
    return rc;
B
bellard 已提交
441 442
}

443 444
int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
                          off_t *size, size_t *blocksize)
B
bellard 已提交
445
{
N
Nick Thomas 已提交
446 447 448
    char buf[256];
    uint64_t magic, s;
    uint16_t tmp;
449
    int rc;
N
Nick Thomas 已提交
450

D
Dong Xu Wang 已提交
451
    TRACE("Receiving negotiation.");
N
Nick Thomas 已提交
452

453
    socket_set_block(csock);
454 455
    rc = -EINVAL;

N
Nick Thomas 已提交
456 457
    if (read_sync(csock, buf, 8) != 8) {
        LOG("read failed");
458
        goto fail;
N
Nick Thomas 已提交
459 460 461 462 463
    }

    buf[8] = '\0';
    if (strlen(buf) == 0) {
        LOG("server connection closed");
464
        goto fail;
N
Nick Thomas 已提交
465 466 467 468 469 470 471 472 473 474 475 476 477 478
    }

    TRACE("Magic is %c%c%c%c%c%c%c%c",
          qemu_isprint(buf[0]) ? buf[0] : '.',
          qemu_isprint(buf[1]) ? buf[1] : '.',
          qemu_isprint(buf[2]) ? buf[2] : '.',
          qemu_isprint(buf[3]) ? buf[3] : '.',
          qemu_isprint(buf[4]) ? buf[4] : '.',
          qemu_isprint(buf[5]) ? buf[5] : '.',
          qemu_isprint(buf[6]) ? buf[6] : '.',
          qemu_isprint(buf[7]) ? buf[7] : '.');

    if (memcmp(buf, "NBDMAGIC", 8) != 0) {
        LOG("Invalid magic received");
479
        goto fail;
N
Nick Thomas 已提交
480 481 482 483
    }

    if (read_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) {
        LOG("read failed");
484
        goto fail;
N
Nick Thomas 已提交
485 486 487 488 489 490 491 492 493 494
    }
    magic = be64_to_cpu(magic);
    TRACE("Magic is 0x%" PRIx64, magic);

    if (name) {
        uint32_t reserved = 0;
        uint32_t opt;
        uint32_t namesize;

        TRACE("Checking magic (opts_magic)");
P
Paolo Bonzini 已提交
495
        if (magic != NBD_OPTS_MAGIC) {
N
Nick Thomas 已提交
496
            LOG("Bad magic received");
497
            goto fail;
N
Nick Thomas 已提交
498 499 500
        }
        if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) {
            LOG("flags read failed");
501
            goto fail;
N
Nick Thomas 已提交
502 503 504 505 506 507
        }
        *flags = be16_to_cpu(tmp) << 16;
        /* reserved for future use */
        if (write_sync(csock, &reserved, sizeof(reserved)) !=
            sizeof(reserved)) {
            LOG("write failed (reserved)");
508
            goto fail;
N
Nick Thomas 已提交
509 510 511 512 513
        }
        /* write the export name */
        magic = cpu_to_be64(magic);
        if (write_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) {
            LOG("write failed (magic)");
514
            goto fail;
N
Nick Thomas 已提交
515 516 517 518
        }
        opt = cpu_to_be32(NBD_OPT_EXPORT_NAME);
        if (write_sync(csock, &opt, sizeof(opt)) != sizeof(opt)) {
            LOG("write failed (opt)");
519
            goto fail;
N
Nick Thomas 已提交
520 521 522 523 524
        }
        namesize = cpu_to_be32(strlen(name));
        if (write_sync(csock, &namesize, sizeof(namesize)) !=
            sizeof(namesize)) {
            LOG("write failed (namesize)");
525
            goto fail;
N
Nick Thomas 已提交
526 527 528
        }
        if (write_sync(csock, (char*)name, strlen(name)) != strlen(name)) {
            LOG("write failed (name)");
529
            goto fail;
N
Nick Thomas 已提交
530 531 532 533
        }
    } else {
        TRACE("Checking magic (cli_magic)");

P
Paolo Bonzini 已提交
534
        if (magic != NBD_CLIENT_MAGIC) {
N
Nick Thomas 已提交
535
            LOG("Bad magic received");
536
            goto fail;
N
Nick Thomas 已提交
537 538 539 540 541
        }
    }

    if (read_sync(csock, &s, sizeof(s)) != sizeof(s)) {
        LOG("read failed");
542
        goto fail;
N
Nick Thomas 已提交
543 544 545 546 547 548 549 550
    }
    *size = be64_to_cpu(s);
    *blocksize = 1024;
    TRACE("Size is %" PRIu64, *size);

    if (!name) {
        if (read_sync(csock, flags, sizeof(*flags)) != sizeof(*flags)) {
            LOG("read failed (flags)");
551
            goto fail;
N
Nick Thomas 已提交
552 553 554 555 556
        }
        *flags = be32_to_cpup(flags);
    } else {
        if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) {
            LOG("read failed (tmp)");
557
            goto fail;
N
Nick Thomas 已提交
558 559 560 561 562
        }
        *flags |= be32_to_cpu(tmp);
    }
    if (read_sync(csock, &buf, 124) != 124) {
        LOG("read failed (buf)");
563
        goto fail;
N
Nick Thomas 已提交
564
    }
565 566 567
    rc = 0;

fail:
568
    socket_set_nonblock(csock);
569
    return rc;
570
}
B
bellard 已提交
571

P
Paolo Bonzini 已提交
572 573
#ifdef __linux__
int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize)
574
{
575 576
    TRACE("Setting NBD socket");

577
    if (ioctl(fd, NBD_SET_SOCK, csock) < 0) {
578 579
        int serrno = errno;
        LOG("Failed to set NBD socket");
580
        return -serrno;
581 582
    }

N
Nick Thomas 已提交
583
    TRACE("Setting block size to %lu", (unsigned long)blocksize);
B
bellard 已提交
584

585
    if (ioctl(fd, NBD_SET_BLKSIZE, blocksize) < 0) {
N
Nick Thomas 已提交
586 587
        int serrno = errno;
        LOG("Failed setting NBD block size");
588
        return -serrno;
N
Nick Thomas 已提交
589
    }
B
bellard 已提交
590

B
Blue Swirl 已提交
591
        TRACE("Setting size to %zd block(s)", (size_t)(size / blocksize));
B
bellard 已提交
592

593
    if (ioctl(fd, NBD_SET_SIZE_BLOCKS, size / blocksize) < 0) {
N
Nick Thomas 已提交
594 595
        int serrno = errno;
        LOG("Failed setting size (in blocks)");
596
        return -serrno;
N
Nick Thomas 已提交
597
    }
B
bellard 已提交
598

P
Paolo Bonzini 已提交
599 600 601 602 603 604 605 606 607 608 609
    if (ioctl(fd, NBD_SET_FLAGS, flags) < 0) {
        if (errno == ENOTTY) {
            int read_only = (flags & NBD_FLAG_READ_ONLY) != 0;
            TRACE("Setting readonly attribute");

            if (ioctl(fd, BLKROSET, (unsigned long) &read_only) < 0) {
                int serrno = errno;
                LOG("Failed setting read-only attribute");
                return -serrno;
            }
        } else {
P
Paolo Bonzini 已提交
610
            int serrno = errno;
P
Paolo Bonzini 已提交
611
            LOG("Failed setting flags");
612
            return -serrno;
P
Paolo Bonzini 已提交
613 614 615
        }
    }

N
Nick Thomas 已提交
616
    TRACE("Negotiation ended");
B
bellard 已提交
617

N
Nick Thomas 已提交
618
    return 0;
B
bellard 已提交
619 620 621 622
}

int nbd_disconnect(int fd)
{
N
Nick Thomas 已提交
623 624 625 626
    ioctl(fd, NBD_CLEAR_QUE);
    ioctl(fd, NBD_DISCONNECT);
    ioctl(fd, NBD_CLEAR_SOCK);
    return 0;
B
bellard 已提交
627 628
}

629
int nbd_client(int fd)
B
bellard 已提交
630
{
N
Nick Thomas 已提交
631 632
    int ret;
    int serrno;
B
bellard 已提交
633

N
Nick Thomas 已提交
634
    TRACE("Doing NBD loop");
B
bellard 已提交
635

N
Nick Thomas 已提交
636
    ret = ioctl(fd, NBD_DO_IT);
637
    if (ret < 0 && errno == EPIPE) {
638 639 640 641 642 643
        /* NBD_DO_IT normally returns EPIPE when someone has disconnected
         * the socket via NBD_DISCONNECT.  We do not want to return 1 in
         * that case.
         */
        ret = 0;
    }
N
Nick Thomas 已提交
644
    serrno = errno;
B
bellard 已提交
645

N
Nick Thomas 已提交
646
    TRACE("NBD loop returned %d: %s", ret, strerror(serrno));
B
bellard 已提交
647

N
Nick Thomas 已提交
648 649
    TRACE("Clearing NBD queue");
    ioctl(fd, NBD_CLEAR_QUE);
B
bellard 已提交
650

N
Nick Thomas 已提交
651 652
    TRACE("Clearing NBD socket");
    ioctl(fd, NBD_CLEAR_SOCK);
B
bellard 已提交
653

N
Nick Thomas 已提交
654 655
    errno = serrno;
    return ret;
B
bellard 已提交
656
}
657
#else
P
Paolo Bonzini 已提交
658
int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize)
659
{
660
    return -ENOTSUP;
661 662 663 664
}

int nbd_disconnect(int fd)
{
665
    return -ENOTSUP;
666 667
}

668
int nbd_client(int fd)
669
{
670
    return -ENOTSUP;
671 672
}
#endif
B
bellard 已提交
673

P
Paolo Bonzini 已提交
674
ssize_t nbd_send_request(int csock, struct nbd_request *request)
B
bellard 已提交
675
{
P
Paolo Bonzini 已提交
676
    uint8_t buf[NBD_REQUEST_SIZE];
677
    ssize_t ret;
N
Nick Thomas 已提交
678 679 680 681 682 683

    cpu_to_be32w((uint32_t*)buf, NBD_REQUEST_MAGIC);
    cpu_to_be32w((uint32_t*)(buf + 4), request->type);
    cpu_to_be64w((uint64_t*)(buf + 8), request->handle);
    cpu_to_be64w((uint64_t*)(buf + 16), request->from);
    cpu_to_be32w((uint32_t*)(buf + 24), request->len);
684

N
Nick Thomas 已提交
685 686 687 688
    TRACE("Sending request to client: "
          "{ .from = %" PRIu64", .len = %u, .handle = %" PRIu64", .type=%i}",
          request->from, request->len, request->handle, request->type);

689 690 691 692 693 694
    ret = write_sync(csock, buf, sizeof(buf));
    if (ret < 0) {
        return ret;
    }

    if (ret != sizeof(buf)) {
N
Nick Thomas 已提交
695
        LOG("writing to socket failed");
696
        return -EINVAL;
N
Nick Thomas 已提交
697 698 699
    }
    return 0;
}
700

P
Paolo Bonzini 已提交
701
static ssize_t nbd_receive_request(int csock, struct nbd_request *request)
702
{
P
Paolo Bonzini 已提交
703
    uint8_t buf[NBD_REQUEST_SIZE];
N
Nick Thomas 已提交
704
    uint32_t magic;
705
    ssize_t ret;
N
Nick Thomas 已提交
706

707 708 709 710 711 712
    ret = read_sync(csock, buf, sizeof(buf));
    if (ret < 0) {
        return ret;
    }

    if (ret != sizeof(buf)) {
N
Nick Thomas 已提交
713
        LOG("read failed");
714
        return -EINVAL;
N
Nick Thomas 已提交
715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736
    }

    /* Request
       [ 0 ..  3]   magic   (NBD_REQUEST_MAGIC)
       [ 4 ..  7]   type    (0 == READ, 1 == WRITE)
       [ 8 .. 15]   handle
       [16 .. 23]   from
       [24 .. 27]   len
     */

    magic = be32_to_cpup((uint32_t*)buf);
    request->type  = be32_to_cpup((uint32_t*)(buf + 4));
    request->handle = be64_to_cpup((uint64_t*)(buf + 8));
    request->from  = be64_to_cpup((uint64_t*)(buf + 16));
    request->len   = be32_to_cpup((uint32_t*)(buf + 24));

    TRACE("Got request: "
          "{ magic = 0x%x, .type = %d, from = %" PRIu64" , len = %u }",
          magic, request->type, request->from, request->len);

    if (magic != NBD_REQUEST_MAGIC) {
        LOG("invalid magic (got 0x%x)", magic);
737
        return -EINVAL;
N
Nick Thomas 已提交
738 739
    }
    return 0;
740 741
}

P
Paolo Bonzini 已提交
742
ssize_t nbd_receive_reply(int csock, struct nbd_reply *reply)
743
{
N
Nick Thomas 已提交
744 745
    uint8_t buf[NBD_REPLY_SIZE];
    uint32_t magic;
746
    ssize_t ret;
N
Nick Thomas 已提交
747

748 749 750 751 752 753
    ret = read_sync(csock, buf, sizeof(buf));
    if (ret < 0) {
        return ret;
    }

    if (ret != sizeof(buf)) {
N
Nick Thomas 已提交
754
        LOG("read failed");
755
        return -EINVAL;
N
Nick Thomas 已提交
756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773
    }

    /* Reply
       [ 0 ..  3]    magic   (NBD_REPLY_MAGIC)
       [ 4 ..  7]    error   (0 == no error)
       [ 7 .. 15]    handle
     */

    magic = be32_to_cpup((uint32_t*)buf);
    reply->error  = be32_to_cpup((uint32_t*)(buf + 4));
    reply->handle = be64_to_cpup((uint64_t*)(buf + 8));

    TRACE("Got reply: "
          "{ magic = 0x%x, .error = %d, handle = %" PRIu64" }",
          magic, reply->error, reply->handle);

    if (magic != NBD_REPLY_MAGIC) {
        LOG("invalid magic (got 0x%x)", magic);
774
        return -EINVAL;
N
Nick Thomas 已提交
775 776
    }
    return 0;
777 778
}

P
Paolo Bonzini 已提交
779
static ssize_t nbd_send_reply(int csock, struct nbd_reply *reply)
780
{
P
Paolo Bonzini 已提交
781
    uint8_t buf[NBD_REPLY_SIZE];
782
    ssize_t ret;
N
Nick Thomas 已提交
783 784 785 786 787 788 789 790 791 792 793 794

    /* Reply
       [ 0 ..  3]    magic   (NBD_REPLY_MAGIC)
       [ 4 ..  7]    error   (0 == no error)
       [ 7 .. 15]    handle
     */
    cpu_to_be32w((uint32_t*)buf, NBD_REPLY_MAGIC);
    cpu_to_be32w((uint32_t*)(buf + 4), reply->error);
    cpu_to_be64w((uint64_t*)(buf + 8), reply->handle);

    TRACE("Sending response to client");

795 796 797 798 799 800
    ret = write_sync(csock, buf, sizeof(buf));
    if (ret < 0) {
        return ret;
    }

    if (ret != sizeof(buf)) {
N
Nick Thomas 已提交
801
        LOG("writing to socket failed");
802
        return -EINVAL;
N
Nick Thomas 已提交
803 804
    }
    return 0;
805
}
B
bellard 已提交
806

P
Paolo Bonzini 已提交
807 808
#define MAX_NBD_REQUESTS 16

809
void nbd_client_get(NBDClient *client)
810 811 812 813
{
    client->refcount++;
}

814
void nbd_client_put(NBDClient *client)
815 816
{
    if (--client->refcount == 0) {
817 818 819 820 821 822 823 824
        /* The last reference should be dropped by client->close,
         * which is called by nbd_client_close.
         */
        assert(client->closing);

        qemu_set_fd_handler2(client->sock, NULL, NULL, NULL, NULL);
        close(client->sock);
        client->sock = -1;
825 826 827 828
        if (client->exp) {
            QTAILQ_REMOVE(&client->exp->clients, client, next);
            nbd_export_put(client->exp);
        }
829 830 831 832
        g_free(client);
    }
}

833
void nbd_client_close(NBDClient *client)
834
{
835 836 837 838 839 840 841 842 843 844 845 846
    if (client->closing) {
        return;
    }

    client->closing = true;

    /* Force requests to finish.  They will drop their own references,
     * then we'll close the socket and free the NBDClient.
     */
    shutdown(client->sock, 2);

    /* Also tell the client, so that they release their reference.  */
847 848 849 850 851
    if (client->close) {
        client->close(client);
    }
}

852
static NBDRequest *nbd_request_get(NBDClient *client)
P
Paolo Bonzini 已提交
853 854
{
    NBDRequest *req;
855 856
    NBDExport *exp = client->exp;

P
Paolo Bonzini 已提交
857 858 859
    assert(client->nb_requests <= MAX_NBD_REQUESTS - 1);
    client->nb_requests++;

P
Paolo Bonzini 已提交
860 861 862 863 864 865 866
    if (QSIMPLEQ_EMPTY(&exp->requests)) {
        req = g_malloc0(sizeof(NBDRequest));
        req->data = qemu_blockalign(exp->bs, NBD_BUFFER_SIZE);
    } else {
        req = QSIMPLEQ_FIRST(&exp->requests);
        QSIMPLEQ_REMOVE_HEAD(&exp->requests, entry);
    }
867 868
    nbd_client_get(client);
    req->client = client;
P
Paolo Bonzini 已提交
869 870 871
    return req;
}

872
static void nbd_request_put(NBDRequest *req)
P
Paolo Bonzini 已提交
873
{
874 875
    NBDClient *client = req->client;
    QSIMPLEQ_INSERT_HEAD(&client->exp->requests, req, entry);
P
Paolo Bonzini 已提交
876 877 878
    if (client->nb_requests-- == MAX_NBD_REQUESTS) {
        qemu_notify_event();
    }
879
    nbd_client_put(client);
P
Paolo Bonzini 已提交
880 881
}

P
Paolo Bonzini 已提交
882
NBDExport *nbd_export_new(BlockDriverState *bs, off_t dev_offset,
883 884
                          off_t size, uint32_t nbdflags,
                          void (*close)(NBDExport *))
P
Paolo Bonzini 已提交
885 886
{
    NBDExport *exp = g_malloc0(sizeof(NBDExport));
P
Paolo Bonzini 已提交
887
    QSIMPLEQ_INIT(&exp->requests);
888
    exp->refcount = 1;
889
    QTAILQ_INIT(&exp->clients);
P
Paolo Bonzini 已提交
890 891 892
    exp->bs = bs;
    exp->dev_offset = dev_offset;
    exp->nbdflags = nbdflags;
P
Paolo Bonzini 已提交
893
    exp->size = size == -1 ? bdrv_getlength(bs) : size;
894
    exp->close = close;
P
Paolo Bonzini 已提交
895 896 897
    return exp;
}

P
Paolo Bonzini 已提交
898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930
NBDExport *nbd_export_find(const char *name)
{
    NBDExport *exp;
    QTAILQ_FOREACH(exp, &exports, next) {
        if (strcmp(name, exp->name) == 0) {
            return exp;
        }
    }

    return NULL;
}

void nbd_export_set_name(NBDExport *exp, const char *name)
{
    if (exp->name == name) {
        return;
    }

    nbd_export_get(exp);
    if (exp->name != NULL) {
        g_free(exp->name);
        exp->name = NULL;
        QTAILQ_REMOVE(&exports, exp, next);
        nbd_export_put(exp);
    }
    if (name != NULL) {
        nbd_export_get(exp);
        exp->name = g_strdup(name);
        QTAILQ_INSERT_TAIL(&exports, exp, next);
    }
    nbd_export_put(exp);
}

P
Paolo Bonzini 已提交
931 932
void nbd_export_close(NBDExport *exp)
{
933
    NBDClient *client, *next;
934

935 936 937 938
    nbd_export_get(exp);
    QTAILQ_FOREACH_SAFE(client, &exp->clients, next, next) {
        nbd_client_close(client);
    }
P
Paolo Bonzini 已提交
939
    nbd_export_set_name(exp, NULL);
940
    nbd_export_put(exp);
941 942 943 944 945 946 947 948 949 950 951 952 953
}

void nbd_export_get(NBDExport *exp)
{
    assert(exp->refcount > 0);
    exp->refcount++;
}

void nbd_export_put(NBDExport *exp)
{
    assert(exp->refcount > 0);
    if (exp->refcount == 1) {
        nbd_export_close(exp);
P
Paolo Bonzini 已提交
954 955
    }

956
    if (--exp->refcount == 0) {
P
Paolo Bonzini 已提交
957 958
        assert(exp->name == NULL);

959 960 961 962
        if (exp->close) {
            exp->close(exp);
        }

963 964 965 966 967 968 969 970 971
        while (!QSIMPLEQ_EMPTY(&exp->requests)) {
            NBDRequest *first = QSIMPLEQ_FIRST(&exp->requests);
            QSIMPLEQ_REMOVE_HEAD(&exp->requests, entry);
            qemu_vfree(first->data);
            g_free(first);
        }

        g_free(exp);
    }
P
Paolo Bonzini 已提交
972 973
}

P
Paolo Bonzini 已提交
974 975 976 977 978
BlockDriverState *nbd_export_get_blockdev(NBDExport *exp)
{
    return exp->bs;
}

P
Paolo Bonzini 已提交
979 980 981 982 983 984 985 986 987
void nbd_export_close_all(void)
{
    NBDExport *exp, *next;

    QTAILQ_FOREACH_SAFE(exp, &exports, next, next) {
        nbd_export_close(exp);
    }
}

P
Paolo Bonzini 已提交
988
static int nbd_can_read(void *opaque);
P
Paolo Bonzini 已提交
989 990 991
static void nbd_read(void *opaque);
static void nbd_restart_write(void *opaque);

P
Paolo Bonzini 已提交
992 993
static ssize_t nbd_co_send_reply(NBDRequest *req, struct nbd_reply *reply,
                                 int len)
994
{
995 996
    NBDClient *client = req->client;
    int csock = client->sock;
P
Paolo Bonzini 已提交
997
    ssize_t rc, ret;
998

P
Paolo Bonzini 已提交
999
    qemu_co_mutex_lock(&client->send_lock);
P
Paolo Bonzini 已提交
1000 1001
    qemu_set_fd_handler2(csock, nbd_can_read, nbd_read,
                         nbd_restart_write, client);
P
Paolo Bonzini 已提交
1002 1003
    client->send_coroutine = qemu_coroutine_self();

1004 1005 1006 1007 1008
    if (!len) {
        rc = nbd_send_reply(csock, reply);
    } else {
        socket_set_cork(csock, 1);
        rc = nbd_send_reply(csock, reply);
1009
        if (rc >= 0) {
P
Paolo Bonzini 已提交
1010
            ret = qemu_co_send(csock, req->data, len);
1011
            if (ret != len) {
1012
                rc = -EIO;
1013 1014 1015 1016
            }
        }
        socket_set_cork(csock, 0);
    }
P
Paolo Bonzini 已提交
1017 1018

    client->send_coroutine = NULL;
P
Paolo Bonzini 已提交
1019
    qemu_set_fd_handler2(csock, nbd_can_read, nbd_read, NULL, client);
P
Paolo Bonzini 已提交
1020
    qemu_co_mutex_unlock(&client->send_lock);
1021 1022 1023
    return rc;
}

P
Paolo Bonzini 已提交
1024
static ssize_t nbd_co_receive_request(NBDRequest *req, struct nbd_request *request)
1025
{
1026 1027
    NBDClient *client = req->client;
    int csock = client->sock;
P
Paolo Bonzini 已提交
1028
    ssize_t rc;
1029

P
Paolo Bonzini 已提交
1030
    client->recv_coroutine = qemu_coroutine_self();
1031 1032 1033 1034 1035
    rc = nbd_receive_request(csock, request);
    if (rc < 0) {
        if (rc != -EAGAIN) {
            rc = -EIO;
        }
1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057
        goto out;
    }

    if (request->len > NBD_BUFFER_SIZE) {
        LOG("len (%u) is larger than max len (%u)",
            request->len, NBD_BUFFER_SIZE);
        rc = -EINVAL;
        goto out;
    }

    if ((request->from + request->len) < request->from) {
        LOG("integer overflow detected! "
            "you're probably being attacked");
        rc = -EINVAL;
        goto out;
    }

    TRACE("Decoding type");

    if ((request->type & NBD_CMD_MASK_COMMAND) == NBD_CMD_WRITE) {
        TRACE("Reading %u byte(s)", request->len);

P
Paolo Bonzini 已提交
1058
        if (qemu_co_recv(csock, req->data, request->len) != request->len) {
1059 1060 1061 1062 1063 1064 1065 1066
            LOG("reading from socket failed");
            rc = -EIO;
            goto out;
        }
    }
    rc = 0;

out:
P
Paolo Bonzini 已提交
1067
    client->recv_coroutine = NULL;
1068 1069 1070
    return rc;
}

P
Paolo Bonzini 已提交
1071
static void nbd_trip(void *opaque)
1072
{
P
Paolo Bonzini 已提交
1073
    NBDClient *client = opaque;
1074
    NBDExport *exp = client->exp;
1075
    NBDRequest *req;
N
Nick Thomas 已提交
1076 1077
    struct nbd_request request;
    struct nbd_reply reply;
P
Paolo Bonzini 已提交
1078
    ssize_t ret;
N
Nick Thomas 已提交
1079 1080

    TRACE("Reading request.");
1081 1082 1083
    if (client->closing) {
        return;
    }
N
Nick Thomas 已提交
1084

1085
    req = nbd_request_get(client);
P
Paolo Bonzini 已提交
1086
    ret = nbd_co_receive_request(req, &request);
1087 1088 1089
    if (ret == -EAGAIN) {
        goto done;
    }
1090
    if (ret == -EIO) {
P
Paolo Bonzini 已提交
1091
        goto out;
1092
    }
N
Nick Thomas 已提交
1093

1094 1095 1096
    reply.handle = request.handle;
    reply.error = 0;

1097 1098 1099
    if (ret < 0) {
        reply.error = -ret;
        goto error_reply;
N
Nick Thomas 已提交
1100 1101
    }

P
Paolo Bonzini 已提交
1102
    if ((request.from + request.len) > exp->size) {
N
Nick Thomas 已提交
1103 1104
            LOG("From: %" PRIu64 ", Len: %u, Size: %" PRIu64
            ", Offset: %" PRIu64 "\n",
P
Paolo Bonzini 已提交
1105
                    request.from, request.len,
S
Stefan Weil 已提交
1106
                    (uint64_t)exp->size, (uint64_t)exp->dev_offset);
N
Nick Thomas 已提交
1107
        LOG("requested operation past EOF--bad client?");
1108
        goto invalid_request;
N
Nick Thomas 已提交
1109 1110
    }

1111
    switch (request.type & NBD_CMD_MASK_COMMAND) {
N
Nick Thomas 已提交
1112 1113 1114
    case NBD_CMD_READ:
        TRACE("Request type is READ");

P
Paolo Bonzini 已提交
1115 1116 1117 1118 1119 1120 1121 1122 1123
        if (request.type & NBD_CMD_FLAG_FUA) {
            ret = bdrv_co_flush(exp->bs);
            if (ret < 0) {
                LOG("flush failed");
                reply.error = -ret;
                goto error_reply;
            }
        }

P
Paolo Bonzini 已提交
1124
        ret = bdrv_read(exp->bs, (request.from + exp->dev_offset) / 512,
P
Paolo Bonzini 已提交
1125
                        req->data, request.len / 512);
1126
        if (ret < 0) {
N
Nick Thomas 已提交
1127
            LOG("reading from file failed");
1128
            reply.error = -ret;
1129
            goto error_reply;
N
Nick Thomas 已提交
1130 1131 1132
        }

        TRACE("Read %u byte(s)", request.len);
P
Paolo Bonzini 已提交
1133
        if (nbd_co_send_reply(req, &reply, request.len) < 0)
P
Paolo Bonzini 已提交
1134
            goto out;
N
Nick Thomas 已提交
1135 1136 1137 1138
        break;
    case NBD_CMD_WRITE:
        TRACE("Request type is WRITE");

P
Paolo Bonzini 已提交
1139
        if (exp->nbdflags & NBD_FLAG_READ_ONLY) {
N
Nick Thomas 已提交
1140
            TRACE("Server is read-only, return error");
1141 1142 1143 1144 1145 1146
            reply.error = EROFS;
            goto error_reply;
        }

        TRACE("Writing to device");

P
Paolo Bonzini 已提交
1147
        ret = bdrv_write(exp->bs, (request.from + exp->dev_offset) / 512,
P
Paolo Bonzini 已提交
1148
                         req->data, request.len / 512);
1149 1150 1151 1152 1153
        if (ret < 0) {
            LOG("writing to file failed");
            reply.error = -ret;
            goto error_reply;
        }
N
Nick Thomas 已提交
1154

1155
        if (request.type & NBD_CMD_FLAG_FUA) {
P
Paolo Bonzini 已提交
1156
            ret = bdrv_co_flush(exp->bs);
1157
            if (ret < 0) {
1158
                LOG("flush failed");
1159
                reply.error = -ret;
1160
                goto error_reply;
1161
            }
N
Nick Thomas 已提交
1162 1163
        }

1164
        if (nbd_co_send_reply(req, &reply, 0) < 0) {
P
Paolo Bonzini 已提交
1165
            goto out;
1166
        }
N
Nick Thomas 已提交
1167 1168 1169 1170
        break;
    case NBD_CMD_DISC:
        TRACE("Request type is DISCONNECT");
        errno = 0;
P
Paolo Bonzini 已提交
1171
        goto out;
P
Paolo Bonzini 已提交
1172 1173 1174
    case NBD_CMD_FLUSH:
        TRACE("Request type is FLUSH");

P
Paolo Bonzini 已提交
1175
        ret = bdrv_co_flush(exp->bs);
P
Paolo Bonzini 已提交
1176 1177 1178 1179
        if (ret < 0) {
            LOG("flush failed");
            reply.error = -ret;
        }
1180
        if (nbd_co_send_reply(req, &reply, 0) < 0) {
P
Paolo Bonzini 已提交
1181
            goto out;
1182
        }
P
Paolo Bonzini 已提交
1183 1184 1185
        break;
    case NBD_CMD_TRIM:
        TRACE("Request type is TRIM");
P
Paolo Bonzini 已提交
1186 1187
        ret = bdrv_co_discard(exp->bs, (request.from + exp->dev_offset) / 512,
                              request.len / 512);
P
Paolo Bonzini 已提交
1188 1189 1190 1191
        if (ret < 0) {
            LOG("discard failed");
            reply.error = -ret;
        }
1192
        if (nbd_co_send_reply(req, &reply, 0) < 0) {
P
Paolo Bonzini 已提交
1193
            goto out;
1194
        }
P
Paolo Bonzini 已提交
1195
        break;
N
Nick Thomas 已提交
1196 1197
    default:
        LOG("invalid request type (%u) received", request.type);
1198 1199 1200
    invalid_request:
        reply.error = -EINVAL;
    error_reply:
1201
        if (nbd_co_send_reply(req, &reply, 0) < 0) {
P
Paolo Bonzini 已提交
1202
            goto out;
1203
        }
1204
        break;
N
Nick Thomas 已提交
1205 1206 1207 1208
    }

    TRACE("Request/Reply complete");

1209
done:
P
Paolo Bonzini 已提交
1210 1211 1212
    nbd_request_put(req);
    return;

P
Paolo Bonzini 已提交
1213
out:
1214
    nbd_request_put(req);
P
Paolo Bonzini 已提交
1215
    nbd_client_close(client);
B
bellard 已提交
1216
}
P
Paolo Bonzini 已提交
1217

P
Paolo Bonzini 已提交
1218 1219 1220 1221 1222 1223 1224
static int nbd_can_read(void *opaque)
{
    NBDClient *client = opaque;

    return client->recv_coroutine || client->nb_requests < MAX_NBD_REQUESTS;
}

1225 1226 1227 1228
static void nbd_read(void *opaque)
{
    NBDClient *client = opaque;

P
Paolo Bonzini 已提交
1229 1230 1231 1232
    if (client->recv_coroutine) {
        qemu_coroutine_enter(client->recv_coroutine, NULL);
    } else {
        qemu_coroutine_enter(qemu_coroutine_create(nbd_trip), client);
1233 1234 1235
    }
}

P
Paolo Bonzini 已提交
1236 1237 1238 1239 1240 1241 1242
static void nbd_restart_write(void *opaque)
{
    NBDClient *client = opaque;

    qemu_coroutine_enter(client->send_coroutine, NULL);
}

1243 1244
NBDClient *nbd_client_new(NBDExport *exp, int csock,
                          void (*close)(NBDClient *))
P
Paolo Bonzini 已提交
1245
{
1246 1247 1248 1249 1250
    NBDClient *client;
    client = g_malloc0(sizeof(NBDClient));
    client->refcount = 1;
    client->exp = exp;
    client->sock = csock;
1251 1252 1253 1254
    if (nbd_send_negotiate(client) < 0) {
        g_free(client);
        return NULL;
    }
1255
    client->close = close;
P
Paolo Bonzini 已提交
1256
    qemu_co_mutex_init(&client->send_lock);
P
Paolo Bonzini 已提交
1257
    qemu_set_fd_handler2(csock, nbd_can_read, nbd_read, NULL, client);
1258

1259 1260 1261 1262
    if (exp) {
        QTAILQ_INSERT_TAIL(&exp->clients, client, next);
        nbd_export_get(exp);
    }
1263
    return client;
P
Paolo Bonzini 已提交
1264
}