net.c 45.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * QEMU System Emulator
 *
 * Copyright (c) 2003-2008 Fabrice Bellard
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24

P
Peter Maydell 已提交
25
#include "qemu/osdep.h"
B
blueswir1 已提交
26

P
Paolo Bonzini 已提交
27
#include "net/net.h"
P
Paolo Bonzini 已提交
28 29
#include "clients.h"
#include "hub.h"
P
Paolo Bonzini 已提交
30
#include "net/slirp.h"
31
#include "net/eth.h"
P
Paolo Bonzini 已提交
32
#include "util.h"
33

34
#include "monitor/monitor.h"
35
#include "qemu/help_option.h"
36
#include "qapi/qmp/qdict.h"
37
#include "qapi/qmp/qerror.h"
38
#include "qemu/error-report.h"
39
#include "qemu/sockets.h"
40
#include "qemu/cutils.h"
41
#include "qemu/config-file.h"
L
Luiz Capitulino 已提交
42
#include "qmp-commands.h"
43
#include "hw/qdev.h"
44
#include "qemu/iov.h"
45
#include "qemu/main-loop.h"
46
#include "qemu/option.h"
47
#include "qapi-visit.h"
48
#include "qapi/error.h"
49
#include "qapi/opts-visitor.h"
50
#include "sysemu/sysemu.h"
51
#include "sysemu/qtest.h"
Y
Yang Hongyang 已提交
52
#include "net/filter.h"
53
#include "qapi/string-output-visitor.h"
54

55 56 57 58 59
/* Net bridge is currently not supported for W32. */
#if !defined(_WIN32)
# define CONFIG_NET_BRIDGE
#endif

60
static VMChangeStateEntry *net_change_state_entry;
61
static QTAILQ_HEAD(, NetClientState) net_clients;
62

63 64 65 66 67 68 69
const char *host_net_devices[] = {
    "tap",
    "socket",
    "dump",
#ifdef CONFIG_NET_BRIDGE
    "bridge",
#endif
70 71 72
#ifdef CONFIG_NETMAP
    "netmap",
#endif
73 74 75 76 77 78
#ifdef CONFIG_SLIRP
    "user",
#endif
#ifdef CONFIG_VDE
    "vde",
#endif
79
    "vhost-user",
80 81 82
    NULL,
};

83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105
/***********************************************************/
/* network device redirectors */

static int get_str_sep(char *buf, int buf_size, const char **pp, int sep)
{
    const char *p, *p1;
    int len;
    p = *pp;
    p1 = strchr(p, sep);
    if (!p1)
        return -1;
    len = p1 - p;
    p1++;
    if (buf_size > 0) {
        if (len > buf_size - 1)
            len = buf_size - 1;
        memcpy(buf, p, len);
        buf[len] = '\0';
    }
    *pp = p1;
    return 0;
}

106 107
int parse_host_port(struct sockaddr_in *saddr, const char *str,
                    Error **errp)
108 109 110 111 112 113 114
{
    char buf[512];
    struct hostent *he;
    const char *p, *r;
    int port;

    p = str;
115 116 117
    if (get_str_sep(buf, sizeof(buf), &p, ':') < 0) {
        error_setg(errp, "host address '%s' doesn't contain ':' "
                   "separating host from port", str);
118
        return -1;
119
    }
120 121 122 123
    saddr->sin_family = AF_INET;
    if (buf[0] == '\0') {
        saddr->sin_addr.s_addr = 0;
    } else {
124
        if (qemu_isdigit(buf[0])) {
125 126 127
            if (!inet_aton(buf, &saddr->sin_addr)) {
                error_setg(errp, "host address '%s' is not a valid "
                           "IPv4 address", buf);
128
                return -1;
129
            }
130
        } else {
131 132 133
            he = gethostbyname(buf);
            if (he == NULL) {
                error_setg(errp, "can't resolve host address '%s'", buf);
134
                return - 1;
135
            }
136 137 138 139
            saddr->sin_addr = *(struct in_addr *)he->h_addr;
        }
    }
    port = strtol(p, (char **)&r, 0);
140 141
    if (r == p) {
        error_setg(errp, "port number '%s' is invalid", p);
142
        return -1;
143
    }
144 145 146 147
    saddr->sin_port = htons(port);
    return 0;
}

148 149 150 151 152 153 154
char *qemu_mac_strdup_printf(const uint8_t *macaddr)
{
    return g_strdup_printf("%.2x:%.2x:%.2x:%.2x:%.2x:%.2x",
                           macaddr[0], macaddr[1], macaddr[2],
                           macaddr[3], macaddr[4], macaddr[5]);
}

155
void qemu_format_nic_info_str(NetClientState *nc, uint8_t macaddr[6])
156
{
157
    snprintf(nc->info_str, sizeof(nc->info_str),
158
             "model=%s,macaddr=%02x:%02x:%02x:%02x:%02x:%02x",
159
             nc->model,
160 161 162 163
             macaddr[0], macaddr[1], macaddr[2],
             macaddr[3], macaddr[4], macaddr[5]);
}

164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204
static int mac_table[256] = {0};

static void qemu_macaddr_set_used(MACAddr *macaddr)
{
    int index;

    for (index = 0x56; index < 0xFF; index++) {
        if (macaddr->a[5] == index) {
            mac_table[index]++;
        }
    }
}

static void qemu_macaddr_set_free(MACAddr *macaddr)
{
    int index;
    static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };

    if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
        return;
    }
    for (index = 0x56; index < 0xFF; index++) {
        if (macaddr->a[5] == index) {
            mac_table[index]--;
        }
    }
}

static int qemu_macaddr_get_free(void)
{
    int index;

    for (index = 0x56; index < 0xFF; index++) {
        if (mac_table[index] == 0) {
            return index;
        }
    }

    return -1;
}

G
Gerd Hoffmann 已提交
205 206 207
void qemu_macaddr_default_if_unset(MACAddr *macaddr)
{
    static const MACAddr zero = { .a = { 0,0,0,0,0,0 } };
208 209 210 211 212 213 214 215 216 217
    static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };

    if (memcmp(macaddr, &zero, sizeof(zero)) != 0) {
        if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
            return;
        } else {
            qemu_macaddr_set_used(macaddr);
            return;
        }
    }
G
Gerd Hoffmann 已提交
218 219 220 221 222 223

    macaddr->a[0] = 0x52;
    macaddr->a[1] = 0x54;
    macaddr->a[2] = 0x00;
    macaddr->a[3] = 0x12;
    macaddr->a[4] = 0x34;
224 225
    macaddr->a[5] = qemu_macaddr_get_free();
    qemu_macaddr_set_used(macaddr);
G
Gerd Hoffmann 已提交
226 227
}

228 229 230
/**
 * Generate a name for net client
 *
A
Amos Kong 已提交
231
 * Only net clients created with the legacy -net option and NICs need this.
232
 */
233
static char *assign_name(NetClientState *nc1, const char *model)
234
{
235
    NetClientState *nc;
236 237
    int id = 0;

238 239
    QTAILQ_FOREACH(nc, &net_clients, next) {
        if (nc == nc1) {
240
            continue;
241
        }
A
Amos Kong 已提交
242
        if (strcmp(nc->model, model) == 0) {
243 244 245 246
            id++;
        }
    }

247
    return g_strdup_printf("%s.%d", model, id);
248 249
}

250 251 252 253 254
static void qemu_net_client_destructor(NetClientState *nc)
{
    g_free(nc);
}

255 256 257 258
static void qemu_net_client_setup(NetClientState *nc,
                                  NetClientInfo *info,
                                  NetClientState *peer,
                                  const char *model,
259 260
                                  const char *name,
                                  NetClientDestructor *destructor)
261
{
262 263
    nc->info = info;
    nc->model = g_strdup(model);
264
    if (name) {
265
        nc->name = g_strdup(name);
266
    } else {
267
        nc->name = assign_name(nc, model);
268
    }
269

270 271
    if (peer) {
        assert(!peer->peer);
272 273
        nc->peer = peer;
        peer->peer = nc;
274
    }
275
    QTAILQ_INSERT_TAIL(&net_clients, nc, next);
276

277
    nc->incoming_queue = qemu_new_net_queue(qemu_deliver_packet_iov, nc);
278
    nc->destructor = destructor;
Y
Yang Hongyang 已提交
279
    QTAILQ_INIT(&nc->filters);
280 281 282 283 284 285 286 287 288 289 290 291
}

NetClientState *qemu_new_net_client(NetClientInfo *info,
                                    NetClientState *peer,
                                    const char *model,
                                    const char *name)
{
    NetClientState *nc;

    assert(info->size >= sizeof(NetClientState));

    nc = g_malloc0(info->size);
292 293
    qemu_net_client_setup(nc, info, peer, model, name,
                          qemu_net_client_destructor);
294

295
    return nc;
296 297
}

298 299 300 301 302 303
NICState *qemu_new_nic(NetClientInfo *info,
                       NICConf *conf,
                       const char *model,
                       const char *name,
                       void *opaque)
{
J
Jason Wang 已提交
304
    NetClientState **peers = conf->peers.ncs;
305
    NICState *nic;
306
    int i, queues = MAX(1, conf->peers.queues);
307

308
    assert(info->type == NET_CLIENT_DRIVER_NIC);
309 310
    assert(info->size >= sizeof(NICState));

311 312
    nic = g_malloc0(info->size + sizeof(NetClientState) * queues);
    nic->ncs = (void *)nic + info->size;
313 314 315
    nic->conf = conf;
    nic->opaque = opaque;

316 317
    for (i = 0; i < queues; i++) {
        qemu_net_client_setup(&nic->ncs[i], info, peers[i], model, name,
J
Jason Wang 已提交
318 319 320 321
                              NULL);
        nic->ncs[i].queue_index = i;
    }

322 323 324
    return nic;
}

J
Jason Wang 已提交
325 326
NetClientState *qemu_get_subqueue(NICState *nic, int queue_index)
{
327
    return nic->ncs + queue_index;
J
Jason Wang 已提交
328 329
}

J
Jason Wang 已提交
330 331
NetClientState *qemu_get_queue(NICState *nic)
{
J
Jason Wang 已提交
332
    return qemu_get_subqueue(nic, 0);
J
Jason Wang 已提交
333 334
}

J
Jason Wang 已提交
335 336
NICState *qemu_get_nic(NetClientState *nc)
{
J
Jason Wang 已提交
337 338
    NetClientState *nc0 = nc - nc->queue_index;

339
    return (NICState *)((void *)nc0 - nc->info->size);
J
Jason Wang 已提交
340 341 342 343 344 345 346 347 348
}

void *qemu_get_nic_opaque(NetClientState *nc)
{
    NICState *nic = qemu_get_nic(nc);

    return nic->opaque;
}

349
static void qemu_cleanup_net_client(NetClientState *nc)
350
{
351
    QTAILQ_REMOVE(&net_clients, nc, next);
352

353 354 355
    if (nc->info->cleanup) {
        nc->info->cleanup(nc);
    }
356
}
357

358
static void qemu_free_net_client(NetClientState *nc)
359
{
360 361
    if (nc->incoming_queue) {
        qemu_del_net_queue(nc->incoming_queue);
S
Stefan Hajnoczi 已提交
362
    }
363 364
    if (nc->peer) {
        nc->peer->peer = NULL;
365
    }
366 367
    g_free(nc->name);
    g_free(nc->model);
368 369 370
    if (nc->destructor) {
        nc->destructor(nc);
    }
371 372
}

373
void qemu_del_net_client(NetClientState *nc)
374
{
J
Jason Wang 已提交
375 376
    NetClientState *ncs[MAX_QUEUE_NUM];
    int queues, i;
Y
Yang Hongyang 已提交
377
    NetFilterState *nf, *next;
J
Jason Wang 已提交
378

379
    assert(nc->info->type != NET_CLIENT_DRIVER_NIC);
380

J
Jason Wang 已提交
381 382 383 384
    /* If the NetClientState belongs to a multiqueue backend, we will change all
     * other NetClientStates also.
     */
    queues = qemu_find_net_clients_except(nc->name, ncs,
385
                                          NET_CLIENT_DRIVER_NIC,
J
Jason Wang 已提交
386 387 388
                                          MAX_QUEUE_NUM);
    assert(queues != 0);

Y
Yang Hongyang 已提交
389 390 391 392
    QTAILQ_FOREACH_SAFE(nf, &nc->filters, next, next) {
        object_unparent(OBJECT(nf));
    }

393
    /* If there is a peer NIC, delete and cleanup client, but do not free. */
394
    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
J
Jason Wang 已提交
395
        NICState *nic = qemu_get_nic(nc->peer);
396 397 398 399
        if (nic->peer_deleted) {
            return;
        }
        nic->peer_deleted = true;
J
Jason Wang 已提交
400 401 402 403 404

        for (i = 0; i < queues; i++) {
            ncs[i]->peer->link_down = true;
        }

405 406
        if (nc->peer->info->link_status_changed) {
            nc->peer->info->link_status_changed(nc->peer);
407
        }
J
Jason Wang 已提交
408 409 410 411 412

        for (i = 0; i < queues; i++) {
            qemu_cleanup_net_client(ncs[i]);
        }

413 414 415
        return;
    }

J
Jason Wang 已提交
416 417 418 419
    for (i = 0; i < queues; i++) {
        qemu_cleanup_net_client(ncs[i]);
        qemu_free_net_client(ncs[i]);
    }
J
Jason Wang 已提交
420 421 422 423
}

void qemu_del_nic(NICState *nic)
{
424
    int i, queues = MAX(nic->conf->peers.queues, 1);
J
Jason Wang 已提交
425

426 427
    qemu_macaddr_set_free(&nic->conf->macaddr);

428
    /* If this is a peer NIC and peer has already been deleted, free it now. */
J
Jason Wang 已提交
429 430 431
    if (nic->peer_deleted) {
        for (i = 0; i < queues; i++) {
            qemu_free_net_client(qemu_get_subqueue(nic, i)->peer);
432 433 434
        }
    }

J
Jason Wang 已提交
435 436 437 438 439 440
    for (i = queues - 1; i >= 0; i--) {
        NetClientState *nc = qemu_get_subqueue(nic, i);

        qemu_cleanup_net_client(nc);
        qemu_free_net_client(nc);
    }
441 442

    g_free(nic);
443 444
}

M
Mark McLoughlin 已提交
445 446
void qemu_foreach_nic(qemu_nic_foreach func, void *opaque)
{
447
    NetClientState *nc;
M
Mark McLoughlin 已提交
448

449
    QTAILQ_FOREACH(nc, &net_clients, next) {
450
        if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
J
Jason Wang 已提交
451 452 453
            if (nc->queue_index == 0) {
                func(qemu_get_nic(nc), opaque);
            }
M
Mark McLoughlin 已提交
454 455 456 457
        }
    }
}

458
bool qemu_has_ufo(NetClientState *nc)
459
{
460
    if (!nc || !nc->info->has_ufo) {
461 462 463
        return false;
    }

464
    return nc->info->has_ufo(nc);
465 466
}

467
bool qemu_has_vnet_hdr(NetClientState *nc)
468
{
469
    if (!nc || !nc->info->has_vnet_hdr) {
470 471 472
        return false;
    }

473
    return nc->info->has_vnet_hdr(nc);
474 475
}

476
bool qemu_has_vnet_hdr_len(NetClientState *nc, int len)
477
{
478
    if (!nc || !nc->info->has_vnet_hdr_len) {
479 480 481
        return false;
    }

482
    return nc->info->has_vnet_hdr_len(nc, len);
483 484
}

485
void qemu_using_vnet_hdr(NetClientState *nc, bool enable)
486
{
487
    if (!nc || !nc->info->using_vnet_hdr) {
488 489 490
        return;
    }

491
    nc->info->using_vnet_hdr(nc, enable);
492 493
}

494
void qemu_set_offload(NetClientState *nc, int csum, int tso4, int tso6,
495 496
                          int ecn, int ufo)
{
497
    if (!nc || !nc->info->set_offload) {
498 499 500
        return;
    }

501
    nc->info->set_offload(nc, csum, tso4, tso6, ecn, ufo);
502 503
}

504
void qemu_set_vnet_hdr_len(NetClientState *nc, int len)
505
{
506
    if (!nc || !nc->info->set_vnet_hdr_len) {
507 508 509
        return;
    }

510
    nc->vnet_hdr_len = len;
511
    nc->info->set_vnet_hdr_len(nc, len);
512 513
}

G
Greg Kurz 已提交
514 515
int qemu_set_vnet_le(NetClientState *nc, bool is_le)
{
516
#ifdef HOST_WORDS_BIGENDIAN
G
Greg Kurz 已提交
517 518 519 520 521
    if (!nc || !nc->info->set_vnet_le) {
        return -ENOSYS;
    }

    return nc->info->set_vnet_le(nc, is_le);
522 523 524
#else
    return 0;
#endif
G
Greg Kurz 已提交
525 526 527 528
}

int qemu_set_vnet_be(NetClientState *nc, bool is_be)
{
529 530 531
#ifdef HOST_WORDS_BIGENDIAN
    return 0;
#else
G
Greg Kurz 已提交
532 533 534 535 536
    if (!nc || !nc->info->set_vnet_be) {
        return -ENOSYS;
    }

    return nc->info->set_vnet_be(nc, is_be);
537
#endif
G
Greg Kurz 已提交
538 539
}

540
int qemu_can_send_packet(NetClientState *sender)
541
{
542 543 544 545 546 547
    int vm_running = runstate_is_running();

    if (!vm_running) {
        return 0;
    }

S
Stefan Hajnoczi 已提交
548
    if (!sender->peer) {
549 550 551
        return 1;
    }

S
Stefan Hajnoczi 已提交
552 553 554 555 556
    if (sender->peer->receive_disabled) {
        return 0;
    } else if (sender->peer->info->can_receive &&
               !sender->peer->info->can_receive(sender->peer)) {
        return 0;
557
    }
558
    return 1;
559 560
}

561 562 563 564 565 566 567 568 569 570 571
static ssize_t filter_receive_iov(NetClientState *nc,
                                  NetFilterDirection direction,
                                  NetClientState *sender,
                                  unsigned flags,
                                  const struct iovec *iov,
                                  int iovcnt,
                                  NetPacketSent *sent_cb)
{
    ssize_t ret = 0;
    NetFilterState *nf = NULL;

572 573 574 575 576 577 578 579 580 581 582 583 584 585 586
    if (direction == NET_FILTER_DIRECTION_TX) {
        QTAILQ_FOREACH(nf, &nc->filters, next) {
            ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
                                         iovcnt, sent_cb);
            if (ret) {
                return ret;
            }
        }
    } else {
        QTAILQ_FOREACH_REVERSE(nf, &nc->filters, NetFilterHead, next) {
            ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
                                         iovcnt, sent_cb);
            if (ret) {
                return ret;
            }
587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608
        }
    }

    return ret;
}

static ssize_t filter_receive(NetClientState *nc,
                              NetFilterDirection direction,
                              NetClientState *sender,
                              unsigned flags,
                              const uint8_t *data,
                              size_t size,
                              NetPacketSent *sent_cb)
{
    struct iovec iov = {
        .iov_base = (void *)data,
        .iov_len = size
    };

    return filter_receive_iov(nc, direction, sender, flags, &iov, 1, sent_cb);
}

609
void qemu_purge_queued_packets(NetClientState *nc)
610
{
611
    if (!nc->peer) {
612
        return;
613
    }
614

615
    qemu_net_queue_purge(nc->peer->incoming_queue, nc);
616 617
}

618 619
static
void qemu_flush_or_purge_queued_packets(NetClientState *nc, bool purge)
620
{
621
    nc->receive_disabled = 0;
622

623
    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_HUBPORT) {
624 625 626 627
        if (net_hub_flush(nc->peer)) {
            qemu_notify_event();
        }
    }
628
    if (qemu_net_queue_flush(nc->incoming_queue)) {
629 630 631 632
        /* We emptied the queue successfully, signal to the IO thread to repoll
         * the file descriptor (for tap, for example).
         */
        qemu_notify_event();
633 634 635
    } else if (purge) {
        /* Unable to empty the queue, purge remaining packets */
        qemu_net_queue_purge(nc->incoming_queue, nc);
636
    }
637 638
}

639 640 641 642 643
void qemu_flush_queued_packets(NetClientState *nc)
{
    qemu_flush_or_purge_queued_packets(nc, false);
}

644
static ssize_t qemu_send_packet_async_with_flags(NetClientState *sender,
645 646 647
                                                 unsigned flags,
                                                 const uint8_t *buf, int size,
                                                 NetPacketSent *sent_cb)
648
{
649
    NetQueue *queue;
650
    int ret;
651

652
#ifdef DEBUG_NET
653
    printf("qemu_send_packet_async:\n");
654
    qemu_hexdump((const char *)buf, stdout, "net", size);
655
#endif
656

S
Stefan Hajnoczi 已提交
657
    if (sender->link_down || !sender->peer) {
658 659 660
        return size;
    }

661 662 663 664 665 666 667 668 669 670 671 672 673
    /* Let filters handle the packet first */
    ret = filter_receive(sender, NET_FILTER_DIRECTION_TX,
                         sender, flags, buf, size, sent_cb);
    if (ret) {
        return ret;
    }

    ret = filter_receive(sender->peer, NET_FILTER_DIRECTION_RX,
                         sender, flags, buf, size, sent_cb);
    if (ret) {
        return ret;
    }

674
    queue = sender->peer->incoming_queue;
675

676 677 678
    return qemu_net_queue_send(queue, sender, flags, buf, size, sent_cb);
}

679
ssize_t qemu_send_packet_async(NetClientState *sender,
680 681 682 683 684
                               const uint8_t *buf, int size,
                               NetPacketSent *sent_cb)
{
    return qemu_send_packet_async_with_flags(sender, QEMU_NET_PACKET_FLAG_NONE,
                                             buf, size, sent_cb);
685 686
}

687
void qemu_send_packet(NetClientState *nc, const uint8_t *buf, int size)
688
{
689
    qemu_send_packet_async(nc, buf, size, NULL);
690 691
}

692
ssize_t qemu_send_packet_raw(NetClientState *nc, const uint8_t *buf, int size)
693
{
694
    return qemu_send_packet_async_with_flags(nc, QEMU_NET_PACKET_FLAG_RAW,
695 696 697
                                             buf, size, NULL);
}

698
static ssize_t nc_sendv_compat(NetClientState *nc, const struct iovec *iov,
699
                               int iovcnt, unsigned flags)
A
aliguori 已提交
700
{
701
    uint8_t *buf = NULL;
702
    uint8_t *buffer;
B
Benjamin Poirier 已提交
703
    size_t offset;
704
    ssize_t ret;
A
aliguori 已提交
705

706 707 708 709
    if (iovcnt == 1) {
        buffer = iov[0].iov_base;
        offset = iov[0].iov_len;
    } else {
710 711 712 713 714
        offset = iov_size(iov, iovcnt);
        if (offset > NET_BUFSIZE) {
            return -1;
        }
        buf = g_malloc(offset);
715
        buffer = buf;
716
        offset = iov_to_buf(iov, iovcnt, 0, buf, offset);
717
    }
A
aliguori 已提交
718

719
    if (flags & QEMU_NET_PACKET_FLAG_RAW && nc->info->receive_raw) {
720
        ret = nc->info->receive_raw(nc, buffer, offset);
721
    } else {
722
        ret = nc->info->receive(nc, buffer, offset);
723
    }
724 725 726

    g_free(buf);
    return ret;
A
aliguori 已提交
727 728
}

729 730 731 732 733
ssize_t qemu_deliver_packet_iov(NetClientState *sender,
                                unsigned flags,
                                const struct iovec *iov,
                                int iovcnt,
                                void *opaque)
734
{
735
    NetClientState *nc = opaque;
736
    int ret;
737

738
    if (nc->link_down) {
B
Benjamin Poirier 已提交
739
        return iov_size(iov, iovcnt);
740 741
    }

742 743 744 745
    if (nc->receive_disabled) {
        return 0;
    }

746
    if (nc->info->receive_iov && !(flags & QEMU_NET_PACKET_FLAG_RAW)) {
747
        ret = nc->info->receive_iov(nc, iov, iovcnt);
748
    } else {
749
        ret = nc_sendv_compat(nc, iov, iovcnt, flags);
750 751 752 753
    }

    if (ret == 0) {
        nc->receive_disabled = 1;
754
    }
755 756

    return ret;
757 758
}

759
ssize_t qemu_sendv_packet_async(NetClientState *sender,
760 761
                                const struct iovec *iov, int iovcnt,
                                NetPacketSent *sent_cb)
762
{
763
    NetQueue *queue;
764
    int ret;
765

S
Stefan Hajnoczi 已提交
766
    if (sender->link_down || !sender->peer) {
B
Benjamin Poirier 已提交
767
        return iov_size(iov, iovcnt);
768 769
    }

770 771 772 773 774 775 776 777 778 779 780 781 782
    /* Let filters handle the packet first */
    ret = filter_receive_iov(sender, NET_FILTER_DIRECTION_TX, sender,
                             QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
    if (ret) {
        return ret;
    }

    ret = filter_receive_iov(sender->peer, NET_FILTER_DIRECTION_RX, sender,
                             QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
    if (ret) {
        return ret;
    }

783
    queue = sender->peer->incoming_queue;
784

785 786 787
    return qemu_net_queue_send_iov(queue, sender,
                                   QEMU_NET_PACKET_FLAG_NONE,
                                   iov, iovcnt, sent_cb);
A
aliguori 已提交
788 789
}

790
ssize_t
791
qemu_sendv_packet(NetClientState *nc, const struct iovec *iov, int iovcnt)
792
{
793
    return qemu_sendv_packet_async(nc, iov, iovcnt, NULL);
794 795
}

796
NetClientState *qemu_find_netdev(const char *id)
M
Mark McLoughlin 已提交
797
{
798
    NetClientState *nc;
M
Mark McLoughlin 已提交
799

800
    QTAILQ_FOREACH(nc, &net_clients, next) {
801
        if (nc->info->type == NET_CLIENT_DRIVER_NIC)
802
            continue;
803 804
        if (!strcmp(nc->name, id)) {
            return nc;
M
Mark McLoughlin 已提交
805 806 807 808 809 810
        }
    }

    return NULL;
}

811
int qemu_find_net_clients_except(const char *id, NetClientState **ncs,
812
                                 NetClientDriver type, int max)
813 814 815 816 817 818 819 820
{
    NetClientState *nc;
    int ret = 0;

    QTAILQ_FOREACH(nc, &net_clients, next) {
        if (nc->info->type == type) {
            continue;
        }
821
        if (!id || !strcmp(nc->name, id)) {
822 823 824 825 826 827 828 829 830 831
            if (ret < max) {
                ncs[ret] = nc;
            }
            ret++;
        }
    }

    return ret;
}

832 833 834 835 836 837 838 839 840 841
static int nic_get_free_idx(void)
{
    int index;

    for (index = 0; index < MAX_NICS; index++)
        if (!nd_table[index].used)
            return index;
    return -1;
}

842 843 844 845
int qemu_show_nic_models(const char *arg, const char *const *models)
{
    int i;

846
    if (!arg || !is_help_option(arg)) {
847
        return 0;
848
    }
849 850 851 852 853 854 855

    fprintf(stderr, "qemu: Supported NIC models: ");
    for (i = 0 ; models[i]; i++)
        fprintf(stderr, "%s%c", models[i], models[i+1] ? ',' : '\n');
    return 1;
}

856 857 858 859 860 861 862
void qemu_check_nic_model(NICInfo *nd, const char *model)
{
    const char *models[2];

    models[0] = model;
    models[1] = NULL;

863 864 865 866
    if (qemu_show_nic_models(nd->model, models))
        exit(0);
    if (qemu_find_nic_model(nd, models, model) < 0)
        exit(1);
867 868
}

869 870
int qemu_find_nic_model(NICInfo *nd, const char * const *models,
                        const char *default_model)
871
{
872
    int i;
873 874

    if (!nd->model)
875
        nd->model = g_strdup(default_model);
876

877 878 879
    for (i = 0 ; models[i]; i++) {
        if (strcmp(nd->model, models[i]) == 0)
            return i;
880 881
    }

882
    error_report("Unsupported NIC model: %s", nd->model);
883
    return -1;
884 885
}

886
static int net_init_nic(const Netdev *netdev, const char *name,
887
                        NetClientState *peer, Error **errp)
888 889 890
{
    int idx;
    NICInfo *nd;
891 892
    const NetLegacyNicOptions *nic;

893 894
    assert(netdev->type == NET_CLIENT_DRIVER_NIC);
    nic = &netdev->u.nic;
895 896 897

    idx = nic_get_free_idx();
    if (idx == -1 || nb_nics >= MAX_NICS) {
898
        error_setg(errp, "too many NICs");
899 900 901 902 903 904 905
        return -1;
    }

    nd = &nd_table[idx];

    memset(nd, 0, sizeof(*nd));

906 907
    if (nic->has_netdev) {
        nd->netdev = qemu_find_netdev(nic->netdev);
M
Mark McLoughlin 已提交
908
        if (!nd->netdev) {
909
            error_setg(errp, "netdev '%s' not found", nic->netdev);
M
Mark McLoughlin 已提交
910 911 912
            return -1;
        }
    } else {
913 914
        assert(peer);
        nd->netdev = peer;
M
Mark McLoughlin 已提交
915
    }
916
    nd->name = g_strdup(name);
917 918
    if (nic->has_model) {
        nd->model = g_strdup(nic->model);
919
    }
920 921
    if (nic->has_addr) {
        nd->devaddr = g_strdup(nic->addr);
922 923
    }

924 925
    if (nic->has_macaddr &&
        net_parse_macaddr(nd->macaddr.a, nic->macaddr) < 0) {
926
        error_setg(errp, "invalid syntax for ethernet address");
927 928
        return -1;
    }
929 930
    if (nic->has_macaddr &&
        is_multicast_ether_addr(nd->macaddr.a)) {
931 932
        error_setg(errp,
                   "NIC cannot have multicast MAC address (odd 1st byte)");
933 934
        return -1;
    }
935
    qemu_macaddr_default_if_unset(&nd->macaddr);
936

937 938
    if (nic->has_vectors) {
        if (nic->vectors > 0x7ffffff) {
939
            error_setg(errp, "invalid # of vectors: %"PRIu32, nic->vectors);
940 941 942 943 944
            return -1;
        }
        nd->nvectors = nic->vectors;
    } else {
        nd->nvectors = DEV_NVECTORS_UNSPECIFIED;
945 946 947 948 949 950 951 952
    }

    nd->used = 1;
    nb_nics++;

    return idx;
}

953

954
static int (* const net_client_init_fun[NET_CLIENT_DRIVER__MAX])(
955
    const Netdev *netdev,
956
    const char *name,
957
    NetClientState *peer, Error **errp) = {
958
        [NET_CLIENT_DRIVER_NIC]       = net_init_nic,
M
Mark McLoughlin 已提交
959
#ifdef CONFIG_SLIRP
960
        [NET_CLIENT_DRIVER_USER]      = net_init_slirp,
961
#endif
962 963
        [NET_CLIENT_DRIVER_TAP]       = net_init_tap,
        [NET_CLIENT_DRIVER_SOCKET]    = net_init_socket,
M
Mark McLoughlin 已提交
964
#ifdef CONFIG_VDE
965
        [NET_CLIENT_DRIVER_VDE]       = net_init_vde,
966 967
#endif
#ifdef CONFIG_NETMAP
968
        [NET_CLIENT_DRIVER_NETMAP]    = net_init_netmap,
M
Mark McLoughlin 已提交
969
#endif
970
        [NET_CLIENT_DRIVER_DUMP]      = net_init_dump,
971
#ifdef CONFIG_NET_BRIDGE
972
        [NET_CLIENT_DRIVER_BRIDGE]    = net_init_bridge,
973
#endif
974
        [NET_CLIENT_DRIVER_HUBPORT]   = net_init_hubport,
975
#ifdef CONFIG_VHOST_NET_USED
976
        [NET_CLIENT_DRIVER_VHOST_USER] = net_init_vhost_user,
977
#endif
978
#ifdef CONFIG_L2TPV3
979
        [NET_CLIENT_DRIVER_L2TPV3]    = net_init_l2tpv3,
A
Anton Ivanov 已提交
980
#endif
981 982
};

983

E
Eric Blake 已提交
984
static int net_client_init1(const void *object, bool is_netdev, Error **errp)
985
{
986 987
    Netdev legacy = {0};
    const Netdev *netdev;
988
    const char *name;
989
    NetClientState *peer = NULL;
990
    static bool vlan_warned;
991

992
    if (is_netdev) {
993
        netdev = object;
994
        name = netdev->id;
995

996 997 998
        if (netdev->type == NET_CLIENT_DRIVER_DUMP ||
            netdev->type == NET_CLIENT_DRIVER_NIC ||
            !net_client_init_fun[netdev->type]) {
999 1000
            error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "type",
                       "a netdev backend type");
M
Mark McLoughlin 已提交
1001 1002
            return -1;
        }
1003
    } else {
1004
        const NetLegacy *net = object;
1005
        const NetLegacyOptions *opts = net->opts;
1006 1007
        legacy.id = net->id;
        netdev = &legacy;
1008
        /* missing optional values have been initialized to "all bits zero" */
1009
        name = net->has_id ? net->id : net->name;
1010

1011 1012
        /* Map the old options to the new flat type */
        switch (opts->type) {
1013
        case NET_LEGACY_OPTIONS_TYPE_NONE:
1014
            return 0; /* nothing to do */
1015
        case NET_LEGACY_OPTIONS_TYPE_NIC:
1016
            legacy.type = NET_CLIENT_DRIVER_NIC;
1017
            legacy.u.nic = opts->u.nic;
1018
            break;
1019
        case NET_LEGACY_OPTIONS_TYPE_USER:
1020
            legacy.type = NET_CLIENT_DRIVER_USER;
1021
            legacy.u.user = opts->u.user;
1022
            break;
1023
        case NET_LEGACY_OPTIONS_TYPE_TAP:
1024
            legacy.type = NET_CLIENT_DRIVER_TAP;
1025
            legacy.u.tap = opts->u.tap;
1026
            break;
1027
        case NET_LEGACY_OPTIONS_TYPE_L2TPV3:
1028
            legacy.type = NET_CLIENT_DRIVER_L2TPV3;
1029
            legacy.u.l2tpv3 = opts->u.l2tpv3;
1030
            break;
1031
        case NET_LEGACY_OPTIONS_TYPE_SOCKET:
1032
            legacy.type = NET_CLIENT_DRIVER_SOCKET;
1033
            legacy.u.socket = opts->u.socket;
1034
            break;
1035
        case NET_LEGACY_OPTIONS_TYPE_VDE:
1036
            legacy.type = NET_CLIENT_DRIVER_VDE;
1037
            legacy.u.vde = opts->u.vde;
1038
            break;
1039
        case NET_LEGACY_OPTIONS_TYPE_DUMP:
1040
            legacy.type = NET_CLIENT_DRIVER_DUMP;
1041
            legacy.u.dump = opts->u.dump;
1042
            break;
1043
        case NET_LEGACY_OPTIONS_TYPE_BRIDGE:
1044
            legacy.type = NET_CLIENT_DRIVER_BRIDGE;
1045
            legacy.u.bridge = opts->u.bridge;
1046
            break;
1047
        case NET_LEGACY_OPTIONS_TYPE_NETMAP:
1048
            legacy.type = NET_CLIENT_DRIVER_NETMAP;
1049
            legacy.u.netmap = opts->u.netmap;
1050
            break;
1051
        case NET_LEGACY_OPTIONS_TYPE_VHOST_USER:
1052
            legacy.type = NET_CLIENT_DRIVER_VHOST_USER;
1053
            legacy.u.vhost_user = opts->u.vhost_user;
1054 1055 1056
            break;
        default:
            abort();
1057
        }
1058

1059
        if (!net_client_init_fun[netdev->type]) {
1060 1061 1062 1063 1064
            error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "type",
                       "a net backend type (maybe it is not compiled "
                       "into this binary)");
            return -1;
        }
M
Mark McLoughlin 已提交
1065

1066
        /* Do not add to a vlan if it's a nic with a netdev= parameter. */
1067
        if (netdev->type != NET_CLIENT_DRIVER_NIC ||
1068
            !opts->u.nic.has_netdev) {
1069
            peer = net_hub_add_port(net->has_vlan ? net->vlan : 0, NULL, NULL);
1070
        }
1071 1072 1073 1074 1075

        if (net->has_vlan && !vlan_warned) {
            error_report("'vlan' is deprecated. Please use 'netdev' instead.");
            vlan_warned = true;
        }
1076
    }
1077

1078
    if (net_client_init_fun[netdev->type](netdev, name, peer, errp) < 0) {
1079 1080 1081
        /* FIXME drop when all init functions store an Error */
        if (errp && !*errp) {
            error_setg(errp, QERR_DEVICE_INIT_FAILED,
1082
                       NetClientDriver_str(netdev->type));
M
Mark McLoughlin 已提交
1083
        }
1084
        return -1;
M
Mark McLoughlin 已提交
1085
    }
1086 1087 1088
    return 0;
}

M
Mark McLoughlin 已提交
1089

E
Eric Blake 已提交
1090
int net_client_init(QemuOpts *opts, bool is_netdev, Error **errp)
1091 1092 1093 1094
{
    void *object = NULL;
    Error *err = NULL;
    int ret = -1;
1095
    Visitor *v = opts_visitor_new(opts);
1096

1097 1098
    {
        /* Parse convenience option format ip6-net=fec0::0[/64] */
1099
        const char *ip6_net = qemu_opt_get(opts, "ipv6-net");
1100 1101 1102 1103 1104 1105

        if (ip6_net) {
            char buf[strlen(ip6_net) + 1];

            if (get_str_sep(buf, sizeof(buf), &ip6_net, '/') < 0) {
                /* Default 64bit prefix length.  */
1106 1107
                qemu_opt_set(opts, "ipv6-prefix", ip6_net, &error_abort);
                qemu_opt_set_number(opts, "ipv6-prefixlen", 64, &error_abort);
1108 1109 1110 1111 1112
            } else {
                /* User-specified prefix length.  */
                unsigned long len;
                int err;

1113
                qemu_opt_set(opts, "ipv6-prefix", buf, &error_abort);
1114 1115 1116 1117
                err = qemu_strtoul(ip6_net, NULL, 10, &len);

                if (err) {
                    error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
1118
                              "ipv6-prefix", "a number");
1119
                } else {
1120
                    qemu_opt_set_number(opts, "ipv6-prefixlen", len,
1121 1122 1123
                                        &error_abort);
                }
            }
1124
            qemu_opt_unset(opts, "ipv6-net");
1125 1126 1127
        }
    }

1128 1129 1130 1131
    if (is_netdev) {
        visit_type_Netdev(v, NULL, (Netdev **)&object, &err);
    } else {
        visit_type_NetLegacy(v, NULL, (NetLegacy **)&object, &err);
1132 1133
    }

1134
    if (!err) {
1135
        ret = net_client_init1(object, is_netdev, &err);
1136 1137
    }

1138 1139 1140 1141
    if (is_netdev) {
        qapi_free_Netdev(object);
    } else {
        qapi_free_NetLegacy(object);
1142 1143 1144
    }

    error_propagate(errp, err);
1145
    visit_free(v);
1146
    return ret;
1147 1148
}

1149

1150 1151 1152
static int net_host_check_device(const char *device)
{
    int i;
1153 1154 1155
    for (i = 0; host_net_devices[i]; i++) {
        if (!strncmp(host_net_devices[i], device,
                     strlen(host_net_devices[i]))) {
1156
            return 1;
1157
        }
1158 1159 1160 1161 1162
    }

    return 0;
}

1163
void hmp_host_net_add(Monitor *mon, const QDict *qdict)
1164
{
1165
    const char *device = qdict_get_str(qdict, "device");
1166
    const char *opts_str = qdict_get_try_str(qdict, "opts");
1167
    Error *local_err = NULL;
1168
    QemuOpts *opts;
1169 1170 1171 1172 1173 1174
    static bool warned;

    if (!warned && !qtest_enabled()) {
        error_report("host_net_add is deprecated, use netdev_add instead");
        warned = true;
    }
1175

1176
    if (!net_host_check_device(device)) {
A
aliguori 已提交
1177
        monitor_printf(mon, "invalid host network device %s\n", device);
1178 1179
        return;
    }
1180

1181 1182
    opts = qemu_opts_parse_noisily(qemu_find_opts("net"),
                                   opts_str ? opts_str : "", false);
1183 1184 1185 1186
    if (!opts) {
        return;
    }

1187
    qemu_opt_set(opts, "type", device, &error_abort);
1188

E
Eric Blake 已提交
1189
    net_client_init(opts, false, &local_err);
1190
    if (local_err) {
1191
        error_report_err(local_err);
1192 1193
        monitor_printf(mon, "adding host network device %s failed\n", device);
    }
1194 1195
}

1196
void hmp_host_net_remove(Monitor *mon, const QDict *qdict)
1197
{
1198
    NetClientState *nc;
1199 1200
    int vlan_id = qdict_get_int(qdict, "vlan_id");
    const char *device = qdict_get_str(qdict, "device");
1201 1202 1203 1204 1205 1206
    static bool warned;

    if (!warned && !qtest_enabled()) {
        error_report("host_net_remove is deprecated, use netdev_del instead");
        warned = true;
    }
1207

1208 1209
    nc = net_hub_find_client_by_name(vlan_id, device);
    if (!nc) {
1210 1211
        error_report("Host network device '%s' on hub '%d' not found",
                     device, vlan_id);
1212 1213
        return;
    }
1214
    if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
1215
        error_report("invalid host network device '%s'", device);
1216 1217
        return;
    }
1218 1219

    qemu_del_net_client(nc->peer);
1220
    qemu_del_net_client(nc);
1221
    qemu_opts_del(qemu_opts_find(qemu_find_opts("net"), device));
1222 1223
}

L
Luiz Capitulino 已提交
1224 1225
void netdev_add(QemuOpts *opts, Error **errp)
{
E
Eric Blake 已提交
1226
    net_client_init(opts, true, errp);
L
Luiz Capitulino 已提交
1227 1228
}

1229
void qmp_netdev_add(QDict *qdict, QObject **ret, Error **errp)
1230
{
1231
    Error *local_err = NULL;
L
Luiz Capitulino 已提交
1232
    QemuOptsList *opts_list;
1233 1234
    QemuOpts *opts;

L
Luiz Capitulino 已提交
1235
    opts_list = qemu_find_opts_err("netdev", &local_err);
1236
    if (local_err) {
1237
        goto out;
1238 1239
    }

L
Luiz Capitulino 已提交
1240
    opts = qemu_opts_from_qdict(opts_list, qdict, &local_err);
1241
    if (local_err) {
1242
        goto out;
L
Luiz Capitulino 已提交
1243 1244 1245
    }

    netdev_add(opts, &local_err);
1246
    if (local_err) {
1247
        qemu_opts_del(opts);
1248
        goto out;
1249 1250
    }

1251 1252
out:
    error_propagate(errp, local_err);
1253 1254
}

L
Luiz Capitulino 已提交
1255
void qmp_netdev_del(const char *id, Error **errp)
1256
{
1257
    NetClientState *nc;
1258
    QemuOpts *opts;
1259

1260 1261
    nc = qemu_find_netdev(id);
    if (!nc) {
1262 1263
        error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
                  "Device '%s' not found", id);
L
Luiz Capitulino 已提交
1264
        return;
1265
    }
L
Luiz Capitulino 已提交
1266

1267 1268 1269 1270 1271 1272
    opts = qemu_opts_find(qemu_find_opts_err("netdev", NULL), id);
    if (!opts) {
        error_setg(errp, "Device '%s' is not a netdev", id);
        return;
    }

1273
    qemu_del_net_client(nc);
1274
    qemu_opts_del(opts);
1275 1276
}

1277 1278 1279 1280 1281
static void netfilter_print_info(Monitor *mon, NetFilterState *nf)
{
    char *str;
    ObjectProperty *prop;
    ObjectPropertyIterator iter;
1282
    Visitor *v;
1283 1284 1285 1286 1287 1288 1289

    /* generate info str */
    object_property_iter_init(&iter, OBJECT(nf));
    while ((prop = object_property_iter_next(&iter))) {
        if (!strcmp(prop->name, "type")) {
            continue;
        }
1290 1291 1292 1293
        v = string_output_visitor_new(false, &str);
        object_property_get(OBJECT(nf), v, prop->name, NULL);
        visit_complete(v, &str);
        visit_free(v);
1294 1295 1296 1297 1298 1299
        monitor_printf(mon, ",%s=%s", prop->name, str);
        g_free(str);
    }
    monitor_printf(mon, "\n");
}

1300
void print_net_client(Monitor *mon, NetClientState *nc)
1301
{
1302 1303
    NetFilterState *nf;

J
Jason Wang 已提交
1304 1305
    monitor_printf(mon, "%s: index=%d,type=%s,%s\n", nc->name,
                   nc->queue_index,
1306
                   NetClientDriver_str(nc->info->type),
J
Jason Wang 已提交
1307
                   nc->info_str);
1308 1309 1310 1311
    if (!QTAILQ_EMPTY(&nc->filters)) {
        monitor_printf(mon, "filters:\n");
    }
    QTAILQ_FOREACH(nf, &nc->filters, next) {
1312
        char *path = object_get_canonical_path_component(OBJECT(nf));
1313 1314 1315 1316

        monitor_printf(mon, "  - %s: type=%s", path,
                       object_get_typename(OBJECT(nf)));
        netfilter_print_info(mon, nf);
1317
        g_free(path);
1318
    }
1319 1320
}

1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335
RxFilterInfoList *qmp_query_rx_filter(bool has_name, const char *name,
                                      Error **errp)
{
    NetClientState *nc;
    RxFilterInfoList *filter_list = NULL, *last_entry = NULL;

    QTAILQ_FOREACH(nc, &net_clients, next) {
        RxFilterInfoList *entry;
        RxFilterInfo *info;

        if (has_name && strcmp(nc->name, name) != 0) {
            continue;
        }

        /* only query rx-filter information of NIC */
1336
        if (nc->info->type != NET_CLIENT_DRIVER_NIC) {
1337 1338
            if (has_name) {
                error_setg(errp, "net client(%s) isn't a NIC", name);
1339
                return NULL;
1340 1341 1342 1343
            }
            continue;
        }

1344 1345 1346 1347 1348 1349
        /* only query information on queue 0 since the info is per nic,
         * not per queue
         */
        if (nc->queue_index != 0)
            continue;

1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363
        if (nc->info->query_rx_filter) {
            info = nc->info->query_rx_filter(nc);
            entry = g_malloc0(sizeof(*entry));
            entry->value = info;

            if (!filter_list) {
                filter_list = entry;
            } else {
                last_entry->next = entry;
            }
            last_entry = entry;
        } else if (has_name) {
            error_setg(errp, "net client(%s) doesn't support"
                       " rx-filter querying", name);
1364
            return NULL;
1365
        }
1366 1367 1368 1369

        if (has_name) {
            break;
        }
1370 1371
    }

1372
    if (filter_list == NULL && has_name) {
1373 1374 1375 1376 1377 1378
        error_setg(errp, "invalid net client name: %s", name);
    }

    return filter_list;
}

1379
void hmp_info_network(Monitor *mon, const QDict *qdict)
1380
{
1381
    NetClientState *nc, *peer;
1382
    NetClientDriver type;
1383

1384 1385
    net_hub_info(mon);

1386 1387 1388
    QTAILQ_FOREACH(nc, &net_clients, next) {
        peer = nc->peer;
        type = nc->info->type;
1389

1390 1391 1392
        /* Skip if already printed in hub info */
        if (net_hub_id_for_client(nc, NULL) == 0) {
            continue;
1393
        }
1394

1395
        if (!peer || type == NET_CLIENT_DRIVER_NIC) {
1396
            print_net_client(mon, nc);
1397
        } /* else it's a netdev connected to a NIC, printed with the NIC */
1398
        if (peer && type == NET_CLIENT_DRIVER_NIC) {
1399
            monitor_printf(mon, " \\ ");
1400
            print_net_client(mon, peer);
1401 1402
        }
    }
1403 1404
}

L
Luiz Capitulino 已提交
1405
void qmp_set_link(const char *name, bool up, Error **errp)
1406
{
J
Jason Wang 已提交
1407 1408 1409
    NetClientState *ncs[MAX_QUEUE_NUM];
    NetClientState *nc;
    int queues, i;
1410

J
Jason Wang 已提交
1411
    queues = qemu_find_net_clients_except(name, ncs,
1412
                                          NET_CLIENT_DRIVER__MAX,
J
Jason Wang 已提交
1413 1414 1415
                                          MAX_QUEUE_NUM);

    if (queues == 0) {
1416 1417
        error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
                  "Device '%s' not found", name);
L
Luiz Capitulino 已提交
1418
        return;
1419
    }
J
Jason Wang 已提交
1420
    nc = ncs[0];
1421

J
Jason Wang 已提交
1422 1423 1424
    for (i = 0; i < queues; i++) {
        ncs[i]->link_down = !up;
    }
1425

1426 1427
    if (nc->info->link_status_changed) {
        nc->info->link_status_changed(nc);
1428
    }
1429

1430 1431 1432 1433 1434 1435 1436 1437 1438
    if (nc->peer) {
        /* Change peer link only if the peer is NIC and then notify peer.
         * If the peer is a HUBPORT or a backend, we do not change the
         * link status.
         *
         * This behavior is compatible with qemu vlans where there could be
         * multiple clients that can still communicate with each other in
         * disconnected mode. For now maintain this compatibility.
         */
1439
        if (nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
1440 1441 1442 1443 1444 1445 1446
            for (i = 0; i < queues; i++) {
                ncs[i]->peer->link_down = !up;
            }
        }
        if (nc->peer->info->link_status_changed) {
            nc->peer->info->link_status_changed(nc->peer);
        }
1447
    }
1448 1449
}

1450 1451 1452
static void net_vm_change_state_handler(void *opaque, int running,
                                        RunState state)
{
1453 1454
    NetClientState *nc;
    NetClientState *tmp;
1455

1456 1457 1458 1459 1460 1461 1462 1463 1464 1465
    QTAILQ_FOREACH_SAFE(nc, &net_clients, next, tmp) {
        if (running) {
            /* Flush queued packets and wake up backends. */
            if (nc->peer && qemu_can_send_packet(nc)) {
                qemu_flush_queued_packets(nc->peer);
            }
        } else {
            /* Complete all queued packets, to guarantee we don't modify
             * state later when VM is not running.
             */
1466 1467 1468 1469 1470
            qemu_flush_or_purge_queued_packets(nc, true);
        }
    }
}

1471 1472
void net_cleanup(void)
{
J
Jason Wang 已提交
1473
    NetClientState *nc;
1474

J
Jason Wang 已提交
1475 1476 1477 1478 1479
    /* We may del multiple entries during qemu_del_net_client(),
     * so QTAILQ_FOREACH_SAFE() is also not safe here.
     */
    while (!QTAILQ_EMPTY(&net_clients)) {
        nc = QTAILQ_FIRST(&net_clients);
1480
        if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
J
Jason Wang 已提交
1481 1482 1483 1484
            qemu_del_nic(qemu_get_nic(nc));
        } else {
            qemu_del_net_client(nc);
        }
1485
    }
1486 1487

    qemu_del_vm_change_state_handler(net_change_state_entry);
1488 1489
}

1490
void net_check_clients(void)
1491
{
1492
    NetClientState *nc;
1493
    int i;
1494

1495
    net_hub_check_clients();
1496

1497 1498
    QTAILQ_FOREACH(nc, &net_clients, next) {
        if (!nc->peer) {
1499
            warn_report("%s %s has no peer",
A
Alistair Francis 已提交
1500 1501 1502
                        nc->info->type == NET_CLIENT_DRIVER_NIC
                        ? "nic" : "netdev",
                        nc->name);
1503 1504
        }
    }
1505 1506 1507 1508 1509 1510 1511 1512

    /* Check that all NICs requested via -net nic actually got created.
     * NICs created via -device don't need to be checked here because
     * they are always instantiated.
     */
    for (i = 0; i < MAX_NICS; i++) {
        NICInfo *nd = &nd_table[i];
        if (nd->used && !nd->instantiated) {
1513 1514 1515 1516
            warn_report("requested NIC (%s, model %s) "
                        "was not created (not supported by this machine?)",
                        nd->name ? nd->name : "anonymous",
                        nd->model ? nd->model : "unspecified");
1517 1518
        }
    }
1519
}
1520

1521
static int net_init_client(void *dummy, QemuOpts *opts, Error **errp)
1522
{
1523 1524
    Error *local_err = NULL;

E
Eric Blake 已提交
1525
    net_client_init(opts, false, &local_err);
1526
    if (local_err) {
1527
        error_report_err(local_err);
1528
        return -1;
1529 1530
    }

1531
    return 0;
M
Mark McLoughlin 已提交
1532 1533
}

1534
static int net_init_netdev(void *dummy, QemuOpts *opts, Error **errp)
M
Mark McLoughlin 已提交
1535
{
1536 1537 1538
    Error *local_err = NULL;
    int ret;

E
Eric Blake 已提交
1539
    ret = net_client_init(opts, true, &local_err);
1540
    if (local_err) {
1541
        error_report_err(local_err);
1542 1543 1544 1545
        return -1;
    }

    return ret;
1546 1547 1548 1549
}

int net_init_clients(void)
{
1550 1551
    QemuOptsList *net = qemu_find_opts("net");

1552 1553 1554
    net_change_state_entry =
        qemu_add_vm_change_state_handler(net_vm_change_state_handler, NULL);

1555
    QTAILQ_INIT(&net_clients);
1556

1557 1558
    if (qemu_opts_foreach(qemu_find_opts("netdev"),
                          net_init_netdev, NULL, NULL)) {
M
Mark McLoughlin 已提交
1559
        return -1;
1560
    }
M
Mark McLoughlin 已提交
1561

1562
    if (qemu_opts_foreach(net, net_init_client, NULL, NULL)) {
1563 1564 1565 1566 1567 1568
        return -1;
    }

    return 0;
}

1569
int net_client_parse(QemuOptsList *opts_list, const char *optarg)
1570
{
1571
    if (!qemu_opts_parse_noisily(opts_list, optarg, true)) {
1572 1573 1574 1575 1576
        return -1;
    }

    return 0;
}
1577 1578 1579

/* From FreeBSD */
/* XXX: optimize */
1580
uint32_t net_crc32(const uint8_t *p, int len)
1581 1582 1583 1584 1585 1586
{
    uint32_t crc;
    int carry, i, j;
    uint8_t b;

    crc = 0xffffffff;
1587 1588
    for (i = 0; i < len; i++) {
        b = *p++;
1589 1590 1591 1592 1593
        for (j = 0; j < 8; j++) {
            carry = ((crc & 0x80000000L) ? 1 : 0) ^ (b & 0x01);
            crc <<= 1;
            b >>= 1;
            if (carry) {
1594
                crc = ((crc ^ POLYNOMIAL_BE) | carry);
1595 1596 1597
            }
        }
    }
1598 1599 1600 1601

    return crc;
}

1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623
uint32_t net_crc32_le(const uint8_t *p, int len)
{
    uint32_t crc;
    int carry, i, j;
    uint8_t b;

    crc = 0xffffffff;
    for (i = 0; i < len; i++) {
        b = *p++;
        for (j = 0; j < 8; j++) {
            carry = (crc & 0x1) ^ (b & 0x01);
            crc >>= 1;
            b >>= 1;
            if (carry) {
                crc ^= POLYNOMIAL_LE;
            }
        }
    }

    return crc;
}

1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648
QemuOptsList qemu_netdev_opts = {
    .name = "netdev",
    .implied_opt_name = "type",
    .head = QTAILQ_HEAD_INITIALIZER(qemu_netdev_opts.head),
    .desc = {
        /*
         * no elements => accept any params
         * validation will happen later
         */
        { /* end of list */ }
    },
};

QemuOptsList qemu_net_opts = {
    .name = "net",
    .implied_opt_name = "type",
    .head = QTAILQ_HEAD_INITIALIZER(qemu_net_opts.head),
    .desc = {
        /*
         * no elements => accept any params
         * validation will happen later
         */
        { /* end of list */ }
    },
};
1649 1650

void net_socket_rs_init(SocketReadState *rs,
1651 1652
                        SocketReadStateFinalize *finalize,
                        bool vnet_hdr)
1653 1654
{
    rs->state = 0;
1655
    rs->vnet_hdr = vnet_hdr;
1656 1657
    rs->index = 0;
    rs->packet_len = 0;
1658
    rs->vnet_hdr_len = 0;
1659 1660 1661 1662 1663 1664
    memset(rs->buf, 0, sizeof(rs->buf));
    rs->finalize = finalize;
}

/*
 * Returns
1665 1666
 * 0: success
 * -1: error occurs
1667 1668 1669 1670 1671 1672
 */
int net_fill_rstate(SocketReadState *rs, const uint8_t *buf, int size)
{
    unsigned int l;

    while (size > 0) {
1673 1674 1675 1676 1677 1678
        /* Reassemble a packet from the network.
         * 0 = getting length.
         * 1 = getting vnet header length.
         * 2 = getting data.
         */
        switch (rs->state) {
1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691
        case 0:
            l = 4 - rs->index;
            if (l > size) {
                l = size;
            }
            memcpy(rs->buf + rs->index, buf, l);
            buf += l;
            size -= l;
            rs->index += l;
            if (rs->index == 4) {
                /* got length */
                rs->packet_len = ntohl(*(uint32_t *)rs->buf);
                rs->index = 0;
1692 1693 1694 1695 1696 1697
                if (rs->vnet_hdr) {
                    rs->state = 1;
                } else {
                    rs->state = 2;
                    rs->vnet_hdr_len = 0;
                }
1698 1699 1700
            }
            break;
        case 1:
1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716
            l = 4 - rs->index;
            if (l > size) {
                l = size;
            }
            memcpy(rs->buf + rs->index, buf, l);
            buf += l;
            size -= l;
            rs->index += l;
            if (rs->index == 4) {
                /* got vnet header length */
                rs->vnet_hdr_len = ntohl(*(uint32_t *)rs->buf);
                rs->index = 0;
                rs->state = 2;
            }
            break;
        case 2:
1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735
            l = rs->packet_len - rs->index;
            if (l > size) {
                l = size;
            }
            if (rs->index + l <= sizeof(rs->buf)) {
                memcpy(rs->buf + rs->index, buf, l);
            } else {
                fprintf(stderr, "serious error: oversized packet received,"
                    "connection terminated.\n");
                rs->index = rs->state = 0;
                return -1;
            }

            rs->index += l;
            buf += l;
            size -= l;
            if (rs->index >= rs->packet_len) {
                rs->index = 0;
                rs->state = 0;
1736 1737
                assert(rs->finalize);
                rs->finalize(rs);
1738 1739 1740 1741
            }
            break;
        }
    }
1742 1743

    assert(size == 0);
1744 1745
    return 0;
}