net.c 45.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * QEMU System Emulator
 *
 * Copyright (c) 2003-2008 Fabrice Bellard
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24

P
Peter Maydell 已提交
25
#include "qemu/osdep.h"
B
blueswir1 已提交
26

P
Paolo Bonzini 已提交
27
#include "net/net.h"
P
Paolo Bonzini 已提交
28 29
#include "clients.h"
#include "hub.h"
P
Paolo Bonzini 已提交
30
#include "net/slirp.h"
31
#include "net/eth.h"
P
Paolo Bonzini 已提交
32
#include "util.h"
33

34
#include "monitor/monitor.h"
M
Mark McLoughlin 已提交
35
#include "qemu-common.h"
36
#include "qemu/help_option.h"
37
#include "qapi/qmp/qerror.h"
38
#include "qemu/error-report.h"
39
#include "qemu/sockets.h"
40
#include "qemu/cutils.h"
41
#include "qemu/config-file.h"
L
Luiz Capitulino 已提交
42
#include "qmp-commands.h"
43
#include "hw/qdev.h"
44
#include "qemu/iov.h"
45
#include "qemu/main-loop.h"
46
#include "qapi-visit.h"
47
#include "qapi/error.h"
48
#include "qapi/opts-visitor.h"
49
#include "sysemu/sysemu.h"
50
#include "sysemu/qtest.h"
Y
Yang Hongyang 已提交
51
#include "net/filter.h"
52
#include "qapi/string-output-visitor.h"
53

54 55 56 57 58
/* Net bridge is currently not supported for W32. */
#if !defined(_WIN32)
# define CONFIG_NET_BRIDGE
#endif

59
static VMChangeStateEntry *net_change_state_entry;
60
static QTAILQ_HEAD(, NetClientState) net_clients;
61

62 63 64 65 66 67 68
const char *host_net_devices[] = {
    "tap",
    "socket",
    "dump",
#ifdef CONFIG_NET_BRIDGE
    "bridge",
#endif
69 70 71
#ifdef CONFIG_NETMAP
    "netmap",
#endif
72 73 74 75 76 77
#ifdef CONFIG_SLIRP
    "user",
#endif
#ifdef CONFIG_VDE
    "vde",
#endif
78
    "vhost-user",
79 80 81
    NULL,
};

82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
/***********************************************************/
/* network device redirectors */

static int get_str_sep(char *buf, int buf_size, const char **pp, int sep)
{
    const char *p, *p1;
    int len;
    p = *pp;
    p1 = strchr(p, sep);
    if (!p1)
        return -1;
    len = p1 - p;
    p1++;
    if (buf_size > 0) {
        if (len > buf_size - 1)
            len = buf_size - 1;
        memcpy(buf, p, len);
        buf[len] = '\0';
    }
    *pp = p1;
    return 0;
}

105 106
int parse_host_port(struct sockaddr_in *saddr, const char *str,
                    Error **errp)
107 108 109 110 111 112 113
{
    char buf[512];
    struct hostent *he;
    const char *p, *r;
    int port;

    p = str;
114 115 116
    if (get_str_sep(buf, sizeof(buf), &p, ':') < 0) {
        error_setg(errp, "host address '%s' doesn't contain ':' "
                   "separating host from port", str);
117
        return -1;
118
    }
119 120 121 122
    saddr->sin_family = AF_INET;
    if (buf[0] == '\0') {
        saddr->sin_addr.s_addr = 0;
    } else {
123
        if (qemu_isdigit(buf[0])) {
124 125 126
            if (!inet_aton(buf, &saddr->sin_addr)) {
                error_setg(errp, "host address '%s' is not a valid "
                           "IPv4 address", buf);
127
                return -1;
128
            }
129
        } else {
130 131 132
            he = gethostbyname(buf);
            if (he == NULL) {
                error_setg(errp, "can't resolve host address '%s'", buf);
133
                return - 1;
134
            }
135 136 137 138
            saddr->sin_addr = *(struct in_addr *)he->h_addr;
        }
    }
    port = strtol(p, (char **)&r, 0);
139 140
    if (r == p) {
        error_setg(errp, "port number '%s' is invalid", p);
141
        return -1;
142
    }
143 144 145 146
    saddr->sin_port = htons(port);
    return 0;
}

147 148 149 150 151 152 153
char *qemu_mac_strdup_printf(const uint8_t *macaddr)
{
    return g_strdup_printf("%.2x:%.2x:%.2x:%.2x:%.2x:%.2x",
                           macaddr[0], macaddr[1], macaddr[2],
                           macaddr[3], macaddr[4], macaddr[5]);
}

154
void qemu_format_nic_info_str(NetClientState *nc, uint8_t macaddr[6])
155
{
156
    snprintf(nc->info_str, sizeof(nc->info_str),
157
             "model=%s,macaddr=%02x:%02x:%02x:%02x:%02x:%02x",
158
             nc->model,
159 160 161 162
             macaddr[0], macaddr[1], macaddr[2],
             macaddr[3], macaddr[4], macaddr[5]);
}

163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203
static int mac_table[256] = {0};

static void qemu_macaddr_set_used(MACAddr *macaddr)
{
    int index;

    for (index = 0x56; index < 0xFF; index++) {
        if (macaddr->a[5] == index) {
            mac_table[index]++;
        }
    }
}

static void qemu_macaddr_set_free(MACAddr *macaddr)
{
    int index;
    static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };

    if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
        return;
    }
    for (index = 0x56; index < 0xFF; index++) {
        if (macaddr->a[5] == index) {
            mac_table[index]--;
        }
    }
}

static int qemu_macaddr_get_free(void)
{
    int index;

    for (index = 0x56; index < 0xFF; index++) {
        if (mac_table[index] == 0) {
            return index;
        }
    }

    return -1;
}

G
Gerd Hoffmann 已提交
204 205 206
void qemu_macaddr_default_if_unset(MACAddr *macaddr)
{
    static const MACAddr zero = { .a = { 0,0,0,0,0,0 } };
207 208 209 210 211 212 213 214 215 216
    static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };

    if (memcmp(macaddr, &zero, sizeof(zero)) != 0) {
        if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
            return;
        } else {
            qemu_macaddr_set_used(macaddr);
            return;
        }
    }
G
Gerd Hoffmann 已提交
217 218 219 220 221 222

    macaddr->a[0] = 0x52;
    macaddr->a[1] = 0x54;
    macaddr->a[2] = 0x00;
    macaddr->a[3] = 0x12;
    macaddr->a[4] = 0x34;
223 224
    macaddr->a[5] = qemu_macaddr_get_free();
    qemu_macaddr_set_used(macaddr);
G
Gerd Hoffmann 已提交
225 226
}

227 228 229
/**
 * Generate a name for net client
 *
A
Amos Kong 已提交
230
 * Only net clients created with the legacy -net option and NICs need this.
231
 */
232
static char *assign_name(NetClientState *nc1, const char *model)
233
{
234
    NetClientState *nc;
235 236
    int id = 0;

237 238
    QTAILQ_FOREACH(nc, &net_clients, next) {
        if (nc == nc1) {
239
            continue;
240
        }
A
Amos Kong 已提交
241
        if (strcmp(nc->model, model) == 0) {
242 243 244 245
            id++;
        }
    }

246
    return g_strdup_printf("%s.%d", model, id);
247 248
}

249 250 251 252 253
static void qemu_net_client_destructor(NetClientState *nc)
{
    g_free(nc);
}

254 255 256 257
static void qemu_net_client_setup(NetClientState *nc,
                                  NetClientInfo *info,
                                  NetClientState *peer,
                                  const char *model,
258 259
                                  const char *name,
                                  NetClientDestructor *destructor)
260
{
261 262
    nc->info = info;
    nc->model = g_strdup(model);
263
    if (name) {
264
        nc->name = g_strdup(name);
265
    } else {
266
        nc->name = assign_name(nc, model);
267
    }
268

269 270
    if (peer) {
        assert(!peer->peer);
271 272
        nc->peer = peer;
        peer->peer = nc;
273
    }
274
    QTAILQ_INSERT_TAIL(&net_clients, nc, next);
275

276
    nc->incoming_queue = qemu_new_net_queue(qemu_deliver_packet_iov, nc);
277
    nc->destructor = destructor;
Y
Yang Hongyang 已提交
278
    QTAILQ_INIT(&nc->filters);
279 280 281 282 283 284 285 286 287 288 289 290
}

NetClientState *qemu_new_net_client(NetClientInfo *info,
                                    NetClientState *peer,
                                    const char *model,
                                    const char *name)
{
    NetClientState *nc;

    assert(info->size >= sizeof(NetClientState));

    nc = g_malloc0(info->size);
291 292
    qemu_net_client_setup(nc, info, peer, model, name,
                          qemu_net_client_destructor);
293

294
    return nc;
295 296
}

297 298 299 300 301 302
NICState *qemu_new_nic(NetClientInfo *info,
                       NICConf *conf,
                       const char *model,
                       const char *name,
                       void *opaque)
{
J
Jason Wang 已提交
303
    NetClientState **peers = conf->peers.ncs;
304
    NICState *nic;
305
    int i, queues = MAX(1, conf->peers.queues);
306

307
    assert(info->type == NET_CLIENT_DRIVER_NIC);
308 309
    assert(info->size >= sizeof(NICState));

310 311
    nic = g_malloc0(info->size + sizeof(NetClientState) * queues);
    nic->ncs = (void *)nic + info->size;
312 313 314
    nic->conf = conf;
    nic->opaque = opaque;

315 316
    for (i = 0; i < queues; i++) {
        qemu_net_client_setup(&nic->ncs[i], info, peers[i], model, name,
J
Jason Wang 已提交
317 318 319 320
                              NULL);
        nic->ncs[i].queue_index = i;
    }

321 322 323
    return nic;
}

J
Jason Wang 已提交
324 325
NetClientState *qemu_get_subqueue(NICState *nic, int queue_index)
{
326
    return nic->ncs + queue_index;
J
Jason Wang 已提交
327 328
}

J
Jason Wang 已提交
329 330
NetClientState *qemu_get_queue(NICState *nic)
{
J
Jason Wang 已提交
331
    return qemu_get_subqueue(nic, 0);
J
Jason Wang 已提交
332 333
}

J
Jason Wang 已提交
334 335
NICState *qemu_get_nic(NetClientState *nc)
{
J
Jason Wang 已提交
336 337
    NetClientState *nc0 = nc - nc->queue_index;

338
    return (NICState *)((void *)nc0 - nc->info->size);
J
Jason Wang 已提交
339 340 341 342 343 344 345 346 347
}

void *qemu_get_nic_opaque(NetClientState *nc)
{
    NICState *nic = qemu_get_nic(nc);

    return nic->opaque;
}

348
static void qemu_cleanup_net_client(NetClientState *nc)
349
{
350
    QTAILQ_REMOVE(&net_clients, nc, next);
351

352 353 354
    if (nc->info->cleanup) {
        nc->info->cleanup(nc);
    }
355
}
356

357
static void qemu_free_net_client(NetClientState *nc)
358
{
359 360
    if (nc->incoming_queue) {
        qemu_del_net_queue(nc->incoming_queue);
S
Stefan Hajnoczi 已提交
361
    }
362 363
    if (nc->peer) {
        nc->peer->peer = NULL;
364
    }
365 366
    g_free(nc->name);
    g_free(nc->model);
367 368 369
    if (nc->destructor) {
        nc->destructor(nc);
    }
370 371
}

372
void qemu_del_net_client(NetClientState *nc)
373
{
J
Jason Wang 已提交
374 375
    NetClientState *ncs[MAX_QUEUE_NUM];
    int queues, i;
Y
Yang Hongyang 已提交
376
    NetFilterState *nf, *next;
J
Jason Wang 已提交
377

378
    assert(nc->info->type != NET_CLIENT_DRIVER_NIC);
379

J
Jason Wang 已提交
380 381 382 383
    /* If the NetClientState belongs to a multiqueue backend, we will change all
     * other NetClientStates also.
     */
    queues = qemu_find_net_clients_except(nc->name, ncs,
384
                                          NET_CLIENT_DRIVER_NIC,
J
Jason Wang 已提交
385 386 387
                                          MAX_QUEUE_NUM);
    assert(queues != 0);

Y
Yang Hongyang 已提交
388 389 390 391
    QTAILQ_FOREACH_SAFE(nf, &nc->filters, next, next) {
        object_unparent(OBJECT(nf));
    }

392
    /* If there is a peer NIC, delete and cleanup client, but do not free. */
393
    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
J
Jason Wang 已提交
394
        NICState *nic = qemu_get_nic(nc->peer);
395 396 397 398
        if (nic->peer_deleted) {
            return;
        }
        nic->peer_deleted = true;
J
Jason Wang 已提交
399 400 401 402 403

        for (i = 0; i < queues; i++) {
            ncs[i]->peer->link_down = true;
        }

404 405
        if (nc->peer->info->link_status_changed) {
            nc->peer->info->link_status_changed(nc->peer);
406
        }
J
Jason Wang 已提交
407 408 409 410 411

        for (i = 0; i < queues; i++) {
            qemu_cleanup_net_client(ncs[i]);
        }

412 413 414
        return;
    }

J
Jason Wang 已提交
415 416 417 418
    for (i = 0; i < queues; i++) {
        qemu_cleanup_net_client(ncs[i]);
        qemu_free_net_client(ncs[i]);
    }
J
Jason Wang 已提交
419 420 421 422
}

void qemu_del_nic(NICState *nic)
{
423
    int i, queues = MAX(nic->conf->peers.queues, 1);
J
Jason Wang 已提交
424

425 426
    qemu_macaddr_set_free(&nic->conf->macaddr);

427
    /* If this is a peer NIC and peer has already been deleted, free it now. */
J
Jason Wang 已提交
428 429 430
    if (nic->peer_deleted) {
        for (i = 0; i < queues; i++) {
            qemu_free_net_client(qemu_get_subqueue(nic, i)->peer);
431 432 433
        }
    }

J
Jason Wang 已提交
434 435 436 437 438 439
    for (i = queues - 1; i >= 0; i--) {
        NetClientState *nc = qemu_get_subqueue(nic, i);

        qemu_cleanup_net_client(nc);
        qemu_free_net_client(nc);
    }
440 441

    g_free(nic);
442 443
}

M
Mark McLoughlin 已提交
444 445
void qemu_foreach_nic(qemu_nic_foreach func, void *opaque)
{
446
    NetClientState *nc;
M
Mark McLoughlin 已提交
447

448
    QTAILQ_FOREACH(nc, &net_clients, next) {
449
        if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
J
Jason Wang 已提交
450 451 452
            if (nc->queue_index == 0) {
                func(qemu_get_nic(nc), opaque);
            }
M
Mark McLoughlin 已提交
453 454 455 456
        }
    }
}

457
bool qemu_has_ufo(NetClientState *nc)
458
{
459
    if (!nc || !nc->info->has_ufo) {
460 461 462
        return false;
    }

463
    return nc->info->has_ufo(nc);
464 465
}

466
bool qemu_has_vnet_hdr(NetClientState *nc)
467
{
468
    if (!nc || !nc->info->has_vnet_hdr) {
469 470 471
        return false;
    }

472
    return nc->info->has_vnet_hdr(nc);
473 474
}

475
bool qemu_has_vnet_hdr_len(NetClientState *nc, int len)
476
{
477
    if (!nc || !nc->info->has_vnet_hdr_len) {
478 479 480
        return false;
    }

481
    return nc->info->has_vnet_hdr_len(nc, len);
482 483
}

484
void qemu_using_vnet_hdr(NetClientState *nc, bool enable)
485
{
486
    if (!nc || !nc->info->using_vnet_hdr) {
487 488 489
        return;
    }

490
    nc->info->using_vnet_hdr(nc, enable);
491 492
}

493
void qemu_set_offload(NetClientState *nc, int csum, int tso4, int tso6,
494 495
                          int ecn, int ufo)
{
496
    if (!nc || !nc->info->set_offload) {
497 498 499
        return;
    }

500
    nc->info->set_offload(nc, csum, tso4, tso6, ecn, ufo);
501 502
}

503
void qemu_set_vnet_hdr_len(NetClientState *nc, int len)
504
{
505
    if (!nc || !nc->info->set_vnet_hdr_len) {
506 507 508
        return;
    }

509
    nc->vnet_hdr_len = len;
510
    nc->info->set_vnet_hdr_len(nc, len);
511 512
}

G
Greg Kurz 已提交
513 514
int qemu_set_vnet_le(NetClientState *nc, bool is_le)
{
515
#ifdef HOST_WORDS_BIGENDIAN
G
Greg Kurz 已提交
516 517 518 519 520
    if (!nc || !nc->info->set_vnet_le) {
        return -ENOSYS;
    }

    return nc->info->set_vnet_le(nc, is_le);
521 522 523
#else
    return 0;
#endif
G
Greg Kurz 已提交
524 525 526 527
}

int qemu_set_vnet_be(NetClientState *nc, bool is_be)
{
528 529 530
#ifdef HOST_WORDS_BIGENDIAN
    return 0;
#else
G
Greg Kurz 已提交
531 532 533 534 535
    if (!nc || !nc->info->set_vnet_be) {
        return -ENOSYS;
    }

    return nc->info->set_vnet_be(nc, is_be);
536
#endif
G
Greg Kurz 已提交
537 538
}

539
int qemu_can_send_packet(NetClientState *sender)
540
{
541 542 543 544 545 546
    int vm_running = runstate_is_running();

    if (!vm_running) {
        return 0;
    }

S
Stefan Hajnoczi 已提交
547
    if (!sender->peer) {
548 549 550
        return 1;
    }

S
Stefan Hajnoczi 已提交
551 552 553 554 555
    if (sender->peer->receive_disabled) {
        return 0;
    } else if (sender->peer->info->can_receive &&
               !sender->peer->info->can_receive(sender->peer)) {
        return 0;
556
    }
557
    return 1;
558 559
}

560 561 562 563 564 565 566 567 568 569 570
static ssize_t filter_receive_iov(NetClientState *nc,
                                  NetFilterDirection direction,
                                  NetClientState *sender,
                                  unsigned flags,
                                  const struct iovec *iov,
                                  int iovcnt,
                                  NetPacketSent *sent_cb)
{
    ssize_t ret = 0;
    NetFilterState *nf = NULL;

571 572 573 574 575 576 577 578 579 580 581 582 583 584 585
    if (direction == NET_FILTER_DIRECTION_TX) {
        QTAILQ_FOREACH(nf, &nc->filters, next) {
            ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
                                         iovcnt, sent_cb);
            if (ret) {
                return ret;
            }
        }
    } else {
        QTAILQ_FOREACH_REVERSE(nf, &nc->filters, NetFilterHead, next) {
            ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
                                         iovcnt, sent_cb);
            if (ret) {
                return ret;
            }
586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607
        }
    }

    return ret;
}

static ssize_t filter_receive(NetClientState *nc,
                              NetFilterDirection direction,
                              NetClientState *sender,
                              unsigned flags,
                              const uint8_t *data,
                              size_t size,
                              NetPacketSent *sent_cb)
{
    struct iovec iov = {
        .iov_base = (void *)data,
        .iov_len = size
    };

    return filter_receive_iov(nc, direction, sender, flags, &iov, 1, sent_cb);
}

608
void qemu_purge_queued_packets(NetClientState *nc)
609
{
610
    if (!nc->peer) {
611
        return;
612
    }
613

614
    qemu_net_queue_purge(nc->peer->incoming_queue, nc);
615 616
}

617 618
static
void qemu_flush_or_purge_queued_packets(NetClientState *nc, bool purge)
619
{
620
    nc->receive_disabled = 0;
621

622
    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_HUBPORT) {
623 624 625 626
        if (net_hub_flush(nc->peer)) {
            qemu_notify_event();
        }
    }
627
    if (qemu_net_queue_flush(nc->incoming_queue)) {
628 629 630 631
        /* We emptied the queue successfully, signal to the IO thread to repoll
         * the file descriptor (for tap, for example).
         */
        qemu_notify_event();
632 633 634
    } else if (purge) {
        /* Unable to empty the queue, purge remaining packets */
        qemu_net_queue_purge(nc->incoming_queue, nc);
635
    }
636 637
}

638 639 640 641 642
void qemu_flush_queued_packets(NetClientState *nc)
{
    qemu_flush_or_purge_queued_packets(nc, false);
}

643
static ssize_t qemu_send_packet_async_with_flags(NetClientState *sender,
644 645 646
                                                 unsigned flags,
                                                 const uint8_t *buf, int size,
                                                 NetPacketSent *sent_cb)
647
{
648
    NetQueue *queue;
649
    int ret;
650

651
#ifdef DEBUG_NET
652
    printf("qemu_send_packet_async:\n");
653
    qemu_hexdump((const char *)buf, stdout, "net", size);
654
#endif
655

S
Stefan Hajnoczi 已提交
656
    if (sender->link_down || !sender->peer) {
657 658 659
        return size;
    }

660 661 662 663 664 665 666 667 668 669 670 671 672
    /* Let filters handle the packet first */
    ret = filter_receive(sender, NET_FILTER_DIRECTION_TX,
                         sender, flags, buf, size, sent_cb);
    if (ret) {
        return ret;
    }

    ret = filter_receive(sender->peer, NET_FILTER_DIRECTION_RX,
                         sender, flags, buf, size, sent_cb);
    if (ret) {
        return ret;
    }

673
    queue = sender->peer->incoming_queue;
674

675 676 677
    return qemu_net_queue_send(queue, sender, flags, buf, size, sent_cb);
}

678
ssize_t qemu_send_packet_async(NetClientState *sender,
679 680 681 682 683
                               const uint8_t *buf, int size,
                               NetPacketSent *sent_cb)
{
    return qemu_send_packet_async_with_flags(sender, QEMU_NET_PACKET_FLAG_NONE,
                                             buf, size, sent_cb);
684 685
}

686
void qemu_send_packet(NetClientState *nc, const uint8_t *buf, int size)
687
{
688
    qemu_send_packet_async(nc, buf, size, NULL);
689 690
}

691
ssize_t qemu_send_packet_raw(NetClientState *nc, const uint8_t *buf, int size)
692
{
693
    return qemu_send_packet_async_with_flags(nc, QEMU_NET_PACKET_FLAG_RAW,
694 695 696
                                             buf, size, NULL);
}

697
static ssize_t nc_sendv_compat(NetClientState *nc, const struct iovec *iov,
698
                               int iovcnt, unsigned flags)
A
aliguori 已提交
699
{
700
    uint8_t *buf = NULL;
701
    uint8_t *buffer;
B
Benjamin Poirier 已提交
702
    size_t offset;
703
    ssize_t ret;
A
aliguori 已提交
704

705 706 707 708
    if (iovcnt == 1) {
        buffer = iov[0].iov_base;
        offset = iov[0].iov_len;
    } else {
709 710 711 712 713
        offset = iov_size(iov, iovcnt);
        if (offset > NET_BUFSIZE) {
            return -1;
        }
        buf = g_malloc(offset);
714
        buffer = buf;
715
        offset = iov_to_buf(iov, iovcnt, 0, buf, offset);
716
    }
A
aliguori 已提交
717

718
    if (flags & QEMU_NET_PACKET_FLAG_RAW && nc->info->receive_raw) {
719
        ret = nc->info->receive_raw(nc, buffer, offset);
720
    } else {
721
        ret = nc->info->receive(nc, buffer, offset);
722
    }
723 724 725

    g_free(buf);
    return ret;
A
aliguori 已提交
726 727
}

728 729 730 731 732
ssize_t qemu_deliver_packet_iov(NetClientState *sender,
                                unsigned flags,
                                const struct iovec *iov,
                                int iovcnt,
                                void *opaque)
733
{
734
    NetClientState *nc = opaque;
735
    int ret;
736

737
    if (nc->link_down) {
B
Benjamin Poirier 已提交
738
        return iov_size(iov, iovcnt);
739 740
    }

741 742 743 744
    if (nc->receive_disabled) {
        return 0;
    }

745
    if (nc->info->receive_iov && !(flags & QEMU_NET_PACKET_FLAG_RAW)) {
746
        ret = nc->info->receive_iov(nc, iov, iovcnt);
747
    } else {
748
        ret = nc_sendv_compat(nc, iov, iovcnt, flags);
749 750 751 752
    }

    if (ret == 0) {
        nc->receive_disabled = 1;
753
    }
754 755

    return ret;
756 757
}

758
ssize_t qemu_sendv_packet_async(NetClientState *sender,
759 760
                                const struct iovec *iov, int iovcnt,
                                NetPacketSent *sent_cb)
761
{
762
    NetQueue *queue;
763
    int ret;
764

S
Stefan Hajnoczi 已提交
765
    if (sender->link_down || !sender->peer) {
B
Benjamin Poirier 已提交
766
        return iov_size(iov, iovcnt);
767 768
    }

769 770 771 772 773 774 775 776 777 778 779 780 781
    /* Let filters handle the packet first */
    ret = filter_receive_iov(sender, NET_FILTER_DIRECTION_TX, sender,
                             QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
    if (ret) {
        return ret;
    }

    ret = filter_receive_iov(sender->peer, NET_FILTER_DIRECTION_RX, sender,
                             QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
    if (ret) {
        return ret;
    }

782
    queue = sender->peer->incoming_queue;
783

784 785 786
    return qemu_net_queue_send_iov(queue, sender,
                                   QEMU_NET_PACKET_FLAG_NONE,
                                   iov, iovcnt, sent_cb);
A
aliguori 已提交
787 788
}

789
ssize_t
790
qemu_sendv_packet(NetClientState *nc, const struct iovec *iov, int iovcnt)
791
{
792
    return qemu_sendv_packet_async(nc, iov, iovcnt, NULL);
793 794
}

795
NetClientState *qemu_find_netdev(const char *id)
M
Mark McLoughlin 已提交
796
{
797
    NetClientState *nc;
M
Mark McLoughlin 已提交
798

799
    QTAILQ_FOREACH(nc, &net_clients, next) {
800
        if (nc->info->type == NET_CLIENT_DRIVER_NIC)
801
            continue;
802 803
        if (!strcmp(nc->name, id)) {
            return nc;
M
Mark McLoughlin 已提交
804 805 806 807 808 809
        }
    }

    return NULL;
}

810
int qemu_find_net_clients_except(const char *id, NetClientState **ncs,
811
                                 NetClientDriver type, int max)
812 813 814 815 816 817 818 819
{
    NetClientState *nc;
    int ret = 0;

    QTAILQ_FOREACH(nc, &net_clients, next) {
        if (nc->info->type == type) {
            continue;
        }
820
        if (!id || !strcmp(nc->name, id)) {
821 822 823 824 825 826 827 828 829 830
            if (ret < max) {
                ncs[ret] = nc;
            }
            ret++;
        }
    }

    return ret;
}

831 832 833 834 835 836 837 838 839 840
static int nic_get_free_idx(void)
{
    int index;

    for (index = 0; index < MAX_NICS; index++)
        if (!nd_table[index].used)
            return index;
    return -1;
}

841 842 843 844
int qemu_show_nic_models(const char *arg, const char *const *models)
{
    int i;

845
    if (!arg || !is_help_option(arg)) {
846
        return 0;
847
    }
848 849 850 851 852 853 854

    fprintf(stderr, "qemu: Supported NIC models: ");
    for (i = 0 ; models[i]; i++)
        fprintf(stderr, "%s%c", models[i], models[i+1] ? ',' : '\n');
    return 1;
}

855 856 857 858 859 860 861
void qemu_check_nic_model(NICInfo *nd, const char *model)
{
    const char *models[2];

    models[0] = model;
    models[1] = NULL;

862 863 864 865
    if (qemu_show_nic_models(nd->model, models))
        exit(0);
    if (qemu_find_nic_model(nd, models, model) < 0)
        exit(1);
866 867
}

868 869
int qemu_find_nic_model(NICInfo *nd, const char * const *models,
                        const char *default_model)
870
{
871
    int i;
872 873

    if (!nd->model)
874
        nd->model = g_strdup(default_model);
875

876 877 878
    for (i = 0 ; models[i]; i++) {
        if (strcmp(nd->model, models[i]) == 0)
            return i;
879 880
    }

881
    error_report("Unsupported NIC model: %s", nd->model);
882
    return -1;
883 884
}

885
static int net_init_nic(const Netdev *netdev, const char *name,
886
                        NetClientState *peer, Error **errp)
887 888 889
{
    int idx;
    NICInfo *nd;
890 891
    const NetLegacyNicOptions *nic;

892 893
    assert(netdev->type == NET_CLIENT_DRIVER_NIC);
    nic = &netdev->u.nic;
894 895 896

    idx = nic_get_free_idx();
    if (idx == -1 || nb_nics >= MAX_NICS) {
897
        error_setg(errp, "too many NICs");
898 899 900 901 902 903 904
        return -1;
    }

    nd = &nd_table[idx];

    memset(nd, 0, sizeof(*nd));

905 906
    if (nic->has_netdev) {
        nd->netdev = qemu_find_netdev(nic->netdev);
M
Mark McLoughlin 已提交
907
        if (!nd->netdev) {
908
            error_setg(errp, "netdev '%s' not found", nic->netdev);
M
Mark McLoughlin 已提交
909 910 911
            return -1;
        }
    } else {
912 913
        assert(peer);
        nd->netdev = peer;
M
Mark McLoughlin 已提交
914
    }
915
    nd->name = g_strdup(name);
916 917
    if (nic->has_model) {
        nd->model = g_strdup(nic->model);
918
    }
919 920
    if (nic->has_addr) {
        nd->devaddr = g_strdup(nic->addr);
921 922
    }

923 924
    if (nic->has_macaddr &&
        net_parse_macaddr(nd->macaddr.a, nic->macaddr) < 0) {
925
        error_setg(errp, "invalid syntax for ethernet address");
926 927
        return -1;
    }
928 929
    if (nic->has_macaddr &&
        is_multicast_ether_addr(nd->macaddr.a)) {
930 931
        error_setg(errp,
                   "NIC cannot have multicast MAC address (odd 1st byte)");
932 933
        return -1;
    }
934
    qemu_macaddr_default_if_unset(&nd->macaddr);
935

936 937
    if (nic->has_vectors) {
        if (nic->vectors > 0x7ffffff) {
938
            error_setg(errp, "invalid # of vectors: %"PRIu32, nic->vectors);
939 940 941 942 943
            return -1;
        }
        nd->nvectors = nic->vectors;
    } else {
        nd->nvectors = DEV_NVECTORS_UNSPECIFIED;
944 945 946 947 948 949 950 951
    }

    nd->used = 1;
    nb_nics++;

    return idx;
}

952

953
static int (* const net_client_init_fun[NET_CLIENT_DRIVER__MAX])(
954
    const Netdev *netdev,
955
    const char *name,
956
    NetClientState *peer, Error **errp) = {
957
        [NET_CLIENT_DRIVER_NIC]       = net_init_nic,
M
Mark McLoughlin 已提交
958
#ifdef CONFIG_SLIRP
959
        [NET_CLIENT_DRIVER_USER]      = net_init_slirp,
960
#endif
961 962
        [NET_CLIENT_DRIVER_TAP]       = net_init_tap,
        [NET_CLIENT_DRIVER_SOCKET]    = net_init_socket,
M
Mark McLoughlin 已提交
963
#ifdef CONFIG_VDE
964
        [NET_CLIENT_DRIVER_VDE]       = net_init_vde,
965 966
#endif
#ifdef CONFIG_NETMAP
967
        [NET_CLIENT_DRIVER_NETMAP]    = net_init_netmap,
M
Mark McLoughlin 已提交
968
#endif
969
        [NET_CLIENT_DRIVER_DUMP]      = net_init_dump,
970
#ifdef CONFIG_NET_BRIDGE
971
        [NET_CLIENT_DRIVER_BRIDGE]    = net_init_bridge,
972
#endif
973
        [NET_CLIENT_DRIVER_HUBPORT]   = net_init_hubport,
974
#ifdef CONFIG_VHOST_NET_USED
975
        [NET_CLIENT_DRIVER_VHOST_USER] = net_init_vhost_user,
976
#endif
977
#ifdef CONFIG_L2TPV3
978
        [NET_CLIENT_DRIVER_L2TPV3]    = net_init_l2tpv3,
A
Anton Ivanov 已提交
979
#endif
980 981
};

982

E
Eric Blake 已提交
983
static int net_client_init1(const void *object, bool is_netdev, Error **errp)
984
{
985 986
    Netdev legacy = {0};
    const Netdev *netdev;
987
    const char *name;
988
    NetClientState *peer = NULL;
989
    static bool vlan_warned;
990

991
    if (is_netdev) {
992
        netdev = object;
993
        name = netdev->id;
994

995 996 997
        if (netdev->type == NET_CLIENT_DRIVER_DUMP ||
            netdev->type == NET_CLIENT_DRIVER_NIC ||
            !net_client_init_fun[netdev->type]) {
998 999
            error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "type",
                       "a netdev backend type");
M
Mark McLoughlin 已提交
1000 1001
            return -1;
        }
1002
    } else {
1003
        const NetLegacy *net = object;
1004
        const NetLegacyOptions *opts = net->opts;
1005 1006
        legacy.id = net->id;
        netdev = &legacy;
1007
        /* missing optional values have been initialized to "all bits zero" */
1008
        name = net->has_id ? net->id : net->name;
1009

1010 1011
        /* Map the old options to the new flat type */
        switch (opts->type) {
1012
        case NET_LEGACY_OPTIONS_TYPE_NONE:
1013
            return 0; /* nothing to do */
1014
        case NET_LEGACY_OPTIONS_TYPE_NIC:
1015
            legacy.type = NET_CLIENT_DRIVER_NIC;
1016
            legacy.u.nic = opts->u.nic;
1017
            break;
1018
        case NET_LEGACY_OPTIONS_TYPE_USER:
1019
            legacy.type = NET_CLIENT_DRIVER_USER;
1020
            legacy.u.user = opts->u.user;
1021
            break;
1022
        case NET_LEGACY_OPTIONS_TYPE_TAP:
1023
            legacy.type = NET_CLIENT_DRIVER_TAP;
1024
            legacy.u.tap = opts->u.tap;
1025
            break;
1026
        case NET_LEGACY_OPTIONS_TYPE_L2TPV3:
1027
            legacy.type = NET_CLIENT_DRIVER_L2TPV3;
1028
            legacy.u.l2tpv3 = opts->u.l2tpv3;
1029
            break;
1030
        case NET_LEGACY_OPTIONS_TYPE_SOCKET:
1031
            legacy.type = NET_CLIENT_DRIVER_SOCKET;
1032
            legacy.u.socket = opts->u.socket;
1033
            break;
1034
        case NET_LEGACY_OPTIONS_TYPE_VDE:
1035
            legacy.type = NET_CLIENT_DRIVER_VDE;
1036
            legacy.u.vde = opts->u.vde;
1037
            break;
1038
        case NET_LEGACY_OPTIONS_TYPE_DUMP:
1039
            legacy.type = NET_CLIENT_DRIVER_DUMP;
1040
            legacy.u.dump = opts->u.dump;
1041
            break;
1042
        case NET_LEGACY_OPTIONS_TYPE_BRIDGE:
1043
            legacy.type = NET_CLIENT_DRIVER_BRIDGE;
1044
            legacy.u.bridge = opts->u.bridge;
1045
            break;
1046
        case NET_LEGACY_OPTIONS_TYPE_NETMAP:
1047
            legacy.type = NET_CLIENT_DRIVER_NETMAP;
1048
            legacy.u.netmap = opts->u.netmap;
1049
            break;
1050
        case NET_LEGACY_OPTIONS_TYPE_VHOST_USER:
1051
            legacy.type = NET_CLIENT_DRIVER_VHOST_USER;
1052
            legacy.u.vhost_user = opts->u.vhost_user;
1053 1054 1055
            break;
        default:
            abort();
1056
        }
1057

1058
        if (!net_client_init_fun[netdev->type]) {
1059 1060 1061 1062 1063
            error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "type",
                       "a net backend type (maybe it is not compiled "
                       "into this binary)");
            return -1;
        }
M
Mark McLoughlin 已提交
1064

1065
        /* Do not add to a vlan if it's a nic with a netdev= parameter. */
1066
        if (netdev->type != NET_CLIENT_DRIVER_NIC ||
1067
            !opts->u.nic.has_netdev) {
1068
            peer = net_hub_add_port(net->has_vlan ? net->vlan : 0, NULL, NULL);
1069
        }
1070 1071 1072 1073 1074

        if (net->has_vlan && !vlan_warned) {
            error_report("'vlan' is deprecated. Please use 'netdev' instead.");
            vlan_warned = true;
        }
1075
    }
1076

1077
    if (net_client_init_fun[netdev->type](netdev, name, peer, errp) < 0) {
1078 1079 1080
        /* FIXME drop when all init functions store an Error */
        if (errp && !*errp) {
            error_setg(errp, QERR_DEVICE_INIT_FAILED,
1081
                       NetClientDriver_str(netdev->type));
M
Mark McLoughlin 已提交
1082
        }
1083
        return -1;
M
Mark McLoughlin 已提交
1084
    }
1085 1086 1087
    return 0;
}

M
Mark McLoughlin 已提交
1088

E
Eric Blake 已提交
1089
int net_client_init(QemuOpts *opts, bool is_netdev, Error **errp)
1090 1091 1092 1093
{
    void *object = NULL;
    Error *err = NULL;
    int ret = -1;
1094
    Visitor *v = opts_visitor_new(opts);
1095

1096 1097
    {
        /* Parse convenience option format ip6-net=fec0::0[/64] */
1098
        const char *ip6_net = qemu_opt_get(opts, "ipv6-net");
1099 1100 1101 1102 1103 1104

        if (ip6_net) {
            char buf[strlen(ip6_net) + 1];

            if (get_str_sep(buf, sizeof(buf), &ip6_net, '/') < 0) {
                /* Default 64bit prefix length.  */
1105 1106
                qemu_opt_set(opts, "ipv6-prefix", ip6_net, &error_abort);
                qemu_opt_set_number(opts, "ipv6-prefixlen", 64, &error_abort);
1107 1108 1109 1110 1111
            } else {
                /* User-specified prefix length.  */
                unsigned long len;
                int err;

1112
                qemu_opt_set(opts, "ipv6-prefix", buf, &error_abort);
1113 1114 1115 1116
                err = qemu_strtoul(ip6_net, NULL, 10, &len);

                if (err) {
                    error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
1117
                              "ipv6-prefix", "a number");
1118
                } else {
1119
                    qemu_opt_set_number(opts, "ipv6-prefixlen", len,
1120 1121 1122
                                        &error_abort);
                }
            }
1123
            qemu_opt_unset(opts, "ipv6-net");
1124 1125 1126
        }
    }

1127 1128 1129 1130
    if (is_netdev) {
        visit_type_Netdev(v, NULL, (Netdev **)&object, &err);
    } else {
        visit_type_NetLegacy(v, NULL, (NetLegacy **)&object, &err);
1131 1132
    }

1133
    if (!err) {
1134
        ret = net_client_init1(object, is_netdev, &err);
1135 1136
    }

1137 1138 1139 1140
    if (is_netdev) {
        qapi_free_Netdev(object);
    } else {
        qapi_free_NetLegacy(object);
1141 1142 1143
    }

    error_propagate(errp, err);
1144
    visit_free(v);
1145
    return ret;
1146 1147
}

1148

1149 1150 1151
static int net_host_check_device(const char *device)
{
    int i;
1152 1153 1154
    for (i = 0; host_net_devices[i]; i++) {
        if (!strncmp(host_net_devices[i], device,
                     strlen(host_net_devices[i]))) {
1155
            return 1;
1156
        }
1157 1158 1159 1160 1161
    }

    return 0;
}

1162
void hmp_host_net_add(Monitor *mon, const QDict *qdict)
1163
{
1164
    const char *device = qdict_get_str(qdict, "device");
1165
    const char *opts_str = qdict_get_try_str(qdict, "opts");
1166
    Error *local_err = NULL;
1167
    QemuOpts *opts;
1168 1169 1170 1171 1172 1173
    static bool warned;

    if (!warned && !qtest_enabled()) {
        error_report("host_net_add is deprecated, use netdev_add instead");
        warned = true;
    }
1174

1175
    if (!net_host_check_device(device)) {
A
aliguori 已提交
1176
        monitor_printf(mon, "invalid host network device %s\n", device);
1177 1178
        return;
    }
1179

1180 1181
    opts = qemu_opts_parse_noisily(qemu_find_opts("net"),
                                   opts_str ? opts_str : "", false);
1182 1183 1184 1185
    if (!opts) {
        return;
    }

1186
    qemu_opt_set(opts, "type", device, &error_abort);
1187

E
Eric Blake 已提交
1188
    net_client_init(opts, false, &local_err);
1189
    if (local_err) {
1190
        error_report_err(local_err);
1191 1192
        monitor_printf(mon, "adding host network device %s failed\n", device);
    }
1193 1194
}

1195
void hmp_host_net_remove(Monitor *mon, const QDict *qdict)
1196
{
1197
    NetClientState *nc;
1198 1199
    int vlan_id = qdict_get_int(qdict, "vlan_id");
    const char *device = qdict_get_str(qdict, "device");
1200 1201 1202 1203 1204 1205
    static bool warned;

    if (!warned && !qtest_enabled()) {
        error_report("host_net_remove is deprecated, use netdev_del instead");
        warned = true;
    }
1206

1207 1208
    nc = net_hub_find_client_by_name(vlan_id, device);
    if (!nc) {
1209 1210
        error_report("Host network device '%s' on hub '%d' not found",
                     device, vlan_id);
1211 1212
        return;
    }
1213
    if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
1214
        error_report("invalid host network device '%s'", device);
1215 1216
        return;
    }
1217 1218

    qemu_del_net_client(nc->peer);
1219
    qemu_del_net_client(nc);
1220
    qemu_opts_del(qemu_opts_find(qemu_find_opts("net"), device));
1221 1222
}

L
Luiz Capitulino 已提交
1223 1224
void netdev_add(QemuOpts *opts, Error **errp)
{
E
Eric Blake 已提交
1225
    net_client_init(opts, true, errp);
L
Luiz Capitulino 已提交
1226 1227
}

1228
void qmp_netdev_add(QDict *qdict, QObject **ret, Error **errp)
1229
{
1230
    Error *local_err = NULL;
L
Luiz Capitulino 已提交
1231
    QemuOptsList *opts_list;
1232 1233
    QemuOpts *opts;

L
Luiz Capitulino 已提交
1234
    opts_list = qemu_find_opts_err("netdev", &local_err);
1235
    if (local_err) {
1236
        goto out;
1237 1238
    }

L
Luiz Capitulino 已提交
1239
    opts = qemu_opts_from_qdict(opts_list, qdict, &local_err);
1240
    if (local_err) {
1241
        goto out;
L
Luiz Capitulino 已提交
1242 1243 1244
    }

    netdev_add(opts, &local_err);
1245
    if (local_err) {
1246
        qemu_opts_del(opts);
1247
        goto out;
1248 1249
    }

1250 1251
out:
    error_propagate(errp, local_err);
1252 1253
}

L
Luiz Capitulino 已提交
1254
void qmp_netdev_del(const char *id, Error **errp)
1255
{
1256
    NetClientState *nc;
1257
    QemuOpts *opts;
1258

1259 1260
    nc = qemu_find_netdev(id);
    if (!nc) {
1261 1262
        error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
                  "Device '%s' not found", id);
L
Luiz Capitulino 已提交
1263
        return;
1264
    }
L
Luiz Capitulino 已提交
1265

1266 1267 1268 1269 1270 1271
    opts = qemu_opts_find(qemu_find_opts_err("netdev", NULL), id);
    if (!opts) {
        error_setg(errp, "Device '%s' is not a netdev", id);
        return;
    }

1272
    qemu_del_net_client(nc);
1273
    qemu_opts_del(opts);
1274 1275
}

1276 1277 1278 1279 1280
static void netfilter_print_info(Monitor *mon, NetFilterState *nf)
{
    char *str;
    ObjectProperty *prop;
    ObjectPropertyIterator iter;
1281
    Visitor *v;
1282 1283 1284 1285 1286 1287 1288

    /* generate info str */
    object_property_iter_init(&iter, OBJECT(nf));
    while ((prop = object_property_iter_next(&iter))) {
        if (!strcmp(prop->name, "type")) {
            continue;
        }
1289 1290 1291 1292
        v = string_output_visitor_new(false, &str);
        object_property_get(OBJECT(nf), v, prop->name, NULL);
        visit_complete(v, &str);
        visit_free(v);
1293 1294 1295 1296 1297 1298
        monitor_printf(mon, ",%s=%s", prop->name, str);
        g_free(str);
    }
    monitor_printf(mon, "\n");
}

1299
void print_net_client(Monitor *mon, NetClientState *nc)
1300
{
1301 1302
    NetFilterState *nf;

J
Jason Wang 已提交
1303 1304
    monitor_printf(mon, "%s: index=%d,type=%s,%s\n", nc->name,
                   nc->queue_index,
1305
                   NetClientDriver_str(nc->info->type),
J
Jason Wang 已提交
1306
                   nc->info_str);
1307 1308 1309 1310
    if (!QTAILQ_EMPTY(&nc->filters)) {
        monitor_printf(mon, "filters:\n");
    }
    QTAILQ_FOREACH(nf, &nc->filters, next) {
1311
        char *path = object_get_canonical_path_component(OBJECT(nf));
1312 1313 1314 1315

        monitor_printf(mon, "  - %s: type=%s", path,
                       object_get_typename(OBJECT(nf)));
        netfilter_print_info(mon, nf);
1316
        g_free(path);
1317
    }
1318 1319
}

1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334
RxFilterInfoList *qmp_query_rx_filter(bool has_name, const char *name,
                                      Error **errp)
{
    NetClientState *nc;
    RxFilterInfoList *filter_list = NULL, *last_entry = NULL;

    QTAILQ_FOREACH(nc, &net_clients, next) {
        RxFilterInfoList *entry;
        RxFilterInfo *info;

        if (has_name && strcmp(nc->name, name) != 0) {
            continue;
        }

        /* only query rx-filter information of NIC */
1335
        if (nc->info->type != NET_CLIENT_DRIVER_NIC) {
1336 1337
            if (has_name) {
                error_setg(errp, "net client(%s) isn't a NIC", name);
1338
                return NULL;
1339 1340 1341 1342
            }
            continue;
        }

1343 1344 1345 1346 1347 1348
        /* only query information on queue 0 since the info is per nic,
         * not per queue
         */
        if (nc->queue_index != 0)
            continue;

1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362
        if (nc->info->query_rx_filter) {
            info = nc->info->query_rx_filter(nc);
            entry = g_malloc0(sizeof(*entry));
            entry->value = info;

            if (!filter_list) {
                filter_list = entry;
            } else {
                last_entry->next = entry;
            }
            last_entry = entry;
        } else if (has_name) {
            error_setg(errp, "net client(%s) doesn't support"
                       " rx-filter querying", name);
1363
            return NULL;
1364
        }
1365 1366 1367 1368

        if (has_name) {
            break;
        }
1369 1370
    }

1371
    if (filter_list == NULL && has_name) {
1372 1373 1374 1375 1376 1377
        error_setg(errp, "invalid net client name: %s", name);
    }

    return filter_list;
}

1378
void hmp_info_network(Monitor *mon, const QDict *qdict)
1379
{
1380
    NetClientState *nc, *peer;
1381
    NetClientDriver type;
1382

1383 1384
    net_hub_info(mon);

1385 1386 1387
    QTAILQ_FOREACH(nc, &net_clients, next) {
        peer = nc->peer;
        type = nc->info->type;
1388

1389 1390 1391
        /* Skip if already printed in hub info */
        if (net_hub_id_for_client(nc, NULL) == 0) {
            continue;
1392
        }
1393

1394
        if (!peer || type == NET_CLIENT_DRIVER_NIC) {
1395
            print_net_client(mon, nc);
1396
        } /* else it's a netdev connected to a NIC, printed with the NIC */
1397
        if (peer && type == NET_CLIENT_DRIVER_NIC) {
1398
            monitor_printf(mon, " \\ ");
1399
            print_net_client(mon, peer);
1400 1401
        }
    }
1402 1403
}

L
Luiz Capitulino 已提交
1404
void qmp_set_link(const char *name, bool up, Error **errp)
1405
{
J
Jason Wang 已提交
1406 1407 1408
    NetClientState *ncs[MAX_QUEUE_NUM];
    NetClientState *nc;
    int queues, i;
1409

J
Jason Wang 已提交
1410
    queues = qemu_find_net_clients_except(name, ncs,
1411
                                          NET_CLIENT_DRIVER__MAX,
J
Jason Wang 已提交
1412 1413 1414
                                          MAX_QUEUE_NUM);

    if (queues == 0) {
1415 1416
        error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
                  "Device '%s' not found", name);
L
Luiz Capitulino 已提交
1417
        return;
1418
    }
J
Jason Wang 已提交
1419
    nc = ncs[0];
1420

J
Jason Wang 已提交
1421 1422 1423
    for (i = 0; i < queues; i++) {
        ncs[i]->link_down = !up;
    }
1424

1425 1426
    if (nc->info->link_status_changed) {
        nc->info->link_status_changed(nc);
1427
    }
1428

1429 1430 1431 1432 1433 1434 1435 1436 1437
    if (nc->peer) {
        /* Change peer link only if the peer is NIC and then notify peer.
         * If the peer is a HUBPORT or a backend, we do not change the
         * link status.
         *
         * This behavior is compatible with qemu vlans where there could be
         * multiple clients that can still communicate with each other in
         * disconnected mode. For now maintain this compatibility.
         */
1438
        if (nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
1439 1440 1441 1442 1443 1444 1445
            for (i = 0; i < queues; i++) {
                ncs[i]->peer->link_down = !up;
            }
        }
        if (nc->peer->info->link_status_changed) {
            nc->peer->info->link_status_changed(nc->peer);
        }
1446
    }
1447 1448
}

1449 1450 1451
static void net_vm_change_state_handler(void *opaque, int running,
                                        RunState state)
{
1452 1453
    NetClientState *nc;
    NetClientState *tmp;
1454

1455 1456 1457 1458 1459 1460 1461 1462 1463 1464
    QTAILQ_FOREACH_SAFE(nc, &net_clients, next, tmp) {
        if (running) {
            /* Flush queued packets and wake up backends. */
            if (nc->peer && qemu_can_send_packet(nc)) {
                qemu_flush_queued_packets(nc->peer);
            }
        } else {
            /* Complete all queued packets, to guarantee we don't modify
             * state later when VM is not running.
             */
1465 1466 1467 1468 1469
            qemu_flush_or_purge_queued_packets(nc, true);
        }
    }
}

1470 1471
void net_cleanup(void)
{
J
Jason Wang 已提交
1472
    NetClientState *nc;
1473

J
Jason Wang 已提交
1474 1475 1476 1477 1478
    /* We may del multiple entries during qemu_del_net_client(),
     * so QTAILQ_FOREACH_SAFE() is also not safe here.
     */
    while (!QTAILQ_EMPTY(&net_clients)) {
        nc = QTAILQ_FIRST(&net_clients);
1479
        if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
J
Jason Wang 已提交
1480 1481 1482 1483
            qemu_del_nic(qemu_get_nic(nc));
        } else {
            qemu_del_net_client(nc);
        }
1484
    }
1485 1486

    qemu_del_vm_change_state_handler(net_change_state_entry);
1487 1488
}

1489
void net_check_clients(void)
1490
{
1491
    NetClientState *nc;
1492
    int i;
1493

1494
    net_hub_check_clients();
1495

1496 1497
    QTAILQ_FOREACH(nc, &net_clients, next) {
        if (!nc->peer) {
1498
            warn_report("%s %s has no peer",
A
Alistair Francis 已提交
1499 1500 1501
                        nc->info->type == NET_CLIENT_DRIVER_NIC
                        ? "nic" : "netdev",
                        nc->name);
1502 1503
        }
    }
1504 1505 1506 1507 1508 1509 1510 1511

    /* Check that all NICs requested via -net nic actually got created.
     * NICs created via -device don't need to be checked here because
     * they are always instantiated.
     */
    for (i = 0; i < MAX_NICS; i++) {
        NICInfo *nd = &nd_table[i];
        if (nd->used && !nd->instantiated) {
1512 1513 1514 1515
            warn_report("requested NIC (%s, model %s) "
                        "was not created (not supported by this machine?)",
                        nd->name ? nd->name : "anonymous",
                        nd->model ? nd->model : "unspecified");
1516 1517
        }
    }
1518
}
1519

1520
static int net_init_client(void *dummy, QemuOpts *opts, Error **errp)
1521
{
1522 1523
    Error *local_err = NULL;

E
Eric Blake 已提交
1524
    net_client_init(opts, false, &local_err);
1525
    if (local_err) {
1526
        error_report_err(local_err);
1527
        return -1;
1528 1529
    }

1530
    return 0;
M
Mark McLoughlin 已提交
1531 1532
}

1533
static int net_init_netdev(void *dummy, QemuOpts *opts, Error **errp)
M
Mark McLoughlin 已提交
1534
{
1535 1536 1537
    Error *local_err = NULL;
    int ret;

E
Eric Blake 已提交
1538
    ret = net_client_init(opts, true, &local_err);
1539
    if (local_err) {
1540
        error_report_err(local_err);
1541 1542 1543 1544
        return -1;
    }

    return ret;
1545 1546 1547 1548
}

int net_init_clients(void)
{
1549 1550
    QemuOptsList *net = qemu_find_opts("net");

1551 1552 1553
    net_change_state_entry =
        qemu_add_vm_change_state_handler(net_vm_change_state_handler, NULL);

1554
    QTAILQ_INIT(&net_clients);
1555

1556 1557
    if (qemu_opts_foreach(qemu_find_opts("netdev"),
                          net_init_netdev, NULL, NULL)) {
M
Mark McLoughlin 已提交
1558
        return -1;
1559
    }
M
Mark McLoughlin 已提交
1560

1561
    if (qemu_opts_foreach(net, net_init_client, NULL, NULL)) {
1562 1563 1564 1565 1566 1567
        return -1;
    }

    return 0;
}

1568
int net_client_parse(QemuOptsList *opts_list, const char *optarg)
1569
{
1570
    if (!qemu_opts_parse_noisily(opts_list, optarg, true)) {
1571 1572 1573 1574 1575
        return -1;
    }

    return 0;
}
1576 1577 1578

/* From FreeBSD */
/* XXX: optimize */
1579
uint32_t net_crc32(const uint8_t *p, int len)
1580 1581 1582 1583 1584 1585
{
    uint32_t crc;
    int carry, i, j;
    uint8_t b;

    crc = 0xffffffff;
1586 1587
    for (i = 0; i < len; i++) {
        b = *p++;
1588 1589 1590 1591 1592
        for (j = 0; j < 8; j++) {
            carry = ((crc & 0x80000000L) ? 1 : 0) ^ (b & 0x01);
            crc <<= 1;
            b >>= 1;
            if (carry) {
1593
                crc = ((crc ^ POLYNOMIAL_BE) | carry);
1594 1595 1596
            }
        }
    }
1597 1598 1599 1600

    return crc;
}

1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622
uint32_t net_crc32_le(const uint8_t *p, int len)
{
    uint32_t crc;
    int carry, i, j;
    uint8_t b;

    crc = 0xffffffff;
    for (i = 0; i < len; i++) {
        b = *p++;
        for (j = 0; j < 8; j++) {
            carry = (crc & 0x1) ^ (b & 0x01);
            crc >>= 1;
            b >>= 1;
            if (carry) {
                crc ^= POLYNOMIAL_LE;
            }
        }
    }

    return crc;
}

1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647
QemuOptsList qemu_netdev_opts = {
    .name = "netdev",
    .implied_opt_name = "type",
    .head = QTAILQ_HEAD_INITIALIZER(qemu_netdev_opts.head),
    .desc = {
        /*
         * no elements => accept any params
         * validation will happen later
         */
        { /* end of list */ }
    },
};

QemuOptsList qemu_net_opts = {
    .name = "net",
    .implied_opt_name = "type",
    .head = QTAILQ_HEAD_INITIALIZER(qemu_net_opts.head),
    .desc = {
        /*
         * no elements => accept any params
         * validation will happen later
         */
        { /* end of list */ }
    },
};
1648 1649

void net_socket_rs_init(SocketReadState *rs,
1650 1651
                        SocketReadStateFinalize *finalize,
                        bool vnet_hdr)
1652 1653
{
    rs->state = 0;
1654
    rs->vnet_hdr = vnet_hdr;
1655 1656
    rs->index = 0;
    rs->packet_len = 0;
1657
    rs->vnet_hdr_len = 0;
1658 1659 1660 1661 1662 1663
    memset(rs->buf, 0, sizeof(rs->buf));
    rs->finalize = finalize;
}

/*
 * Returns
1664 1665
 * 0: success
 * -1: error occurs
1666 1667 1668 1669 1670 1671
 */
int net_fill_rstate(SocketReadState *rs, const uint8_t *buf, int size)
{
    unsigned int l;

    while (size > 0) {
1672 1673 1674 1675 1676 1677
        /* Reassemble a packet from the network.
         * 0 = getting length.
         * 1 = getting vnet header length.
         * 2 = getting data.
         */
        switch (rs->state) {
1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690
        case 0:
            l = 4 - rs->index;
            if (l > size) {
                l = size;
            }
            memcpy(rs->buf + rs->index, buf, l);
            buf += l;
            size -= l;
            rs->index += l;
            if (rs->index == 4) {
                /* got length */
                rs->packet_len = ntohl(*(uint32_t *)rs->buf);
                rs->index = 0;
1691 1692 1693 1694 1695 1696
                if (rs->vnet_hdr) {
                    rs->state = 1;
                } else {
                    rs->state = 2;
                    rs->vnet_hdr_len = 0;
                }
1697 1698 1699
            }
            break;
        case 1:
1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715
            l = 4 - rs->index;
            if (l > size) {
                l = size;
            }
            memcpy(rs->buf + rs->index, buf, l);
            buf += l;
            size -= l;
            rs->index += l;
            if (rs->index == 4) {
                /* got vnet header length */
                rs->vnet_hdr_len = ntohl(*(uint32_t *)rs->buf);
                rs->index = 0;
                rs->state = 2;
            }
            break;
        case 2:
1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734
            l = rs->packet_len - rs->index;
            if (l > size) {
                l = size;
            }
            if (rs->index + l <= sizeof(rs->buf)) {
                memcpy(rs->buf + rs->index, buf, l);
            } else {
                fprintf(stderr, "serious error: oversized packet received,"
                    "connection terminated.\n");
                rs->index = rs->state = 0;
                return -1;
            }

            rs->index += l;
            buf += l;
            size -= l;
            if (rs->index >= rs->packet_len) {
                rs->index = 0;
                rs->state = 0;
1735 1736
                assert(rs->finalize);
                rs->finalize(rs);
1737 1738 1739 1740
            }
            break;
        }
    }
1741 1742

    assert(size == 0);
1743 1744
    return 0;
}