virtio_net.c 43.9 KB
Newer Older
1
/* A network driver using virtio.
R
Rusty Russell 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 *
 * Copyright 2007 Rusty Russell <rusty@rustcorp.com.au> IBM Corporation
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 */
//#define DEBUG
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
22
#include <linux/ethtool.h>
R
Rusty Russell 已提交
23 24 25 26
#include <linux/module.h>
#include <linux/virtio.h>
#include <linux/virtio_net.h>
#include <linux/scatterlist.h>
27
#include <linux/if_vlan.h>
28
#include <linux/slab.h>
29
#include <linux/cpu.h>
R
Rusty Russell 已提交
30

31
static int napi_weight = NAPI_POLL_WEIGHT;
32 33
module_param(napi_weight, int, 0444);

34
static bool csum = true, gso = true;
R
Rusty Russell 已提交
35 36 37
module_param(csum, bool, 0444);
module_param(gso, bool, 0444);

R
Rusty Russell 已提交
38
/* FIXME: MTU in config. */
39
#define MAX_PACKET_LEN (ETH_HLEN + VLAN_HLEN + ETH_DATA_LEN)
40
#define GOOD_COPY_LEN	128
R
Rusty Russell 已提交
41

42
#define VIRTNET_DRIVER_VERSION "1.0.0"
43

44
struct virtnet_stats {
45 46
	struct u64_stats_sync tx_syncp;
	struct u64_stats_sync rx_syncp;
47 48 49 50 51 52 53
	u64 tx_bytes;
	u64 tx_packets;

	u64 rx_bytes;
	u64 rx_packets;
};

54 55 56 57 58 59 60
/* Internal representation of a send virtqueue */
struct send_queue {
	/* Virtqueue associated with this send _queue */
	struct virtqueue *vq;

	/* TX: fragments + linear part + virtio header */
	struct scatterlist sg[MAX_SKB_FRAGS + 2];
J
Jason Wang 已提交
61 62 63

	/* Name of the send queue: output.$index */
	char name[40];
64 65 66 67 68 69 70
};

/* Internal representation of a receive virtqueue */
struct receive_queue {
	/* Virtqueue associated with this receive_queue */
	struct virtqueue *vq;

R
Rusty Russell 已提交
71 72 73 74 75
	struct napi_struct napi;

	/* Number of input buffers, and max we've ever had. */
	unsigned int num, max;

76 77 78 79 80
	/* Chain pages by the private ptr. */
	struct page *pages;

	/* RX: fragments + linear part + virtio header */
	struct scatterlist sg[MAX_SKB_FRAGS + 2];
J
Jason Wang 已提交
81 82 83

	/* Name of this receive queue: input.$index */
	char name[40];
84 85 86 87 88 89
};

struct virtnet_info {
	struct virtio_device *vdev;
	struct virtqueue *cvq;
	struct net_device *dev;
J
Jason Wang 已提交
90 91
	struct send_queue *sq;
	struct receive_queue *rq;
92 93
	unsigned int status;

J
Jason Wang 已提交
94 95 96 97 98 99
	/* Max # of queue pairs supported by the device */
	u16 max_queue_pairs;

	/* # of queue pairs currently used by the driver */
	u16 curr_queue_pairs;

100 101 102
	/* I like... big packets and I cannot lie! */
	bool big_packets;

103 104 105
	/* Host will merge rx buffers for big packets (shake it! shake it!) */
	bool mergeable_rx_bufs;

J
Jason Wang 已提交
106 107 108
	/* Has control virtqueue */
	bool has_cvq;

109 110 111
	/* Host can handle any s/g split between our header and packet data */
	bool any_header_sg;

112 113 114
	/* enable config space updates */
	bool config_enable;

115 116 117
	/* Active statistics */
	struct virtnet_stats __percpu *stats;

118 119 120
	/* Work struct for refilling if we run low on memory. */
	struct delayed_work refill;

121 122 123 124 125
	/* Work struct for config space updates */
	struct work_struct config_work;

	/* Lock for config space updates */
	struct mutex config_lock;
J
Jason Wang 已提交
126 127 128

	/* Does the affinity hint is set for virtqueues? */
	bool affinity_hint_set;
129 130 131

	/* Per-cpu variable to show the mapping from CPU to virtqueue */
	int __percpu *vq_index;
132 133 134

	/* CPU hot plug notifier */
	struct notifier_block nb;
R
Rusty Russell 已提交
135 136
};

137 138 139 140 141 142 143
struct skb_vnet_hdr {
	union {
		struct virtio_net_hdr hdr;
		struct virtio_net_hdr_mrg_rxbuf mhdr;
	};
};

144 145 146 147 148 149 150 151 152 153
struct padded_vnet_hdr {
	struct virtio_net_hdr hdr;
	/*
	 * virtio_net_hdr should be in a separated sg buffer because of a
	 * QEMU bug, and data sg buffer shares same page with this header sg.
	 * This padding makes next sg 16 byte aligned after virtio_net_hdr.
	 */
	char padding[6];
};

J
Jason Wang 已提交
154 155 156 157 158
/* Converting between virtqueue no. and kernel tx/rx queue no.
 * 0:rx0 1:tx0 2:rx1 3:tx1 ... 2N:rxN 2N+1:txN 2N+2:cvq
 */
static int vq2txq(struct virtqueue *vq)
{
159
	return (vq->index - 1) / 2;
J
Jason Wang 已提交
160 161 162 163 164 165 166 167 168
}

static int txq2vq(int txq)
{
	return txq * 2 + 1;
}

static int vq2rxq(struct virtqueue *vq)
{
169
	return vq->index / 2;
J
Jason Wang 已提交
170 171 172 173 174 175 176
}

static int rxq2vq(int rxq)
{
	return rxq * 2;
}

177
static inline struct skb_vnet_hdr *skb_vnet_hdr(struct sk_buff *skb)
R
Rusty Russell 已提交
178
{
179
	return (struct skb_vnet_hdr *)skb->cb;
R
Rusty Russell 已提交
180 181
}

182 183 184 185
/*
 * private is used to chain pages for big packets, put the whole
 * most recent used list in the beginning for reuse
 */
186
static void give_pages(struct receive_queue *rq, struct page *page)
187
{
188
	struct page *end;
189

190
	/* Find end of list, sew whole thing into vi->rq.pages. */
191
	for (end = page; end->private; end = (struct page *)end->private);
192 193
	end->private = (unsigned long)rq->pages;
	rq->pages = page;
194 195
}

196
static struct page *get_a_page(struct receive_queue *rq, gfp_t gfp_mask)
197
{
198
	struct page *p = rq->pages;
199

200
	if (p) {
201
		rq->pages = (struct page *)p->private;
202 203 204
		/* clear private here, it is used to chain pages */
		p->private = 0;
	} else
205 206 207 208
		p = alloc_page(gfp_mask);
	return p;
}

209
static void skb_xmit_done(struct virtqueue *vq)
R
Rusty Russell 已提交
210
{
211
	struct virtnet_info *vi = vq->vdev->priv;
R
Rusty Russell 已提交
212

213
	/* Suppress further interrupts. */
214
	virtqueue_disable_cb(vq);
215

216
	/* We were probably waiting for more output buffers. */
J
Jason Wang 已提交
217
	netif_wake_subqueue(vi->dev, vq2txq(vq));
R
Rusty Russell 已提交
218 219
}

220 221
static void set_skb_frag(struct sk_buff *skb, struct page *page,
			 unsigned int offset, unsigned int *len)
R
Rusty Russell 已提交
222
{
223
	int size = min((unsigned)PAGE_SIZE - offset, *len);
224 225
	int i = skb_shinfo(skb)->nr_frags;

226
	__skb_fill_page_desc(skb, i, page, offset, size);
227

228 229
	skb->data_len += size;
	skb->len += size;
230
	skb->truesize += PAGE_SIZE;
231
	skb_shinfo(skb)->nr_frags++;
232
	skb_shinfo(skb)->tx_flags |= SKBTX_SHARED_FRAG;
233
	*len -= size;
234
}
235

236
/* Called from bottom half context */
237
static struct sk_buff *page_to_skb(struct receive_queue *rq,
238 239
				   struct page *page, unsigned int len)
{
240
	struct virtnet_info *vi = rq->vq->vdev->priv;
241 242 243 244
	struct sk_buff *skb;
	struct skb_vnet_hdr *hdr;
	unsigned int copy, hdr_len, offset;
	char *p;
245

246
	p = page_address(page);
247

248 249 250 251
	/* copy small packet so we can reuse these pages for small data */
	skb = netdev_alloc_skb_ip_align(vi->dev, GOOD_COPY_LEN);
	if (unlikely(!skb))
		return NULL;
252

253
	hdr = skb_vnet_hdr(skb);
254

255 256 257 258 259 260 261
	if (vi->mergeable_rx_bufs) {
		hdr_len = sizeof hdr->mhdr;
		offset = hdr_len;
	} else {
		hdr_len = sizeof hdr->hdr;
		offset = sizeof(struct padded_vnet_hdr);
	}
262

263
	memcpy(hdr, p, hdr_len);
264

265 266
	len -= hdr_len;
	p += offset;
267

268 269 270 271
	copy = len;
	if (copy > skb_tailroom(skb))
		copy = skb_tailroom(skb);
	memcpy(skb_put(skb, copy), p, copy);
272

273 274
	len -= copy;
	offset += copy;
275

276 277 278 279 280 281 282
	/*
	 * Verify that we can indeed put this data into a skb.
	 * This is here to handle cases when the device erroneously
	 * tries to receive more than is possible. This is usually
	 * the case of a broken device.
	 */
	if (unlikely(len > MAX_SKB_FRAGS * PAGE_SIZE)) {
283
		net_dbg_ratelimited("%s: too much data\n", skb->dev->name);
284 285 286 287
		dev_kfree_skb(skb);
		return NULL;
	}

288 289 290 291 292
	while (len) {
		set_skb_frag(skb, page, offset, &len);
		page = (struct page *)page->private;
		offset = 0;
	}
293

294
	if (page)
295
		give_pages(rq, page);
296

297 298
	return skb;
}
299

300
static int receive_mergeable(struct receive_queue *rq, struct sk_buff *skb)
301 302 303 304 305 306 307 308 309 310 311 312 313
{
	struct skb_vnet_hdr *hdr = skb_vnet_hdr(skb);
	struct page *page;
	int num_buf, i, len;

	num_buf = hdr->mhdr.num_buffers;
	while (--num_buf) {
		i = skb_shinfo(skb)->nr_frags;
		if (i >= MAX_SKB_FRAGS) {
			pr_debug("%s: packet too long\n", skb->dev->name);
			skb->dev->stats.rx_length_errors++;
			return -EINVAL;
		}
314
		page = virtqueue_get_buf(rq->vq, &len);
315 316 317 318 319
		if (!page) {
			pr_debug("%s: rx error: %d buffers missing\n",
				 skb->dev->name, hdr->mhdr.num_buffers);
			skb->dev->stats.rx_length_errors++;
			return -EINVAL;
320
		}
321

322 323 324 325 326
		if (len > PAGE_SIZE)
			len = PAGE_SIZE;

		set_skb_frag(skb, page, 0, &len);

327
		--rq->num;
328 329 330 331
	}
	return 0;
}

332
static void receive_buf(struct receive_queue *rq, void *buf, unsigned int len)
333
{
334 335
	struct virtnet_info *vi = rq->vq->vdev->priv;
	struct net_device *dev = vi->dev;
E
Eric Dumazet 已提交
336
	struct virtnet_stats *stats = this_cpu_ptr(vi->stats);
337 338 339
	struct sk_buff *skb;
	struct page *page;
	struct skb_vnet_hdr *hdr;
340

341 342 343 344
	if (unlikely(len < sizeof(struct virtio_net_hdr) + ETH_HLEN)) {
		pr_debug("%s: short packet %i\n", dev->name, len);
		dev->stats.rx_length_errors++;
		if (vi->mergeable_rx_bufs || vi->big_packets)
345
			give_pages(rq, buf);
346 347 348 349
		else
			dev_kfree_skb(buf);
		return;
	}
350

351 352 353 354 355 356
	if (!vi->mergeable_rx_bufs && !vi->big_packets) {
		skb = buf;
		len -= sizeof(struct virtio_net_hdr);
		skb_trim(skb, len);
	} else {
		page = buf;
357
		skb = page_to_skb(rq, page, len);
358
		if (unlikely(!skb)) {
359
			dev->stats.rx_dropped++;
360
			give_pages(rq, page);
361
			return;
362
		}
363
		if (vi->mergeable_rx_bufs)
364
			if (receive_mergeable(rq, skb)) {
365 366 367
				dev_kfree_skb(skb);
				return;
			}
368
	}
369

370
	hdr = skb_vnet_hdr(skb);
371

372
	u64_stats_update_begin(&stats->rx_syncp);
373 374
	stats->rx_bytes += skb->len;
	stats->rx_packets++;
375
	u64_stats_update_end(&stats->rx_syncp);
R
Rusty Russell 已提交
376

377
	if (hdr->hdr.flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) {
R
Rusty Russell 已提交
378
		pr_debug("Needs csum!\n");
379 380 381
		if (!skb_partial_csum_set(skb,
					  hdr->hdr.csum_start,
					  hdr->hdr.csum_offset))
R
Rusty Russell 已提交
382
			goto frame_err;
383 384
	} else if (hdr->hdr.flags & VIRTIO_NET_HDR_F_DATA_VALID) {
		skb->ip_summed = CHECKSUM_UNNECESSARY;
R
Rusty Russell 已提交
385 386
	}

387 388 389 390
	skb->protocol = eth_type_trans(skb, dev);
	pr_debug("Receiving skb proto 0x%04x len %i type %i\n",
		 ntohs(skb->protocol), skb->len, skb->pkt_type);

391
	if (hdr->hdr.gso_type != VIRTIO_NET_HDR_GSO_NONE) {
R
Rusty Russell 已提交
392
		pr_debug("GSO!\n");
393
		switch (hdr->hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN) {
R
Rusty Russell 已提交
394
		case VIRTIO_NET_HDR_GSO_TCPV4:
395
			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
R
Rusty Russell 已提交
396 397
			break;
		case VIRTIO_NET_HDR_GSO_UDP:
398
			skb_shinfo(skb)->gso_type = SKB_GSO_UDP;
R
Rusty Russell 已提交
399 400
			break;
		case VIRTIO_NET_HDR_GSO_TCPV6:
401
			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
R
Rusty Russell 已提交
402 403
			break;
		default:
404 405
			net_warn_ratelimited("%s: bad gso type %u.\n",
					     dev->name, hdr->hdr.gso_type);
R
Rusty Russell 已提交
406 407 408
			goto frame_err;
		}

409
		if (hdr->hdr.gso_type & VIRTIO_NET_HDR_GSO_ECN)
410
			skb_shinfo(skb)->gso_type |= SKB_GSO_TCP_ECN;
R
Rusty Russell 已提交
411

412
		skb_shinfo(skb)->gso_size = hdr->hdr.gso_size;
R
Rusty Russell 已提交
413
		if (skb_shinfo(skb)->gso_size == 0) {
414
			net_warn_ratelimited("%s: zero gso size.\n", dev->name);
R
Rusty Russell 已提交
415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430
			goto frame_err;
		}

		/* Header must be checked, and gso_segs computed. */
		skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
		skb_shinfo(skb)->gso_segs = 0;
	}

	netif_receive_skb(skb);
	return;

frame_err:
	dev->stats.rx_frame_errors++;
	dev_kfree_skb(skb);
}

431
static int add_recvbuf_small(struct receive_queue *rq, gfp_t gfp)
R
Rusty Russell 已提交
432
{
433
	struct virtnet_info *vi = rq->vq->vdev->priv;
R
Rusty Russell 已提交
434
	struct sk_buff *skb;
435 436
	struct skb_vnet_hdr *hdr;
	int err;
437

438
	skb = __netdev_alloc_skb_ip_align(vi->dev, MAX_PACKET_LEN, gfp);
439 440
	if (unlikely(!skb))
		return -ENOMEM;
R
Rusty Russell 已提交
441

442
	skb_put(skb, MAX_PACKET_LEN);
443

444
	hdr = skb_vnet_hdr(skb);
445
	sg_set_buf(rq->sg, &hdr->hdr, sizeof hdr->hdr);
446

447
	skb_to_sgvec(skb, rq->sg + 1, 0, skb->len);
448

449
	err = virtqueue_add_inbuf(rq->vq, rq->sg, 2, skb, gfp);
450 451
	if (err < 0)
		dev_kfree_skb(skb);
452

453 454
	return err;
}
455

456
static int add_recvbuf_big(struct receive_queue *rq, gfp_t gfp)
457 458 459 460 461
{
	struct page *first, *list = NULL;
	char *p;
	int i, err, offset;

462
	/* page in rq->sg[MAX_SKB_FRAGS + 1] is list tail */
463
	for (i = MAX_SKB_FRAGS + 1; i > 1; --i) {
464
		first = get_a_page(rq, gfp);
465 466
		if (!first) {
			if (list)
467
				give_pages(rq, list);
468
			return -ENOMEM;
469
		}
470
		sg_set_buf(&rq->sg[i], page_address(first), PAGE_SIZE);
471

472 473 474 475
		/* chain new page in list head to match sg */
		first->private = (unsigned long)list;
		list = first;
	}
R
Rusty Russell 已提交
476

477
	first = get_a_page(rq, gfp);
478
	if (!first) {
479
		give_pages(rq, list);
480 481 482 483
		return -ENOMEM;
	}
	p = page_address(first);

484 485 486
	/* rq->sg[0], rq->sg[1] share the same page */
	/* a separated rq->sg[0] for virtio_net_hdr only due to QEMU bug */
	sg_set_buf(&rq->sg[0], p, sizeof(struct virtio_net_hdr));
487

488
	/* rq->sg[1] for data packet, from offset */
489
	offset = sizeof(struct padded_vnet_hdr);
490
	sg_set_buf(&rq->sg[1], p + offset, PAGE_SIZE - offset);
491 492 493

	/* chain first in list head */
	first->private = (unsigned long)list;
494 495
	err = virtqueue_add_inbuf(rq->vq, rq->sg, MAX_SKB_FRAGS + 2,
				  first, gfp);
496
	if (err < 0)
497
		give_pages(rq, first);
498 499

	return err;
R
Rusty Russell 已提交
500 501
}

502
static int add_recvbuf_mergeable(struct receive_queue *rq, gfp_t gfp)
503
{
504
	struct page *page;
505 506
	int err;

507
	page = get_a_page(rq, gfp);
508 509
	if (!page)
		return -ENOMEM;
510

511
	sg_init_one(rq->sg, page_address(page), PAGE_SIZE);
512

513
	err = virtqueue_add_inbuf(rq->vq, rq->sg, 1, page, gfp);
514
	if (err < 0)
515
		give_pages(rq, page);
516

517 518
	return err;
}
519

520 521 522 523 524 525 526
/*
 * Returns false if we couldn't fill entirely (OOM).
 *
 * Normally run in the receive path, but can also be run from ndo_open
 * before we're receiving packets, or from refill_work which is
 * careful to disable receiving (using napi_disable).
 */
527
static bool try_fill_recv(struct receive_queue *rq, gfp_t gfp)
528
{
529
	struct virtnet_info *vi = rq->vq->vdev->priv;
530
	int err;
531
	bool oom;
532

533 534
	do {
		if (vi->mergeable_rx_bufs)
535
			err = add_recvbuf_mergeable(rq, gfp);
536
		else if (vi->big_packets)
537
			err = add_recvbuf_big(rq, gfp);
538
		else
539
			err = add_recvbuf_small(rq, gfp);
540

541
		oom = err == -ENOMEM;
542
		if (err)
543
			break;
544
		++rq->num;
545
	} while (rq->vq->num_free);
546 547
	if (unlikely(rq->num > rq->max))
		rq->max = rq->num;
548 549
	if (unlikely(!virtqueue_kick(rq->vq)))
		return false;
550
	return !oom;
551 552
}

553
static void skb_recv_done(struct virtqueue *rvq)
R
Rusty Russell 已提交
554 555
{
	struct virtnet_info *vi = rvq->vdev->priv;
J
Jason Wang 已提交
556
	struct receive_queue *rq = &vi->rq[vq2rxq(rvq)];
557

558
	/* Schedule NAPI, Suppress further interrupts if successful. */
559
	if (napi_schedule_prep(&rq->napi)) {
560
		virtqueue_disable_cb(rvq);
561
		__napi_schedule(&rq->napi);
562
	}
R
Rusty Russell 已提交
563 564
}

565
static void virtnet_napi_enable(struct receive_queue *rq)
566
{
567
	napi_enable(&rq->napi);
568 569 570 571 572

	/* If all buffers were filled by other side before we napi_enabled, we
	 * won't get another interrupt, so process any outstanding packets
	 * now.  virtnet_poll wants re-enable the queue, so we disable here.
	 * We synchronize against interrupts via NAPI_STATE_SCHED */
573 574
	if (napi_schedule_prep(&rq->napi)) {
		virtqueue_disable_cb(rq->vq);
575
		local_bh_disable();
576
		__napi_schedule(&rq->napi);
577
		local_bh_enable();
578 579 580
	}
}

581 582
static void refill_work(struct work_struct *work)
{
583 584
	struct virtnet_info *vi =
		container_of(work, struct virtnet_info, refill.work);
585
	bool still_empty;
J
Jason Wang 已提交
586 587
	int i;

588
	for (i = 0; i < vi->curr_queue_pairs; i++) {
J
Jason Wang 已提交
589
		struct receive_queue *rq = &vi->rq[i];
590

J
Jason Wang 已提交
591 592 593
		napi_disable(&rq->napi);
		still_empty = !try_fill_recv(rq, GFP_KERNEL);
		virtnet_napi_enable(rq);
594

J
Jason Wang 已提交
595 596 597 598 599 600
		/* In theory, this can happen: if we don't get any buffers in
		 * we will *never* try to fill again.
		 */
		if (still_empty)
			schedule_delayed_work(&vi->refill, HZ/2);
	}
601 602
}

R
Rusty Russell 已提交
603 604
static int virtnet_poll(struct napi_struct *napi, int budget)
{
605 606 607
	struct receive_queue *rq =
		container_of(napi, struct receive_queue, napi);
	struct virtnet_info *vi = rq->vq->vdev->priv;
608
	void *buf;
609
	unsigned int r, len, received = 0;
R
Rusty Russell 已提交
610 611 612

again:
	while (received < budget &&
613 614 615
	       (buf = virtqueue_get_buf(rq->vq, &len)) != NULL) {
		receive_buf(rq, buf, len);
		--rq->num;
R
Rusty Russell 已提交
616 617 618
		received++;
	}

619 620
	if (rq->num < rq->max / 2) {
		if (!try_fill_recv(rq, GFP_ATOMIC))
621
			schedule_delayed_work(&vi->refill, 0);
622
	}
R
Rusty Russell 已提交
623

624 625
	/* Out of packets? */
	if (received < budget) {
626
		r = virtqueue_enable_cb_prepare(rq->vq);
627
		napi_complete(napi);
628
		if (unlikely(virtqueue_poll(rq->vq, r)) &&
629
		    napi_schedule_prep(napi)) {
630
			virtqueue_disable_cb(rq->vq);
631
			__napi_schedule(napi);
R
Rusty Russell 已提交
632
			goto again;
633
		}
R
Rusty Russell 已提交
634 635 636 637 638
	}

	return received;
}

J
Jason Wang 已提交
639 640 641 642 643
static int virtnet_open(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
	int i;

644 645 646 647 648
	for (i = 0; i < vi->max_queue_pairs; i++) {
		if (i < vi->curr_queue_pairs)
			/* Make sure we have some buffers: if oom use wq. */
			if (!try_fill_recv(&vi->rq[i], GFP_KERNEL))
				schedule_delayed_work(&vi->refill, 0);
J
Jason Wang 已提交
649 650 651 652 653 654
		virtnet_napi_enable(&vi->rq[i]);
	}

	return 0;
}

655
static void free_old_xmit_skbs(struct send_queue *sq)
R
Rusty Russell 已提交
656 657
{
	struct sk_buff *skb;
658
	unsigned int len;
659
	struct virtnet_info *vi = sq->vq->vdev->priv;
E
Eric Dumazet 已提交
660
	struct virtnet_stats *stats = this_cpu_ptr(vi->stats);
R
Rusty Russell 已提交
661

662
	while ((skb = virtqueue_get_buf(sq->vq, &len)) != NULL) {
R
Rusty Russell 已提交
663
		pr_debug("Sent skb %p\n", skb);
664

665
		u64_stats_update_begin(&stats->tx_syncp);
666 667
		stats->tx_bytes += skb->len;
		stats->tx_packets++;
668
		u64_stats_update_end(&stats->tx_syncp);
669

670
		dev_kfree_skb_any(skb);
R
Rusty Russell 已提交
671 672 673
	}
}

674
static int xmit_skb(struct send_queue *sq, struct sk_buff *skb)
R
Rusty Russell 已提交
675
{
676
	struct skb_vnet_hdr *hdr;
R
Rusty Russell 已提交
677
	const unsigned char *dest = ((struct ethhdr *)skb->data)->h_dest;
678
	struct virtnet_info *vi = sq->vq->vdev->priv;
679
	unsigned num_sg;
680 681
	unsigned hdr_len;
	bool can_push;
R
Rusty Russell 已提交
682

J
Johannes Berg 已提交
683
	pr_debug("%s: xmit %p %pM\n", vi->dev->name, skb, dest);
684 685 686 687 688 689 690 691 692 693 694 695 696 697
	if (vi->mergeable_rx_bufs)
		hdr_len = sizeof hdr->mhdr;
	else
		hdr_len = sizeof hdr->hdr;

	can_push = vi->any_header_sg &&
		!((unsigned long)skb->data & (__alignof__(*hdr) - 1)) &&
		!skb_header_cloned(skb) && skb_headroom(skb) >= hdr_len;
	/* Even if we can, don't push here yet as this would skew
	 * csum_start offset below. */
	if (can_push)
		hdr = (struct skb_vnet_hdr *)(skb->data - hdr_len);
	else
		hdr = skb_vnet_hdr(skb);
R
Rusty Russell 已提交
698 699

	if (skb->ip_summed == CHECKSUM_PARTIAL) {
700
		hdr->hdr.flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
701
		hdr->hdr.csum_start = skb_checksum_start_offset(skb);
702
		hdr->hdr.csum_offset = skb->csum_offset;
R
Rusty Russell 已提交
703
	} else {
704 705
		hdr->hdr.flags = 0;
		hdr->hdr.csum_offset = hdr->hdr.csum_start = 0;
R
Rusty Russell 已提交
706 707 708
	}

	if (skb_is_gso(skb)) {
709 710
		hdr->hdr.hdr_len = skb_headlen(skb);
		hdr->hdr.gso_size = skb_shinfo(skb)->gso_size;
R
Rusty Russell 已提交
711
		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV4)
712
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
R
Rusty Russell 已提交
713
		else if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6)
714
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
R
Rusty Russell 已提交
715
		else if (skb_shinfo(skb)->gso_type & SKB_GSO_UDP)
716
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_UDP;
R
Rusty Russell 已提交
717 718
		else
			BUG();
R
Rusty Russell 已提交
719
		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCP_ECN)
720
			hdr->hdr.gso_type |= VIRTIO_NET_HDR_GSO_ECN;
R
Rusty Russell 已提交
721
	} else {
722 723
		hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_NONE;
		hdr->hdr.gso_size = hdr->hdr.hdr_len = 0;
R
Rusty Russell 已提交
724 725
	}

726
	if (vi->mergeable_rx_bufs)
727
		hdr->mhdr.num_buffers = 0;
728

729 730 731 732 733 734 735 736 737
	if (can_push) {
		__skb_push(skb, hdr_len);
		num_sg = skb_to_sgvec(skb, sq->sg, 0, skb->len);
		/* Pull header back to avoid skew in tx bytes calculations. */
		__skb_pull(skb, hdr_len);
	} else {
		sg_set_buf(sq->sg, hdr, hdr_len);
		num_sg = skb_to_sgvec(skb, sq->sg + 1, 0, skb->len) + 1;
	}
738
	return virtqueue_add_outbuf(sq->vq, sq->sg, num_sg, skb, GFP_ATOMIC);
739 740
}

741
static netdev_tx_t start_xmit(struct sk_buff *skb, struct net_device *dev)
742 743
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
744 745
	int qnum = skb_get_queue_mapping(skb);
	struct send_queue *sq = &vi->sq[qnum];
746
	int err;
747 748

	/* Free up any pending old buffers before queueing new ones. */
749
	free_old_xmit_skbs(sq);
750

751
	/* Try to transmit */
752
	err = xmit_skb(sq, skb);
753

754
	/* This should not happen! */
755
	if (unlikely(err) || unlikely(!virtqueue_kick(sq->vq))) {
756 757 758
		dev->stats.tx_fifo_errors++;
		if (net_ratelimit())
			dev_warn(&dev->dev,
759
				 "Unexpected TXQ (%d) queue failure: %d\n", qnum, err);
760 761 762
		dev->stats.tx_dropped++;
		kfree_skb(skb);
		return NETDEV_TX_OK;
R
Rusty Russell 已提交
763
	}
764

765 766 767 768 769 770
	/* Don't wait up for transmitted skbs to be freed. */
	skb_orphan(skb);
	nf_reset(skb);

	/* Apparently nice girls don't return TX_BUSY; stop the queue
	 * before it gets out of hand.  Naturally, this wastes entries. */
771
	if (sq->vq->num_free < 2+MAX_SKB_FRAGS) {
J
Jason Wang 已提交
772
		netif_stop_subqueue(dev, qnum);
773
		if (unlikely(!virtqueue_enable_cb_delayed(sq->vq))) {
774
			/* More just got used, free them then recheck. */
775 776
			free_old_xmit_skbs(sq);
			if (sq->vq->num_free >= 2+MAX_SKB_FRAGS) {
J
Jason Wang 已提交
777
				netif_start_subqueue(dev, qnum);
778
				virtqueue_disable_cb(sq->vq);
779 780
			}
		}
781
	}
782 783

	return NETDEV_TX_OK;
R
Rusty Russell 已提交
784 785
}

786 787 788 789 790 791
/*
 * Send command via the control virtqueue and check status.  Commands
 * supported by the hypervisor, as indicated by feature bits, should
 * never fail unless improperly formated.
 */
static bool virtnet_send_command(struct virtnet_info *vi, u8 class, u8 cmd,
792 793
				 struct scatterlist *out,
				 struct scatterlist *in)
794
{
795
	struct scatterlist *sgs[4], hdr, stat;
796 797
	struct virtio_net_ctrl_hdr ctrl;
	virtio_net_ctrl_ack status = ~0;
798
	unsigned out_num = 0, in_num = 0, tmp;
799 800

	/* Caller should know better */
801
	BUG_ON(!virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VQ));
802 803 804

	ctrl.class = class;
	ctrl.cmd = cmd;
805 806 807
	/* Add header */
	sg_init_one(&hdr, &ctrl, sizeof(ctrl));
	sgs[out_num++] = &hdr;
808

809 810 811 812
	if (out)
		sgs[out_num++] = out;
	if (in)
		sgs[out_num + in_num++] = in;
813

814 815 816
	/* Add return status. */
	sg_init_one(&stat, &status, sizeof(status));
	sgs[out_num + in_num++] = &stat;
817

818 819 820
	BUG_ON(out_num + in_num > ARRAY_SIZE(sgs));
	BUG_ON(virtqueue_add_sgs(vi->cvq, sgs, out_num, in_num, vi, GFP_ATOMIC)
	       < 0);
821

822 823
	if (unlikely(!virtqueue_kick(vi->cvq)))
		return status == VIRTIO_NET_OK;
824 825 826 827 828 829 830 831 832 833

	/* Spin for a response, the kick causes an ioport write, trapping
	 * into the hypervisor, so the request should be handled immediately.
	 */
	while (!virtqueue_get_buf(vi->cvq, &tmp))
		cpu_relax();

	return status == VIRTIO_NET_OK;
}

834 835 836 837
static int virtnet_set_mac_address(struct net_device *dev, void *p)
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct virtio_device *vdev = vi->vdev;
838
	int ret;
839 840
	struct sockaddr *addr = p;
	struct scatterlist sg;
841

842
	ret = eth_prepare_mac_addr_change(dev, p);
843 844
	if (ret)
		return ret;
845

846 847 848 849
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR)) {
		sg_init_one(&sg, addr->sa_data, dev->addr_len);
		if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MAC,
					  VIRTIO_NET_CTRL_MAC_ADDR_SET,
850
					  &sg, NULL)) {
851 852 853 854 855
			dev_warn(&vdev->dev,
				 "Failed to set mac address by vq command.\n");
			return -EINVAL;
		}
	} else if (virtio_has_feature(vdev, VIRTIO_NET_F_MAC)) {
856 857 858 859 860 861 862
		unsigned int i;

		/* Naturally, this has an atomicity problem. */
		for (i = 0; i < dev->addr_len; i++)
			virtio_cwrite8(vdev,
				       offsetof(struct virtio_net_config, mac) +
				       i, addr->sa_data[i]);
863 864 865
	}

	eth_commit_mac_addr_change(dev, p);
866 867 868 869

	return 0;
}

870 871 872 873 874 875 876 877
static struct rtnl_link_stats64 *virtnet_stats(struct net_device *dev,
					       struct rtnl_link_stats64 *tot)
{
	struct virtnet_info *vi = netdev_priv(dev);
	int cpu;
	unsigned int start;

	for_each_possible_cpu(cpu) {
E
Eric Dumazet 已提交
878
		struct virtnet_stats *stats = per_cpu_ptr(vi->stats, cpu);
879 880 881
		u64 tpackets, tbytes, rpackets, rbytes;

		do {
882
			start = u64_stats_fetch_begin_bh(&stats->tx_syncp);
883 884
			tpackets = stats->tx_packets;
			tbytes   = stats->tx_bytes;
885
		} while (u64_stats_fetch_retry_bh(&stats->tx_syncp, start));
886 887

		do {
888
			start = u64_stats_fetch_begin_bh(&stats->rx_syncp);
889 890
			rpackets = stats->rx_packets;
			rbytes   = stats->rx_bytes;
891
		} while (u64_stats_fetch_retry_bh(&stats->rx_syncp, start));
892 893 894 895 896 897 898 899

		tot->rx_packets += rpackets;
		tot->tx_packets += tpackets;
		tot->rx_bytes   += rbytes;
		tot->tx_bytes   += tbytes;
	}

	tot->tx_dropped = dev->stats.tx_dropped;
900
	tot->tx_fifo_errors = dev->stats.tx_fifo_errors;
901 902 903 904 905 906 907
	tot->rx_dropped = dev->stats.rx_dropped;
	tot->rx_length_errors = dev->stats.rx_length_errors;
	tot->rx_frame_errors = dev->stats.rx_frame_errors;

	return tot;
}

908 909 910 911
#ifdef CONFIG_NET_POLL_CONTROLLER
static void virtnet_netpoll(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
912
	int i;
913

J
Jason Wang 已提交
914 915
	for (i = 0; i < vi->curr_queue_pairs; i++)
		napi_schedule(&vi->rq[i].napi);
916 917 918
}
#endif

919 920 921 922
static void virtnet_ack_link_announce(struct virtnet_info *vi)
{
	rtnl_lock();
	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_ANNOUNCE,
923
				  VIRTIO_NET_CTRL_ANNOUNCE_ACK, NULL, NULL))
924 925 926 927
		dev_warn(&vi->dev->dev, "Failed to ack link announce.\n");
	rtnl_unlock();
}

J
Jason Wang 已提交
928 929 930 931 932 933 934 935 936 937 938 939 940
static int virtnet_set_queues(struct virtnet_info *vi, u16 queue_pairs)
{
	struct scatterlist sg;
	struct virtio_net_ctrl_mq s;
	struct net_device *dev = vi->dev;

	if (!vi->has_cvq || !virtio_has_feature(vi->vdev, VIRTIO_NET_F_MQ))
		return 0;

	s.virtqueue_pairs = queue_pairs;
	sg_init_one(&sg, &s, sizeof(s));

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MQ,
941
				  VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET, &sg, NULL)) {
J
Jason Wang 已提交
942 943 944
		dev_warn(&dev->dev, "Fail to set num of queue pairs to %d\n",
			 queue_pairs);
		return -EINVAL;
945
	} else {
J
Jason Wang 已提交
946
		vi->curr_queue_pairs = queue_pairs;
947
		schedule_delayed_work(&vi->refill, 0);
948
	}
J
Jason Wang 已提交
949 950 951 952

	return 0;
}

R
Rusty Russell 已提交
953 954 955
static int virtnet_close(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
956
	int i;
R
Rusty Russell 已提交
957

958 959
	/* Make sure refill_work doesn't re-enable napi! */
	cancel_delayed_work_sync(&vi->refill);
J
Jason Wang 已提交
960 961 962

	for (i = 0; i < vi->max_queue_pairs; i++)
		napi_disable(&vi->rq[i].napi);
R
Rusty Russell 已提交
963 964 965 966

	return 0;
}

967 968 969
static void virtnet_set_rx_mode(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
970
	struct scatterlist sg[2];
971
	u8 promisc, allmulti;
972
	struct virtio_net_ctrl_mac *mac_data;
J
Jiri Pirko 已提交
973
	struct netdev_hw_addr *ha;
974
	int uc_count;
975
	int mc_count;
976 977
	void *buf;
	int i;
978 979 980 981 982

	/* We can't dynamicaly set ndo_set_rx_mode, so return gracefully */
	if (!virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_RX))
		return;

983 984
	promisc = ((dev->flags & IFF_PROMISC) != 0);
	allmulti = ((dev->flags & IFF_ALLMULTI) != 0);
985

986
	sg_init_one(sg, &promisc, sizeof(promisc));
987 988 989

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_RX,
				  VIRTIO_NET_CTRL_RX_PROMISC,
990
				  sg, NULL))
991 992 993
		dev_warn(&dev->dev, "Failed to %sable promisc mode.\n",
			 promisc ? "en" : "dis");

994
	sg_init_one(sg, &allmulti, sizeof(allmulti));
995 996 997

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_RX,
				  VIRTIO_NET_CTRL_RX_ALLMULTI,
998
				  sg, NULL))
999 1000
		dev_warn(&dev->dev, "Failed to %sable allmulti mode.\n",
			 allmulti ? "en" : "dis");
1001

1002
	uc_count = netdev_uc_count(dev);
1003
	mc_count = netdev_mc_count(dev);
1004
	/* MAC filter - use one buffer for both lists */
1005 1006 1007
	buf = kzalloc(((uc_count + mc_count) * ETH_ALEN) +
		      (2 * sizeof(mac_data->entries)), GFP_ATOMIC);
	mac_data = buf;
1008
	if (!buf)
1009 1010
		return;

1011 1012
	sg_init_table(sg, 2);

1013
	/* Store the unicast list and count in the front of the buffer */
1014
	mac_data->entries = uc_count;
J
Jiri Pirko 已提交
1015
	i = 0;
1016
	netdev_for_each_uc_addr(ha, dev)
J
Jiri Pirko 已提交
1017
		memcpy(&mac_data->macs[i++][0], ha->addr, ETH_ALEN);
1018 1019

	sg_set_buf(&sg[0], mac_data,
1020
		   sizeof(mac_data->entries) + (uc_count * ETH_ALEN));
1021 1022

	/* multicast list and count fill the end */
1023
	mac_data = (void *)&mac_data->macs[uc_count][0];
1024

1025
	mac_data->entries = mc_count;
1026
	i = 0;
1027 1028
	netdev_for_each_mc_addr(ha, dev)
		memcpy(&mac_data->macs[i++][0], ha->addr, ETH_ALEN);
1029 1030

	sg_set_buf(&sg[1], mac_data,
1031
		   sizeof(mac_data->entries) + (mc_count * ETH_ALEN));
1032 1033 1034

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MAC,
				  VIRTIO_NET_CTRL_MAC_TABLE_SET,
1035
				  sg, NULL))
1036 1037 1038
		dev_warn(&dev->dev, "Failed to set MAC fitler table.\n");

	kfree(buf);
1039 1040
}

1041 1042
static int virtnet_vlan_rx_add_vid(struct net_device *dev,
				   __be16 proto, u16 vid)
1043 1044 1045 1046
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct scatterlist sg;

1047
	sg_init_one(&sg, &vid, sizeof(vid));
1048 1049

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_VLAN,
1050
				  VIRTIO_NET_CTRL_VLAN_ADD, &sg, NULL))
1051
		dev_warn(&dev->dev, "Failed to add VLAN ID %d.\n", vid);
1052
	return 0;
1053 1054
}

1055 1056
static int virtnet_vlan_rx_kill_vid(struct net_device *dev,
				    __be16 proto, u16 vid)
1057 1058 1059 1060
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct scatterlist sg;

1061
	sg_init_one(&sg, &vid, sizeof(vid));
1062 1063

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_VLAN,
1064
				  VIRTIO_NET_CTRL_VLAN_DEL, &sg, NULL))
1065
		dev_warn(&dev->dev, "Failed to kill VLAN ID %d.\n", vid);
1066
	return 0;
1067 1068
}

1069
static void virtnet_clean_affinity(struct virtnet_info *vi, long hcpu)
J
Jason Wang 已提交
1070 1071
{
	int i;
1072
	int cpu;
J
Jason Wang 已提交
1073

1074 1075
	if (vi->affinity_hint_set) {
		for (i = 0; i < vi->max_queue_pairs; i++) {
1076 1077 1078 1079
			virtqueue_set_affinity(vi->rq[i].vq, -1);
			virtqueue_set_affinity(vi->sq[i].vq, -1);
		}

1080 1081 1082 1083 1084 1085 1086 1087
		vi->affinity_hint_set = false;
	}

	i = 0;
	for_each_online_cpu(cpu) {
		if (cpu == hcpu) {
			*per_cpu_ptr(vi->vq_index, cpu) = -1;
		} else {
1088 1089
			*per_cpu_ptr(vi->vq_index, cpu) =
				++i % vi->curr_queue_pairs;
1090 1091 1092
		}
	}
}
1093

1094 1095 1096 1097
static void virtnet_set_affinity(struct virtnet_info *vi)
{
	int i;
	int cpu;
J
Jason Wang 已提交
1098 1099 1100 1101 1102

	/* In multiqueue mode, when the number of cpu is equal to the number of
	 * queue pairs, we let the queue pairs to be private to one cpu by
	 * setting the affinity hint to eliminate the contention.
	 */
1103 1104 1105 1106
	if (vi->curr_queue_pairs == 1 ||
	    vi->max_queue_pairs != num_online_cpus()) {
		virtnet_clean_affinity(vi, -1);
		return;
J
Jason Wang 已提交
1107 1108
	}

1109 1110
	i = 0;
	for_each_online_cpu(cpu) {
J
Jason Wang 已提交
1111 1112
		virtqueue_set_affinity(vi->rq[i].vq, cpu);
		virtqueue_set_affinity(vi->sq[i].vq, cpu);
1113 1114
		*per_cpu_ptr(vi->vq_index, cpu) = i;
		i++;
J
Jason Wang 已提交
1115 1116
	}

1117
	vi->affinity_hint_set = true;
J
Jason Wang 已提交
1118 1119
}

1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137
static int virtnet_cpu_callback(struct notifier_block *nfb,
			        unsigned long action, void *hcpu)
{
	struct virtnet_info *vi = container_of(nfb, struct virtnet_info, nb);

	switch(action & ~CPU_TASKS_FROZEN) {
	case CPU_ONLINE:
	case CPU_DOWN_FAILED:
	case CPU_DEAD:
		virtnet_set_affinity(vi);
		break;
	case CPU_DOWN_PREPARE:
		virtnet_clean_affinity(vi, (long)hcpu);
		break;
	default:
		break;
	}
	return NOTIFY_OK;
J
Jason Wang 已提交
1138 1139
}

R
Rick Jones 已提交
1140 1141 1142 1143 1144
static void virtnet_get_ringparam(struct net_device *dev,
				struct ethtool_ringparam *ring)
{
	struct virtnet_info *vi = netdev_priv(dev);

J
Jason Wang 已提交
1145 1146
	ring->rx_max_pending = virtqueue_get_vring_size(vi->rq[0].vq);
	ring->tx_max_pending = virtqueue_get_vring_size(vi->sq[0].vq);
R
Rick Jones 已提交
1147 1148 1149 1150
	ring->rx_pending = ring->rx_max_pending;
	ring->tx_pending = ring->tx_max_pending;
}

1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163

static void virtnet_get_drvinfo(struct net_device *dev,
				struct ethtool_drvinfo *info)
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct virtio_device *vdev = vi->vdev;

	strlcpy(info->driver, KBUILD_MODNAME, sizeof(info->driver));
	strlcpy(info->version, VIRTNET_DRIVER_VERSION, sizeof(info->version));
	strlcpy(info->bus_info, virtio_bus_name(vdev), sizeof(info->bus_info));

}

1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180
/* TODO: Eliminate OOO packets during switching */
static int virtnet_set_channels(struct net_device *dev,
				struct ethtool_channels *channels)
{
	struct virtnet_info *vi = netdev_priv(dev);
	u16 queue_pairs = channels->combined_count;
	int err;

	/* We don't support separate rx/tx channels.
	 * We don't allow setting 'other' channels.
	 */
	if (channels->rx_count || channels->tx_count || channels->other_count)
		return -EINVAL;

	if (queue_pairs > vi->max_queue_pairs)
		return -EINVAL;

1181
	get_online_cpus();
1182 1183 1184 1185 1186
	err = virtnet_set_queues(vi, queue_pairs);
	if (!err) {
		netif_set_real_num_tx_queues(dev, queue_pairs);
		netif_set_real_num_rx_queues(dev, queue_pairs);

1187
		virtnet_set_affinity(vi);
1188
	}
1189
	put_online_cpus();
1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206

	return err;
}

static void virtnet_get_channels(struct net_device *dev,
				 struct ethtool_channels *channels)
{
	struct virtnet_info *vi = netdev_priv(dev);

	channels->combined_count = vi->curr_queue_pairs;
	channels->max_combined = vi->max_queue_pairs;
	channels->max_other = 0;
	channels->rx_count = 0;
	channels->tx_count = 0;
	channels->other_count = 0;
}

1207
static const struct ethtool_ops virtnet_ethtool_ops = {
1208
	.get_drvinfo = virtnet_get_drvinfo,
1209
	.get_link = ethtool_op_get_link,
R
Rick Jones 已提交
1210
	.get_ringparam = virtnet_get_ringparam,
1211 1212
	.set_channels = virtnet_set_channels,
	.get_channels = virtnet_get_channels,
1213 1214
};

M
Mark McLoughlin 已提交
1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225
#define MIN_MTU 68
#define MAX_MTU 65535

static int virtnet_change_mtu(struct net_device *dev, int new_mtu)
{
	if (new_mtu < MIN_MTU || new_mtu > MAX_MTU)
		return -EINVAL;
	dev->mtu = new_mtu;
	return 0;
}

J
Jason Wang 已提交
1226 1227 1228 1229 1230
/* To avoid contending a lock hold by a vcpu who would exit to host, select the
 * txq based on the processor id.
 */
static u16 virtnet_select_queue(struct net_device *dev, struct sk_buff *skb)
{
1231 1232 1233 1234 1235 1236 1237 1238 1239 1240
	int txq;
	struct virtnet_info *vi = netdev_priv(dev);

	if (skb_rx_queue_recorded(skb)) {
		txq = skb_get_rx_queue(skb);
	} else {
		txq = *__this_cpu_ptr(vi->vq_index);
		if (txq == -1)
			txq = 0;
	}
J
Jason Wang 已提交
1241 1242 1243 1244 1245 1246 1247

	while (unlikely(txq >= dev->real_num_tx_queues))
		txq -= dev->real_num_tx_queues;

	return txq;
}

1248 1249 1250 1251 1252
static const struct net_device_ops virtnet_netdev = {
	.ndo_open            = virtnet_open,
	.ndo_stop   	     = virtnet_close,
	.ndo_start_xmit      = start_xmit,
	.ndo_validate_addr   = eth_validate_addr,
1253
	.ndo_set_mac_address = virtnet_set_mac_address,
1254
	.ndo_set_rx_mode     = virtnet_set_rx_mode,
1255
	.ndo_change_mtu	     = virtnet_change_mtu,
1256
	.ndo_get_stats64     = virtnet_stats,
1257 1258
	.ndo_vlan_rx_add_vid = virtnet_vlan_rx_add_vid,
	.ndo_vlan_rx_kill_vid = virtnet_vlan_rx_kill_vid,
J
Jason Wang 已提交
1259
	.ndo_select_queue     = virtnet_select_queue,
1260 1261 1262 1263 1264
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller = virtnet_netpoll,
#endif
};

1265
static void virtnet_config_changed_work(struct work_struct *work)
1266
{
1267 1268
	struct virtnet_info *vi =
		container_of(work, struct virtnet_info, config_work);
1269 1270
	u16 v;

1271 1272 1273 1274
	mutex_lock(&vi->config_lock);
	if (!vi->config_enable)
		goto done;

1275 1276
	if (virtio_cread_feature(vi->vdev, VIRTIO_NET_F_STATUS,
				 struct virtio_net_config, status, &v) < 0)
1277 1278 1279
		goto done;

	if (v & VIRTIO_NET_S_ANNOUNCE) {
1280
		netdev_notify_peers(vi->dev);
1281 1282
		virtnet_ack_link_announce(vi);
	}
1283 1284 1285 1286 1287

	/* Ignore unknown (future) status bits */
	v &= VIRTIO_NET_S_LINK_UP;

	if (vi->status == v)
1288
		goto done;
1289 1290 1291 1292 1293

	vi->status = v;

	if (vi->status & VIRTIO_NET_S_LINK_UP) {
		netif_carrier_on(vi->dev);
J
Jason Wang 已提交
1294
		netif_tx_wake_all_queues(vi->dev);
1295 1296
	} else {
		netif_carrier_off(vi->dev);
J
Jason Wang 已提交
1297
		netif_tx_stop_all_queues(vi->dev);
1298
	}
1299 1300
done:
	mutex_unlock(&vi->config_lock);
1301 1302 1303 1304 1305 1306
}

static void virtnet_config_changed(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;

1307
	schedule_work(&vi->config_work);
1308 1309
}

J
Jason Wang 已提交
1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350
static void virtnet_free_queues(struct virtnet_info *vi)
{
	kfree(vi->rq);
	kfree(vi->sq);
}

static void free_receive_bufs(struct virtnet_info *vi)
{
	int i;

	for (i = 0; i < vi->max_queue_pairs; i++) {
		while (vi->rq[i].pages)
			__free_pages(get_a_page(&vi->rq[i], GFP_KERNEL), 0);
	}
}

static void free_unused_bufs(struct virtnet_info *vi)
{
	void *buf;
	int i;

	for (i = 0; i < vi->max_queue_pairs; i++) {
		struct virtqueue *vq = vi->sq[i].vq;
		while ((buf = virtqueue_detach_unused_buf(vq)) != NULL)
			dev_kfree_skb(buf);
	}

	for (i = 0; i < vi->max_queue_pairs; i++) {
		struct virtqueue *vq = vi->rq[i].vq;

		while ((buf = virtqueue_detach_unused_buf(vq)) != NULL) {
			if (vi->mergeable_rx_bufs || vi->big_packets)
				give_pages(&vi->rq[i], buf);
			else
				dev_kfree_skb(buf);
			--vi->rq[i].num;
		}
		BUG_ON(vi->rq[i].num != 0);
	}
}

1351 1352 1353 1354
static void virtnet_del_vqs(struct virtnet_info *vi)
{
	struct virtio_device *vdev = vi->vdev;

1355
	virtnet_clean_affinity(vi, -1);
J
Jason Wang 已提交
1356

1357
	vdev->config->del_vqs(vdev);
J
Jason Wang 已提交
1358 1359

	virtnet_free_queues(vi);
1360 1361
}

J
Jason Wang 已提交
1362
static int virtnet_find_vqs(struct virtnet_info *vi)
1363
{
J
Jason Wang 已提交
1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392
	vq_callback_t **callbacks;
	struct virtqueue **vqs;
	int ret = -ENOMEM;
	int i, total_vqs;
	const char **names;

	/* We expect 1 RX virtqueue followed by 1 TX virtqueue, followed by
	 * possible N-1 RX/TX queue pairs used in multiqueue mode, followed by
	 * possible control vq.
	 */
	total_vqs = vi->max_queue_pairs * 2 +
		    virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VQ);

	/* Allocate space for find_vqs parameters */
	vqs = kzalloc(total_vqs * sizeof(*vqs), GFP_KERNEL);
	if (!vqs)
		goto err_vq;
	callbacks = kmalloc(total_vqs * sizeof(*callbacks), GFP_KERNEL);
	if (!callbacks)
		goto err_callback;
	names = kmalloc(total_vqs * sizeof(*names), GFP_KERNEL);
	if (!names)
		goto err_names;

	/* Parameters for control virtqueue, if any */
	if (vi->has_cvq) {
		callbacks[total_vqs - 1] = NULL;
		names[total_vqs - 1] = "control";
	}
1393

J
Jason Wang 已提交
1394 1395 1396 1397 1398 1399 1400 1401 1402
	/* Allocate/initialize parameters for send/receive virtqueues */
	for (i = 0; i < vi->max_queue_pairs; i++) {
		callbacks[rxq2vq(i)] = skb_recv_done;
		callbacks[txq2vq(i)] = skb_xmit_done;
		sprintf(vi->rq[i].name, "input.%d", i);
		sprintf(vi->sq[i].name, "output.%d", i);
		names[rxq2vq(i)] = vi->rq[i].name;
		names[txq2vq(i)] = vi->sq[i].name;
	}
1403

J
Jason Wang 已提交
1404 1405 1406 1407
	ret = vi->vdev->config->find_vqs(vi->vdev, total_vqs, vqs, callbacks,
					 names);
	if (ret)
		goto err_find;
1408

J
Jason Wang 已提交
1409 1410
	if (vi->has_cvq) {
		vi->cvq = vqs[total_vqs - 1];
1411
		if (virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VLAN))
1412
			vi->dev->features |= NETIF_F_HW_VLAN_CTAG_FILTER;
1413
	}
J
Jason Wang 已提交
1414 1415 1416 1417 1418 1419 1420 1421 1422 1423

	for (i = 0; i < vi->max_queue_pairs; i++) {
		vi->rq[i].vq = vqs[rxq2vq(i)];
		vi->sq[i].vq = vqs[txq2vq(i)];
	}

	kfree(names);
	kfree(callbacks);
	kfree(vqs);

1424
	return 0;
J
Jason Wang 已提交
1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443

err_find:
	kfree(names);
err_names:
	kfree(callbacks);
err_callback:
	kfree(vqs);
err_vq:
	return ret;
}

static int virtnet_alloc_queues(struct virtnet_info *vi)
{
	int i;

	vi->sq = kzalloc(sizeof(*vi->sq) * vi->max_queue_pairs, GFP_KERNEL);
	if (!vi->sq)
		goto err_sq;
	vi->rq = kzalloc(sizeof(*vi->rq) * vi->max_queue_pairs, GFP_KERNEL);
1444
	if (!vi->rq)
J
Jason Wang 已提交
1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477
		goto err_rq;

	INIT_DELAYED_WORK(&vi->refill, refill_work);
	for (i = 0; i < vi->max_queue_pairs; i++) {
		vi->rq[i].pages = NULL;
		netif_napi_add(vi->dev, &vi->rq[i].napi, virtnet_poll,
			       napi_weight);

		sg_init_table(vi->rq[i].sg, ARRAY_SIZE(vi->rq[i].sg));
		sg_init_table(vi->sq[i].sg, ARRAY_SIZE(vi->sq[i].sg));
	}

	return 0;

err_rq:
	kfree(vi->sq);
err_sq:
	return -ENOMEM;
}

static int init_vqs(struct virtnet_info *vi)
{
	int ret;

	/* Allocate send & receive queues */
	ret = virtnet_alloc_queues(vi);
	if (ret)
		goto err;

	ret = virtnet_find_vqs(vi);
	if (ret)
		goto err_free;

1478
	get_online_cpus();
1479
	virtnet_set_affinity(vi);
1480 1481
	put_online_cpus();

J
Jason Wang 已提交
1482 1483 1484 1485 1486 1487
	return 0;

err_free:
	virtnet_free_queues(vi);
err:
	return ret;
1488 1489
}

R
Rusty Russell 已提交
1490 1491
static int virtnet_probe(struct virtio_device *vdev)
{
J
Jason Wang 已提交
1492
	int i, err;
R
Rusty Russell 已提交
1493 1494
	struct net_device *dev;
	struct virtnet_info *vi;
J
Jason Wang 已提交
1495 1496 1497
	u16 max_queue_pairs;

	/* Find if host supports multiqueue virtio_net device */
1498 1499 1500
	err = virtio_cread_feature(vdev, VIRTIO_NET_F_MQ,
				   struct virtio_net_config,
				   max_virtqueue_pairs, &max_queue_pairs);
J
Jason Wang 已提交
1501 1502 1503 1504 1505 1506

	/* We need at least 2 queue's */
	if (err || max_queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
	    max_queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
	    !virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ))
		max_queue_pairs = 1;
R
Rusty Russell 已提交
1507 1508

	/* Allocate ourselves a network device with room for our info */
J
Jason Wang 已提交
1509
	dev = alloc_etherdev_mq(sizeof(struct virtnet_info), max_queue_pairs);
R
Rusty Russell 已提交
1510 1511 1512 1513
	if (!dev)
		return -ENOMEM;

	/* Set up network device as normal. */
1514
	dev->priv_flags |= IFF_UNICAST_FLT | IFF_LIVE_ADDR_CHANGE;
1515
	dev->netdev_ops = &virtnet_netdev;
R
Rusty Russell 已提交
1516
	dev->features = NETIF_F_HIGHDMA;
1517

1518
	SET_ETHTOOL_OPS(dev, &virtnet_ethtool_ops);
R
Rusty Russell 已提交
1519 1520 1521
	SET_NETDEV_DEV(dev, &vdev->dev);

	/* Do we support "hardware" checksums? */
1522
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CSUM)) {
R
Rusty Russell 已提交
1523
		/* This opens up the world of extra features. */
1524 1525 1526 1527 1528 1529
		dev->hw_features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;
		if (csum)
			dev->features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;

		if (virtio_has_feature(vdev, VIRTIO_NET_F_GSO)) {
			dev->hw_features |= NETIF_F_TSO | NETIF_F_UFO
R
Rusty Russell 已提交
1530 1531
				| NETIF_F_TSO_ECN | NETIF_F_TSO6;
		}
1532
		/* Individual feature bits: what can host handle? */
1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO4))
			dev->hw_features |= NETIF_F_TSO;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO6))
			dev->hw_features |= NETIF_F_TSO6;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_ECN))
			dev->hw_features |= NETIF_F_TSO_ECN;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_UFO))
			dev->hw_features |= NETIF_F_UFO;

		if (gso)
			dev->features |= dev->hw_features & (NETIF_F_ALL_TSO|NETIF_F_UFO);
		/* (!csum && gso) case will be fixed by register_netdev() */
R
Rusty Russell 已提交
1545
	}
1546 1547
	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_CSUM))
		dev->features |= NETIF_F_RXCSUM;
R
Rusty Russell 已提交
1548

1549 1550
	dev->vlan_features = dev->features;

R
Rusty Russell 已提交
1551
	/* Configuration may specify what MAC to use.  Otherwise random. */
1552 1553 1554 1555 1556
	if (virtio_has_feature(vdev, VIRTIO_NET_F_MAC))
		virtio_cread_bytes(vdev,
				   offsetof(struct virtio_net_config, mac),
				   dev->dev_addr, dev->addr_len);
	else
1557
		eth_hw_addr_random(dev);
R
Rusty Russell 已提交
1558 1559 1560 1561 1562

	/* Set up our device-specific information */
	vi = netdev_priv(dev);
	vi->dev = dev;
	vi->vdev = vdev;
1563
	vdev->priv = vi;
1564 1565 1566 1567 1568
	vi->stats = alloc_percpu(struct virtnet_stats);
	err = -ENOMEM;
	if (vi->stats == NULL)
		goto free;

1569 1570 1571 1572
	vi->vq_index = alloc_percpu(int);
	if (vi->vq_index == NULL)
		goto free_stats;

1573 1574 1575
	mutex_init(&vi->config_lock);
	vi->config_enable = true;
	INIT_WORK(&vi->config_work, virtnet_config_changed_work);
R
Rusty Russell 已提交
1576

1577
	/* If we can receive ANY GSO packets, we must allocate large ones. */
1578 1579 1580
	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO4) ||
	    virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO6) ||
	    virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_ECN))
1581 1582
		vi->big_packets = true;

1583 1584 1585
	if (virtio_has_feature(vdev, VIRTIO_NET_F_MRG_RXBUF))
		vi->mergeable_rx_bufs = true;

1586 1587 1588
	if (virtio_has_feature(vdev, VIRTIO_F_ANY_LAYOUT))
		vi->any_header_sg = true;

J
Jason Wang 已提交
1589 1590 1591 1592 1593 1594 1595 1596
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ))
		vi->has_cvq = true;

	/* Use single tx/rx queue pair as default */
	vi->curr_queue_pairs = 1;
	vi->max_queue_pairs = max_queue_pairs;

	/* Allocate/initialize the rx/tx queues, and invoke find_vqs */
1597
	err = init_vqs(vi);
1598
	if (err)
1599
		goto free_index;
R
Rusty Russell 已提交
1600

J
Jason Wang 已提交
1601 1602 1603
	netif_set_real_num_tx_queues(dev, 1);
	netif_set_real_num_rx_queues(dev, 1);

R
Rusty Russell 已提交
1604 1605 1606
	err = register_netdev(dev);
	if (err) {
		pr_debug("virtio_net: registering device failed\n");
1607
		goto free_vqs;
R
Rusty Russell 已提交
1608
	}
1609 1610

	/* Last of all, set up some receive buffers. */
1611
	for (i = 0; i < vi->curr_queue_pairs; i++) {
J
Jason Wang 已提交
1612 1613 1614 1615 1616 1617 1618 1619
		try_fill_recv(&vi->rq[i], GFP_KERNEL);

		/* If we didn't even get one input buffer, we're useless. */
		if (vi->rq[i].num == 0) {
			free_unused_bufs(vi);
			err = -ENOMEM;
			goto free_recv_bufs;
		}
1620 1621
	}

1622 1623 1624 1625 1626 1627 1628
	vi->nb.notifier_call = &virtnet_cpu_callback;
	err = register_hotcpu_notifier(&vi->nb);
	if (err) {
		pr_debug("virtio_net: registering cpu notifier failed\n");
		goto free_recv_bufs;
	}

J
Jason Wang 已提交
1629 1630 1631 1632
	/* Assume link up if device can't report link status,
	   otherwise get link status from config. */
	if (virtio_has_feature(vi->vdev, VIRTIO_NET_F_STATUS)) {
		netif_carrier_off(dev);
1633
		schedule_work(&vi->config_work);
J
Jason Wang 已提交
1634 1635 1636 1637
	} else {
		vi->status = VIRTIO_NET_S_LINK_UP;
		netif_carrier_on(dev);
	}
1638

J
Jason Wang 已提交
1639 1640 1641
	pr_debug("virtnet: registered device %s with %d RX and TX vq's\n",
		 dev->name, max_queue_pairs);

R
Rusty Russell 已提交
1642 1643
	return 0;

J
Jason Wang 已提交
1644 1645
free_recv_bufs:
	free_receive_bufs(vi);
1646
	unregister_netdev(dev);
1647
free_vqs:
J
Jason Wang 已提交
1648
	cancel_delayed_work_sync(&vi->refill);
1649
	virtnet_del_vqs(vi);
1650 1651
free_index:
	free_percpu(vi->vq_index);
1652 1653
free_stats:
	free_percpu(vi->stats);
R
Rusty Russell 已提交
1654 1655 1656 1657 1658
free:
	free_netdev(dev);
	return err;
}

1659
static void remove_vq_common(struct virtnet_info *vi)
R
Rusty Russell 已提交
1660
{
1661
	vi->vdev->config->reset(vi->vdev);
S
Shirley Ma 已提交
1662 1663

	/* Free unused buffers in both send and recv, if any. */
1664
	free_unused_bufs(vi);
1665

J
Jason Wang 已提交
1666
	free_receive_bufs(vi);
1667

J
Jason Wang 已提交
1668
	virtnet_del_vqs(vi);
1669 1670
}

1671
static void virtnet_remove(struct virtio_device *vdev)
1672 1673 1674
{
	struct virtnet_info *vi = vdev->priv;

1675 1676
	unregister_hotcpu_notifier(&vi->nb);

1677 1678 1679 1680 1681
	/* Prevent config work handler from accessing the device. */
	mutex_lock(&vi->config_lock);
	vi->config_enable = false;
	mutex_unlock(&vi->config_lock);

1682 1683 1684
	unregister_netdev(vi->dev);

	remove_vq_common(vi);
1685

1686 1687
	flush_work(&vi->config_work);

1688
	free_percpu(vi->vq_index);
1689
	free_percpu(vi->stats);
1690
	free_netdev(vi->dev);
R
Rusty Russell 已提交
1691 1692
}

1693
#ifdef CONFIG_PM_SLEEP
1694 1695 1696
static int virtnet_freeze(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;
J
Jason Wang 已提交
1697
	int i;
1698

1699 1700 1701 1702 1703
	/* Prevent config work handler from accessing the device */
	mutex_lock(&vi->config_lock);
	vi->config_enable = false;
	mutex_unlock(&vi->config_lock);

1704 1705 1706 1707
	netif_device_detach(vi->dev);
	cancel_delayed_work_sync(&vi->refill);

	if (netif_running(vi->dev))
J
Jason Wang 已提交
1708 1709 1710 1711
		for (i = 0; i < vi->max_queue_pairs; i++) {
			napi_disable(&vi->rq[i].napi);
			netif_napi_del(&vi->rq[i].napi);
		}
1712 1713 1714

	remove_vq_common(vi);

1715 1716
	flush_work(&vi->config_work);

1717 1718 1719 1720 1721 1722
	return 0;
}

static int virtnet_restore(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;
J
Jason Wang 已提交
1723
	int err, i;
1724 1725 1726 1727 1728 1729

	err = init_vqs(vi);
	if (err)
		return err;

	if (netif_running(vi->dev))
J
Jason Wang 已提交
1730 1731
		for (i = 0; i < vi->max_queue_pairs; i++)
			virtnet_napi_enable(&vi->rq[i]);
1732 1733 1734

	netif_device_attach(vi->dev);

1735
	for (i = 0; i < vi->curr_queue_pairs; i++)
J
Jason Wang 已提交
1736 1737
		if (!try_fill_recv(&vi->rq[i], GFP_KERNEL))
			schedule_delayed_work(&vi->refill, 0);
1738

1739 1740 1741 1742
	mutex_lock(&vi->config_lock);
	vi->config_enable = true;
	mutex_unlock(&vi->config_lock);

J
Jason Wang 已提交
1743 1744
	virtnet_set_queues(vi, vi->curr_queue_pairs);

1745 1746 1747 1748
	return 0;
}
#endif

R
Rusty Russell 已提交
1749 1750 1751 1752 1753
static struct virtio_device_id id_table[] = {
	{ VIRTIO_ID_NET, VIRTIO_DEV_ANY_ID },
	{ 0 },
};

1754
static unsigned int features[] = {
1755 1756
	VIRTIO_NET_F_CSUM, VIRTIO_NET_F_GUEST_CSUM,
	VIRTIO_NET_F_GSO, VIRTIO_NET_F_MAC,
1757
	VIRTIO_NET_F_HOST_TSO4, VIRTIO_NET_F_HOST_UFO, VIRTIO_NET_F_HOST_TSO6,
1758
	VIRTIO_NET_F_HOST_ECN, VIRTIO_NET_F_GUEST_TSO4, VIRTIO_NET_F_GUEST_TSO6,
1759
	VIRTIO_NET_F_GUEST_ECN, VIRTIO_NET_F_GUEST_UFO,
1760
	VIRTIO_NET_F_MRG_RXBUF, VIRTIO_NET_F_STATUS, VIRTIO_NET_F_CTRL_VQ,
1761
	VIRTIO_NET_F_CTRL_RX, VIRTIO_NET_F_CTRL_VLAN,
J
Jason Wang 已提交
1762
	VIRTIO_NET_F_GUEST_ANNOUNCE, VIRTIO_NET_F_MQ,
1763
	VIRTIO_NET_F_CTRL_MAC_ADDR,
1764
	VIRTIO_F_ANY_LAYOUT,
1765 1766
};

1767
static struct virtio_driver virtio_net_driver = {
1768 1769
	.feature_table = features,
	.feature_table_size = ARRAY_SIZE(features),
R
Rusty Russell 已提交
1770 1771 1772 1773
	.driver.name =	KBUILD_MODNAME,
	.driver.owner =	THIS_MODULE,
	.id_table =	id_table,
	.probe =	virtnet_probe,
1774
	.remove =	virtnet_remove,
1775
	.config_changed = virtnet_config_changed,
1776
#ifdef CONFIG_PM_SLEEP
1777 1778 1779
	.freeze =	virtnet_freeze,
	.restore =	virtnet_restore,
#endif
R
Rusty Russell 已提交
1780 1781
};

1782
module_virtio_driver(virtio_net_driver);
R
Rusty Russell 已提交
1783 1784 1785 1786

MODULE_DEVICE_TABLE(virtio, id_table);
MODULE_DESCRIPTION("Virtio network driver");
MODULE_LICENSE("GPL");