virtio_net.c 43.8 KB
Newer Older
1
/* A network driver using virtio.
R
Rusty Russell 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 *
 * Copyright 2007 Rusty Russell <rusty@rustcorp.com.au> IBM Corporation
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 */
//#define DEBUG
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
22
#include <linux/ethtool.h>
R
Rusty Russell 已提交
23 24 25 26
#include <linux/module.h>
#include <linux/virtio.h>
#include <linux/virtio_net.h>
#include <linux/scatterlist.h>
27
#include <linux/if_vlan.h>
28
#include <linux/slab.h>
29
#include <linux/cpu.h>
R
Rusty Russell 已提交
30

31
static int napi_weight = NAPI_POLL_WEIGHT;
32 33
module_param(napi_weight, int, 0444);

34
static bool csum = true, gso = true;
R
Rusty Russell 已提交
35 36 37
module_param(csum, bool, 0444);
module_param(gso, bool, 0444);

R
Rusty Russell 已提交
38
/* FIXME: MTU in config. */
39
#define MAX_PACKET_LEN (ETH_HLEN + VLAN_HLEN + ETH_DATA_LEN)
40
#define GOOD_COPY_LEN	128
R
Rusty Russell 已提交
41

42
#define VIRTNET_DRIVER_VERSION "1.0.0"
43

44
struct virtnet_stats {
45 46
	struct u64_stats_sync tx_syncp;
	struct u64_stats_sync rx_syncp;
47 48 49 50 51 52 53
	u64 tx_bytes;
	u64 tx_packets;

	u64 rx_bytes;
	u64 rx_packets;
};

54 55 56 57 58 59 60
/* Internal representation of a send virtqueue */
struct send_queue {
	/* Virtqueue associated with this send _queue */
	struct virtqueue *vq;

	/* TX: fragments + linear part + virtio header */
	struct scatterlist sg[MAX_SKB_FRAGS + 2];
J
Jason Wang 已提交
61 62 63

	/* Name of the send queue: output.$index */
	char name[40];
64 65 66 67 68 69 70
};

/* Internal representation of a receive virtqueue */
struct receive_queue {
	/* Virtqueue associated with this receive_queue */
	struct virtqueue *vq;

R
Rusty Russell 已提交
71 72 73 74 75
	struct napi_struct napi;

	/* Number of input buffers, and max we've ever had. */
	unsigned int num, max;

76 77 78 79 80
	/* Chain pages by the private ptr. */
	struct page *pages;

	/* RX: fragments + linear part + virtio header */
	struct scatterlist sg[MAX_SKB_FRAGS + 2];
J
Jason Wang 已提交
81 82 83

	/* Name of this receive queue: input.$index */
	char name[40];
84 85 86 87 88 89
};

struct virtnet_info {
	struct virtio_device *vdev;
	struct virtqueue *cvq;
	struct net_device *dev;
J
Jason Wang 已提交
90 91
	struct send_queue *sq;
	struct receive_queue *rq;
92 93
	unsigned int status;

J
Jason Wang 已提交
94 95 96 97 98 99
	/* Max # of queue pairs supported by the device */
	u16 max_queue_pairs;

	/* # of queue pairs currently used by the driver */
	u16 curr_queue_pairs;

100 101 102
	/* I like... big packets and I cannot lie! */
	bool big_packets;

103 104 105
	/* Host will merge rx buffers for big packets (shake it! shake it!) */
	bool mergeable_rx_bufs;

J
Jason Wang 已提交
106 107 108
	/* Has control virtqueue */
	bool has_cvq;

109 110 111
	/* Host can handle any s/g split between our header and packet data */
	bool any_header_sg;

112 113 114
	/* enable config space updates */
	bool config_enable;

115 116 117
	/* Active statistics */
	struct virtnet_stats __percpu *stats;

118 119 120
	/* Work struct for refilling if we run low on memory. */
	struct delayed_work refill;

121 122 123 124 125
	/* Work struct for config space updates */
	struct work_struct config_work;

	/* Lock for config space updates */
	struct mutex config_lock;
J
Jason Wang 已提交
126 127 128

	/* Does the affinity hint is set for virtqueues? */
	bool affinity_hint_set;
129 130 131

	/* Per-cpu variable to show the mapping from CPU to virtqueue */
	int __percpu *vq_index;
132 133 134

	/* CPU hot plug notifier */
	struct notifier_block nb;
R
Rusty Russell 已提交
135 136
};

137 138 139 140 141 142 143
struct skb_vnet_hdr {
	union {
		struct virtio_net_hdr hdr;
		struct virtio_net_hdr_mrg_rxbuf mhdr;
	};
};

144 145 146 147 148 149 150 151 152 153
struct padded_vnet_hdr {
	struct virtio_net_hdr hdr;
	/*
	 * virtio_net_hdr should be in a separated sg buffer because of a
	 * QEMU bug, and data sg buffer shares same page with this header sg.
	 * This padding makes next sg 16 byte aligned after virtio_net_hdr.
	 */
	char padding[6];
};

J
Jason Wang 已提交
154 155 156 157 158
/* Converting between virtqueue no. and kernel tx/rx queue no.
 * 0:rx0 1:tx0 2:rx1 3:tx1 ... 2N:rxN 2N+1:txN 2N+2:cvq
 */
static int vq2txq(struct virtqueue *vq)
{
159
	return (vq->index - 1) / 2;
J
Jason Wang 已提交
160 161 162 163 164 165 166 167 168
}

static int txq2vq(int txq)
{
	return txq * 2 + 1;
}

static int vq2rxq(struct virtqueue *vq)
{
169
	return vq->index / 2;
J
Jason Wang 已提交
170 171 172 173 174 175 176
}

static int rxq2vq(int rxq)
{
	return rxq * 2;
}

177
static inline struct skb_vnet_hdr *skb_vnet_hdr(struct sk_buff *skb)
R
Rusty Russell 已提交
178
{
179
	return (struct skb_vnet_hdr *)skb->cb;
R
Rusty Russell 已提交
180 181
}

182 183 184 185
/*
 * private is used to chain pages for big packets, put the whole
 * most recent used list in the beginning for reuse
 */
186
static void give_pages(struct receive_queue *rq, struct page *page)
187
{
188
	struct page *end;
189

190
	/* Find end of list, sew whole thing into vi->rq.pages. */
191
	for (end = page; end->private; end = (struct page *)end->private);
192 193
	end->private = (unsigned long)rq->pages;
	rq->pages = page;
194 195
}

196
static struct page *get_a_page(struct receive_queue *rq, gfp_t gfp_mask)
197
{
198
	struct page *p = rq->pages;
199

200
	if (p) {
201
		rq->pages = (struct page *)p->private;
202 203 204
		/* clear private here, it is used to chain pages */
		p->private = 0;
	} else
205 206 207 208
		p = alloc_page(gfp_mask);
	return p;
}

209
static void skb_xmit_done(struct virtqueue *vq)
R
Rusty Russell 已提交
210
{
211
	struct virtnet_info *vi = vq->vdev->priv;
R
Rusty Russell 已提交
212

213
	/* Suppress further interrupts. */
214
	virtqueue_disable_cb(vq);
215

216
	/* We were probably waiting for more output buffers. */
J
Jason Wang 已提交
217
	netif_wake_subqueue(vi->dev, vq2txq(vq));
R
Rusty Russell 已提交
218 219
}

220 221
static void set_skb_frag(struct sk_buff *skb, struct page *page,
			 unsigned int offset, unsigned int *len)
R
Rusty Russell 已提交
222
{
223
	int size = min((unsigned)PAGE_SIZE - offset, *len);
224 225
	int i = skb_shinfo(skb)->nr_frags;

226
	__skb_fill_page_desc(skb, i, page, offset, size);
227

228 229
	skb->data_len += size;
	skb->len += size;
230
	skb->truesize += PAGE_SIZE;
231
	skb_shinfo(skb)->nr_frags++;
232
	skb_shinfo(skb)->tx_flags |= SKBTX_SHARED_FRAG;
233
	*len -= size;
234
}
235

236
/* Called from bottom half context */
237
static struct sk_buff *page_to_skb(struct receive_queue *rq,
238 239
				   struct page *page, unsigned int len)
{
240
	struct virtnet_info *vi = rq->vq->vdev->priv;
241 242 243 244
	struct sk_buff *skb;
	struct skb_vnet_hdr *hdr;
	unsigned int copy, hdr_len, offset;
	char *p;
245

246
	p = page_address(page);
247

248 249 250 251
	/* copy small packet so we can reuse these pages for small data */
	skb = netdev_alloc_skb_ip_align(vi->dev, GOOD_COPY_LEN);
	if (unlikely(!skb))
		return NULL;
252

253
	hdr = skb_vnet_hdr(skb);
254

255 256 257 258 259 260 261
	if (vi->mergeable_rx_bufs) {
		hdr_len = sizeof hdr->mhdr;
		offset = hdr_len;
	} else {
		hdr_len = sizeof hdr->hdr;
		offset = sizeof(struct padded_vnet_hdr);
	}
262

263
	memcpy(hdr, p, hdr_len);
264

265 266
	len -= hdr_len;
	p += offset;
267

268 269 270 271
	copy = len;
	if (copy > skb_tailroom(skb))
		copy = skb_tailroom(skb);
	memcpy(skb_put(skb, copy), p, copy);
272

273 274
	len -= copy;
	offset += copy;
275

276 277 278 279 280 281 282
	/*
	 * Verify that we can indeed put this data into a skb.
	 * This is here to handle cases when the device erroneously
	 * tries to receive more than is possible. This is usually
	 * the case of a broken device.
	 */
	if (unlikely(len > MAX_SKB_FRAGS * PAGE_SIZE)) {
283
		net_dbg_ratelimited("%s: too much data\n", skb->dev->name);
284 285 286 287
		dev_kfree_skb(skb);
		return NULL;
	}

288 289 290 291 292
	while (len) {
		set_skb_frag(skb, page, offset, &len);
		page = (struct page *)page->private;
		offset = 0;
	}
293

294
	if (page)
295
		give_pages(rq, page);
296

297 298
	return skb;
}
299

300
static int receive_mergeable(struct receive_queue *rq, struct sk_buff *skb)
301 302 303 304 305 306 307 308 309 310 311 312 313
{
	struct skb_vnet_hdr *hdr = skb_vnet_hdr(skb);
	struct page *page;
	int num_buf, i, len;

	num_buf = hdr->mhdr.num_buffers;
	while (--num_buf) {
		i = skb_shinfo(skb)->nr_frags;
		if (i >= MAX_SKB_FRAGS) {
			pr_debug("%s: packet too long\n", skb->dev->name);
			skb->dev->stats.rx_length_errors++;
			return -EINVAL;
		}
314
		page = virtqueue_get_buf(rq->vq, &len);
315 316 317 318 319
		if (!page) {
			pr_debug("%s: rx error: %d buffers missing\n",
				 skb->dev->name, hdr->mhdr.num_buffers);
			skb->dev->stats.rx_length_errors++;
			return -EINVAL;
320
		}
321

322 323 324 325 326
		if (len > PAGE_SIZE)
			len = PAGE_SIZE;

		set_skb_frag(skb, page, 0, &len);

327
		--rq->num;
328 329 330 331
	}
	return 0;
}

332
static void receive_buf(struct receive_queue *rq, void *buf, unsigned int len)
333
{
334 335
	struct virtnet_info *vi = rq->vq->vdev->priv;
	struct net_device *dev = vi->dev;
E
Eric Dumazet 已提交
336
	struct virtnet_stats *stats = this_cpu_ptr(vi->stats);
337 338 339
	struct sk_buff *skb;
	struct page *page;
	struct skb_vnet_hdr *hdr;
340

341 342 343 344
	if (unlikely(len < sizeof(struct virtio_net_hdr) + ETH_HLEN)) {
		pr_debug("%s: short packet %i\n", dev->name, len);
		dev->stats.rx_length_errors++;
		if (vi->mergeable_rx_bufs || vi->big_packets)
345
			give_pages(rq, buf);
346 347 348 349
		else
			dev_kfree_skb(buf);
		return;
	}
350

351 352 353 354 355 356
	if (!vi->mergeable_rx_bufs && !vi->big_packets) {
		skb = buf;
		len -= sizeof(struct virtio_net_hdr);
		skb_trim(skb, len);
	} else {
		page = buf;
357
		skb = page_to_skb(rq, page, len);
358
		if (unlikely(!skb)) {
359
			dev->stats.rx_dropped++;
360
			give_pages(rq, page);
361
			return;
362
		}
363
		if (vi->mergeable_rx_bufs)
364
			if (receive_mergeable(rq, skb)) {
365 366 367
				dev_kfree_skb(skb);
				return;
			}
368
	}
369

370
	hdr = skb_vnet_hdr(skb);
371

372
	u64_stats_update_begin(&stats->rx_syncp);
373 374
	stats->rx_bytes += skb->len;
	stats->rx_packets++;
375
	u64_stats_update_end(&stats->rx_syncp);
R
Rusty Russell 已提交
376

377
	if (hdr->hdr.flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) {
R
Rusty Russell 已提交
378
		pr_debug("Needs csum!\n");
379 380 381
		if (!skb_partial_csum_set(skb,
					  hdr->hdr.csum_start,
					  hdr->hdr.csum_offset))
R
Rusty Russell 已提交
382
			goto frame_err;
383 384
	} else if (hdr->hdr.flags & VIRTIO_NET_HDR_F_DATA_VALID) {
		skb->ip_summed = CHECKSUM_UNNECESSARY;
R
Rusty Russell 已提交
385 386
	}

387 388 389 390
	skb->protocol = eth_type_trans(skb, dev);
	pr_debug("Receiving skb proto 0x%04x len %i type %i\n",
		 ntohs(skb->protocol), skb->len, skb->pkt_type);

391
	if (hdr->hdr.gso_type != VIRTIO_NET_HDR_GSO_NONE) {
R
Rusty Russell 已提交
392
		pr_debug("GSO!\n");
393
		switch (hdr->hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN) {
R
Rusty Russell 已提交
394
		case VIRTIO_NET_HDR_GSO_TCPV4:
395
			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
R
Rusty Russell 已提交
396 397
			break;
		case VIRTIO_NET_HDR_GSO_UDP:
398
			skb_shinfo(skb)->gso_type = SKB_GSO_UDP;
R
Rusty Russell 已提交
399 400
			break;
		case VIRTIO_NET_HDR_GSO_TCPV6:
401
			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
R
Rusty Russell 已提交
402 403
			break;
		default:
404 405
			net_warn_ratelimited("%s: bad gso type %u.\n",
					     dev->name, hdr->hdr.gso_type);
R
Rusty Russell 已提交
406 407 408
			goto frame_err;
		}

409
		if (hdr->hdr.gso_type & VIRTIO_NET_HDR_GSO_ECN)
410
			skb_shinfo(skb)->gso_type |= SKB_GSO_TCP_ECN;
R
Rusty Russell 已提交
411

412
		skb_shinfo(skb)->gso_size = hdr->hdr.gso_size;
R
Rusty Russell 已提交
413
		if (skb_shinfo(skb)->gso_size == 0) {
414
			net_warn_ratelimited("%s: zero gso size.\n", dev->name);
R
Rusty Russell 已提交
415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430
			goto frame_err;
		}

		/* Header must be checked, and gso_segs computed. */
		skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
		skb_shinfo(skb)->gso_segs = 0;
	}

	netif_receive_skb(skb);
	return;

frame_err:
	dev->stats.rx_frame_errors++;
	dev_kfree_skb(skb);
}

431
static int add_recvbuf_small(struct receive_queue *rq, gfp_t gfp)
R
Rusty Russell 已提交
432
{
433
	struct virtnet_info *vi = rq->vq->vdev->priv;
R
Rusty Russell 已提交
434
	struct sk_buff *skb;
435 436
	struct skb_vnet_hdr *hdr;
	int err;
437

438
	skb = __netdev_alloc_skb_ip_align(vi->dev, MAX_PACKET_LEN, gfp);
439 440
	if (unlikely(!skb))
		return -ENOMEM;
R
Rusty Russell 已提交
441

442
	skb_put(skb, MAX_PACKET_LEN);
443

444
	hdr = skb_vnet_hdr(skb);
445
	sg_set_buf(rq->sg, &hdr->hdr, sizeof hdr->hdr);
446

447
	skb_to_sgvec(skb, rq->sg + 1, 0, skb->len);
448

449
	err = virtqueue_add_inbuf(rq->vq, rq->sg, 2, skb, gfp);
450 451
	if (err < 0)
		dev_kfree_skb(skb);
452

453 454
	return err;
}
455

456
static int add_recvbuf_big(struct receive_queue *rq, gfp_t gfp)
457 458 459 460 461
{
	struct page *first, *list = NULL;
	char *p;
	int i, err, offset;

462
	/* page in rq->sg[MAX_SKB_FRAGS + 1] is list tail */
463
	for (i = MAX_SKB_FRAGS + 1; i > 1; --i) {
464
		first = get_a_page(rq, gfp);
465 466
		if (!first) {
			if (list)
467
				give_pages(rq, list);
468
			return -ENOMEM;
469
		}
470
		sg_set_buf(&rq->sg[i], page_address(first), PAGE_SIZE);
471

472 473 474 475
		/* chain new page in list head to match sg */
		first->private = (unsigned long)list;
		list = first;
	}
R
Rusty Russell 已提交
476

477
	first = get_a_page(rq, gfp);
478
	if (!first) {
479
		give_pages(rq, list);
480 481 482 483
		return -ENOMEM;
	}
	p = page_address(first);

484 485 486
	/* rq->sg[0], rq->sg[1] share the same page */
	/* a separated rq->sg[0] for virtio_net_hdr only due to QEMU bug */
	sg_set_buf(&rq->sg[0], p, sizeof(struct virtio_net_hdr));
487

488
	/* rq->sg[1] for data packet, from offset */
489
	offset = sizeof(struct padded_vnet_hdr);
490
	sg_set_buf(&rq->sg[1], p + offset, PAGE_SIZE - offset);
491 492 493

	/* chain first in list head */
	first->private = (unsigned long)list;
494 495
	err = virtqueue_add_inbuf(rq->vq, rq->sg, MAX_SKB_FRAGS + 2,
				  first, gfp);
496
	if (err < 0)
497
		give_pages(rq, first);
498 499

	return err;
R
Rusty Russell 已提交
500 501
}

502
static int add_recvbuf_mergeable(struct receive_queue *rq, gfp_t gfp)
503
{
504
	struct page *page;
505 506
	int err;

507
	page = get_a_page(rq, gfp);
508 509
	if (!page)
		return -ENOMEM;
510

511
	sg_init_one(rq->sg, page_address(page), PAGE_SIZE);
512

513
	err = virtqueue_add_inbuf(rq->vq, rq->sg, 1, page, gfp);
514
	if (err < 0)
515
		give_pages(rq, page);
516

517 518
	return err;
}
519

520 521 522 523 524 525 526
/*
 * Returns false if we couldn't fill entirely (OOM).
 *
 * Normally run in the receive path, but can also be run from ndo_open
 * before we're receiving packets, or from refill_work which is
 * careful to disable receiving (using napi_disable).
 */
527
static bool try_fill_recv(struct receive_queue *rq, gfp_t gfp)
528
{
529
	struct virtnet_info *vi = rq->vq->vdev->priv;
530
	int err;
531
	bool oom;
532

533 534
	do {
		if (vi->mergeable_rx_bufs)
535
			err = add_recvbuf_mergeable(rq, gfp);
536
		else if (vi->big_packets)
537
			err = add_recvbuf_big(rq, gfp);
538
		else
539
			err = add_recvbuf_small(rq, gfp);
540

541
		oom = err == -ENOMEM;
542
		if (err)
543
			break;
544
		++rq->num;
545
	} while (rq->vq->num_free);
546 547 548
	if (unlikely(rq->num > rq->max))
		rq->max = rq->num;
	virtqueue_kick(rq->vq);
549
	return !oom;
550 551
}

552
static void skb_recv_done(struct virtqueue *rvq)
R
Rusty Russell 已提交
553 554
{
	struct virtnet_info *vi = rvq->vdev->priv;
J
Jason Wang 已提交
555
	struct receive_queue *rq = &vi->rq[vq2rxq(rvq)];
556

557
	/* Schedule NAPI, Suppress further interrupts if successful. */
558
	if (napi_schedule_prep(&rq->napi)) {
559
		virtqueue_disable_cb(rvq);
560
		__napi_schedule(&rq->napi);
561
	}
R
Rusty Russell 已提交
562 563
}

564
static void virtnet_napi_enable(struct receive_queue *rq)
565
{
566
	napi_enable(&rq->napi);
567 568 569 570 571

	/* If all buffers were filled by other side before we napi_enabled, we
	 * won't get another interrupt, so process any outstanding packets
	 * now.  virtnet_poll wants re-enable the queue, so we disable here.
	 * We synchronize against interrupts via NAPI_STATE_SCHED */
572 573
	if (napi_schedule_prep(&rq->napi)) {
		virtqueue_disable_cb(rq->vq);
574
		local_bh_disable();
575
		__napi_schedule(&rq->napi);
576
		local_bh_enable();
577 578 579
	}
}

580 581
static void refill_work(struct work_struct *work)
{
582 583
	struct virtnet_info *vi =
		container_of(work, struct virtnet_info, refill.work);
584
	bool still_empty;
J
Jason Wang 已提交
585 586
	int i;

587
	for (i = 0; i < vi->curr_queue_pairs; i++) {
J
Jason Wang 已提交
588
		struct receive_queue *rq = &vi->rq[i];
589

J
Jason Wang 已提交
590 591 592
		napi_disable(&rq->napi);
		still_empty = !try_fill_recv(rq, GFP_KERNEL);
		virtnet_napi_enable(rq);
593

J
Jason Wang 已提交
594 595 596 597 598 599
		/* In theory, this can happen: if we don't get any buffers in
		 * we will *never* try to fill again.
		 */
		if (still_empty)
			schedule_delayed_work(&vi->refill, HZ/2);
	}
600 601
}

R
Rusty Russell 已提交
602 603
static int virtnet_poll(struct napi_struct *napi, int budget)
{
604 605 606
	struct receive_queue *rq =
		container_of(napi, struct receive_queue, napi);
	struct virtnet_info *vi = rq->vq->vdev->priv;
607
	void *buf;
608
	unsigned int r, len, received = 0;
R
Rusty Russell 已提交
609 610 611

again:
	while (received < budget &&
612 613 614
	       (buf = virtqueue_get_buf(rq->vq, &len)) != NULL) {
		receive_buf(rq, buf, len);
		--rq->num;
R
Rusty Russell 已提交
615 616 617
		received++;
	}

618 619
	if (rq->num < rq->max / 2) {
		if (!try_fill_recv(rq, GFP_ATOMIC))
620
			schedule_delayed_work(&vi->refill, 0);
621
	}
R
Rusty Russell 已提交
622

623 624
	/* Out of packets? */
	if (received < budget) {
625
		r = virtqueue_enable_cb_prepare(rq->vq);
626
		napi_complete(napi);
627
		if (unlikely(virtqueue_poll(rq->vq, r)) &&
628
		    napi_schedule_prep(napi)) {
629
			virtqueue_disable_cb(rq->vq);
630
			__napi_schedule(napi);
R
Rusty Russell 已提交
631
			goto again;
632
		}
R
Rusty Russell 已提交
633 634 635 636 637
	}

	return received;
}

J
Jason Wang 已提交
638 639 640 641 642
static int virtnet_open(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
	int i;

643 644 645 646 647
	for (i = 0; i < vi->max_queue_pairs; i++) {
		if (i < vi->curr_queue_pairs)
			/* Make sure we have some buffers: if oom use wq. */
			if (!try_fill_recv(&vi->rq[i], GFP_KERNEL))
				schedule_delayed_work(&vi->refill, 0);
J
Jason Wang 已提交
648 649 650 651 652 653
		virtnet_napi_enable(&vi->rq[i]);
	}

	return 0;
}

654
static void free_old_xmit_skbs(struct send_queue *sq)
R
Rusty Russell 已提交
655 656
{
	struct sk_buff *skb;
657
	unsigned int len;
658
	struct virtnet_info *vi = sq->vq->vdev->priv;
E
Eric Dumazet 已提交
659
	struct virtnet_stats *stats = this_cpu_ptr(vi->stats);
R
Rusty Russell 已提交
660

661
	while ((skb = virtqueue_get_buf(sq->vq, &len)) != NULL) {
R
Rusty Russell 已提交
662
		pr_debug("Sent skb %p\n", skb);
663

664
		u64_stats_update_begin(&stats->tx_syncp);
665 666
		stats->tx_bytes += skb->len;
		stats->tx_packets++;
667
		u64_stats_update_end(&stats->tx_syncp);
668

669
		dev_kfree_skb_any(skb);
R
Rusty Russell 已提交
670 671 672
	}
}

673
static int xmit_skb(struct send_queue *sq, struct sk_buff *skb)
R
Rusty Russell 已提交
674
{
675
	struct skb_vnet_hdr *hdr;
R
Rusty Russell 已提交
676
	const unsigned char *dest = ((struct ethhdr *)skb->data)->h_dest;
677
	struct virtnet_info *vi = sq->vq->vdev->priv;
678
	unsigned num_sg;
679 680
	unsigned hdr_len;
	bool can_push;
R
Rusty Russell 已提交
681

J
Johannes Berg 已提交
682
	pr_debug("%s: xmit %p %pM\n", vi->dev->name, skb, dest);
683 684 685 686 687 688 689 690 691 692 693 694 695 696
	if (vi->mergeable_rx_bufs)
		hdr_len = sizeof hdr->mhdr;
	else
		hdr_len = sizeof hdr->hdr;

	can_push = vi->any_header_sg &&
		!((unsigned long)skb->data & (__alignof__(*hdr) - 1)) &&
		!skb_header_cloned(skb) && skb_headroom(skb) >= hdr_len;
	/* Even if we can, don't push here yet as this would skew
	 * csum_start offset below. */
	if (can_push)
		hdr = (struct skb_vnet_hdr *)(skb->data - hdr_len);
	else
		hdr = skb_vnet_hdr(skb);
R
Rusty Russell 已提交
697 698

	if (skb->ip_summed == CHECKSUM_PARTIAL) {
699
		hdr->hdr.flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
700
		hdr->hdr.csum_start = skb_checksum_start_offset(skb);
701
		hdr->hdr.csum_offset = skb->csum_offset;
R
Rusty Russell 已提交
702
	} else {
703 704
		hdr->hdr.flags = 0;
		hdr->hdr.csum_offset = hdr->hdr.csum_start = 0;
R
Rusty Russell 已提交
705 706 707
	}

	if (skb_is_gso(skb)) {
708 709
		hdr->hdr.hdr_len = skb_headlen(skb);
		hdr->hdr.gso_size = skb_shinfo(skb)->gso_size;
R
Rusty Russell 已提交
710
		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV4)
711
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
R
Rusty Russell 已提交
712
		else if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6)
713
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
R
Rusty Russell 已提交
714
		else if (skb_shinfo(skb)->gso_type & SKB_GSO_UDP)
715
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_UDP;
R
Rusty Russell 已提交
716 717
		else
			BUG();
R
Rusty Russell 已提交
718
		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCP_ECN)
719
			hdr->hdr.gso_type |= VIRTIO_NET_HDR_GSO_ECN;
R
Rusty Russell 已提交
720
	} else {
721 722
		hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_NONE;
		hdr->hdr.gso_size = hdr->hdr.hdr_len = 0;
R
Rusty Russell 已提交
723 724
	}

725
	if (vi->mergeable_rx_bufs)
726
		hdr->mhdr.num_buffers = 0;
727

728 729 730 731 732 733 734 735 736
	if (can_push) {
		__skb_push(skb, hdr_len);
		num_sg = skb_to_sgvec(skb, sq->sg, 0, skb->len);
		/* Pull header back to avoid skew in tx bytes calculations. */
		__skb_pull(skb, hdr_len);
	} else {
		sg_set_buf(sq->sg, hdr, hdr_len);
		num_sg = skb_to_sgvec(skb, sq->sg + 1, 0, skb->len) + 1;
	}
737
	return virtqueue_add_outbuf(sq->vq, sq->sg, num_sg, skb, GFP_ATOMIC);
738 739
}

740
static netdev_tx_t start_xmit(struct sk_buff *skb, struct net_device *dev)
741 742
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
743 744
	int qnum = skb_get_queue_mapping(skb);
	struct send_queue *sq = &vi->sq[qnum];
745
	int err;
746 747

	/* Free up any pending old buffers before queueing new ones. */
748
	free_old_xmit_skbs(sq);
749

750
	/* Try to transmit */
751
	err = xmit_skb(sq, skb);
752

753
	/* This should not happen! */
754
	if (unlikely(err)) {
755 756 757
		dev->stats.tx_fifo_errors++;
		if (net_ratelimit())
			dev_warn(&dev->dev,
758
				 "Unexpected TXQ (%d) queue failure: %d\n", qnum, err);
759 760 761
		dev->stats.tx_dropped++;
		kfree_skb(skb);
		return NETDEV_TX_OK;
R
Rusty Russell 已提交
762
	}
763
	virtqueue_kick(sq->vq);
764

765 766 767 768 769 770
	/* Don't wait up for transmitted skbs to be freed. */
	skb_orphan(skb);
	nf_reset(skb);

	/* Apparently nice girls don't return TX_BUSY; stop the queue
	 * before it gets out of hand.  Naturally, this wastes entries. */
771
	if (sq->vq->num_free < 2+MAX_SKB_FRAGS) {
J
Jason Wang 已提交
772
		netif_stop_subqueue(dev, qnum);
773
		if (unlikely(!virtqueue_enable_cb_delayed(sq->vq))) {
774
			/* More just got used, free them then recheck. */
775 776
			free_old_xmit_skbs(sq);
			if (sq->vq->num_free >= 2+MAX_SKB_FRAGS) {
J
Jason Wang 已提交
777
				netif_start_subqueue(dev, qnum);
778
				virtqueue_disable_cb(sq->vq);
779 780
			}
		}
781
	}
782 783

	return NETDEV_TX_OK;
R
Rusty Russell 已提交
784 785
}

786 787 788 789 790 791
/*
 * Send command via the control virtqueue and check status.  Commands
 * supported by the hypervisor, as indicated by feature bits, should
 * never fail unless improperly formated.
 */
static bool virtnet_send_command(struct virtnet_info *vi, u8 class, u8 cmd,
792 793
				 struct scatterlist *out,
				 struct scatterlist *in)
794
{
795
	struct scatterlist *sgs[4], hdr, stat;
796 797
	struct virtio_net_ctrl_hdr ctrl;
	virtio_net_ctrl_ack status = ~0;
798
	unsigned out_num = 0, in_num = 0, tmp;
799 800

	/* Caller should know better */
801
	BUG_ON(!virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VQ));
802 803 804

	ctrl.class = class;
	ctrl.cmd = cmd;
805 806 807
	/* Add header */
	sg_init_one(&hdr, &ctrl, sizeof(ctrl));
	sgs[out_num++] = &hdr;
808

809 810 811 812
	if (out)
		sgs[out_num++] = out;
	if (in)
		sgs[out_num + in_num++] = in;
813

814 815 816
	/* Add return status. */
	sg_init_one(&stat, &status, sizeof(status));
	sgs[out_num + in_num++] = &stat;
817

818 819 820
	BUG_ON(out_num + in_num > ARRAY_SIZE(sgs));
	BUG_ON(virtqueue_add_sgs(vi->cvq, sgs, out_num, in_num, vi, GFP_ATOMIC)
	       < 0);
821 822 823 824 825 826 827 828 829 830 831 832

	virtqueue_kick(vi->cvq);

	/* Spin for a response, the kick causes an ioport write, trapping
	 * into the hypervisor, so the request should be handled immediately.
	 */
	while (!virtqueue_get_buf(vi->cvq, &tmp))
		cpu_relax();

	return status == VIRTIO_NET_OK;
}

833 834 835 836
static int virtnet_set_mac_address(struct net_device *dev, void *p)
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct virtio_device *vdev = vi->vdev;
837
	int ret;
838 839
	struct sockaddr *addr = p;
	struct scatterlist sg;
840

841
	ret = eth_prepare_mac_addr_change(dev, p);
842 843
	if (ret)
		return ret;
844

845 846 847 848
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR)) {
		sg_init_one(&sg, addr->sa_data, dev->addr_len);
		if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MAC,
					  VIRTIO_NET_CTRL_MAC_ADDR_SET,
849
					  &sg, NULL)) {
850 851 852 853 854
			dev_warn(&vdev->dev,
				 "Failed to set mac address by vq command.\n");
			return -EINVAL;
		}
	} else if (virtio_has_feature(vdev, VIRTIO_NET_F_MAC)) {
855
		vdev->config->set(vdev, offsetof(struct virtio_net_config, mac),
856 857 858 859
				  addr->sa_data, dev->addr_len);
	}

	eth_commit_mac_addr_change(dev, p);
860 861 862 863

	return 0;
}

864 865 866 867 868 869 870 871
static struct rtnl_link_stats64 *virtnet_stats(struct net_device *dev,
					       struct rtnl_link_stats64 *tot)
{
	struct virtnet_info *vi = netdev_priv(dev);
	int cpu;
	unsigned int start;

	for_each_possible_cpu(cpu) {
E
Eric Dumazet 已提交
872
		struct virtnet_stats *stats = per_cpu_ptr(vi->stats, cpu);
873 874 875
		u64 tpackets, tbytes, rpackets, rbytes;

		do {
876
			start = u64_stats_fetch_begin_bh(&stats->tx_syncp);
877 878
			tpackets = stats->tx_packets;
			tbytes   = stats->tx_bytes;
879
		} while (u64_stats_fetch_retry_bh(&stats->tx_syncp, start));
880 881

		do {
882
			start = u64_stats_fetch_begin_bh(&stats->rx_syncp);
883 884
			rpackets = stats->rx_packets;
			rbytes   = stats->rx_bytes;
885
		} while (u64_stats_fetch_retry_bh(&stats->rx_syncp, start));
886 887 888 889 890 891 892 893

		tot->rx_packets += rpackets;
		tot->tx_packets += tpackets;
		tot->rx_bytes   += rbytes;
		tot->tx_bytes   += tbytes;
	}

	tot->tx_dropped = dev->stats.tx_dropped;
894
	tot->tx_fifo_errors = dev->stats.tx_fifo_errors;
895 896 897 898 899 900 901
	tot->rx_dropped = dev->stats.rx_dropped;
	tot->rx_length_errors = dev->stats.rx_length_errors;
	tot->rx_frame_errors = dev->stats.rx_frame_errors;

	return tot;
}

902 903 904 905
#ifdef CONFIG_NET_POLL_CONTROLLER
static void virtnet_netpoll(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
906
	int i;
907

J
Jason Wang 已提交
908 909
	for (i = 0; i < vi->curr_queue_pairs; i++)
		napi_schedule(&vi->rq[i].napi);
910 911 912
}
#endif

913 914 915 916
static void virtnet_ack_link_announce(struct virtnet_info *vi)
{
	rtnl_lock();
	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_ANNOUNCE,
917
				  VIRTIO_NET_CTRL_ANNOUNCE_ACK, NULL, NULL))
918 919 920 921
		dev_warn(&vi->dev->dev, "Failed to ack link announce.\n");
	rtnl_unlock();
}

J
Jason Wang 已提交
922 923 924 925 926 927 928 929 930 931 932 933 934
static int virtnet_set_queues(struct virtnet_info *vi, u16 queue_pairs)
{
	struct scatterlist sg;
	struct virtio_net_ctrl_mq s;
	struct net_device *dev = vi->dev;

	if (!vi->has_cvq || !virtio_has_feature(vi->vdev, VIRTIO_NET_F_MQ))
		return 0;

	s.virtqueue_pairs = queue_pairs;
	sg_init_one(&sg, &s, sizeof(s));

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MQ,
935
				  VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET, &sg, NULL)) {
J
Jason Wang 已提交
936 937 938
		dev_warn(&dev->dev, "Fail to set num of queue pairs to %d\n",
			 queue_pairs);
		return -EINVAL;
939
	} else {
J
Jason Wang 已提交
940
		vi->curr_queue_pairs = queue_pairs;
941
		schedule_delayed_work(&vi->refill, 0);
942
	}
J
Jason Wang 已提交
943 944 945 946

	return 0;
}

R
Rusty Russell 已提交
947 948 949
static int virtnet_close(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
950
	int i;
R
Rusty Russell 已提交
951

952 953
	/* Make sure refill_work doesn't re-enable napi! */
	cancel_delayed_work_sync(&vi->refill);
J
Jason Wang 已提交
954 955 956

	for (i = 0; i < vi->max_queue_pairs; i++)
		napi_disable(&vi->rq[i].napi);
R
Rusty Russell 已提交
957 958 959 960

	return 0;
}

961 962 963
static void virtnet_set_rx_mode(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
964
	struct scatterlist sg[2];
965
	u8 promisc, allmulti;
966
	struct virtio_net_ctrl_mac *mac_data;
J
Jiri Pirko 已提交
967
	struct netdev_hw_addr *ha;
968
	int uc_count;
969
	int mc_count;
970 971
	void *buf;
	int i;
972 973 974 975 976

	/* We can't dynamicaly set ndo_set_rx_mode, so return gracefully */
	if (!virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_RX))
		return;

977 978
	promisc = ((dev->flags & IFF_PROMISC) != 0);
	allmulti = ((dev->flags & IFF_ALLMULTI) != 0);
979

980
	sg_init_one(sg, &promisc, sizeof(promisc));
981 982 983

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_RX,
				  VIRTIO_NET_CTRL_RX_PROMISC,
984
				  sg, NULL))
985 986 987
		dev_warn(&dev->dev, "Failed to %sable promisc mode.\n",
			 promisc ? "en" : "dis");

988
	sg_init_one(sg, &allmulti, sizeof(allmulti));
989 990 991

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_RX,
				  VIRTIO_NET_CTRL_RX_ALLMULTI,
992
				  sg, NULL))
993 994
		dev_warn(&dev->dev, "Failed to %sable allmulti mode.\n",
			 allmulti ? "en" : "dis");
995

996
	uc_count = netdev_uc_count(dev);
997
	mc_count = netdev_mc_count(dev);
998
	/* MAC filter - use one buffer for both lists */
999 1000 1001
	buf = kzalloc(((uc_count + mc_count) * ETH_ALEN) +
		      (2 * sizeof(mac_data->entries)), GFP_ATOMIC);
	mac_data = buf;
1002
	if (!buf)
1003 1004
		return;

1005 1006
	sg_init_table(sg, 2);

1007
	/* Store the unicast list and count in the front of the buffer */
1008
	mac_data->entries = uc_count;
J
Jiri Pirko 已提交
1009
	i = 0;
1010
	netdev_for_each_uc_addr(ha, dev)
J
Jiri Pirko 已提交
1011
		memcpy(&mac_data->macs[i++][0], ha->addr, ETH_ALEN);
1012 1013

	sg_set_buf(&sg[0], mac_data,
1014
		   sizeof(mac_data->entries) + (uc_count * ETH_ALEN));
1015 1016

	/* multicast list and count fill the end */
1017
	mac_data = (void *)&mac_data->macs[uc_count][0];
1018

1019
	mac_data->entries = mc_count;
1020
	i = 0;
1021 1022
	netdev_for_each_mc_addr(ha, dev)
		memcpy(&mac_data->macs[i++][0], ha->addr, ETH_ALEN);
1023 1024

	sg_set_buf(&sg[1], mac_data,
1025
		   sizeof(mac_data->entries) + (mc_count * ETH_ALEN));
1026 1027 1028

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MAC,
				  VIRTIO_NET_CTRL_MAC_TABLE_SET,
1029
				  sg, NULL))
1030 1031 1032
		dev_warn(&dev->dev, "Failed to set MAC fitler table.\n");

	kfree(buf);
1033 1034
}

1035 1036
static int virtnet_vlan_rx_add_vid(struct net_device *dev,
				   __be16 proto, u16 vid)
1037 1038 1039 1040
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct scatterlist sg;

1041
	sg_init_one(&sg, &vid, sizeof(vid));
1042 1043

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_VLAN,
1044
				  VIRTIO_NET_CTRL_VLAN_ADD, &sg, NULL))
1045
		dev_warn(&dev->dev, "Failed to add VLAN ID %d.\n", vid);
1046
	return 0;
1047 1048
}

1049 1050
static int virtnet_vlan_rx_kill_vid(struct net_device *dev,
				    __be16 proto, u16 vid)
1051 1052 1053 1054
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct scatterlist sg;

1055
	sg_init_one(&sg, &vid, sizeof(vid));
1056 1057

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_VLAN,
1058
				  VIRTIO_NET_CTRL_VLAN_DEL, &sg, NULL))
1059
		dev_warn(&dev->dev, "Failed to kill VLAN ID %d.\n", vid);
1060
	return 0;
1061 1062
}

1063
static void virtnet_clean_affinity(struct virtnet_info *vi, long hcpu)
J
Jason Wang 已提交
1064 1065
{
	int i;
1066
	int cpu;
J
Jason Wang 已提交
1067

1068 1069
	if (vi->affinity_hint_set) {
		for (i = 0; i < vi->max_queue_pairs; i++) {
1070 1071 1072 1073
			virtqueue_set_affinity(vi->rq[i].vq, -1);
			virtqueue_set_affinity(vi->sq[i].vq, -1);
		}

1074 1075 1076 1077 1078 1079 1080 1081
		vi->affinity_hint_set = false;
	}

	i = 0;
	for_each_online_cpu(cpu) {
		if (cpu == hcpu) {
			*per_cpu_ptr(vi->vq_index, cpu) = -1;
		} else {
1082 1083
			*per_cpu_ptr(vi->vq_index, cpu) =
				++i % vi->curr_queue_pairs;
1084 1085 1086
		}
	}
}
1087

1088 1089 1090 1091
static void virtnet_set_affinity(struct virtnet_info *vi)
{
	int i;
	int cpu;
J
Jason Wang 已提交
1092 1093 1094 1095 1096

	/* In multiqueue mode, when the number of cpu is equal to the number of
	 * queue pairs, we let the queue pairs to be private to one cpu by
	 * setting the affinity hint to eliminate the contention.
	 */
1097 1098 1099 1100
	if (vi->curr_queue_pairs == 1 ||
	    vi->max_queue_pairs != num_online_cpus()) {
		virtnet_clean_affinity(vi, -1);
		return;
J
Jason Wang 已提交
1101 1102
	}

1103 1104
	i = 0;
	for_each_online_cpu(cpu) {
J
Jason Wang 已提交
1105 1106
		virtqueue_set_affinity(vi->rq[i].vq, cpu);
		virtqueue_set_affinity(vi->sq[i].vq, cpu);
1107 1108
		*per_cpu_ptr(vi->vq_index, cpu) = i;
		i++;
J
Jason Wang 已提交
1109 1110
	}

1111
	vi->affinity_hint_set = true;
J
Jason Wang 已提交
1112 1113
}

1114 1115 1116 1117 1118
static int virtnet_cpu_callback(struct notifier_block *nfb,
			        unsigned long action, void *hcpu)
{
	struct virtnet_info *vi = container_of(nfb, struct virtnet_info, nb);

1119 1120 1121 1122 1123
	mutex_lock(&vi->config_lock);

	if (!vi->config_enable)
		goto done;

1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135
	switch(action & ~CPU_TASKS_FROZEN) {
	case CPU_ONLINE:
	case CPU_DOWN_FAILED:
	case CPU_DEAD:
		virtnet_set_affinity(vi);
		break;
	case CPU_DOWN_PREPARE:
		virtnet_clean_affinity(vi, (long)hcpu);
		break;
	default:
		break;
	}
1136 1137 1138

done:
	mutex_unlock(&vi->config_lock);
1139
	return NOTIFY_OK;
J
Jason Wang 已提交
1140 1141
}

R
Rick Jones 已提交
1142 1143 1144 1145 1146
static void virtnet_get_ringparam(struct net_device *dev,
				struct ethtool_ringparam *ring)
{
	struct virtnet_info *vi = netdev_priv(dev);

J
Jason Wang 已提交
1147 1148
	ring->rx_max_pending = virtqueue_get_vring_size(vi->rq[0].vq);
	ring->tx_max_pending = virtqueue_get_vring_size(vi->sq[0].vq);
R
Rick Jones 已提交
1149 1150 1151 1152
	ring->rx_pending = ring->rx_max_pending;
	ring->tx_pending = ring->tx_max_pending;
}

1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165

static void virtnet_get_drvinfo(struct net_device *dev,
				struct ethtool_drvinfo *info)
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct virtio_device *vdev = vi->vdev;

	strlcpy(info->driver, KBUILD_MODNAME, sizeof(info->driver));
	strlcpy(info->version, VIRTNET_DRIVER_VERSION, sizeof(info->version));
	strlcpy(info->bus_info, virtio_bus_name(vdev), sizeof(info->bus_info));

}

1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182
/* TODO: Eliminate OOO packets during switching */
static int virtnet_set_channels(struct net_device *dev,
				struct ethtool_channels *channels)
{
	struct virtnet_info *vi = netdev_priv(dev);
	u16 queue_pairs = channels->combined_count;
	int err;

	/* We don't support separate rx/tx channels.
	 * We don't allow setting 'other' channels.
	 */
	if (channels->rx_count || channels->tx_count || channels->other_count)
		return -EINVAL;

	if (queue_pairs > vi->max_queue_pairs)
		return -EINVAL;

1183
	get_online_cpus();
1184 1185 1186 1187 1188
	err = virtnet_set_queues(vi, queue_pairs);
	if (!err) {
		netif_set_real_num_tx_queues(dev, queue_pairs);
		netif_set_real_num_rx_queues(dev, queue_pairs);

1189
		virtnet_set_affinity(vi);
1190
	}
1191
	put_online_cpus();
1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208

	return err;
}

static void virtnet_get_channels(struct net_device *dev,
				 struct ethtool_channels *channels)
{
	struct virtnet_info *vi = netdev_priv(dev);

	channels->combined_count = vi->curr_queue_pairs;
	channels->max_combined = vi->max_queue_pairs;
	channels->max_other = 0;
	channels->rx_count = 0;
	channels->tx_count = 0;
	channels->other_count = 0;
}

1209
static const struct ethtool_ops virtnet_ethtool_ops = {
1210
	.get_drvinfo = virtnet_get_drvinfo,
1211
	.get_link = ethtool_op_get_link,
R
Rick Jones 已提交
1212
	.get_ringparam = virtnet_get_ringparam,
1213 1214
	.set_channels = virtnet_set_channels,
	.get_channels = virtnet_get_channels,
1215 1216
};

M
Mark McLoughlin 已提交
1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227
#define MIN_MTU 68
#define MAX_MTU 65535

static int virtnet_change_mtu(struct net_device *dev, int new_mtu)
{
	if (new_mtu < MIN_MTU || new_mtu > MAX_MTU)
		return -EINVAL;
	dev->mtu = new_mtu;
	return 0;
}

J
Jason Wang 已提交
1228 1229 1230 1231 1232
/* To avoid contending a lock hold by a vcpu who would exit to host, select the
 * txq based on the processor id.
 */
static u16 virtnet_select_queue(struct net_device *dev, struct sk_buff *skb)
{
1233 1234 1235 1236 1237 1238 1239 1240 1241 1242
	int txq;
	struct virtnet_info *vi = netdev_priv(dev);

	if (skb_rx_queue_recorded(skb)) {
		txq = skb_get_rx_queue(skb);
	} else {
		txq = *__this_cpu_ptr(vi->vq_index);
		if (txq == -1)
			txq = 0;
	}
J
Jason Wang 已提交
1243 1244 1245 1246 1247 1248 1249

	while (unlikely(txq >= dev->real_num_tx_queues))
		txq -= dev->real_num_tx_queues;

	return txq;
}

1250 1251 1252 1253 1254
static const struct net_device_ops virtnet_netdev = {
	.ndo_open            = virtnet_open,
	.ndo_stop   	     = virtnet_close,
	.ndo_start_xmit      = start_xmit,
	.ndo_validate_addr   = eth_validate_addr,
1255
	.ndo_set_mac_address = virtnet_set_mac_address,
1256
	.ndo_set_rx_mode     = virtnet_set_rx_mode,
1257
	.ndo_change_mtu	     = virtnet_change_mtu,
1258
	.ndo_get_stats64     = virtnet_stats,
1259 1260
	.ndo_vlan_rx_add_vid = virtnet_vlan_rx_add_vid,
	.ndo_vlan_rx_kill_vid = virtnet_vlan_rx_kill_vid,
J
Jason Wang 已提交
1261
	.ndo_select_queue     = virtnet_select_queue,
1262 1263 1264 1265 1266
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller = virtnet_netpoll,
#endif
};

1267
static void virtnet_config_changed_work(struct work_struct *work)
1268
{
1269 1270
	struct virtnet_info *vi =
		container_of(work, struct virtnet_info, config_work);
1271 1272
	u16 v;

1273 1274 1275 1276
	mutex_lock(&vi->config_lock);
	if (!vi->config_enable)
		goto done;

1277
	if (virtio_config_val(vi->vdev, VIRTIO_NET_F_STATUS,
1278
			      offsetof(struct virtio_net_config, status),
1279
			      &v) < 0)
1280 1281 1282
		goto done;

	if (v & VIRTIO_NET_S_ANNOUNCE) {
1283
		netdev_notify_peers(vi->dev);
1284 1285
		virtnet_ack_link_announce(vi);
	}
1286 1287 1288 1289 1290

	/* Ignore unknown (future) status bits */
	v &= VIRTIO_NET_S_LINK_UP;

	if (vi->status == v)
1291
		goto done;
1292 1293 1294 1295 1296

	vi->status = v;

	if (vi->status & VIRTIO_NET_S_LINK_UP) {
		netif_carrier_on(vi->dev);
J
Jason Wang 已提交
1297
		netif_tx_wake_all_queues(vi->dev);
1298 1299
	} else {
		netif_carrier_off(vi->dev);
J
Jason Wang 已提交
1300
		netif_tx_stop_all_queues(vi->dev);
1301
	}
1302 1303
done:
	mutex_unlock(&vi->config_lock);
1304 1305 1306 1307 1308 1309
}

static void virtnet_config_changed(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;

1310
	schedule_work(&vi->config_work);
1311 1312
}

J
Jason Wang 已提交
1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353
static void virtnet_free_queues(struct virtnet_info *vi)
{
	kfree(vi->rq);
	kfree(vi->sq);
}

static void free_receive_bufs(struct virtnet_info *vi)
{
	int i;

	for (i = 0; i < vi->max_queue_pairs; i++) {
		while (vi->rq[i].pages)
			__free_pages(get_a_page(&vi->rq[i], GFP_KERNEL), 0);
	}
}

static void free_unused_bufs(struct virtnet_info *vi)
{
	void *buf;
	int i;

	for (i = 0; i < vi->max_queue_pairs; i++) {
		struct virtqueue *vq = vi->sq[i].vq;
		while ((buf = virtqueue_detach_unused_buf(vq)) != NULL)
			dev_kfree_skb(buf);
	}

	for (i = 0; i < vi->max_queue_pairs; i++) {
		struct virtqueue *vq = vi->rq[i].vq;

		while ((buf = virtqueue_detach_unused_buf(vq)) != NULL) {
			if (vi->mergeable_rx_bufs || vi->big_packets)
				give_pages(&vi->rq[i], buf);
			else
				dev_kfree_skb(buf);
			--vi->rq[i].num;
		}
		BUG_ON(vi->rq[i].num != 0);
	}
}

1354 1355 1356 1357
static void virtnet_del_vqs(struct virtnet_info *vi)
{
	struct virtio_device *vdev = vi->vdev;

1358
	virtnet_clean_affinity(vi, -1);
J
Jason Wang 已提交
1359

1360
	vdev->config->del_vqs(vdev);
J
Jason Wang 已提交
1361 1362

	virtnet_free_queues(vi);
1363 1364
}

J
Jason Wang 已提交
1365
static int virtnet_find_vqs(struct virtnet_info *vi)
1366
{
J
Jason Wang 已提交
1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395
	vq_callback_t **callbacks;
	struct virtqueue **vqs;
	int ret = -ENOMEM;
	int i, total_vqs;
	const char **names;

	/* We expect 1 RX virtqueue followed by 1 TX virtqueue, followed by
	 * possible N-1 RX/TX queue pairs used in multiqueue mode, followed by
	 * possible control vq.
	 */
	total_vqs = vi->max_queue_pairs * 2 +
		    virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VQ);

	/* Allocate space for find_vqs parameters */
	vqs = kzalloc(total_vqs * sizeof(*vqs), GFP_KERNEL);
	if (!vqs)
		goto err_vq;
	callbacks = kmalloc(total_vqs * sizeof(*callbacks), GFP_KERNEL);
	if (!callbacks)
		goto err_callback;
	names = kmalloc(total_vqs * sizeof(*names), GFP_KERNEL);
	if (!names)
		goto err_names;

	/* Parameters for control virtqueue, if any */
	if (vi->has_cvq) {
		callbacks[total_vqs - 1] = NULL;
		names[total_vqs - 1] = "control";
	}
1396

J
Jason Wang 已提交
1397 1398 1399 1400 1401 1402 1403 1404 1405
	/* Allocate/initialize parameters for send/receive virtqueues */
	for (i = 0; i < vi->max_queue_pairs; i++) {
		callbacks[rxq2vq(i)] = skb_recv_done;
		callbacks[txq2vq(i)] = skb_xmit_done;
		sprintf(vi->rq[i].name, "input.%d", i);
		sprintf(vi->sq[i].name, "output.%d", i);
		names[rxq2vq(i)] = vi->rq[i].name;
		names[txq2vq(i)] = vi->sq[i].name;
	}
1406

J
Jason Wang 已提交
1407 1408 1409 1410
	ret = vi->vdev->config->find_vqs(vi->vdev, total_vqs, vqs, callbacks,
					 names);
	if (ret)
		goto err_find;
1411

J
Jason Wang 已提交
1412 1413
	if (vi->has_cvq) {
		vi->cvq = vqs[total_vqs - 1];
1414
		if (virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VLAN))
1415
			vi->dev->features |= NETIF_F_HW_VLAN_CTAG_FILTER;
1416
	}
J
Jason Wang 已提交
1417 1418 1419 1420 1421 1422 1423 1424 1425 1426

	for (i = 0; i < vi->max_queue_pairs; i++) {
		vi->rq[i].vq = vqs[rxq2vq(i)];
		vi->sq[i].vq = vqs[txq2vq(i)];
	}

	kfree(names);
	kfree(callbacks);
	kfree(vqs);

1427
	return 0;
J
Jason Wang 已提交
1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446

err_find:
	kfree(names);
err_names:
	kfree(callbacks);
err_callback:
	kfree(vqs);
err_vq:
	return ret;
}

static int virtnet_alloc_queues(struct virtnet_info *vi)
{
	int i;

	vi->sq = kzalloc(sizeof(*vi->sq) * vi->max_queue_pairs, GFP_KERNEL);
	if (!vi->sq)
		goto err_sq;
	vi->rq = kzalloc(sizeof(*vi->rq) * vi->max_queue_pairs, GFP_KERNEL);
1447
	if (!vi->rq)
J
Jason Wang 已提交
1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480
		goto err_rq;

	INIT_DELAYED_WORK(&vi->refill, refill_work);
	for (i = 0; i < vi->max_queue_pairs; i++) {
		vi->rq[i].pages = NULL;
		netif_napi_add(vi->dev, &vi->rq[i].napi, virtnet_poll,
			       napi_weight);

		sg_init_table(vi->rq[i].sg, ARRAY_SIZE(vi->rq[i].sg));
		sg_init_table(vi->sq[i].sg, ARRAY_SIZE(vi->sq[i].sg));
	}

	return 0;

err_rq:
	kfree(vi->sq);
err_sq:
	return -ENOMEM;
}

static int init_vqs(struct virtnet_info *vi)
{
	int ret;

	/* Allocate send & receive queues */
	ret = virtnet_alloc_queues(vi);
	if (ret)
		goto err;

	ret = virtnet_find_vqs(vi);
	if (ret)
		goto err_free;

1481
	get_online_cpus();
1482
	virtnet_set_affinity(vi);
1483 1484
	put_online_cpus();

J
Jason Wang 已提交
1485 1486 1487 1488 1489 1490
	return 0;

err_free:
	virtnet_free_queues(vi);
err:
	return ret;
1491 1492
}

R
Rusty Russell 已提交
1493 1494
static int virtnet_probe(struct virtio_device *vdev)
{
J
Jason Wang 已提交
1495
	int i, err;
R
Rusty Russell 已提交
1496 1497
	struct net_device *dev;
	struct virtnet_info *vi;
J
Jason Wang 已提交
1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509
	u16 max_queue_pairs;

	/* Find if host supports multiqueue virtio_net device */
	err = virtio_config_val(vdev, VIRTIO_NET_F_MQ,
				offsetof(struct virtio_net_config,
				max_virtqueue_pairs), &max_queue_pairs);

	/* We need at least 2 queue's */
	if (err || max_queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
	    max_queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
	    !virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ))
		max_queue_pairs = 1;
R
Rusty Russell 已提交
1510 1511

	/* Allocate ourselves a network device with room for our info */
J
Jason Wang 已提交
1512
	dev = alloc_etherdev_mq(sizeof(struct virtnet_info), max_queue_pairs);
R
Rusty Russell 已提交
1513 1514 1515 1516
	if (!dev)
		return -ENOMEM;

	/* Set up network device as normal. */
1517
	dev->priv_flags |= IFF_UNICAST_FLT | IFF_LIVE_ADDR_CHANGE;
1518
	dev->netdev_ops = &virtnet_netdev;
R
Rusty Russell 已提交
1519
	dev->features = NETIF_F_HIGHDMA;
1520

1521
	SET_ETHTOOL_OPS(dev, &virtnet_ethtool_ops);
R
Rusty Russell 已提交
1522 1523 1524
	SET_NETDEV_DEV(dev, &vdev->dev);

	/* Do we support "hardware" checksums? */
1525
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CSUM)) {
R
Rusty Russell 已提交
1526
		/* This opens up the world of extra features. */
1527 1528 1529 1530 1531 1532
		dev->hw_features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;
		if (csum)
			dev->features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;

		if (virtio_has_feature(vdev, VIRTIO_NET_F_GSO)) {
			dev->hw_features |= NETIF_F_TSO | NETIF_F_UFO
R
Rusty Russell 已提交
1533 1534
				| NETIF_F_TSO_ECN | NETIF_F_TSO6;
		}
1535
		/* Individual feature bits: what can host handle? */
1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO4))
			dev->hw_features |= NETIF_F_TSO;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO6))
			dev->hw_features |= NETIF_F_TSO6;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_ECN))
			dev->hw_features |= NETIF_F_TSO_ECN;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_UFO))
			dev->hw_features |= NETIF_F_UFO;

		if (gso)
			dev->features |= dev->hw_features & (NETIF_F_ALL_TSO|NETIF_F_UFO);
		/* (!csum && gso) case will be fixed by register_netdev() */
R
Rusty Russell 已提交
1548
	}
1549 1550
	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_CSUM))
		dev->features |= NETIF_F_RXCSUM;
R
Rusty Russell 已提交
1551

1552 1553
	dev->vlan_features = dev->features;

R
Rusty Russell 已提交
1554
	/* Configuration may specify what MAC to use.  Otherwise random. */
1555
	if (virtio_config_val_len(vdev, VIRTIO_NET_F_MAC,
1556
				  offsetof(struct virtio_net_config, mac),
1557
				  dev->dev_addr, dev->addr_len) < 0)
1558
		eth_hw_addr_random(dev);
R
Rusty Russell 已提交
1559 1560 1561 1562 1563

	/* Set up our device-specific information */
	vi = netdev_priv(dev);
	vi->dev = dev;
	vi->vdev = vdev;
1564
	vdev->priv = vi;
1565 1566 1567 1568 1569
	vi->stats = alloc_percpu(struct virtnet_stats);
	err = -ENOMEM;
	if (vi->stats == NULL)
		goto free;

1570 1571 1572 1573
	vi->vq_index = alloc_percpu(int);
	if (vi->vq_index == NULL)
		goto free_stats;

1574 1575 1576
	mutex_init(&vi->config_lock);
	vi->config_enable = true;
	INIT_WORK(&vi->config_work, virtnet_config_changed_work);
R
Rusty Russell 已提交
1577

1578
	/* If we can receive ANY GSO packets, we must allocate large ones. */
1579 1580 1581
	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO4) ||
	    virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO6) ||
	    virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_ECN))
1582 1583
		vi->big_packets = true;

1584 1585 1586
	if (virtio_has_feature(vdev, VIRTIO_NET_F_MRG_RXBUF))
		vi->mergeable_rx_bufs = true;

1587 1588 1589
	if (virtio_has_feature(vdev, VIRTIO_F_ANY_LAYOUT))
		vi->any_header_sg = true;

J
Jason Wang 已提交
1590 1591 1592 1593 1594 1595 1596 1597
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ))
		vi->has_cvq = true;

	/* Use single tx/rx queue pair as default */
	vi->curr_queue_pairs = 1;
	vi->max_queue_pairs = max_queue_pairs;

	/* Allocate/initialize the rx/tx queues, and invoke find_vqs */
1598
	err = init_vqs(vi);
1599
	if (err)
1600
		goto free_index;
R
Rusty Russell 已提交
1601

J
Jason Wang 已提交
1602 1603 1604
	netif_set_real_num_tx_queues(dev, 1);
	netif_set_real_num_rx_queues(dev, 1);

R
Rusty Russell 已提交
1605 1606 1607
	err = register_netdev(dev);
	if (err) {
		pr_debug("virtio_net: registering device failed\n");
1608
		goto free_vqs;
R
Rusty Russell 已提交
1609
	}
1610 1611

	/* Last of all, set up some receive buffers. */
1612
	for (i = 0; i < vi->curr_queue_pairs; i++) {
J
Jason Wang 已提交
1613 1614 1615 1616 1617 1618 1619 1620
		try_fill_recv(&vi->rq[i], GFP_KERNEL);

		/* If we didn't even get one input buffer, we're useless. */
		if (vi->rq[i].num == 0) {
			free_unused_bufs(vi);
			err = -ENOMEM;
			goto free_recv_bufs;
		}
1621 1622
	}

1623 1624 1625 1626 1627 1628 1629
	vi->nb.notifier_call = &virtnet_cpu_callback;
	err = register_hotcpu_notifier(&vi->nb);
	if (err) {
		pr_debug("virtio_net: registering cpu notifier failed\n");
		goto free_recv_bufs;
	}

J
Jason Wang 已提交
1630 1631 1632 1633
	/* Assume link up if device can't report link status,
	   otherwise get link status from config. */
	if (virtio_has_feature(vi->vdev, VIRTIO_NET_F_STATUS)) {
		netif_carrier_off(dev);
1634
		schedule_work(&vi->config_work);
J
Jason Wang 已提交
1635 1636 1637 1638
	} else {
		vi->status = VIRTIO_NET_S_LINK_UP;
		netif_carrier_on(dev);
	}
1639

J
Jason Wang 已提交
1640 1641 1642
	pr_debug("virtnet: registered device %s with %d RX and TX vq's\n",
		 dev->name, max_queue_pairs);

R
Rusty Russell 已提交
1643 1644
	return 0;

J
Jason Wang 已提交
1645 1646
free_recv_bufs:
	free_receive_bufs(vi);
1647
	unregister_netdev(dev);
1648
free_vqs:
J
Jason Wang 已提交
1649
	cancel_delayed_work_sync(&vi->refill);
1650
	virtnet_del_vqs(vi);
1651 1652
free_index:
	free_percpu(vi->vq_index);
1653 1654
free_stats:
	free_percpu(vi->stats);
R
Rusty Russell 已提交
1655 1656 1657 1658 1659
free:
	free_netdev(dev);
	return err;
}

1660
static void remove_vq_common(struct virtnet_info *vi)
R
Rusty Russell 已提交
1661
{
1662
	vi->vdev->config->reset(vi->vdev);
S
Shirley Ma 已提交
1663 1664

	/* Free unused buffers in both send and recv, if any. */
1665
	free_unused_bufs(vi);
1666

J
Jason Wang 已提交
1667
	free_receive_bufs(vi);
1668

J
Jason Wang 已提交
1669
	virtnet_del_vqs(vi);
1670 1671
}

1672
static void virtnet_remove(struct virtio_device *vdev)
1673 1674 1675
{
	struct virtnet_info *vi = vdev->priv;

1676 1677
	unregister_hotcpu_notifier(&vi->nb);

1678 1679 1680 1681 1682
	/* Prevent config work handler from accessing the device. */
	mutex_lock(&vi->config_lock);
	vi->config_enable = false;
	mutex_unlock(&vi->config_lock);

1683 1684 1685
	unregister_netdev(vi->dev);

	remove_vq_common(vi);
1686

1687 1688
	flush_work(&vi->config_work);

1689
	free_percpu(vi->vq_index);
1690
	free_percpu(vi->stats);
1691
	free_netdev(vi->dev);
R
Rusty Russell 已提交
1692 1693
}

1694 1695 1696 1697
#ifdef CONFIG_PM
static int virtnet_freeze(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;
J
Jason Wang 已提交
1698
	int i;
1699

1700 1701 1702 1703 1704
	/* Prevent config work handler from accessing the device */
	mutex_lock(&vi->config_lock);
	vi->config_enable = false;
	mutex_unlock(&vi->config_lock);

1705 1706 1707 1708
	netif_device_detach(vi->dev);
	cancel_delayed_work_sync(&vi->refill);

	if (netif_running(vi->dev))
J
Jason Wang 已提交
1709 1710 1711 1712
		for (i = 0; i < vi->max_queue_pairs; i++) {
			napi_disable(&vi->rq[i].napi);
			netif_napi_del(&vi->rq[i].napi);
		}
1713 1714 1715

	remove_vq_common(vi);

1716 1717
	flush_work(&vi->config_work);

1718 1719 1720 1721 1722 1723
	return 0;
}

static int virtnet_restore(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;
J
Jason Wang 已提交
1724
	int err, i;
1725 1726 1727 1728 1729 1730

	err = init_vqs(vi);
	if (err)
		return err;

	if (netif_running(vi->dev))
J
Jason Wang 已提交
1731 1732
		for (i = 0; i < vi->max_queue_pairs; i++)
			virtnet_napi_enable(&vi->rq[i]);
1733 1734 1735

	netif_device_attach(vi->dev);

1736
	for (i = 0; i < vi->curr_queue_pairs; i++)
J
Jason Wang 已提交
1737 1738
		if (!try_fill_recv(&vi->rq[i], GFP_KERNEL))
			schedule_delayed_work(&vi->refill, 0);
1739

1740 1741 1742 1743
	mutex_lock(&vi->config_lock);
	vi->config_enable = true;
	mutex_unlock(&vi->config_lock);

J
Jason Wang 已提交
1744 1745
	virtnet_set_queues(vi, vi->curr_queue_pairs);

1746 1747 1748 1749
	return 0;
}
#endif

R
Rusty Russell 已提交
1750 1751 1752 1753 1754
static struct virtio_device_id id_table[] = {
	{ VIRTIO_ID_NET, VIRTIO_DEV_ANY_ID },
	{ 0 },
};

1755
static unsigned int features[] = {
1756 1757
	VIRTIO_NET_F_CSUM, VIRTIO_NET_F_GUEST_CSUM,
	VIRTIO_NET_F_GSO, VIRTIO_NET_F_MAC,
1758
	VIRTIO_NET_F_HOST_TSO4, VIRTIO_NET_F_HOST_UFO, VIRTIO_NET_F_HOST_TSO6,
1759
	VIRTIO_NET_F_HOST_ECN, VIRTIO_NET_F_GUEST_TSO4, VIRTIO_NET_F_GUEST_TSO6,
1760
	VIRTIO_NET_F_GUEST_ECN, VIRTIO_NET_F_GUEST_UFO,
1761
	VIRTIO_NET_F_MRG_RXBUF, VIRTIO_NET_F_STATUS, VIRTIO_NET_F_CTRL_VQ,
1762
	VIRTIO_NET_F_CTRL_RX, VIRTIO_NET_F_CTRL_VLAN,
J
Jason Wang 已提交
1763
	VIRTIO_NET_F_GUEST_ANNOUNCE, VIRTIO_NET_F_MQ,
1764
	VIRTIO_NET_F_CTRL_MAC_ADDR,
1765
	VIRTIO_F_ANY_LAYOUT,
1766 1767
};

1768
static struct virtio_driver virtio_net_driver = {
1769 1770
	.feature_table = features,
	.feature_table_size = ARRAY_SIZE(features),
R
Rusty Russell 已提交
1771 1772 1773 1774
	.driver.name =	KBUILD_MODNAME,
	.driver.owner =	THIS_MODULE,
	.id_table =	id_table,
	.probe =	virtnet_probe,
1775
	.remove =	virtnet_remove,
1776
	.config_changed = virtnet_config_changed,
1777 1778 1779 1780
#ifdef CONFIG_PM
	.freeze =	virtnet_freeze,
	.restore =	virtnet_restore,
#endif
R
Rusty Russell 已提交
1781 1782
};

1783
module_virtio_driver(virtio_net_driver);
R
Rusty Russell 已提交
1784 1785 1786 1787

MODULE_DEVICE_TABLE(virtio, id_table);
MODULE_DESCRIPTION("Virtio network driver");
MODULE_LICENSE("GPL");