virtio_net.c 43.9 KB
Newer Older
1
/* A network driver using virtio.
R
Rusty Russell 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 *
 * Copyright 2007 Rusty Russell <rusty@rustcorp.com.au> IBM Corporation
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 */
//#define DEBUG
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
22
#include <linux/ethtool.h>
R
Rusty Russell 已提交
23 24 25 26
#include <linux/module.h>
#include <linux/virtio.h>
#include <linux/virtio_net.h>
#include <linux/scatterlist.h>
27
#include <linux/if_vlan.h>
28
#include <linux/slab.h>
29
#include <linux/cpu.h>
R
Rusty Russell 已提交
30

31
static int napi_weight = NAPI_POLL_WEIGHT;
32 33
module_param(napi_weight, int, 0444);

34
static bool csum = true, gso = true;
R
Rusty Russell 已提交
35 36 37
module_param(csum, bool, 0444);
module_param(gso, bool, 0444);

R
Rusty Russell 已提交
38
/* FIXME: MTU in config. */
39
#define MAX_PACKET_LEN (ETH_HLEN + VLAN_HLEN + ETH_DATA_LEN)
40
#define GOOD_COPY_LEN	128
R
Rusty Russell 已提交
41

42
#define VIRTNET_DRIVER_VERSION "1.0.0"
43

44
struct virtnet_stats {
45 46
	struct u64_stats_sync tx_syncp;
	struct u64_stats_sync rx_syncp;
47 48 49 50 51 52 53
	u64 tx_bytes;
	u64 tx_packets;

	u64 rx_bytes;
	u64 rx_packets;
};

54 55 56 57 58 59 60
/* Internal representation of a send virtqueue */
struct send_queue {
	/* Virtqueue associated with this send _queue */
	struct virtqueue *vq;

	/* TX: fragments + linear part + virtio header */
	struct scatterlist sg[MAX_SKB_FRAGS + 2];
J
Jason Wang 已提交
61 62 63

	/* Name of the send queue: output.$index */
	char name[40];
64 65 66 67 68 69 70
};

/* Internal representation of a receive virtqueue */
struct receive_queue {
	/* Virtqueue associated with this receive_queue */
	struct virtqueue *vq;

R
Rusty Russell 已提交
71 72 73 74 75
	struct napi_struct napi;

	/* Number of input buffers, and max we've ever had. */
	unsigned int num, max;

76 77 78 79 80
	/* Chain pages by the private ptr. */
	struct page *pages;

	/* RX: fragments + linear part + virtio header */
	struct scatterlist sg[MAX_SKB_FRAGS + 2];
J
Jason Wang 已提交
81 82 83

	/* Name of this receive queue: input.$index */
	char name[40];
84 85 86 87 88 89
};

struct virtnet_info {
	struct virtio_device *vdev;
	struct virtqueue *cvq;
	struct net_device *dev;
J
Jason Wang 已提交
90 91
	struct send_queue *sq;
	struct receive_queue *rq;
92 93
	unsigned int status;

J
Jason Wang 已提交
94 95 96 97 98 99
	/* Max # of queue pairs supported by the device */
	u16 max_queue_pairs;

	/* # of queue pairs currently used by the driver */
	u16 curr_queue_pairs;

100 101 102
	/* I like... big packets and I cannot lie! */
	bool big_packets;

103 104 105
	/* Host will merge rx buffers for big packets (shake it! shake it!) */
	bool mergeable_rx_bufs;

J
Jason Wang 已提交
106 107 108
	/* Has control virtqueue */
	bool has_cvq;

109 110 111
	/* Host can handle any s/g split between our header and packet data */
	bool any_header_sg;

112 113 114
	/* enable config space updates */
	bool config_enable;

115 116 117
	/* Active statistics */
	struct virtnet_stats __percpu *stats;

118 119 120
	/* Work struct for refilling if we run low on memory. */
	struct delayed_work refill;

121 122 123 124 125
	/* Work struct for config space updates */
	struct work_struct config_work;

	/* Lock for config space updates */
	struct mutex config_lock;
J
Jason Wang 已提交
126 127 128

	/* Does the affinity hint is set for virtqueues? */
	bool affinity_hint_set;
129 130 131

	/* Per-cpu variable to show the mapping from CPU to virtqueue */
	int __percpu *vq_index;
132 133 134

	/* CPU hot plug notifier */
	struct notifier_block nb;
R
Rusty Russell 已提交
135 136
};

137 138 139 140 141 142 143
struct skb_vnet_hdr {
	union {
		struct virtio_net_hdr hdr;
		struct virtio_net_hdr_mrg_rxbuf mhdr;
	};
};

144 145 146 147 148 149 150 151 152 153
struct padded_vnet_hdr {
	struct virtio_net_hdr hdr;
	/*
	 * virtio_net_hdr should be in a separated sg buffer because of a
	 * QEMU bug, and data sg buffer shares same page with this header sg.
	 * This padding makes next sg 16 byte aligned after virtio_net_hdr.
	 */
	char padding[6];
};

J
Jason Wang 已提交
154 155 156 157 158
/* Converting between virtqueue no. and kernel tx/rx queue no.
 * 0:rx0 1:tx0 2:rx1 3:tx1 ... 2N:rxN 2N+1:txN 2N+2:cvq
 */
static int vq2txq(struct virtqueue *vq)
{
159
	return (vq->index - 1) / 2;
J
Jason Wang 已提交
160 161 162 163 164 165 166 167 168
}

static int txq2vq(int txq)
{
	return txq * 2 + 1;
}

static int vq2rxq(struct virtqueue *vq)
{
169
	return vq->index / 2;
J
Jason Wang 已提交
170 171 172 173 174 175 176
}

static int rxq2vq(int rxq)
{
	return rxq * 2;
}

177
static inline struct skb_vnet_hdr *skb_vnet_hdr(struct sk_buff *skb)
R
Rusty Russell 已提交
178
{
179
	return (struct skb_vnet_hdr *)skb->cb;
R
Rusty Russell 已提交
180 181
}

182 183 184 185
/*
 * private is used to chain pages for big packets, put the whole
 * most recent used list in the beginning for reuse
 */
186
static void give_pages(struct receive_queue *rq, struct page *page)
187
{
188
	struct page *end;
189

190
	/* Find end of list, sew whole thing into vi->rq.pages. */
191
	for (end = page; end->private; end = (struct page *)end->private);
192 193
	end->private = (unsigned long)rq->pages;
	rq->pages = page;
194 195
}

196
static struct page *get_a_page(struct receive_queue *rq, gfp_t gfp_mask)
197
{
198
	struct page *p = rq->pages;
199

200
	if (p) {
201
		rq->pages = (struct page *)p->private;
202 203 204
		/* clear private here, it is used to chain pages */
		p->private = 0;
	} else
205 206 207 208
		p = alloc_page(gfp_mask);
	return p;
}

209
static void skb_xmit_done(struct virtqueue *vq)
R
Rusty Russell 已提交
210
{
211
	struct virtnet_info *vi = vq->vdev->priv;
R
Rusty Russell 已提交
212

213
	/* Suppress further interrupts. */
214
	virtqueue_disable_cb(vq);
215

216
	/* We were probably waiting for more output buffers. */
J
Jason Wang 已提交
217
	netif_wake_subqueue(vi->dev, vq2txq(vq));
R
Rusty Russell 已提交
218 219
}

220 221
static void set_skb_frag(struct sk_buff *skb, struct page *page,
			 unsigned int offset, unsigned int *len)
R
Rusty Russell 已提交
222
{
223
	int size = min((unsigned)PAGE_SIZE - offset, *len);
224 225
	int i = skb_shinfo(skb)->nr_frags;

226
	__skb_fill_page_desc(skb, i, page, offset, size);
227

228 229
	skb->data_len += size;
	skb->len += size;
230
	skb->truesize += PAGE_SIZE;
231
	skb_shinfo(skb)->nr_frags++;
232
	skb_shinfo(skb)->tx_flags |= SKBTX_SHARED_FRAG;
233
	*len -= size;
234
}
235

236
/* Called from bottom half context */
237
static struct sk_buff *page_to_skb(struct receive_queue *rq,
238 239
				   struct page *page, unsigned int len)
{
240
	struct virtnet_info *vi = rq->vq->vdev->priv;
241 242 243 244
	struct sk_buff *skb;
	struct skb_vnet_hdr *hdr;
	unsigned int copy, hdr_len, offset;
	char *p;
245

246
	p = page_address(page);
247

248 249 250 251
	/* copy small packet so we can reuse these pages for small data */
	skb = netdev_alloc_skb_ip_align(vi->dev, GOOD_COPY_LEN);
	if (unlikely(!skb))
		return NULL;
252

253
	hdr = skb_vnet_hdr(skb);
254

255 256 257 258 259 260 261
	if (vi->mergeable_rx_bufs) {
		hdr_len = sizeof hdr->mhdr;
		offset = hdr_len;
	} else {
		hdr_len = sizeof hdr->hdr;
		offset = sizeof(struct padded_vnet_hdr);
	}
262

263
	memcpy(hdr, p, hdr_len);
264

265 266
	len -= hdr_len;
	p += offset;
267

268 269 270 271
	copy = len;
	if (copy > skb_tailroom(skb))
		copy = skb_tailroom(skb);
	memcpy(skb_put(skb, copy), p, copy);
272

273 274
	len -= copy;
	offset += copy;
275

276 277 278 279 280 281 282
	/*
	 * Verify that we can indeed put this data into a skb.
	 * This is here to handle cases when the device erroneously
	 * tries to receive more than is possible. This is usually
	 * the case of a broken device.
	 */
	if (unlikely(len > MAX_SKB_FRAGS * PAGE_SIZE)) {
283
		net_dbg_ratelimited("%s: too much data\n", skb->dev->name);
284 285 286 287
		dev_kfree_skb(skb);
		return NULL;
	}

288 289 290 291 292
	while (len) {
		set_skb_frag(skb, page, offset, &len);
		page = (struct page *)page->private;
		offset = 0;
	}
293

294
	if (page)
295
		give_pages(rq, page);
296

297 298
	return skb;
}
299

300
static int receive_mergeable(struct receive_queue *rq, struct sk_buff *skb)
301 302 303 304 305 306 307 308 309 310 311 312 313
{
	struct skb_vnet_hdr *hdr = skb_vnet_hdr(skb);
	struct page *page;
	int num_buf, i, len;

	num_buf = hdr->mhdr.num_buffers;
	while (--num_buf) {
		i = skb_shinfo(skb)->nr_frags;
		if (i >= MAX_SKB_FRAGS) {
			pr_debug("%s: packet too long\n", skb->dev->name);
			skb->dev->stats.rx_length_errors++;
			return -EINVAL;
		}
314
		page = virtqueue_get_buf(rq->vq, &len);
315 316 317 318 319
		if (!page) {
			pr_debug("%s: rx error: %d buffers missing\n",
				 skb->dev->name, hdr->mhdr.num_buffers);
			skb->dev->stats.rx_length_errors++;
			return -EINVAL;
320
		}
321

322 323 324 325 326
		if (len > PAGE_SIZE)
			len = PAGE_SIZE;

		set_skb_frag(skb, page, 0, &len);

327
		--rq->num;
328 329 330 331
	}
	return 0;
}

332
static void receive_buf(struct receive_queue *rq, void *buf, unsigned int len)
333
{
334 335
	struct virtnet_info *vi = rq->vq->vdev->priv;
	struct net_device *dev = vi->dev;
E
Eric Dumazet 已提交
336
	struct virtnet_stats *stats = this_cpu_ptr(vi->stats);
337 338 339
	struct sk_buff *skb;
	struct page *page;
	struct skb_vnet_hdr *hdr;
340

341 342 343 344
	if (unlikely(len < sizeof(struct virtio_net_hdr) + ETH_HLEN)) {
		pr_debug("%s: short packet %i\n", dev->name, len);
		dev->stats.rx_length_errors++;
		if (vi->mergeable_rx_bufs || vi->big_packets)
345
			give_pages(rq, buf);
346 347 348 349
		else
			dev_kfree_skb(buf);
		return;
	}
350

351 352 353 354 355 356
	if (!vi->mergeable_rx_bufs && !vi->big_packets) {
		skb = buf;
		len -= sizeof(struct virtio_net_hdr);
		skb_trim(skb, len);
	} else {
		page = buf;
357
		skb = page_to_skb(rq, page, len);
358
		if (unlikely(!skb)) {
359
			dev->stats.rx_dropped++;
360
			give_pages(rq, page);
361
			return;
362
		}
363
		if (vi->mergeable_rx_bufs)
364
			if (receive_mergeable(rq, skb)) {
365 366 367
				dev_kfree_skb(skb);
				return;
			}
368
	}
369

370
	hdr = skb_vnet_hdr(skb);
371

372
	u64_stats_update_begin(&stats->rx_syncp);
373 374
	stats->rx_bytes += skb->len;
	stats->rx_packets++;
375
	u64_stats_update_end(&stats->rx_syncp);
R
Rusty Russell 已提交
376

377
	if (hdr->hdr.flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) {
R
Rusty Russell 已提交
378
		pr_debug("Needs csum!\n");
379 380 381
		if (!skb_partial_csum_set(skb,
					  hdr->hdr.csum_start,
					  hdr->hdr.csum_offset))
R
Rusty Russell 已提交
382
			goto frame_err;
383 384
	} else if (hdr->hdr.flags & VIRTIO_NET_HDR_F_DATA_VALID) {
		skb->ip_summed = CHECKSUM_UNNECESSARY;
R
Rusty Russell 已提交
385 386
	}

387 388 389 390
	skb->protocol = eth_type_trans(skb, dev);
	pr_debug("Receiving skb proto 0x%04x len %i type %i\n",
		 ntohs(skb->protocol), skb->len, skb->pkt_type);

391
	if (hdr->hdr.gso_type != VIRTIO_NET_HDR_GSO_NONE) {
R
Rusty Russell 已提交
392
		pr_debug("GSO!\n");
393
		switch (hdr->hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN) {
R
Rusty Russell 已提交
394
		case VIRTIO_NET_HDR_GSO_TCPV4:
395
			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
R
Rusty Russell 已提交
396 397
			break;
		case VIRTIO_NET_HDR_GSO_UDP:
398
			skb_shinfo(skb)->gso_type = SKB_GSO_UDP;
R
Rusty Russell 已提交
399 400
			break;
		case VIRTIO_NET_HDR_GSO_TCPV6:
401
			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
R
Rusty Russell 已提交
402 403
			break;
		default:
404 405
			net_warn_ratelimited("%s: bad gso type %u.\n",
					     dev->name, hdr->hdr.gso_type);
R
Rusty Russell 已提交
406 407 408
			goto frame_err;
		}

409
		if (hdr->hdr.gso_type & VIRTIO_NET_HDR_GSO_ECN)
410
			skb_shinfo(skb)->gso_type |= SKB_GSO_TCP_ECN;
R
Rusty Russell 已提交
411

412
		skb_shinfo(skb)->gso_size = hdr->hdr.gso_size;
R
Rusty Russell 已提交
413
		if (skb_shinfo(skb)->gso_size == 0) {
414
			net_warn_ratelimited("%s: zero gso size.\n", dev->name);
R
Rusty Russell 已提交
415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430
			goto frame_err;
		}

		/* Header must be checked, and gso_segs computed. */
		skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
		skb_shinfo(skb)->gso_segs = 0;
	}

	netif_receive_skb(skb);
	return;

frame_err:
	dev->stats.rx_frame_errors++;
	dev_kfree_skb(skb);
}

431
static int add_recvbuf_small(struct receive_queue *rq, gfp_t gfp)
R
Rusty Russell 已提交
432
{
433
	struct virtnet_info *vi = rq->vq->vdev->priv;
R
Rusty Russell 已提交
434
	struct sk_buff *skb;
435 436
	struct skb_vnet_hdr *hdr;
	int err;
437

438
	skb = __netdev_alloc_skb_ip_align(vi->dev, MAX_PACKET_LEN, gfp);
439 440
	if (unlikely(!skb))
		return -ENOMEM;
R
Rusty Russell 已提交
441

442
	skb_put(skb, MAX_PACKET_LEN);
443

444
	hdr = skb_vnet_hdr(skb);
445
	sg_set_buf(rq->sg, &hdr->hdr, sizeof hdr->hdr);
446

447
	skb_to_sgvec(skb, rq->sg + 1, 0, skb->len);
448

449
	err = virtqueue_add_inbuf(rq->vq, rq->sg, 2, skb, gfp);
450 451
	if (err < 0)
		dev_kfree_skb(skb);
452

453 454
	return err;
}
455

456
static int add_recvbuf_big(struct receive_queue *rq, gfp_t gfp)
457 458 459 460 461
{
	struct page *first, *list = NULL;
	char *p;
	int i, err, offset;

462
	/* page in rq->sg[MAX_SKB_FRAGS + 1] is list tail */
463
	for (i = MAX_SKB_FRAGS + 1; i > 1; --i) {
464
		first = get_a_page(rq, gfp);
465 466
		if (!first) {
			if (list)
467
				give_pages(rq, list);
468
			return -ENOMEM;
469
		}
470
		sg_set_buf(&rq->sg[i], page_address(first), PAGE_SIZE);
471

472 473 474 475
		/* chain new page in list head to match sg */
		first->private = (unsigned long)list;
		list = first;
	}
R
Rusty Russell 已提交
476

477
	first = get_a_page(rq, gfp);
478
	if (!first) {
479
		give_pages(rq, list);
480 481 482 483
		return -ENOMEM;
	}
	p = page_address(first);

484 485 486
	/* rq->sg[0], rq->sg[1] share the same page */
	/* a separated rq->sg[0] for virtio_net_hdr only due to QEMU bug */
	sg_set_buf(&rq->sg[0], p, sizeof(struct virtio_net_hdr));
487

488
	/* rq->sg[1] for data packet, from offset */
489
	offset = sizeof(struct padded_vnet_hdr);
490
	sg_set_buf(&rq->sg[1], p + offset, PAGE_SIZE - offset);
491 492 493

	/* chain first in list head */
	first->private = (unsigned long)list;
494 495
	err = virtqueue_add_inbuf(rq->vq, rq->sg, MAX_SKB_FRAGS + 2,
				  first, gfp);
496
	if (err < 0)
497
		give_pages(rq, first);
498 499

	return err;
R
Rusty Russell 已提交
500 501
}

502
static int add_recvbuf_mergeable(struct receive_queue *rq, gfp_t gfp)
503
{
504
	struct page *page;
505 506
	int err;

507
	page = get_a_page(rq, gfp);
508 509
	if (!page)
		return -ENOMEM;
510

511
	sg_init_one(rq->sg, page_address(page), PAGE_SIZE);
512

513
	err = virtqueue_add_inbuf(rq->vq, rq->sg, 1, page, gfp);
514
	if (err < 0)
515
		give_pages(rq, page);
516

517 518
	return err;
}
519

520 521 522 523 524 525 526
/*
 * Returns false if we couldn't fill entirely (OOM).
 *
 * Normally run in the receive path, but can also be run from ndo_open
 * before we're receiving packets, or from refill_work which is
 * careful to disable receiving (using napi_disable).
 */
527
static bool try_fill_recv(struct receive_queue *rq, gfp_t gfp)
528
{
529
	struct virtnet_info *vi = rq->vq->vdev->priv;
530
	int err;
531
	bool oom;
532

533 534
	do {
		if (vi->mergeable_rx_bufs)
535
			err = add_recvbuf_mergeable(rq, gfp);
536
		else if (vi->big_packets)
537
			err = add_recvbuf_big(rq, gfp);
538
		else
539
			err = add_recvbuf_small(rq, gfp);
540

541
		oom = err == -ENOMEM;
542
		if (err)
543
			break;
544
		++rq->num;
545
	} while (rq->vq->num_free);
546 547 548
	if (unlikely(rq->num > rq->max))
		rq->max = rq->num;
	virtqueue_kick(rq->vq);
549
	return !oom;
550 551
}

552
static void skb_recv_done(struct virtqueue *rvq)
R
Rusty Russell 已提交
553 554
{
	struct virtnet_info *vi = rvq->vdev->priv;
J
Jason Wang 已提交
555
	struct receive_queue *rq = &vi->rq[vq2rxq(rvq)];
556

557
	/* Schedule NAPI, Suppress further interrupts if successful. */
558
	if (napi_schedule_prep(&rq->napi)) {
559
		virtqueue_disable_cb(rvq);
560
		__napi_schedule(&rq->napi);
561
	}
R
Rusty Russell 已提交
562 563
}

564
static void virtnet_napi_enable(struct receive_queue *rq)
565
{
566
	napi_enable(&rq->napi);
567 568 569 570 571

	/* If all buffers were filled by other side before we napi_enabled, we
	 * won't get another interrupt, so process any outstanding packets
	 * now.  virtnet_poll wants re-enable the queue, so we disable here.
	 * We synchronize against interrupts via NAPI_STATE_SCHED */
572 573
	if (napi_schedule_prep(&rq->napi)) {
		virtqueue_disable_cb(rq->vq);
574
		local_bh_disable();
575
		__napi_schedule(&rq->napi);
576
		local_bh_enable();
577 578 579
	}
}

580 581
static void refill_work(struct work_struct *work)
{
582 583
	struct virtnet_info *vi =
		container_of(work, struct virtnet_info, refill.work);
584
	bool still_empty;
J
Jason Wang 已提交
585 586
	int i;

587
	for (i = 0; i < vi->curr_queue_pairs; i++) {
J
Jason Wang 已提交
588
		struct receive_queue *rq = &vi->rq[i];
589

J
Jason Wang 已提交
590 591 592
		napi_disable(&rq->napi);
		still_empty = !try_fill_recv(rq, GFP_KERNEL);
		virtnet_napi_enable(rq);
593

J
Jason Wang 已提交
594 595 596 597 598 599
		/* In theory, this can happen: if we don't get any buffers in
		 * we will *never* try to fill again.
		 */
		if (still_empty)
			schedule_delayed_work(&vi->refill, HZ/2);
	}
600 601
}

R
Rusty Russell 已提交
602 603
static int virtnet_poll(struct napi_struct *napi, int budget)
{
604 605 606
	struct receive_queue *rq =
		container_of(napi, struct receive_queue, napi);
	struct virtnet_info *vi = rq->vq->vdev->priv;
607
	void *buf;
608
	unsigned int r, len, received = 0;
R
Rusty Russell 已提交
609 610 611

again:
	while (received < budget &&
612 613 614
	       (buf = virtqueue_get_buf(rq->vq, &len)) != NULL) {
		receive_buf(rq, buf, len);
		--rq->num;
R
Rusty Russell 已提交
615 616 617
		received++;
	}

618 619
	if (rq->num < rq->max / 2) {
		if (!try_fill_recv(rq, GFP_ATOMIC))
620
			schedule_delayed_work(&vi->refill, 0);
621
	}
R
Rusty Russell 已提交
622

623 624
	/* Out of packets? */
	if (received < budget) {
625
		r = virtqueue_enable_cb_prepare(rq->vq);
626
		napi_complete(napi);
627
		if (unlikely(virtqueue_poll(rq->vq, r)) &&
628
		    napi_schedule_prep(napi)) {
629
			virtqueue_disable_cb(rq->vq);
630
			__napi_schedule(napi);
R
Rusty Russell 已提交
631
			goto again;
632
		}
R
Rusty Russell 已提交
633 634 635 636 637
	}

	return received;
}

J
Jason Wang 已提交
638 639 640 641 642
static int virtnet_open(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
	int i;

643 644 645 646 647
	for (i = 0; i < vi->max_queue_pairs; i++) {
		if (i < vi->curr_queue_pairs)
			/* Make sure we have some buffers: if oom use wq. */
			if (!try_fill_recv(&vi->rq[i], GFP_KERNEL))
				schedule_delayed_work(&vi->refill, 0);
J
Jason Wang 已提交
648 649 650 651 652 653
		virtnet_napi_enable(&vi->rq[i]);
	}

	return 0;
}

654
static void free_old_xmit_skbs(struct send_queue *sq)
R
Rusty Russell 已提交
655 656
{
	struct sk_buff *skb;
657
	unsigned int len;
658
	struct virtnet_info *vi = sq->vq->vdev->priv;
E
Eric Dumazet 已提交
659
	struct virtnet_stats *stats = this_cpu_ptr(vi->stats);
R
Rusty Russell 已提交
660

661
	while ((skb = virtqueue_get_buf(sq->vq, &len)) != NULL) {
R
Rusty Russell 已提交
662
		pr_debug("Sent skb %p\n", skb);
663

664
		u64_stats_update_begin(&stats->tx_syncp);
665 666
		stats->tx_bytes += skb->len;
		stats->tx_packets++;
667
		u64_stats_update_end(&stats->tx_syncp);
668

669
		dev_kfree_skb_any(skb);
R
Rusty Russell 已提交
670 671 672
	}
}

673
static int xmit_skb(struct send_queue *sq, struct sk_buff *skb)
R
Rusty Russell 已提交
674
{
675
	struct skb_vnet_hdr *hdr;
R
Rusty Russell 已提交
676
	const unsigned char *dest = ((struct ethhdr *)skb->data)->h_dest;
677
	struct virtnet_info *vi = sq->vq->vdev->priv;
678
	unsigned num_sg;
679 680
	unsigned hdr_len;
	bool can_push;
R
Rusty Russell 已提交
681

J
Johannes Berg 已提交
682
	pr_debug("%s: xmit %p %pM\n", vi->dev->name, skb, dest);
683 684 685 686 687 688 689 690 691 692 693 694 695 696
	if (vi->mergeable_rx_bufs)
		hdr_len = sizeof hdr->mhdr;
	else
		hdr_len = sizeof hdr->hdr;

	can_push = vi->any_header_sg &&
		!((unsigned long)skb->data & (__alignof__(*hdr) - 1)) &&
		!skb_header_cloned(skb) && skb_headroom(skb) >= hdr_len;
	/* Even if we can, don't push here yet as this would skew
	 * csum_start offset below. */
	if (can_push)
		hdr = (struct skb_vnet_hdr *)(skb->data - hdr_len);
	else
		hdr = skb_vnet_hdr(skb);
R
Rusty Russell 已提交
697 698

	if (skb->ip_summed == CHECKSUM_PARTIAL) {
699
		hdr->hdr.flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
700
		hdr->hdr.csum_start = skb_checksum_start_offset(skb);
701
		hdr->hdr.csum_offset = skb->csum_offset;
R
Rusty Russell 已提交
702
	} else {
703 704
		hdr->hdr.flags = 0;
		hdr->hdr.csum_offset = hdr->hdr.csum_start = 0;
R
Rusty Russell 已提交
705 706 707
	}

	if (skb_is_gso(skb)) {
708 709
		hdr->hdr.hdr_len = skb_headlen(skb);
		hdr->hdr.gso_size = skb_shinfo(skb)->gso_size;
R
Rusty Russell 已提交
710
		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV4)
711
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
R
Rusty Russell 已提交
712
		else if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6)
713
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
R
Rusty Russell 已提交
714
		else if (skb_shinfo(skb)->gso_type & SKB_GSO_UDP)
715
			hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_UDP;
R
Rusty Russell 已提交
716 717
		else
			BUG();
R
Rusty Russell 已提交
718
		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCP_ECN)
719
			hdr->hdr.gso_type |= VIRTIO_NET_HDR_GSO_ECN;
R
Rusty Russell 已提交
720
	} else {
721 722
		hdr->hdr.gso_type = VIRTIO_NET_HDR_GSO_NONE;
		hdr->hdr.gso_size = hdr->hdr.hdr_len = 0;
R
Rusty Russell 已提交
723 724
	}

725
	if (vi->mergeable_rx_bufs)
726
		hdr->mhdr.num_buffers = 0;
727

728 729 730 731 732 733 734 735 736
	if (can_push) {
		__skb_push(skb, hdr_len);
		num_sg = skb_to_sgvec(skb, sq->sg, 0, skb->len);
		/* Pull header back to avoid skew in tx bytes calculations. */
		__skb_pull(skb, hdr_len);
	} else {
		sg_set_buf(sq->sg, hdr, hdr_len);
		num_sg = skb_to_sgvec(skb, sq->sg + 1, 0, skb->len) + 1;
	}
737
	return virtqueue_add_outbuf(sq->vq, sq->sg, num_sg, skb, GFP_ATOMIC);
738 739
}

740
static netdev_tx_t start_xmit(struct sk_buff *skb, struct net_device *dev)
741 742
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
743 744
	int qnum = skb_get_queue_mapping(skb);
	struct send_queue *sq = &vi->sq[qnum];
745
	int err;
746 747

	/* Free up any pending old buffers before queueing new ones. */
748
	free_old_xmit_skbs(sq);
749

750
	/* Try to transmit */
751
	err = xmit_skb(sq, skb);
752

753
	/* This should not happen! */
754
	if (unlikely(err)) {
755 756 757
		dev->stats.tx_fifo_errors++;
		if (net_ratelimit())
			dev_warn(&dev->dev,
758
				 "Unexpected TXQ (%d) queue failure: %d\n", qnum, err);
759 760 761
		dev->stats.tx_dropped++;
		kfree_skb(skb);
		return NETDEV_TX_OK;
R
Rusty Russell 已提交
762
	}
763
	virtqueue_kick(sq->vq);
764

765 766 767 768 769 770
	/* Don't wait up for transmitted skbs to be freed. */
	skb_orphan(skb);
	nf_reset(skb);

	/* Apparently nice girls don't return TX_BUSY; stop the queue
	 * before it gets out of hand.  Naturally, this wastes entries. */
771
	if (sq->vq->num_free < 2+MAX_SKB_FRAGS) {
J
Jason Wang 已提交
772
		netif_stop_subqueue(dev, qnum);
773
		if (unlikely(!virtqueue_enable_cb_delayed(sq->vq))) {
774
			/* More just got used, free them then recheck. */
775 776
			free_old_xmit_skbs(sq);
			if (sq->vq->num_free >= 2+MAX_SKB_FRAGS) {
J
Jason Wang 已提交
777
				netif_start_subqueue(dev, qnum);
778
				virtqueue_disable_cb(sq->vq);
779 780
			}
		}
781
	}
782 783

	return NETDEV_TX_OK;
R
Rusty Russell 已提交
784 785
}

786 787 788 789 790 791
/*
 * Send command via the control virtqueue and check status.  Commands
 * supported by the hypervisor, as indicated by feature bits, should
 * never fail unless improperly formated.
 */
static bool virtnet_send_command(struct virtnet_info *vi, u8 class, u8 cmd,
792 793
				 struct scatterlist *out,
				 struct scatterlist *in)
794
{
795
	struct scatterlist *sgs[4], hdr, stat;
796 797
	struct virtio_net_ctrl_hdr ctrl;
	virtio_net_ctrl_ack status = ~0;
798
	unsigned out_num = 0, in_num = 0, tmp;
799 800

	/* Caller should know better */
801
	BUG_ON(!virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VQ));
802 803 804

	ctrl.class = class;
	ctrl.cmd = cmd;
805 806 807
	/* Add header */
	sg_init_one(&hdr, &ctrl, sizeof(ctrl));
	sgs[out_num++] = &hdr;
808

809 810 811 812
	if (out)
		sgs[out_num++] = out;
	if (in)
		sgs[out_num + in_num++] = in;
813

814 815 816
	/* Add return status. */
	sg_init_one(&stat, &status, sizeof(status));
	sgs[out_num + in_num++] = &stat;
817

818 819 820
	BUG_ON(out_num + in_num > ARRAY_SIZE(sgs));
	BUG_ON(virtqueue_add_sgs(vi->cvq, sgs, out_num, in_num, vi, GFP_ATOMIC)
	       < 0);
821 822 823 824 825 826 827 828 829 830 831 832

	virtqueue_kick(vi->cvq);

	/* Spin for a response, the kick causes an ioport write, trapping
	 * into the hypervisor, so the request should be handled immediately.
	 */
	while (!virtqueue_get_buf(vi->cvq, &tmp))
		cpu_relax();

	return status == VIRTIO_NET_OK;
}

833 834 835 836
static int virtnet_set_mac_address(struct net_device *dev, void *p)
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct virtio_device *vdev = vi->vdev;
837
	int ret;
838 839
	struct sockaddr *addr = p;
	struct scatterlist sg;
840

841
	ret = eth_prepare_mac_addr_change(dev, p);
842 843
	if (ret)
		return ret;
844

845 846 847 848
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR)) {
		sg_init_one(&sg, addr->sa_data, dev->addr_len);
		if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MAC,
					  VIRTIO_NET_CTRL_MAC_ADDR_SET,
849
					  &sg, NULL)) {
850 851 852 853 854
			dev_warn(&vdev->dev,
				 "Failed to set mac address by vq command.\n");
			return -EINVAL;
		}
	} else if (virtio_has_feature(vdev, VIRTIO_NET_F_MAC)) {
855
		vdev->config->set(vdev, offsetof(struct virtio_net_config, mac),
856 857 858 859
				  addr->sa_data, dev->addr_len);
	}

	eth_commit_mac_addr_change(dev, p);
860 861 862 863

	return 0;
}

864 865 866 867 868 869 870 871
static struct rtnl_link_stats64 *virtnet_stats(struct net_device *dev,
					       struct rtnl_link_stats64 *tot)
{
	struct virtnet_info *vi = netdev_priv(dev);
	int cpu;
	unsigned int start;

	for_each_possible_cpu(cpu) {
E
Eric Dumazet 已提交
872
		struct virtnet_stats *stats = per_cpu_ptr(vi->stats, cpu);
873 874 875
		u64 tpackets, tbytes, rpackets, rbytes;

		do {
876
			start = u64_stats_fetch_begin_bh(&stats->tx_syncp);
877 878
			tpackets = stats->tx_packets;
			tbytes   = stats->tx_bytes;
879
		} while (u64_stats_fetch_retry_bh(&stats->tx_syncp, start));
880 881

		do {
882
			start = u64_stats_fetch_begin_bh(&stats->rx_syncp);
883 884
			rpackets = stats->rx_packets;
			rbytes   = stats->rx_bytes;
885
		} while (u64_stats_fetch_retry_bh(&stats->rx_syncp, start));
886 887 888 889 890 891 892 893

		tot->rx_packets += rpackets;
		tot->tx_packets += tpackets;
		tot->rx_bytes   += rbytes;
		tot->tx_bytes   += tbytes;
	}

	tot->tx_dropped = dev->stats.tx_dropped;
894
	tot->tx_fifo_errors = dev->stats.tx_fifo_errors;
895 896 897 898 899 900 901
	tot->rx_dropped = dev->stats.rx_dropped;
	tot->rx_length_errors = dev->stats.rx_length_errors;
	tot->rx_frame_errors = dev->stats.rx_frame_errors;

	return tot;
}

902 903 904 905
#ifdef CONFIG_NET_POLL_CONTROLLER
static void virtnet_netpoll(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
906
	int i;
907

J
Jason Wang 已提交
908 909
	for (i = 0; i < vi->curr_queue_pairs; i++)
		napi_schedule(&vi->rq[i].napi);
910 911 912
}
#endif

913 914 915 916
static void virtnet_ack_link_announce(struct virtnet_info *vi)
{
	rtnl_lock();
	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_ANNOUNCE,
917
				  VIRTIO_NET_CTRL_ANNOUNCE_ACK, NULL, NULL))
918 919 920 921
		dev_warn(&vi->dev->dev, "Failed to ack link announce.\n");
	rtnl_unlock();
}

J
Jason Wang 已提交
922 923 924 925 926 927 928 929 930 931 932 933 934
static int virtnet_set_queues(struct virtnet_info *vi, u16 queue_pairs)
{
	struct scatterlist sg;
	struct virtio_net_ctrl_mq s;
	struct net_device *dev = vi->dev;

	if (!vi->has_cvq || !virtio_has_feature(vi->vdev, VIRTIO_NET_F_MQ))
		return 0;

	s.virtqueue_pairs = queue_pairs;
	sg_init_one(&sg, &s, sizeof(s));

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MQ,
935
				  VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET, &sg, NULL)) {
J
Jason Wang 已提交
936 937 938
		dev_warn(&dev->dev, "Fail to set num of queue pairs to %d\n",
			 queue_pairs);
		return -EINVAL;
939
	} else {
J
Jason Wang 已提交
940
		vi->curr_queue_pairs = queue_pairs;
941 942 943
		/* virtnet_open() will refill when device is going to up. */
		if (dev->flags & IFF_UP)
			schedule_delayed_work(&vi->refill, 0);
944
	}
J
Jason Wang 已提交
945 946 947 948

	return 0;
}

R
Rusty Russell 已提交
949 950 951
static int virtnet_close(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
J
Jason Wang 已提交
952
	int i;
R
Rusty Russell 已提交
953

954 955
	/* Make sure refill_work doesn't re-enable napi! */
	cancel_delayed_work_sync(&vi->refill);
J
Jason Wang 已提交
956 957 958

	for (i = 0; i < vi->max_queue_pairs; i++)
		napi_disable(&vi->rq[i].napi);
R
Rusty Russell 已提交
959 960 961 962

	return 0;
}

963 964 965
static void virtnet_set_rx_mode(struct net_device *dev)
{
	struct virtnet_info *vi = netdev_priv(dev);
966
	struct scatterlist sg[2];
967
	u8 promisc, allmulti;
968
	struct virtio_net_ctrl_mac *mac_data;
J
Jiri Pirko 已提交
969
	struct netdev_hw_addr *ha;
970
	int uc_count;
971
	int mc_count;
972 973
	void *buf;
	int i;
974 975 976 977 978

	/* We can't dynamicaly set ndo_set_rx_mode, so return gracefully */
	if (!virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_RX))
		return;

979 980
	promisc = ((dev->flags & IFF_PROMISC) != 0);
	allmulti = ((dev->flags & IFF_ALLMULTI) != 0);
981

982
	sg_init_one(sg, &promisc, sizeof(promisc));
983 984 985

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_RX,
				  VIRTIO_NET_CTRL_RX_PROMISC,
986
				  sg, NULL))
987 988 989
		dev_warn(&dev->dev, "Failed to %sable promisc mode.\n",
			 promisc ? "en" : "dis");

990
	sg_init_one(sg, &allmulti, sizeof(allmulti));
991 992 993

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_RX,
				  VIRTIO_NET_CTRL_RX_ALLMULTI,
994
				  sg, NULL))
995 996
		dev_warn(&dev->dev, "Failed to %sable allmulti mode.\n",
			 allmulti ? "en" : "dis");
997

998
	uc_count = netdev_uc_count(dev);
999
	mc_count = netdev_mc_count(dev);
1000
	/* MAC filter - use one buffer for both lists */
1001 1002 1003
	buf = kzalloc(((uc_count + mc_count) * ETH_ALEN) +
		      (2 * sizeof(mac_data->entries)), GFP_ATOMIC);
	mac_data = buf;
1004
	if (!buf)
1005 1006
		return;

1007 1008
	sg_init_table(sg, 2);

1009
	/* Store the unicast list and count in the front of the buffer */
1010
	mac_data->entries = uc_count;
J
Jiri Pirko 已提交
1011
	i = 0;
1012
	netdev_for_each_uc_addr(ha, dev)
J
Jiri Pirko 已提交
1013
		memcpy(&mac_data->macs[i++][0], ha->addr, ETH_ALEN);
1014 1015

	sg_set_buf(&sg[0], mac_data,
1016
		   sizeof(mac_data->entries) + (uc_count * ETH_ALEN));
1017 1018

	/* multicast list and count fill the end */
1019
	mac_data = (void *)&mac_data->macs[uc_count][0];
1020

1021
	mac_data->entries = mc_count;
1022
	i = 0;
1023 1024
	netdev_for_each_mc_addr(ha, dev)
		memcpy(&mac_data->macs[i++][0], ha->addr, ETH_ALEN);
1025 1026

	sg_set_buf(&sg[1], mac_data,
1027
		   sizeof(mac_data->entries) + (mc_count * ETH_ALEN));
1028 1029 1030

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_MAC,
				  VIRTIO_NET_CTRL_MAC_TABLE_SET,
1031
				  sg, NULL))
1032 1033 1034
		dev_warn(&dev->dev, "Failed to set MAC fitler table.\n");

	kfree(buf);
1035 1036
}

1037 1038
static int virtnet_vlan_rx_add_vid(struct net_device *dev,
				   __be16 proto, u16 vid)
1039 1040 1041 1042
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct scatterlist sg;

1043
	sg_init_one(&sg, &vid, sizeof(vid));
1044 1045

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_VLAN,
1046
				  VIRTIO_NET_CTRL_VLAN_ADD, &sg, NULL))
1047
		dev_warn(&dev->dev, "Failed to add VLAN ID %d.\n", vid);
1048
	return 0;
1049 1050
}

1051 1052
static int virtnet_vlan_rx_kill_vid(struct net_device *dev,
				    __be16 proto, u16 vid)
1053 1054 1055 1056
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct scatterlist sg;

1057
	sg_init_one(&sg, &vid, sizeof(vid));
1058 1059

	if (!virtnet_send_command(vi, VIRTIO_NET_CTRL_VLAN,
1060
				  VIRTIO_NET_CTRL_VLAN_DEL, &sg, NULL))
1061
		dev_warn(&dev->dev, "Failed to kill VLAN ID %d.\n", vid);
1062
	return 0;
1063 1064
}

1065
static void virtnet_clean_affinity(struct virtnet_info *vi, long hcpu)
J
Jason Wang 已提交
1066 1067
{
	int i;
1068
	int cpu;
J
Jason Wang 已提交
1069

1070 1071
	if (vi->affinity_hint_set) {
		for (i = 0; i < vi->max_queue_pairs; i++) {
1072 1073 1074 1075
			virtqueue_set_affinity(vi->rq[i].vq, -1);
			virtqueue_set_affinity(vi->sq[i].vq, -1);
		}

1076 1077 1078 1079 1080 1081 1082 1083
		vi->affinity_hint_set = false;
	}

	i = 0;
	for_each_online_cpu(cpu) {
		if (cpu == hcpu) {
			*per_cpu_ptr(vi->vq_index, cpu) = -1;
		} else {
1084 1085
			*per_cpu_ptr(vi->vq_index, cpu) =
				++i % vi->curr_queue_pairs;
1086 1087 1088
		}
	}
}
1089

1090 1091 1092 1093
static void virtnet_set_affinity(struct virtnet_info *vi)
{
	int i;
	int cpu;
J
Jason Wang 已提交
1094 1095 1096 1097 1098

	/* In multiqueue mode, when the number of cpu is equal to the number of
	 * queue pairs, we let the queue pairs to be private to one cpu by
	 * setting the affinity hint to eliminate the contention.
	 */
1099 1100 1101 1102
	if (vi->curr_queue_pairs == 1 ||
	    vi->max_queue_pairs != num_online_cpus()) {
		virtnet_clean_affinity(vi, -1);
		return;
J
Jason Wang 已提交
1103 1104
	}

1105 1106
	i = 0;
	for_each_online_cpu(cpu) {
J
Jason Wang 已提交
1107 1108
		virtqueue_set_affinity(vi->rq[i].vq, cpu);
		virtqueue_set_affinity(vi->sq[i].vq, cpu);
1109 1110
		*per_cpu_ptr(vi->vq_index, cpu) = i;
		i++;
J
Jason Wang 已提交
1111 1112
	}

1113
	vi->affinity_hint_set = true;
J
Jason Wang 已提交
1114 1115
}

1116 1117 1118 1119 1120
static int virtnet_cpu_callback(struct notifier_block *nfb,
			        unsigned long action, void *hcpu)
{
	struct virtnet_info *vi = container_of(nfb, struct virtnet_info, nb);

1121 1122 1123 1124 1125
	mutex_lock(&vi->config_lock);

	if (!vi->config_enable)
		goto done;

1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137
	switch(action & ~CPU_TASKS_FROZEN) {
	case CPU_ONLINE:
	case CPU_DOWN_FAILED:
	case CPU_DEAD:
		virtnet_set_affinity(vi);
		break;
	case CPU_DOWN_PREPARE:
		virtnet_clean_affinity(vi, (long)hcpu);
		break;
	default:
		break;
	}
1138 1139 1140

done:
	mutex_unlock(&vi->config_lock);
1141
	return NOTIFY_OK;
J
Jason Wang 已提交
1142 1143
}

R
Rick Jones 已提交
1144 1145 1146 1147 1148
static void virtnet_get_ringparam(struct net_device *dev,
				struct ethtool_ringparam *ring)
{
	struct virtnet_info *vi = netdev_priv(dev);

J
Jason Wang 已提交
1149 1150
	ring->rx_max_pending = virtqueue_get_vring_size(vi->rq[0].vq);
	ring->tx_max_pending = virtqueue_get_vring_size(vi->sq[0].vq);
R
Rick Jones 已提交
1151 1152 1153 1154
	ring->rx_pending = ring->rx_max_pending;
	ring->tx_pending = ring->tx_max_pending;
}

1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167

static void virtnet_get_drvinfo(struct net_device *dev,
				struct ethtool_drvinfo *info)
{
	struct virtnet_info *vi = netdev_priv(dev);
	struct virtio_device *vdev = vi->vdev;

	strlcpy(info->driver, KBUILD_MODNAME, sizeof(info->driver));
	strlcpy(info->version, VIRTNET_DRIVER_VERSION, sizeof(info->version));
	strlcpy(info->bus_info, virtio_bus_name(vdev), sizeof(info->bus_info));

}

1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184
/* TODO: Eliminate OOO packets during switching */
static int virtnet_set_channels(struct net_device *dev,
				struct ethtool_channels *channels)
{
	struct virtnet_info *vi = netdev_priv(dev);
	u16 queue_pairs = channels->combined_count;
	int err;

	/* We don't support separate rx/tx channels.
	 * We don't allow setting 'other' channels.
	 */
	if (channels->rx_count || channels->tx_count || channels->other_count)
		return -EINVAL;

	if (queue_pairs > vi->max_queue_pairs)
		return -EINVAL;

1185
	get_online_cpus();
1186 1187 1188 1189 1190
	err = virtnet_set_queues(vi, queue_pairs);
	if (!err) {
		netif_set_real_num_tx_queues(dev, queue_pairs);
		netif_set_real_num_rx_queues(dev, queue_pairs);

1191
		virtnet_set_affinity(vi);
1192
	}
1193
	put_online_cpus();
1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210

	return err;
}

static void virtnet_get_channels(struct net_device *dev,
				 struct ethtool_channels *channels)
{
	struct virtnet_info *vi = netdev_priv(dev);

	channels->combined_count = vi->curr_queue_pairs;
	channels->max_combined = vi->max_queue_pairs;
	channels->max_other = 0;
	channels->rx_count = 0;
	channels->tx_count = 0;
	channels->other_count = 0;
}

1211
static const struct ethtool_ops virtnet_ethtool_ops = {
1212
	.get_drvinfo = virtnet_get_drvinfo,
1213
	.get_link = ethtool_op_get_link,
R
Rick Jones 已提交
1214
	.get_ringparam = virtnet_get_ringparam,
1215 1216
	.set_channels = virtnet_set_channels,
	.get_channels = virtnet_get_channels,
1217 1218
};

M
Mark McLoughlin 已提交
1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229
#define MIN_MTU 68
#define MAX_MTU 65535

static int virtnet_change_mtu(struct net_device *dev, int new_mtu)
{
	if (new_mtu < MIN_MTU || new_mtu > MAX_MTU)
		return -EINVAL;
	dev->mtu = new_mtu;
	return 0;
}

J
Jason Wang 已提交
1230 1231 1232 1233 1234
/* To avoid contending a lock hold by a vcpu who would exit to host, select the
 * txq based on the processor id.
 */
static u16 virtnet_select_queue(struct net_device *dev, struct sk_buff *skb)
{
1235 1236 1237 1238 1239 1240 1241 1242 1243 1244
	int txq;
	struct virtnet_info *vi = netdev_priv(dev);

	if (skb_rx_queue_recorded(skb)) {
		txq = skb_get_rx_queue(skb);
	} else {
		txq = *__this_cpu_ptr(vi->vq_index);
		if (txq == -1)
			txq = 0;
	}
J
Jason Wang 已提交
1245 1246 1247 1248 1249 1250 1251

	while (unlikely(txq >= dev->real_num_tx_queues))
		txq -= dev->real_num_tx_queues;

	return txq;
}

1252 1253 1254 1255 1256
static const struct net_device_ops virtnet_netdev = {
	.ndo_open            = virtnet_open,
	.ndo_stop   	     = virtnet_close,
	.ndo_start_xmit      = start_xmit,
	.ndo_validate_addr   = eth_validate_addr,
1257
	.ndo_set_mac_address = virtnet_set_mac_address,
1258
	.ndo_set_rx_mode     = virtnet_set_rx_mode,
1259
	.ndo_change_mtu	     = virtnet_change_mtu,
1260
	.ndo_get_stats64     = virtnet_stats,
1261 1262
	.ndo_vlan_rx_add_vid = virtnet_vlan_rx_add_vid,
	.ndo_vlan_rx_kill_vid = virtnet_vlan_rx_kill_vid,
J
Jason Wang 已提交
1263
	.ndo_select_queue     = virtnet_select_queue,
1264 1265 1266 1267 1268
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller = virtnet_netpoll,
#endif
};

1269
static void virtnet_config_changed_work(struct work_struct *work)
1270
{
1271 1272
	struct virtnet_info *vi =
		container_of(work, struct virtnet_info, config_work);
1273 1274
	u16 v;

1275 1276 1277 1278
	mutex_lock(&vi->config_lock);
	if (!vi->config_enable)
		goto done;

1279
	if (virtio_config_val(vi->vdev, VIRTIO_NET_F_STATUS,
1280
			      offsetof(struct virtio_net_config, status),
1281
			      &v) < 0)
1282 1283 1284
		goto done;

	if (v & VIRTIO_NET_S_ANNOUNCE) {
1285
		netdev_notify_peers(vi->dev);
1286 1287
		virtnet_ack_link_announce(vi);
	}
1288 1289 1290 1291 1292

	/* Ignore unknown (future) status bits */
	v &= VIRTIO_NET_S_LINK_UP;

	if (vi->status == v)
1293
		goto done;
1294 1295 1296 1297 1298

	vi->status = v;

	if (vi->status & VIRTIO_NET_S_LINK_UP) {
		netif_carrier_on(vi->dev);
J
Jason Wang 已提交
1299
		netif_tx_wake_all_queues(vi->dev);
1300 1301
	} else {
		netif_carrier_off(vi->dev);
J
Jason Wang 已提交
1302
		netif_tx_stop_all_queues(vi->dev);
1303
	}
1304 1305
done:
	mutex_unlock(&vi->config_lock);
1306 1307 1308 1309 1310 1311
}

static void virtnet_config_changed(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;

1312
	schedule_work(&vi->config_work);
1313 1314
}

J
Jason Wang 已提交
1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355
static void virtnet_free_queues(struct virtnet_info *vi)
{
	kfree(vi->rq);
	kfree(vi->sq);
}

static void free_receive_bufs(struct virtnet_info *vi)
{
	int i;

	for (i = 0; i < vi->max_queue_pairs; i++) {
		while (vi->rq[i].pages)
			__free_pages(get_a_page(&vi->rq[i], GFP_KERNEL), 0);
	}
}

static void free_unused_bufs(struct virtnet_info *vi)
{
	void *buf;
	int i;

	for (i = 0; i < vi->max_queue_pairs; i++) {
		struct virtqueue *vq = vi->sq[i].vq;
		while ((buf = virtqueue_detach_unused_buf(vq)) != NULL)
			dev_kfree_skb(buf);
	}

	for (i = 0; i < vi->max_queue_pairs; i++) {
		struct virtqueue *vq = vi->rq[i].vq;

		while ((buf = virtqueue_detach_unused_buf(vq)) != NULL) {
			if (vi->mergeable_rx_bufs || vi->big_packets)
				give_pages(&vi->rq[i], buf);
			else
				dev_kfree_skb(buf);
			--vi->rq[i].num;
		}
		BUG_ON(vi->rq[i].num != 0);
	}
}

1356 1357 1358 1359
static void virtnet_del_vqs(struct virtnet_info *vi)
{
	struct virtio_device *vdev = vi->vdev;

1360
	virtnet_clean_affinity(vi, -1);
J
Jason Wang 已提交
1361

1362
	vdev->config->del_vqs(vdev);
J
Jason Wang 已提交
1363 1364

	virtnet_free_queues(vi);
1365 1366
}

J
Jason Wang 已提交
1367
static int virtnet_find_vqs(struct virtnet_info *vi)
1368
{
J
Jason Wang 已提交
1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397
	vq_callback_t **callbacks;
	struct virtqueue **vqs;
	int ret = -ENOMEM;
	int i, total_vqs;
	const char **names;

	/* We expect 1 RX virtqueue followed by 1 TX virtqueue, followed by
	 * possible N-1 RX/TX queue pairs used in multiqueue mode, followed by
	 * possible control vq.
	 */
	total_vqs = vi->max_queue_pairs * 2 +
		    virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VQ);

	/* Allocate space for find_vqs parameters */
	vqs = kzalloc(total_vqs * sizeof(*vqs), GFP_KERNEL);
	if (!vqs)
		goto err_vq;
	callbacks = kmalloc(total_vqs * sizeof(*callbacks), GFP_KERNEL);
	if (!callbacks)
		goto err_callback;
	names = kmalloc(total_vqs * sizeof(*names), GFP_KERNEL);
	if (!names)
		goto err_names;

	/* Parameters for control virtqueue, if any */
	if (vi->has_cvq) {
		callbacks[total_vqs - 1] = NULL;
		names[total_vqs - 1] = "control";
	}
1398

J
Jason Wang 已提交
1399 1400 1401 1402 1403 1404 1405 1406 1407
	/* Allocate/initialize parameters for send/receive virtqueues */
	for (i = 0; i < vi->max_queue_pairs; i++) {
		callbacks[rxq2vq(i)] = skb_recv_done;
		callbacks[txq2vq(i)] = skb_xmit_done;
		sprintf(vi->rq[i].name, "input.%d", i);
		sprintf(vi->sq[i].name, "output.%d", i);
		names[rxq2vq(i)] = vi->rq[i].name;
		names[txq2vq(i)] = vi->sq[i].name;
	}
1408

J
Jason Wang 已提交
1409 1410 1411 1412
	ret = vi->vdev->config->find_vqs(vi->vdev, total_vqs, vqs, callbacks,
					 names);
	if (ret)
		goto err_find;
1413

J
Jason Wang 已提交
1414 1415
	if (vi->has_cvq) {
		vi->cvq = vqs[total_vqs - 1];
1416
		if (virtio_has_feature(vi->vdev, VIRTIO_NET_F_CTRL_VLAN))
1417
			vi->dev->features |= NETIF_F_HW_VLAN_CTAG_FILTER;
1418
	}
J
Jason Wang 已提交
1419 1420 1421 1422 1423 1424 1425 1426 1427 1428

	for (i = 0; i < vi->max_queue_pairs; i++) {
		vi->rq[i].vq = vqs[rxq2vq(i)];
		vi->sq[i].vq = vqs[txq2vq(i)];
	}

	kfree(names);
	kfree(callbacks);
	kfree(vqs);

1429
	return 0;
J
Jason Wang 已提交
1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448

err_find:
	kfree(names);
err_names:
	kfree(callbacks);
err_callback:
	kfree(vqs);
err_vq:
	return ret;
}

static int virtnet_alloc_queues(struct virtnet_info *vi)
{
	int i;

	vi->sq = kzalloc(sizeof(*vi->sq) * vi->max_queue_pairs, GFP_KERNEL);
	if (!vi->sq)
		goto err_sq;
	vi->rq = kzalloc(sizeof(*vi->rq) * vi->max_queue_pairs, GFP_KERNEL);
1449
	if (!vi->rq)
J
Jason Wang 已提交
1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482
		goto err_rq;

	INIT_DELAYED_WORK(&vi->refill, refill_work);
	for (i = 0; i < vi->max_queue_pairs; i++) {
		vi->rq[i].pages = NULL;
		netif_napi_add(vi->dev, &vi->rq[i].napi, virtnet_poll,
			       napi_weight);

		sg_init_table(vi->rq[i].sg, ARRAY_SIZE(vi->rq[i].sg));
		sg_init_table(vi->sq[i].sg, ARRAY_SIZE(vi->sq[i].sg));
	}

	return 0;

err_rq:
	kfree(vi->sq);
err_sq:
	return -ENOMEM;
}

static int init_vqs(struct virtnet_info *vi)
{
	int ret;

	/* Allocate send & receive queues */
	ret = virtnet_alloc_queues(vi);
	if (ret)
		goto err;

	ret = virtnet_find_vqs(vi);
	if (ret)
		goto err_free;

1483
	get_online_cpus();
1484
	virtnet_set_affinity(vi);
1485 1486
	put_online_cpus();

J
Jason Wang 已提交
1487 1488 1489 1490 1491 1492
	return 0;

err_free:
	virtnet_free_queues(vi);
err:
	return ret;
1493 1494
}

R
Rusty Russell 已提交
1495 1496
static int virtnet_probe(struct virtio_device *vdev)
{
J
Jason Wang 已提交
1497
	int i, err;
R
Rusty Russell 已提交
1498 1499
	struct net_device *dev;
	struct virtnet_info *vi;
J
Jason Wang 已提交
1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511
	u16 max_queue_pairs;

	/* Find if host supports multiqueue virtio_net device */
	err = virtio_config_val(vdev, VIRTIO_NET_F_MQ,
				offsetof(struct virtio_net_config,
				max_virtqueue_pairs), &max_queue_pairs);

	/* We need at least 2 queue's */
	if (err || max_queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
	    max_queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
	    !virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ))
		max_queue_pairs = 1;
R
Rusty Russell 已提交
1512 1513

	/* Allocate ourselves a network device with room for our info */
J
Jason Wang 已提交
1514
	dev = alloc_etherdev_mq(sizeof(struct virtnet_info), max_queue_pairs);
R
Rusty Russell 已提交
1515 1516 1517 1518
	if (!dev)
		return -ENOMEM;

	/* Set up network device as normal. */
1519
	dev->priv_flags |= IFF_UNICAST_FLT | IFF_LIVE_ADDR_CHANGE;
1520
	dev->netdev_ops = &virtnet_netdev;
R
Rusty Russell 已提交
1521
	dev->features = NETIF_F_HIGHDMA;
1522

1523
	SET_ETHTOOL_OPS(dev, &virtnet_ethtool_ops);
R
Rusty Russell 已提交
1524 1525 1526
	SET_NETDEV_DEV(dev, &vdev->dev);

	/* Do we support "hardware" checksums? */
1527
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CSUM)) {
R
Rusty Russell 已提交
1528
		/* This opens up the world of extra features. */
1529 1530 1531 1532 1533 1534
		dev->hw_features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;
		if (csum)
			dev->features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;

		if (virtio_has_feature(vdev, VIRTIO_NET_F_GSO)) {
			dev->hw_features |= NETIF_F_TSO | NETIF_F_UFO
R
Rusty Russell 已提交
1535 1536
				| NETIF_F_TSO_ECN | NETIF_F_TSO6;
		}
1537
		/* Individual feature bits: what can host handle? */
1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO4))
			dev->hw_features |= NETIF_F_TSO;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO6))
			dev->hw_features |= NETIF_F_TSO6;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_ECN))
			dev->hw_features |= NETIF_F_TSO_ECN;
		if (virtio_has_feature(vdev, VIRTIO_NET_F_HOST_UFO))
			dev->hw_features |= NETIF_F_UFO;

		if (gso)
			dev->features |= dev->hw_features & (NETIF_F_ALL_TSO|NETIF_F_UFO);
		/* (!csum && gso) case will be fixed by register_netdev() */
R
Rusty Russell 已提交
1550
	}
1551 1552
	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_CSUM))
		dev->features |= NETIF_F_RXCSUM;
R
Rusty Russell 已提交
1553

1554 1555
	dev->vlan_features = dev->features;

R
Rusty Russell 已提交
1556
	/* Configuration may specify what MAC to use.  Otherwise random. */
1557
	if (virtio_config_val_len(vdev, VIRTIO_NET_F_MAC,
1558
				  offsetof(struct virtio_net_config, mac),
1559
				  dev->dev_addr, dev->addr_len) < 0)
1560
		eth_hw_addr_random(dev);
R
Rusty Russell 已提交
1561 1562 1563 1564 1565

	/* Set up our device-specific information */
	vi = netdev_priv(dev);
	vi->dev = dev;
	vi->vdev = vdev;
1566
	vdev->priv = vi;
1567 1568 1569 1570 1571
	vi->stats = alloc_percpu(struct virtnet_stats);
	err = -ENOMEM;
	if (vi->stats == NULL)
		goto free;

1572 1573 1574 1575
	vi->vq_index = alloc_percpu(int);
	if (vi->vq_index == NULL)
		goto free_stats;

1576 1577 1578
	mutex_init(&vi->config_lock);
	vi->config_enable = true;
	INIT_WORK(&vi->config_work, virtnet_config_changed_work);
R
Rusty Russell 已提交
1579

1580
	/* If we can receive ANY GSO packets, we must allocate large ones. */
1581 1582 1583
	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO4) ||
	    virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO6) ||
	    virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_ECN))
1584 1585
		vi->big_packets = true;

1586 1587 1588
	if (virtio_has_feature(vdev, VIRTIO_NET_F_MRG_RXBUF))
		vi->mergeable_rx_bufs = true;

1589 1590 1591
	if (virtio_has_feature(vdev, VIRTIO_F_ANY_LAYOUT))
		vi->any_header_sg = true;

J
Jason Wang 已提交
1592 1593 1594 1595 1596 1597 1598 1599
	if (virtio_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ))
		vi->has_cvq = true;

	/* Use single tx/rx queue pair as default */
	vi->curr_queue_pairs = 1;
	vi->max_queue_pairs = max_queue_pairs;

	/* Allocate/initialize the rx/tx queues, and invoke find_vqs */
1600
	err = init_vqs(vi);
1601
	if (err)
1602
		goto free_index;
R
Rusty Russell 已提交
1603

J
Jason Wang 已提交
1604 1605 1606
	netif_set_real_num_tx_queues(dev, 1);
	netif_set_real_num_rx_queues(dev, 1);

R
Rusty Russell 已提交
1607 1608 1609
	err = register_netdev(dev);
	if (err) {
		pr_debug("virtio_net: registering device failed\n");
1610
		goto free_vqs;
R
Rusty Russell 已提交
1611
	}
1612 1613

	/* Last of all, set up some receive buffers. */
1614
	for (i = 0; i < vi->curr_queue_pairs; i++) {
J
Jason Wang 已提交
1615 1616 1617 1618 1619 1620 1621 1622
		try_fill_recv(&vi->rq[i], GFP_KERNEL);

		/* If we didn't even get one input buffer, we're useless. */
		if (vi->rq[i].num == 0) {
			free_unused_bufs(vi);
			err = -ENOMEM;
			goto free_recv_bufs;
		}
1623 1624
	}

1625 1626 1627 1628 1629 1630 1631
	vi->nb.notifier_call = &virtnet_cpu_callback;
	err = register_hotcpu_notifier(&vi->nb);
	if (err) {
		pr_debug("virtio_net: registering cpu notifier failed\n");
		goto free_recv_bufs;
	}

J
Jason Wang 已提交
1632 1633 1634 1635
	/* Assume link up if device can't report link status,
	   otherwise get link status from config. */
	if (virtio_has_feature(vi->vdev, VIRTIO_NET_F_STATUS)) {
		netif_carrier_off(dev);
1636
		schedule_work(&vi->config_work);
J
Jason Wang 已提交
1637 1638 1639 1640
	} else {
		vi->status = VIRTIO_NET_S_LINK_UP;
		netif_carrier_on(dev);
	}
1641

J
Jason Wang 已提交
1642 1643 1644
	pr_debug("virtnet: registered device %s with %d RX and TX vq's\n",
		 dev->name, max_queue_pairs);

R
Rusty Russell 已提交
1645 1646
	return 0;

J
Jason Wang 已提交
1647 1648
free_recv_bufs:
	free_receive_bufs(vi);
1649
	unregister_netdev(dev);
1650
free_vqs:
J
Jason Wang 已提交
1651
	cancel_delayed_work_sync(&vi->refill);
1652
	virtnet_del_vqs(vi);
1653 1654
free_index:
	free_percpu(vi->vq_index);
1655 1656
free_stats:
	free_percpu(vi->stats);
R
Rusty Russell 已提交
1657 1658 1659 1660 1661
free:
	free_netdev(dev);
	return err;
}

1662
static void remove_vq_common(struct virtnet_info *vi)
R
Rusty Russell 已提交
1663
{
1664
	vi->vdev->config->reset(vi->vdev);
S
Shirley Ma 已提交
1665 1666

	/* Free unused buffers in both send and recv, if any. */
1667
	free_unused_bufs(vi);
1668

J
Jason Wang 已提交
1669
	free_receive_bufs(vi);
1670

J
Jason Wang 已提交
1671
	virtnet_del_vqs(vi);
1672 1673
}

1674
static void virtnet_remove(struct virtio_device *vdev)
1675 1676 1677
{
	struct virtnet_info *vi = vdev->priv;

1678 1679
	unregister_hotcpu_notifier(&vi->nb);

1680 1681 1682 1683 1684
	/* Prevent config work handler from accessing the device. */
	mutex_lock(&vi->config_lock);
	vi->config_enable = false;
	mutex_unlock(&vi->config_lock);

1685 1686 1687
	unregister_netdev(vi->dev);

	remove_vq_common(vi);
1688

1689 1690
	flush_work(&vi->config_work);

1691
	free_percpu(vi->vq_index);
1692
	free_percpu(vi->stats);
1693
	free_netdev(vi->dev);
R
Rusty Russell 已提交
1694 1695
}

1696 1697 1698 1699
#ifdef CONFIG_PM
static int virtnet_freeze(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;
J
Jason Wang 已提交
1700
	int i;
1701

1702 1703 1704 1705 1706
	/* Prevent config work handler from accessing the device */
	mutex_lock(&vi->config_lock);
	vi->config_enable = false;
	mutex_unlock(&vi->config_lock);

1707 1708 1709 1710
	netif_device_detach(vi->dev);
	cancel_delayed_work_sync(&vi->refill);

	if (netif_running(vi->dev))
J
Jason Wang 已提交
1711 1712 1713 1714
		for (i = 0; i < vi->max_queue_pairs; i++) {
			napi_disable(&vi->rq[i].napi);
			netif_napi_del(&vi->rq[i].napi);
		}
1715 1716 1717

	remove_vq_common(vi);

1718 1719
	flush_work(&vi->config_work);

1720 1721 1722 1723 1724 1725
	return 0;
}

static int virtnet_restore(struct virtio_device *vdev)
{
	struct virtnet_info *vi = vdev->priv;
J
Jason Wang 已提交
1726
	int err, i;
1727 1728 1729 1730 1731 1732

	err = init_vqs(vi);
	if (err)
		return err;

	if (netif_running(vi->dev))
J
Jason Wang 已提交
1733 1734
		for (i = 0; i < vi->max_queue_pairs; i++)
			virtnet_napi_enable(&vi->rq[i]);
1735 1736 1737

	netif_device_attach(vi->dev);

1738
	for (i = 0; i < vi->curr_queue_pairs; i++)
J
Jason Wang 已提交
1739 1740
		if (!try_fill_recv(&vi->rq[i], GFP_KERNEL))
			schedule_delayed_work(&vi->refill, 0);
1741

1742 1743 1744 1745
	mutex_lock(&vi->config_lock);
	vi->config_enable = true;
	mutex_unlock(&vi->config_lock);

1746
	rtnl_lock();
J
Jason Wang 已提交
1747
	virtnet_set_queues(vi, vi->curr_queue_pairs);
1748
	rtnl_unlock();
J
Jason Wang 已提交
1749

1750 1751 1752 1753
	return 0;
}
#endif

R
Rusty Russell 已提交
1754 1755 1756 1757 1758
static struct virtio_device_id id_table[] = {
	{ VIRTIO_ID_NET, VIRTIO_DEV_ANY_ID },
	{ 0 },
};

1759
static unsigned int features[] = {
1760 1761
	VIRTIO_NET_F_CSUM, VIRTIO_NET_F_GUEST_CSUM,
	VIRTIO_NET_F_GSO, VIRTIO_NET_F_MAC,
1762
	VIRTIO_NET_F_HOST_TSO4, VIRTIO_NET_F_HOST_UFO, VIRTIO_NET_F_HOST_TSO6,
1763
	VIRTIO_NET_F_HOST_ECN, VIRTIO_NET_F_GUEST_TSO4, VIRTIO_NET_F_GUEST_TSO6,
1764
	VIRTIO_NET_F_GUEST_ECN, VIRTIO_NET_F_GUEST_UFO,
1765
	VIRTIO_NET_F_MRG_RXBUF, VIRTIO_NET_F_STATUS, VIRTIO_NET_F_CTRL_VQ,
1766
	VIRTIO_NET_F_CTRL_RX, VIRTIO_NET_F_CTRL_VLAN,
J
Jason Wang 已提交
1767
	VIRTIO_NET_F_GUEST_ANNOUNCE, VIRTIO_NET_F_MQ,
1768
	VIRTIO_NET_F_CTRL_MAC_ADDR,
1769
	VIRTIO_F_ANY_LAYOUT,
1770 1771
};

1772
static struct virtio_driver virtio_net_driver = {
1773 1774
	.feature_table = features,
	.feature_table_size = ARRAY_SIZE(features),
R
Rusty Russell 已提交
1775 1776 1777 1778
	.driver.name =	KBUILD_MODNAME,
	.driver.owner =	THIS_MODULE,
	.id_table =	id_table,
	.probe =	virtnet_probe,
1779
	.remove =	virtnet_remove,
1780
	.config_changed = virtnet_config_changed,
1781 1782 1783 1784
#ifdef CONFIG_PM
	.freeze =	virtnet_freeze,
	.restore =	virtnet_restore,
#endif
R
Rusty Russell 已提交
1785 1786
};

1787
module_virtio_driver(virtio_net_driver);
R
Rusty Russell 已提交
1788 1789 1790 1791

MODULE_DEVICE_TABLE(virtio, id_table);
MODULE_DESCRIPTION("Virtio network driver");
MODULE_LICENSE("GPL");