trans_virtio.c 15.0 KB
Newer Older
E
Eric Van Hensbergen 已提交
1
/*
2
 * The Virtio 9p transport driver
E
Eric Van Hensbergen 已提交
3
 *
4 5
 * This is a block based transport driver based on the lguest block driver
 * code.
E
Eric Van Hensbergen 已提交
6
 *
7
 *  Copyright (C) 2007, 2008 Eric Van Hensbergen, IBM Corporation
E
Eric Van Hensbergen 已提交
8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39
 *
 *  Based on virtio console driver
 *  Copyright (C) 2006, 2007 Rusty Russell, IBM Corporation
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License version 2
 *  as published by the Free Software Foundation.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to:
 *  Free Software Foundation
 *  51 Franklin Street, Fifth Floor
 *  Boston, MA  02111-1301  USA
 *
 */

#include <linux/in.h>
#include <linux/module.h>
#include <linux/net.h>
#include <linux/ipv6.h>
#include <linux/errno.h>
#include <linux/kernel.h>
#include <linux/un.h>
#include <linux/uaccess.h>
#include <linux/inet.h>
#include <linux/idr.h>
#include <linux/file.h>
40
#include <linux/slab.h>
E
Eric Van Hensbergen 已提交
41 42
#include <net/9p/9p.h>
#include <linux/parser.h>
43
#include <net/9p/client.h>
E
Eric Van Hensbergen 已提交
44 45 46 47
#include <net/9p/transport.h>
#include <linux/scatterlist.h>
#include <linux/virtio.h>
#include <linux/virtio_9p.h>
48
#include "trans_common.h"
E
Eric Van Hensbergen 已提交
49

50 51
#define VIRTQUEUE_NUM	128

E
Eric Van Hensbergen 已提交
52
/* a single mutex to manage channel initialization and attachment */
53
static DEFINE_MUTEX(virtio_9p_lock);
E
Eric Van Hensbergen 已提交
54

E
Eric Van Hensbergen 已提交
55 56 57 58 59
/**
 * struct virtio_chan - per-instance transport information
 * @initialized: whether the channel is initialized
 * @inuse: whether the channel is in use
 * @lock: protects multiple elements within this structure
A
Abhishek Kulkarni 已提交
60
 * @client: client instance
E
Eric Van Hensbergen 已提交
61 62 63 64 65
 * @vdev: virtio dev associated with this channel
 * @vq: virtio queue associated with this channel
 * @sg: scatter gather list which is used to pack a request (protected?)
 *
 * We keep all per-channel information in a structure.
E
Eric Van Hensbergen 已提交
66 67
 * This structure is allocated within the devices dev->mem space.
 * A pointer to the structure will get put in the transport private.
E
Eric Van Hensbergen 已提交
68
 *
E
Eric Van Hensbergen 已提交
69
 */
E
Eric Van Hensbergen 已提交
70

71
struct virtio_chan {
E
Eric Van Hensbergen 已提交
72
	bool inuse;
E
Eric Van Hensbergen 已提交
73

74 75
	spinlock_t lock;

76
	struct p9_client *client;
E
Eric Van Hensbergen 已提交
77
	struct virtio_device *vdev;
78
	struct virtqueue *vq;
79 80
	int ring_bufs_avail;
	wait_queue_head_t *vc_wq;
E
Eric Van Hensbergen 已提交
81

82 83
	/* Scatterlist: can be too big for stack. */
	struct scatterlist sg[VIRTQUEUE_NUM];
84

85 86 87 88 89 90
	int tag_len;
	/*
	 * tag name to identify a mount Non-null terminated
	 */
	char *tag;

91 92 93 94
	struct list_head chan_list;
};

static struct list_head virtio_chan_list;
E
Eric Van Hensbergen 已提交
95 96 97 98 99 100 101

/* How many bytes left in this page. */
static unsigned int rest_of_page(void *data)
{
	return PAGE_SIZE - ((unsigned long)data % PAGE_SIZE);
}

E
Eric Van Hensbergen 已提交
102 103
/**
 * p9_virtio_close - reclaim resources of a channel
A
Abhishek Kulkarni 已提交
104
 * @client: client instance
E
Eric Van Hensbergen 已提交
105 106 107 108 109 110
 *
 * This reclaims a channel by freeing its resources and
 * reseting its inuse flag.
 *
 */

111
static void p9_virtio_close(struct p9_client *client)
112
{
113
	struct virtio_chan *chan = client->trans;
E
Eric Van Hensbergen 已提交
114

115
	mutex_lock(&virtio_9p_lock);
116 117
	if (chan)
		chan->inuse = false;
118
	mutex_unlock(&virtio_9p_lock);
E
Eric Van Hensbergen 已提交
119 120
}

E
Eric Van Hensbergen 已提交
121 122 123 124 125 126 127 128 129 130 131 132 133
/**
 * req_done - callback which signals activity from the server
 * @vq: virtio queue activity was received on
 *
 * This notifies us that the server has triggered some activity
 * on the virtio channel - most likely a response to request we
 * sent.  Figure out which requests now have responses and wake up
 * those threads.
 *
 * Bugs: could do with some additional sanity checking, but appears to work.
 *
 */

134
static void req_done(struct virtqueue *vq)
E
Eric Van Hensbergen 已提交
135
{
136 137 138 139
	struct virtio_chan *chan = vq->vdev->priv;
	struct p9_fcall *rc;
	unsigned int len;
	struct p9_req_t *req;
140
	unsigned long flags;
141

142 143
	P9_DPRINTK(P9_DEBUG_TRANS, ": request done\n");

144
	while (1) {
145 146 147
		spin_lock_irqsave(&chan->lock, flags);
		rc = virtqueue_get_buf(chan->vq, &len);

148
		if (rc == NULL) {
149
			spin_unlock_irqrestore(&chan->lock, flags);
150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166
			break;
		}

		chan->ring_bufs_avail = 1;
		spin_unlock_irqrestore(&chan->lock, flags);
		/* Wakeup if anyone waiting for VirtIO ring space. */
		wake_up(chan->vc_wq);
		P9_DPRINTK(P9_DEBUG_TRANS, ": rc %p\n", rc);
		P9_DPRINTK(P9_DEBUG_TRANS, ": lookup tag %d\n", rc->tag);
		req = p9_tag_lookup(chan->client, rc->tag);
		if (req->tc->private) {
			struct trans_rpage_info *rp = req->tc->private;
			/*Release pages */
			p9_release_req_pages(rp);
			if (rp->rp_alloc)
				kfree(rp);
			req->tc->private = NULL;
167
		}
168 169 170
		req->status = REQ_STATUS_RCVD;
		p9_client_cb(chan->client, req);
	}
171
}
E
Eric Van Hensbergen 已提交
172

E
Eric Van Hensbergen 已提交
173 174 175 176 177 178 179 180 181 182 183 184 185 186
/**
 * pack_sg_list - pack a scatter gather list from a linear buffer
 * @sg: scatter/gather list to pack into
 * @start: which segment of the sg_list to start at
 * @limit: maximum segment to pack data to
 * @data: data to pack into scatter/gather list
 * @count: amount of data to pack into the scatter/gather list
 *
 * sg_lists have multiple segments of various sizes.  This will pack
 * arbitrary data into an existing scatter gather list, segmenting the
 * data as necessary within constraints.
 *
 */

187 188 189 190 191 192 193 194 195 196 197 198 199 200
static int
pack_sg_list(struct scatterlist *sg, int start, int limit, char *data,
								int count)
{
	int s;
	int index = start;

	while (count) {
		s = rest_of_page(data);
		if (s > count)
			s = count;
		sg_set_buf(&sg[index++], data, s);
		count -= s;
		data += s;
J
Julia Lawall 已提交
201
		BUG_ON(index > limit);
202
	}
E
Eric Van Hensbergen 已提交
203

204
	return index-start;
E
Eric Van Hensbergen 已提交
205 206
}

207 208 209 210 211 212
/* We don't currently allow canceling of virtio requests */
static int p9_virtio_cancel(struct p9_client *client, struct p9_req_t *req)
{
	return 1;
}

213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244
/**
 * pack_sg_list_p - Just like pack_sg_list. Instead of taking a buffer,
 * this takes a list of pages.
 * @sg: scatter/gather list to pack into
 * @start: which segment of the sg_list to start at
 * @pdata_off: Offset into the first page
 * @**pdata: a list of pages to add into sg.
 * @count: amount of data to pack into the scatter/gather list
 */
static int
pack_sg_list_p(struct scatterlist *sg, int start, int limit, size_t pdata_off,
		struct page **pdata, int count)
{
	int s;
	int i = 0;
	int index = start;

	if (pdata_off) {
		s = min((int)(PAGE_SIZE - pdata_off), count);
		sg_set_page(&sg[index++], pdata[i++], s, pdata_off);
		count -= s;
	}

	while (count) {
		BUG_ON(index > limit);
		s = min((int)PAGE_SIZE, count);
		sg_set_page(&sg[index++], pdata[i++], s, 0);
		count -= s;
	}
	return index-start;
}

E
Eric Van Hensbergen 已提交
245
/**
246
 * p9_virtio_request - issue a request
A
Abhishek Kulkarni 已提交
247 248
 * @client: client instance issuing the request
 * @req: request to be issued
E
Eric Van Hensbergen 已提交
249 250 251
 *
 */

252
static int
253
p9_virtio_request(struct p9_client *client, struct p9_req_t *req)
E
Eric Van Hensbergen 已提交
254
{
255
	int in, out, inp, outp;
256 257
	struct virtio_chan *chan = client->trans;
	char *rdata = (char *)req->rc+sizeof(struct p9_fcall);
258
	unsigned long flags;
259 260 261
	size_t pdata_off = 0;
	struct trans_rpage_info *rpinfo = NULL;
	int err, pdata_len = 0;
E
Eric Van Hensbergen 已提交
262

263
	P9_DPRINTK(P9_DEBUG_TRANS, "9p debug: virtio request\n");
E
Eric Van Hensbergen 已提交
264

265
req_retry:
266 267
	req->status = REQ_STATUS_SENT;

268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297
	if (req->tc->pbuf_size && (req->tc->pubuf && P9_IS_USER_CONTEXT)) {
		int nr_pages = p9_nr_pages(req);
		int rpinfo_size = sizeof(struct trans_rpage_info) +
			sizeof(struct page *) * nr_pages;

		if (rpinfo_size <= (req->tc->capacity - req->tc->size)) {
			/* We can use sdata */
			req->tc->private = req->tc->sdata + req->tc->size;
			rpinfo = (struct trans_rpage_info *)req->tc->private;
			rpinfo->rp_alloc = 0;
		} else {
			req->tc->private = kmalloc(rpinfo_size, GFP_NOFS);
			if (!req->tc->private) {
				P9_DPRINTK(P9_DEBUG_TRANS, "9p debug: "
					"private kmalloc returned NULL");
				return -ENOMEM;
			}
			rpinfo = (struct trans_rpage_info *)req->tc->private;
			rpinfo->rp_alloc = 1;
		}

		err = p9_payload_gup(req, &pdata_off, &pdata_len, nr_pages,
				req->tc->id == P9_TREAD ? 1 : 0);
		if (err < 0) {
			if (rpinfo->rp_alloc)
				kfree(rpinfo);
			return err;
		}
	}

298
	spin_lock_irqsave(&chan->lock, flags);
299 300

	/* Handle out VirtIO ring buffers */
301
	out = pack_sg_list(chan->sg, 0, VIRTQUEUE_NUM, req->tc->sdata,
302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345
			req->tc->size);

	if (req->tc->pbuf_size && (req->tc->id == P9_TWRITE)) {
		/* We have additional write payload buffer to take care */
		if (req->tc->pubuf && P9_IS_USER_CONTEXT) {
			outp = pack_sg_list_p(chan->sg, out, VIRTQUEUE_NUM,
					pdata_off, rpinfo->rp_data, pdata_len);
		} else {
			char *pbuf = req->tc->pubuf ? req->tc->pubuf :
								req->tc->pkbuf;
			outp = pack_sg_list(chan->sg, out, VIRTQUEUE_NUM, pbuf,
					req->tc->pbuf_size);
		}
		out += outp;
	}

	/* Handle in VirtIO ring buffers */
	if (req->tc->pbuf_size &&
		((req->tc->id == P9_TREAD) || (req->tc->id == P9_TREADDIR))) {
		/*
		 * Take care of additional Read payload.
		 * 11 is the read/write header = PDU Header(7) + IO Size (4).
		 * Arrange in such a way that server places header in the
		 * alloced memory and payload onto the user buffer.
		 */
		inp = pack_sg_list(chan->sg, out, VIRTQUEUE_NUM, rdata, 11);
		/*
		 * Running executables in the filesystem may result in
		 * a read request with kernel buffer as opposed to user buffer.
		 */
		if (req->tc->pubuf && P9_IS_USER_CONTEXT) {
			in = pack_sg_list_p(chan->sg, out+inp, VIRTQUEUE_NUM,
					pdata_off, rpinfo->rp_data, pdata_len);
		} else {
			char *pbuf = req->tc->pubuf ? req->tc->pubuf :
								req->tc->pkbuf;
			in = pack_sg_list(chan->sg, out+inp, VIRTQUEUE_NUM,
					pbuf, req->tc->pbuf_size);
		}
		in += inp;
	} else {
		in = pack_sg_list(chan->sg, out, VIRTQUEUE_NUM, rdata,
				client->msize);
	}
E
Eric Van Hensbergen 已提交
346

347 348
	err = virtqueue_add_buf(chan->vq, chan->sg, out, in, req->tc);
	if (err < 0) {
349 350 351 352 353 354 355 356 357 358 359 360 361 362 363
		if (err == -ENOSPC) {
			chan->ring_bufs_avail = 0;
			spin_unlock_irqrestore(&chan->lock, flags);
			err = wait_event_interruptible(*chan->vc_wq,
							chan->ring_bufs_avail);
			if (err  == -ERESTARTSYS)
				return err;

			P9_DPRINTK(P9_DEBUG_TRANS, "9p:Retry virtio request\n");
			goto req_retry;
		} else {
			spin_unlock_irqrestore(&chan->lock, flags);
			P9_DPRINTK(P9_DEBUG_TRANS,
					"9p debug: "
					"virtio rpc add_buf returned failure");
364 365
			if (rpinfo && rpinfo->rp_alloc)
				kfree(rpinfo);
366 367
			return -EIO;
		}
368
	}
E
Eric Van Hensbergen 已提交
369

370
	virtqueue_kick(chan->vq);
371
	spin_unlock_irqrestore(&chan->lock, flags);
E
Eric Van Hensbergen 已提交
372

373
	P9_DPRINTK(P9_DEBUG_TRANS, "9p debug: virtio request kicked\n");
374
	return 0;
E
Eric Van Hensbergen 已提交
375 376
}

377 378 379 380 381 382 383 384 385 386 387 388 389 390
static ssize_t p9_mount_tag_show(struct device *dev,
				struct device_attribute *attr, char *buf)
{
	struct virtio_chan *chan;
	struct virtio_device *vdev;

	vdev = dev_to_virtio(dev);
	chan = vdev->priv;

	return snprintf(buf, chan->tag_len + 1, "%s", chan->tag);
}

static DEVICE_ATTR(mount_tag, 0444, p9_mount_tag_show, NULL);

E
Eric Van Hensbergen 已提交
391 392 393 394
/**
 * p9_virtio_probe - probe for existence of 9P virtio channels
 * @vdev: virtio device to probe
 *
395
 * This probes for existing virtio channels.
E
Eric Van Hensbergen 已提交
396 397 398
 *
 */

399
static int p9_virtio_probe(struct virtio_device *vdev)
E
Eric Van Hensbergen 已提交
400
{
401 402
	__u16 tag_len;
	char *tag;
E
Eric Van Hensbergen 已提交
403 404 405
	int err;
	struct virtio_chan *chan;

406 407 408
	chan = kmalloc(sizeof(struct virtio_chan), GFP_KERNEL);
	if (!chan) {
		printk(KERN_ERR "9p: Failed to allocate virtio 9P channel\n");
E
Eric Van Hensbergen 已提交
409 410 411 412
		err = -ENOMEM;
		goto fail;
	}

413
	chan->vdev = vdev;
E
Eric Van Hensbergen 已提交
414

415
	/* We expect one virtqueue, for requests. */
416
	chan->vq = virtio_find_single_vq(vdev, req_done, "requests");
417 418 419
	if (IS_ERR(chan->vq)) {
		err = PTR_ERR(chan->vq);
		goto out_free_vq;
E
Eric Van Hensbergen 已提交
420
	}
421 422
	chan->vq->vdev->priv = chan;
	spin_lock_init(&chan->lock);
E
Eric Van Hensbergen 已提交
423

424
	sg_init_table(chan->sg, VIRTQUEUE_NUM);
E
Eric Van Hensbergen 已提交
425 426

	chan->inuse = false;
427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443
	if (virtio_has_feature(vdev, VIRTIO_9P_MOUNT_TAG)) {
		vdev->config->get(vdev,
				offsetof(struct virtio_9p_config, tag_len),
				&tag_len, sizeof(tag_len));
	} else {
		err = -EINVAL;
		goto out_free_vq;
	}
	tag = kmalloc(tag_len, GFP_KERNEL);
	if (!tag) {
		err = -ENOMEM;
		goto out_free_vq;
	}
	vdev->config->get(vdev, offsetof(struct virtio_9p_config, tag),
			tag, tag_len);
	chan->tag = tag;
	chan->tag_len = tag_len;
444 445
	err = sysfs_create_file(&(vdev->dev.kobj), &dev_attr_mount_tag.attr);
	if (err) {
446
		goto out_free_tag;
447
	}
448 449 450 451 452 453 454 455
	chan->vc_wq = kmalloc(sizeof(wait_queue_head_t), GFP_KERNEL);
	if (!chan->vc_wq) {
		err = -ENOMEM;
		goto out_free_tag;
	}
	init_waitqueue_head(chan->vc_wq);
	chan->ring_bufs_avail = 1;

456 457 458
	mutex_lock(&virtio_9p_lock);
	list_add_tail(&chan->chan_list, &virtio_chan_list);
	mutex_unlock(&virtio_9p_lock);
E
Eric Van Hensbergen 已提交
459 460
	return 0;

461 462
out_free_tag:
	kfree(tag);
463
out_free_vq:
464
	vdev->config->del_vqs(vdev);
465
	kfree(chan);
E
Eric Van Hensbergen 已提交
466 467 468 469
fail:
	return err;
}

E
Eric Van Hensbergen 已提交
470 471 472

/**
 * p9_virtio_create - allocate a new virtio channel
473
 * @client: client instance invoking this transport
E
Eric Van Hensbergen 已提交
474 475 476 477
 * @devname: string identifying the channel to connect to (unused)
 * @args: args passed from sys_mount() for per-transport options (unused)
 *
 * This sets up a transport channel for 9p communication.  Right now
E
Eric Van Hensbergen 已提交
478 479 480
 * we only match the first available channel, but eventually we couldlook up
 * alternate channels by matching devname versus a virtio_config entry.
 * We use a simple reference count mechanism to ensure that only a single
E
Eric Van Hensbergen 已提交
481 482 483 484
 * mount has a channel open at a time.
 *
 */

485 486
static int
p9_virtio_create(struct p9_client *client, const char *devname, char *args)
E
Eric Van Hensbergen 已提交
487
{
488
	struct virtio_chan *chan;
489
	int ret = -ENOENT;
490
	int found = 0;
E
Eric Van Hensbergen 已提交
491

492
	mutex_lock(&virtio_9p_lock);
493
	list_for_each_entry(chan, &virtio_chan_list, chan_list) {
494 495
		if (!strncmp(devname, chan->tag, chan->tag_len) &&
		    strlen(devname) == chan->tag_len) {
496 497
			if (!chan->inuse) {
				chan->inuse = true;
498
				found = 1;
499 500
				break;
			}
501
			ret = -EBUSY;
E
Eric Van Hensbergen 已提交
502 503
		}
	}
504
	mutex_unlock(&virtio_9p_lock);
E
Eric Van Hensbergen 已提交
505

506
	if (!found) {
507
		printk(KERN_ERR "9p: no channels available\n");
508
		return ret;
509 510
	}

511
	client->trans = (void *)chan;
512
	client->status = Connected;
513
	chan->client = client;
E
Eric Van Hensbergen 已提交
514

515
	return 0;
E
Eric Van Hensbergen 已提交
516 517
}

E
Eric Van Hensbergen 已提交
518 519 520 521 522 523
/**
 * p9_virtio_remove - clean up resources associated with a virtio device
 * @vdev: virtio device to remove
 *
 */

524 525 526 527 528
static void p9_virtio_remove(struct virtio_device *vdev)
{
	struct virtio_chan *chan = vdev->priv;

	BUG_ON(chan->inuse);
529 530 531 532 533
	vdev->config->del_vqs(vdev);

	mutex_lock(&virtio_9p_lock);
	list_del(&chan->chan_list);
	mutex_unlock(&virtio_9p_lock);
534
	sysfs_remove_file(&(vdev->dev.kobj), &dev_attr_mount_tag.attr);
535
	kfree(chan->tag);
536
	kfree(chan->vc_wq);
537
	kfree(chan);
538 539 540

}

E
Eric Van Hensbergen 已提交
541 542 543 544 545
static struct virtio_device_id id_table[] = {
	{ VIRTIO_ID_9P, VIRTIO_DEV_ANY_ID },
	{ 0 },
};

546 547 548 549
static unsigned int features[] = {
	VIRTIO_9P_MOUNT_TAG,
};

E
Eric Van Hensbergen 已提交
550 551
/* The standard "struct lguest_driver": */
static struct virtio_driver p9_virtio_drv = {
552 553 554 555 556 557 558
	.feature_table  = features,
	.feature_table_size = ARRAY_SIZE(features),
	.driver.name    = KBUILD_MODNAME,
	.driver.owner	= THIS_MODULE,
	.id_table	= id_table,
	.probe		= p9_virtio_probe,
	.remove		= p9_virtio_remove,
E
Eric Van Hensbergen 已提交
559 560 561 562 563
};

static struct p9_trans_module p9_virtio_trans = {
	.name = "virtio",
	.create = p9_virtio_create,
564
	.close = p9_virtio_close,
565 566
	.request = p9_virtio_request,
	.cancel = p9_virtio_cancel,
567
	.maxsize = PAGE_SIZE*16,
568
	.pref = P9_TRANS_PREF_PAYLOAD_SEP,
E
Eric Van Hensbergen 已提交
569
	.def = 0,
570
	.owner = THIS_MODULE,
E
Eric Van Hensbergen 已提交
571 572 573 574 575
};

/* The standard init function */
static int __init p9_virtio_init(void)
{
576
	INIT_LIST_HEAD(&virtio_chan_list);
E
Eric Van Hensbergen 已提交
577 578 579 580 581

	v9fs_register_trans(&p9_virtio_trans);
	return register_virtio_driver(&p9_virtio_drv);
}

582 583 584
static void __exit p9_virtio_cleanup(void)
{
	unregister_virtio_driver(&p9_virtio_drv);
585
	v9fs_unregister_trans(&p9_virtio_trans);
586 587
}

E
Eric Van Hensbergen 已提交
588
module_init(p9_virtio_init);
589
module_exit(p9_virtio_cleanup);
E
Eric Van Hensbergen 已提交
590 591 592 593 594

MODULE_DEVICE_TABLE(virtio, id_table);
MODULE_AUTHOR("Eric Van Hensbergen <ericvh@gmail.com>");
MODULE_DESCRIPTION("Virtio 9p Transport");
MODULE_LICENSE("GPL");