raw.c 7.1 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
/*
 * linux/drivers/char/raw.c
 *
 * Front-end raw character devices.  These can be bound to any block
 * devices to provide genuine Unix raw character device semantics.
 *
 * We reserve minor number 0 for a control interface.  ioctl()s on this
 * device are used to bind the other minor numbers to block devices.
 */

#include <linux/init.h>
#include <linux/fs.h>
#include <linux/major.h>
#include <linux/blkdev.h>
#include <linux/module.h>
#include <linux/raw.h>
#include <linux/capability.h>
#include <linux/uio.h>
#include <linux/cdev.h>
#include <linux/device.h>
21
#include <linux/mutex.h>
J
Jonathan Corbet 已提交
22
#include <linux/smp_lock.h>
L
Linus Torvalds 已提交
23 24 25 26 27 28 29 30

#include <asm/uaccess.h>

struct raw_device_data {
	struct block_device *binding;
	int inuse;
};

31
static struct class *raw_class;
L
Linus Torvalds 已提交
32
static struct raw_device_data raw_devices[MAX_RAW_MINORS];
33
static DEFINE_MUTEX(raw_mutex);
34
static const struct file_operations raw_ctl_fops; /* forward declaration */
L
Linus Torvalds 已提交
35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56

/*
 * Open/close code for raw IO.
 *
 * We just rewrite the i_mapping for the /dev/raw/rawN file descriptor to
 * point at the blockdev's address_space and set the file handle to use
 * O_DIRECT.
 *
 * Set the device's soft blocksize to the minimum possible.  This gives the
 * finest possible alignment and has no adverse impact on performance.
 */
static int raw_open(struct inode *inode, struct file *filp)
{
	const int minor = iminor(inode);
	struct block_device *bdev;
	int err;

	if (minor == 0) {	/* It is the control device */
		filp->f_op = &raw_ctl_fops;
		return 0;
	}

J
Jonathan Corbet 已提交
57
	lock_kernel();
58
	mutex_lock(&raw_mutex);
L
Linus Torvalds 已提交
59 60 61 62 63 64 65 66 67

	/*
	 * All we need to do on open is check that the device is bound.
	 */
	bdev = raw_devices[minor].binding;
	err = -ENODEV;
	if (!bdev)
		goto out;
	igrab(bdev->bd_inode);
68
	err = blkdev_get(bdev, filp->f_mode);
L
Linus Torvalds 已提交
69 70 71 72 73
	if (err)
		goto out;
	err = bd_claim(bdev, raw_open);
	if (err)
		goto out1;
74
	err = set_blocksize(bdev, bdev_logical_block_size(bdev));
L
Linus Torvalds 已提交
75 76 77 78 79
	if (err)
		goto out2;
	filp->f_flags |= O_DIRECT;
	filp->f_mapping = bdev->bd_inode->i_mapping;
	if (++raw_devices[minor].inuse == 1)
80
		filp->f_path.dentry->d_inode->i_mapping =
L
Linus Torvalds 已提交
81 82
			bdev->bd_inode->i_mapping;
	filp->private_data = bdev;
83
	mutex_unlock(&raw_mutex);
J
Jonathan Corbet 已提交
84
	unlock_kernel();
L
Linus Torvalds 已提交
85 86 87 88 89
	return 0;

out2:
	bd_release(bdev);
out1:
A
Al Viro 已提交
90
	blkdev_put(bdev, filp->f_mode);
L
Linus Torvalds 已提交
91
out:
92
	mutex_unlock(&raw_mutex);
93
	unlock_kernel();
L
Linus Torvalds 已提交
94 95 96 97 98 99 100 101 102 103 104 105
	return err;
}

/*
 * When the final fd which refers to this character-special node is closed, we
 * make its ->mapping point back at its own i_data.
 */
static int raw_release(struct inode *inode, struct file *filp)
{
	const int minor= iminor(inode);
	struct block_device *bdev;

106
	mutex_lock(&raw_mutex);
L
Linus Torvalds 已提交
107 108 109 110 111 112
	bdev = raw_devices[minor].binding;
	if (--raw_devices[minor].inuse == 0) {
		/* Here  inode->i_mapping == bdev->bd_inode->i_mapping  */
		inode->i_mapping = &inode->i_data;
		inode->i_mapping->backing_dev_info = &default_backing_dev_info;
	}
113
	mutex_unlock(&raw_mutex);
L
Linus Torvalds 已提交
114 115

	bd_release(bdev);
A
Al Viro 已提交
116
	blkdev_put(bdev, filp->f_mode);
L
Linus Torvalds 已提交
117 118 119 120 121 122 123 124 125 126 127 128
	return 0;
}

/*
 * Forward ioctls to the underlying block device.
 */
static int
raw_ioctl(struct inode *inode, struct file *filp,
		  unsigned int command, unsigned long arg)
{
	struct block_device *bdev = filp->private_data;

129
	return blkdev_ioctl(bdev, 0, command, arg);
L
Linus Torvalds 已提交
130 131 132 133
}

static void bind_device(struct raw_config_request *rq)
{
134
	device_destroy(raw_class, MKDEV(RAW_MAJOR, rq->raw_minor));
135 136
	device_create(raw_class, NULL, MKDEV(RAW_MAJOR, rq->raw_minor), NULL,
		      "raw%d", rq->raw_minor);
L
Linus Torvalds 已提交
137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160
}

/*
 * Deal with ioctls against the raw-device control interface, to bind
 * and unbind other raw devices.
 */
static int raw_ctl_ioctl(struct inode *inode, struct file *filp,
			unsigned int command, unsigned long arg)
{
	struct raw_config_request rq;
	struct raw_device_data *rawdev;
	int err = 0;

	switch (command) {
	case RAW_SETBIND:
	case RAW_GETBIND:

		/* First, find out which raw minor we want */

		if (copy_from_user(&rq, (void __user *) arg, sizeof(rq))) {
			err = -EFAULT;
			goto out;
		}

161
		if (rq.raw_minor <= 0 || rq.raw_minor >= MAX_RAW_MINORS) {
L
Linus Torvalds 已提交
162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193
			err = -EINVAL;
			goto out;
		}
		rawdev = &raw_devices[rq.raw_minor];

		if (command == RAW_SETBIND) {
			dev_t dev;

			/*
			 * This is like making block devices, so demand the
			 * same capability
			 */
			if (!capable(CAP_SYS_ADMIN)) {
				err = -EPERM;
				goto out;
			}

			/*
			 * For now, we don't need to check that the underlying
			 * block device is present or not: we can do that when
			 * the raw device is opened.  Just check that the
			 * major/minor numbers make sense.
			 */

			dev = MKDEV(rq.block_major, rq.block_minor);
			if ((rq.block_major == 0 && rq.block_minor != 0) ||
					MAJOR(dev) != rq.block_major ||
					MINOR(dev) != rq.block_minor) {
				err = -EINVAL;
				goto out;
			}

194
			mutex_lock(&raw_mutex);
L
Linus Torvalds 已提交
195
			if (rawdev->inuse) {
196
				mutex_unlock(&raw_mutex);
L
Linus Torvalds 已提交
197 198 199 200 201 202 203 204 205 206
				err = -EBUSY;
				goto out;
			}
			if (rawdev->binding) {
				bdput(rawdev->binding);
				module_put(THIS_MODULE);
			}
			if (rq.block_major == 0 && rq.block_minor == 0) {
				/* unbind */
				rawdev->binding = NULL;
207
				device_destroy(raw_class,
208
						MKDEV(RAW_MAJOR, rq.raw_minor));
L
Linus Torvalds 已提交
209 210 211 212 213 214 215 216 217
			} else {
				rawdev->binding = bdget(dev);
				if (rawdev->binding == NULL)
					err = -ENOMEM;
				else {
					__module_get(THIS_MODULE);
					bind_device(&rq);
				}
			}
218
			mutex_unlock(&raw_mutex);
L
Linus Torvalds 已提交
219 220 221
		} else {
			struct block_device *bdev;

222
			mutex_lock(&raw_mutex);
L
Linus Torvalds 已提交
223 224 225 226 227 228 229
			bdev = rawdev->binding;
			if (bdev) {
				rq.block_major = MAJOR(bdev->bd_dev);
				rq.block_minor = MINOR(bdev->bd_dev);
			} else {
				rq.block_major = rq.block_minor = 0;
			}
230
			mutex_unlock(&raw_mutex);
L
Linus Torvalds 已提交
231 232 233 234 235 236 237 238 239 240 241 242 243 244
			if (copy_to_user((void __user *)arg, &rq, sizeof(rq))) {
				err = -EFAULT;
				goto out;
			}
		}
		break;
	default:
		err = -EINVAL;
		break;
	}
out:
	return err;
}

245
static const struct file_operations raw_fops = {
246
	.read	=	do_sync_read,
L
Linus Torvalds 已提交
247
	.aio_read = 	generic_file_aio_read,
248
	.write	=	do_sync_write,
249
	.aio_write =	blkdev_aio_write,
L
Linus Torvalds 已提交
250 251 252 253 254 255
	.open	=	raw_open,
	.release=	raw_release,
	.ioctl	=	raw_ioctl,
	.owner	=	THIS_MODULE,
};

256
static const struct file_operations raw_ctl_fops = {
L
Linus Torvalds 已提交
257 258 259 260 261
	.ioctl	=	raw_ctl_ioctl,
	.open	=	raw_open,
	.owner	=	THIS_MODULE,
};

262
static struct cdev raw_cdev;
L
Linus Torvalds 已提交
263

264 265 266 267 268
static char *raw_nodename(struct device *dev)
{
	return kasprintf(GFP_KERNEL, "raw/%s", dev_name(dev));
}

L
Linus Torvalds 已提交
269 270 271
static int __init raw_init(void)
{
	dev_t dev = MKDEV(RAW_MAJOR, 0);
272
	int ret;
L
Linus Torvalds 已提交
273

274 275
	ret = register_chrdev_region(dev, MAX_RAW_MINORS, "raw");
	if (ret)
L
Linus Torvalds 已提交
276 277 278
		goto error;

	cdev_init(&raw_cdev, &raw_fops);
279 280
	ret = cdev_add(&raw_cdev, dev, MAX_RAW_MINORS);
	if (ret) {
L
Linus Torvalds 已提交
281
		kobject_put(&raw_cdev.kobj);
282
		goto error_region;
L
Linus Torvalds 已提交
283 284
	}

285
	raw_class = class_create(THIS_MODULE, "raw");
L
Linus Torvalds 已提交
286 287 288
	if (IS_ERR(raw_class)) {
		printk(KERN_ERR "Error creating raw class.\n");
		cdev_del(&raw_cdev);
289 290
		ret = PTR_ERR(raw_class);
		goto error_region;
L
Linus Torvalds 已提交
291
	}
292
	raw_class->nodename = raw_nodename;
293
	device_create(raw_class, NULL, MKDEV(RAW_MAJOR, 0), NULL, "rawctl");
L
Linus Torvalds 已提交
294 295 296

	return 0;

297 298
error_region:
	unregister_chrdev_region(dev, MAX_RAW_MINORS);
L
Linus Torvalds 已提交
299
error:
300
	return ret;
L
Linus Torvalds 已提交
301 302 303 304
}

static void __exit raw_exit(void)
{
305
	device_destroy(raw_class, MKDEV(RAW_MAJOR, 0));
306
	class_destroy(raw_class);
L
Linus Torvalds 已提交
307 308 309 310 311 312 313
	cdev_del(&raw_cdev);
	unregister_chrdev_region(MKDEV(RAW_MAJOR, 0), MAX_RAW_MINORS);
}

module_init(raw_init);
module_exit(raw_exit);
MODULE_LICENSE("GPL");