core.c 26.5 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
/*
 * Copyright (C) 2015 IT University of Copenhagen. All rights reserved.
 * Initial release: Matias Bjorling <m@bjorling.me>
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version
 * 2 as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; see the file COPYING.  If not, write to
 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
 * USA.
 *
 */

#include <linux/list.h>
#include <linux/types.h>
#include <linux/sem.h>
#include <linux/bitmap.h>
25
#include <linux/module.h>
26
#include <linux/moduleparam.h>
27 28
#include <linux/miscdevice.h>
#include <linux/lightnvm.h>
29
#include <linux/sched/sysctl.h>
30

31
static LIST_HEAD(nvm_tgt_types);
32
static DECLARE_RWSEM(nvm_tgtt_lock);
33 34 35
static LIST_HEAD(nvm_devices);
static DECLARE_RWSEM(nvm_lock);

36 37 38
/* Map between virtual and physical channel and lun */
struct nvm_ch_map {
	int ch_off;
39
	int num_lun;
40 41 42 43 44
	int *lun_offs;
};

struct nvm_dev_map {
	struct nvm_ch_map *chnls;
45
	int num_ch;
46 47 48 49 50 51 52 53 54 55 56 57 58
};

static struct nvm_target *nvm_find_target(struct nvm_dev *dev, const char *name)
{
	struct nvm_target *tgt;

	list_for_each_entry(tgt, &dev->targets, list)
		if (!strcmp(name, tgt->disk->disk_name))
			return tgt;

	return NULL;
}

59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82
static bool nvm_target_exists(const char *name)
{
	struct nvm_dev *dev;
	struct nvm_target *tgt;
	bool ret = false;

	down_write(&nvm_lock);
	list_for_each_entry(dev, &nvm_devices, devices) {
		mutex_lock(&dev->mlock);
		list_for_each_entry(tgt, &dev->targets, list) {
			if (!strcmp(name, tgt->disk->disk_name)) {
				ret = true;
				mutex_unlock(&dev->mlock);
				goto out;
			}
		}
		mutex_unlock(&dev->mlock);
	}

out:
	up_write(&nvm_lock);
	return ret;
}

83 84 85 86 87 88 89 90 91 92 93 94 95
static int nvm_reserve_luns(struct nvm_dev *dev, int lun_begin, int lun_end)
{
	int i;

	for (i = lun_begin; i <= lun_end; i++) {
		if (test_and_set_bit(i, dev->lun_map)) {
			pr_err("nvm: lun %d already allocated\n", i);
			goto err;
		}
	}

	return 0;
err:
96
	while (--i >= lun_begin)
97 98 99 100 101 102 103 104 105 106 107 108 109 110
		clear_bit(i, dev->lun_map);

	return -EBUSY;
}

static void nvm_release_luns_err(struct nvm_dev *dev, int lun_begin,
				 int lun_end)
{
	int i;

	for (i = lun_begin; i <= lun_end; i++)
		WARN_ON(!test_and_clear_bit(i, dev->lun_map));
}

111
static void nvm_remove_tgt_dev(struct nvm_tgt_dev *tgt_dev, int clear)
112 113 114 115 116
{
	struct nvm_dev *dev = tgt_dev->parent;
	struct nvm_dev_map *dev_map = tgt_dev->map;
	int i, j;

117
	for (i = 0; i < dev_map->num_ch; i++) {
118 119 120 121
		struct nvm_ch_map *ch_map = &dev_map->chnls[i];
		int *lun_offs = ch_map->lun_offs;
		int ch = i + ch_map->ch_off;

122
		if (clear) {
123
			for (j = 0; j < ch_map->num_lun; j++) {
124
				int lun = j + lun_offs[j];
125
				int lunid = (ch * dev->geo.num_lun) + lun;
126

127 128 129
				WARN_ON(!test_and_clear_bit(lunid,
							dev->lun_map));
			}
130 131 132 133 134 135 136 137 138 139 140 141 142
		}

		kfree(ch_map->lun_offs);
	}

	kfree(dev_map->chnls);
	kfree(dev_map);

	kfree(tgt_dev->luns);
	kfree(tgt_dev);
}

static struct nvm_tgt_dev *nvm_create_tgt_dev(struct nvm_dev *dev,
143 144
					      u16 lun_begin, u16 lun_end,
					      u16 op)
145 146 147 148 149
{
	struct nvm_tgt_dev *tgt_dev = NULL;
	struct nvm_dev_map *dev_rmap = dev->rmap;
	struct nvm_dev_map *dev_map;
	struct ppa_addr *luns;
150 151 152 153 154 155
	int num_lun = lun_end - lun_begin + 1;
	int luns_left = num_lun;
	int num_ch = num_lun / dev->geo.num_lun;
	int num_ch_mod = num_lun % dev->geo.num_lun;
	int bch = lun_begin / dev->geo.num_lun;
	int blun = lun_begin % dev->geo.num_lun;
156 157
	int lunid = 0;
	int lun_balanced = 1;
158
	int sec_per_lun, prev_num_lun;
159 160
	int i, j;

161
	num_ch = (num_ch_mod == 0) ? num_ch : num_ch + 1;
162 163 164 165 166

	dev_map = kmalloc(sizeof(struct nvm_dev_map), GFP_KERNEL);
	if (!dev_map)
		goto err_dev;

167
	dev_map->chnls = kcalloc(num_ch, sizeof(struct nvm_ch_map), GFP_KERNEL);
168 169 170
	if (!dev_map->chnls)
		goto err_chnls;

171
	luns = kcalloc(num_lun, sizeof(struct ppa_addr), GFP_KERNEL);
172 173 174
	if (!luns)
		goto err_luns;

175 176 177
	prev_num_lun = (luns_left > dev->geo.num_lun) ?
					dev->geo.num_lun : luns_left;
	for (i = 0; i < num_ch; i++) {
178 179 180 181
		struct nvm_ch_map *ch_rmap = &dev_rmap->chnls[i + bch];
		int *lun_roffs = ch_rmap->lun_offs;
		struct nvm_ch_map *ch_map = &dev_map->chnls[i];
		int *lun_offs;
182 183
		int luns_in_chnl = (luns_left > dev->geo.num_lun) ?
					dev->geo.num_lun : luns_left;
184

185
		if (lun_balanced && prev_num_lun != luns_in_chnl)
186 187 188
			lun_balanced = 0;

		ch_map->ch_off = ch_rmap->ch_off = bch;
189
		ch_map->num_lun = luns_in_chnl;
190 191 192 193 194 195 196

		lun_offs = kcalloc(luns_in_chnl, sizeof(int), GFP_KERNEL);
		if (!lun_offs)
			goto err_ch;

		for (j = 0; j < luns_in_chnl; j++) {
			luns[lunid].ppa = 0;
197 198
			luns[lunid].a.ch = i;
			luns[lunid++].a.lun = j;
199 200 201 202 203 204 205 206 207 208 209 210

			lun_offs[j] = blun;
			lun_roffs[j + blun] = blun;
		}

		ch_map->lun_offs = lun_offs;

		/* when starting a new channel, lun offset is reset */
		blun = 0;
		luns_left -= luns_in_chnl;
	}

211
	dev_map->num_ch = num_ch;
212 213 214 215 216

	tgt_dev = kmalloc(sizeof(struct nvm_tgt_dev), GFP_KERNEL);
	if (!tgt_dev)
		goto err_ch;

217
	/* Inherit device geometry from parent */
218
	memcpy(&tgt_dev->geo, &dev->geo, sizeof(struct nvm_geo));
219

220
	/* Target device only owns a portion of the physical device */
221 222 223 224
	tgt_dev->geo.num_ch = num_ch;
	tgt_dev->geo.num_lun = (lun_balanced) ? prev_num_lun : -1;
	tgt_dev->geo.all_luns = num_lun;
	tgt_dev->geo.all_chunks = num_lun * dev->geo.num_chk;
225

226
	tgt_dev->geo.op = op;
227

228 229
	sec_per_lun = dev->geo.clba * dev->geo.num_chk;
	tgt_dev->geo.total_secs = num_lun * sec_per_lun;
230

231 232 233 234 235 236 237
	tgt_dev->q = dev->q;
	tgt_dev->map = dev_map;
	tgt_dev->luns = luns;
	tgt_dev->parent = dev;

	return tgt_dev;
err_ch:
238
	while (--i >= 0)
239 240 241 242 243 244 245 246 247 248 249 250 251 252
		kfree(dev_map->chnls[i].lun_offs);
	kfree(luns);
err_luns:
	kfree(dev_map->chnls);
err_chnls:
	kfree(dev_map);
err_dev:
	return tgt_dev;
}

static const struct block_device_operations nvm_fops = {
	.owner		= THIS_MODULE,
};

253
static struct nvm_tgt_type *__nvm_find_target_type(const char *name)
254
{
255
	struct nvm_tgt_type *tt;
256

257 258 259
	list_for_each_entry(tt, &nvm_tgt_types, list)
		if (!strcmp(name, tt->name))
			return tt;
260

261 262 263 264 265 266 267 268 269 270
	return NULL;
}

static struct nvm_tgt_type *nvm_find_target_type(const char *name)
{
	struct nvm_tgt_type *tt;

	down_write(&nvm_tgtt_lock);
	tt = __nvm_find_target_type(name);
	up_write(&nvm_tgtt_lock);
271 272 273 274

	return tt;
}

275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308
static int nvm_config_check_luns(struct nvm_geo *geo, int lun_begin,
				 int lun_end)
{
	if (lun_begin > lun_end || lun_end >= geo->all_luns) {
		pr_err("nvm: lun out of bound (%u:%u > %u)\n",
			lun_begin, lun_end, geo->all_luns - 1);
		return -EINVAL;
	}

	return 0;
}

static int __nvm_config_simple(struct nvm_dev *dev,
			       struct nvm_ioctl_create_simple *s)
{
	struct nvm_geo *geo = &dev->geo;

	if (s->lun_begin == -1 && s->lun_end == -1) {
		s->lun_begin = 0;
		s->lun_end = geo->all_luns - 1;
	}

	return nvm_config_check_luns(geo, s->lun_begin, s->lun_end);
}

static int __nvm_config_extended(struct nvm_dev *dev,
				 struct nvm_ioctl_create_extended *e)
{
	if (e->lun_begin == 0xFFFF && e->lun_end == 0xFFFF) {
		e->lun_begin = 0;
		e->lun_end = dev->geo.all_luns - 1;
	}

	/* op not set falls into target's default */
309
	if (e->op == 0xFFFF) {
310
		e->op = NVM_TARGET_DEFAULT_OP;
311
	} else if (e->op < NVM_TARGET_MIN_OP || e->op > NVM_TARGET_MAX_OP) {
312 313 314 315
		pr_err("nvm: invalid over provisioning value\n");
		return -EINVAL;
	}

316
	return nvm_config_check_luns(&dev->geo, e->lun_begin, e->lun_end);
317 318
}

319 320
static int nvm_create_tgt(struct nvm_dev *dev, struct nvm_ioctl_create *create)
{
321
	struct nvm_ioctl_create_extended e;
322 323 324 325 326 327
	struct request_queue *tqueue;
	struct gendisk *tdisk;
	struct nvm_tgt_type *tt;
	struct nvm_target *t;
	struct nvm_tgt_dev *tgt_dev;
	void *targetdata;
328
	int ret;
329

330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351
	switch (create->conf.type) {
	case NVM_CONFIG_TYPE_SIMPLE:
		ret = __nvm_config_simple(dev, &create->conf.s);
		if (ret)
			return ret;

		e.lun_begin = create->conf.s.lun_begin;
		e.lun_end = create->conf.s.lun_end;
		e.op = NVM_TARGET_DEFAULT_OP;
		break;
	case NVM_CONFIG_TYPE_EXTENDED:
		ret = __nvm_config_extended(dev, &create->conf.e);
		if (ret)
			return ret;

		e = create->conf.e;
		break;
	default:
		pr_err("nvm: config type not valid\n");
		return -EINVAL;
	}

352
	tt = nvm_find_target_type(create->tgttype);
353 354 355 356 357
	if (!tt) {
		pr_err("nvm: target type %s not found\n", create->tgttype);
		return -EINVAL;
	}

358 359 360 361 362
	if ((tt->flags & NVM_TGT_F_HOST_L2P) != (dev->geo.dom & NVM_RSP_L2P)) {
		pr_err("nvm: device is incompatible with target L2P type.\n");
		return -EINVAL;
	}

363 364 365
	if (nvm_target_exists(create->tgtname)) {
		pr_err("nvm: target name already exists (%s)\n",
							create->tgtname);
366 367 368
		return -EINVAL;
	}

369
	ret = nvm_reserve_luns(dev, e.lun_begin, e.lun_end);
370 371
	if (ret)
		return ret;
372 373

	t = kmalloc(sizeof(struct nvm_target), GFP_KERNEL);
374 375
	if (!t) {
		ret = -ENOMEM;
376
		goto err_reserve;
377
	}
378

379
	tgt_dev = nvm_create_tgt_dev(dev, e.lun_begin, e.lun_end, e.op);
380 381
	if (!tgt_dev) {
		pr_err("nvm: could not create target device\n");
382
		ret = -ENOMEM;
383 384 385
		goto err_t;
	}

386
	tdisk = alloc_disk(0);
387 388
	if (!tdisk) {
		ret = -ENOMEM;
389
		goto err_dev;
390
	}
391

392
	tqueue = blk_alloc_queue_node(GFP_KERNEL, dev->q->node, NULL);
393 394
	if (!tqueue) {
		ret = -ENOMEM;
395
		goto err_disk;
396
	}
397 398
	blk_queue_make_request(tqueue, tt->make_rq);

399
	strlcpy(tdisk->disk_name, create->tgtname, sizeof(tdisk->disk_name));
400 401 402 403 404 405
	tdisk->flags = GENHD_FL_EXT_DEVT;
	tdisk->major = 0;
	tdisk->first_minor = 0;
	tdisk->fops = &nvm_fops;
	tdisk->queue = tqueue;

406
	targetdata = tt->init(tgt_dev, tdisk, create->flags);
407 408
	if (IS_ERR(targetdata)) {
		ret = PTR_ERR(targetdata);
409
		goto err_init;
410
	}
411 412 413 414

	tdisk->private_data = targetdata;
	tqueue->queuedata = targetdata;

415
	blk_queue_max_hw_sectors(tqueue,
416
			(dev->geo.csecs >> 9) * NVM_MAX_VLBA);
417 418 419 420

	set_capacity(tdisk, tt->capacity(targetdata));
	add_disk(tdisk);

421 422
	if (tt->sysfs_init && tt->sysfs_init(tdisk)) {
		ret = -ENOMEM;
423
		goto err_sysfs;
424
	}
425

426 427 428 429 430 431 432 433
	t->type = tt;
	t->disk = tdisk;
	t->dev = tgt_dev;

	mutex_lock(&dev->mlock);
	list_add_tail(&t->list, &dev->targets);
	mutex_unlock(&dev->mlock);

434 435
	__module_get(tt->owner);

436
	return 0;
437 438
err_sysfs:
	if (tt->exit)
439
		tt->exit(targetdata, true);
440 441
err_init:
	blk_cleanup_queue(tqueue);
442
	tdisk->queue = NULL;
443 444
err_disk:
	put_disk(tdisk);
445
err_dev:
446
	nvm_remove_tgt_dev(tgt_dev, 0);
447 448 449
err_t:
	kfree(t);
err_reserve:
450
	nvm_release_luns_err(dev, e.lun_begin, e.lun_end);
451
	return ret;
452 453
}

454
static void __nvm_remove_target(struct nvm_target *t, bool graceful)
455 456 457 458 459 460 461 462
{
	struct nvm_tgt_type *tt = t->type;
	struct gendisk *tdisk = t->disk;
	struct request_queue *q = tdisk->queue;

	del_gendisk(tdisk);
	blk_cleanup_queue(q);

463 464 465
	if (tt->sysfs_exit)
		tt->sysfs_exit(tdisk);

466
	if (tt->exit)
467
		tt->exit(tdisk->private_data, graceful);
468

469
	nvm_remove_tgt_dev(t->dev, 1);
470
	put_disk(tdisk);
471
	module_put(t->type->owner);
472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496

	list_del(&t->list);
	kfree(t);
}

/**
 * nvm_remove_tgt - Removes a target from the media manager
 * @dev:	device
 * @remove:	ioctl structure with target name to remove.
 *
 * Returns:
 * 0: on success
 * 1: on not found
 * <0: on error
 */
static int nvm_remove_tgt(struct nvm_dev *dev, struct nvm_ioctl_remove *remove)
{
	struct nvm_target *t;

	mutex_lock(&dev->mlock);
	t = nvm_find_target(dev, remove->tgtname);
	if (!t) {
		mutex_unlock(&dev->mlock);
		return 1;
	}
497
	__nvm_remove_target(t, true);
498 499 500 501 502 503 504 505 506 507 508 509 510 511
	mutex_unlock(&dev->mlock);

	return 0;
}

static int nvm_register_map(struct nvm_dev *dev)
{
	struct nvm_dev_map *rmap;
	int i, j;

	rmap = kmalloc(sizeof(struct nvm_dev_map), GFP_KERNEL);
	if (!rmap)
		goto err_rmap;

512
	rmap->chnls = kcalloc(dev->geo.num_ch, sizeof(struct nvm_ch_map),
513 514 515 516
								GFP_KERNEL);
	if (!rmap->chnls)
		goto err_chnls;

517
	for (i = 0; i < dev->geo.num_ch; i++) {
518 519
		struct nvm_ch_map *ch_rmap;
		int *lun_roffs;
520
		int luns_in_chnl = dev->geo.num_lun;
521 522 523 524

		ch_rmap = &rmap->chnls[i];

		ch_rmap->ch_off = -1;
525
		ch_rmap->num_lun = luns_in_chnl;
526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548

		lun_roffs = kcalloc(luns_in_chnl, sizeof(int), GFP_KERNEL);
		if (!lun_roffs)
			goto err_ch;

		for (j = 0; j < luns_in_chnl; j++)
			lun_roffs[j] = -1;

		ch_rmap->lun_offs = lun_roffs;
	}

	dev->rmap = rmap;

	return 0;
err_ch:
	while (--i >= 0)
		kfree(rmap->chnls[i].lun_offs);
err_chnls:
	kfree(rmap);
err_rmap:
	return -ENOMEM;
}

549 550 551 552 553
static void nvm_unregister_map(struct nvm_dev *dev)
{
	struct nvm_dev_map *rmap = dev->rmap;
	int i;

554
	for (i = 0; i < dev->geo.num_ch; i++)
555 556 557 558 559 560
		kfree(rmap->chnls[i].lun_offs);

	kfree(rmap->chnls);
	kfree(rmap);
}

561
static void nvm_map_to_dev(struct nvm_tgt_dev *tgt_dev, struct ppa_addr *p)
562 563
{
	struct nvm_dev_map *dev_map = tgt_dev->map;
564 565
	struct nvm_ch_map *ch_map = &dev_map->chnls[p->a.ch];
	int lun_off = ch_map->lun_offs[p->a.lun];
566

567 568
	p->a.ch += ch_map->ch_off;
	p->a.lun += lun_off;
569 570
}

571
static void nvm_map_to_tgt(struct nvm_tgt_dev *tgt_dev, struct ppa_addr *p)
572 573 574
{
	struct nvm_dev *dev = tgt_dev->parent;
	struct nvm_dev_map *dev_rmap = dev->rmap;
575 576
	struct nvm_ch_map *ch_rmap = &dev_rmap->chnls[p->a.ch];
	int lun_roff = ch_rmap->lun_offs[p->a.lun];
577

578 579
	p->a.ch -= ch_rmap->ch_off;
	p->a.lun -= lun_roff;
580 581
}

582 583
static void nvm_ppa_tgt_to_dev(struct nvm_tgt_dev *tgt_dev,
				struct ppa_addr *ppa_list, int nr_ppas)
584 585 586
{
	int i;

587 588
	for (i = 0; i < nr_ppas; i++) {
		nvm_map_to_dev(tgt_dev, &ppa_list[i]);
589
		ppa_list[i] = generic_to_dev_addr(tgt_dev->parent, ppa_list[i]);
590
	}
591
}
592

593 594 595 596 597 598
static void nvm_ppa_dev_to_tgt(struct nvm_tgt_dev *tgt_dev,
				struct ppa_addr *ppa_list, int nr_ppas)
{
	int i;

	for (i = 0; i < nr_ppas; i++) {
599
		ppa_list[i] = dev_to_generic_addr(tgt_dev->parent, ppa_list[i]);
600
		nvm_map_to_tgt(tgt_dev, &ppa_list[i]);
601 602 603
	}
}

604
static void nvm_rq_tgt_to_dev(struct nvm_tgt_dev *tgt_dev, struct nvm_rq *rqd)
605
{
606 607 608 609
	if (rqd->nr_ppas == 1) {
		nvm_ppa_tgt_to_dev(tgt_dev, &rqd->ppa_addr, 1);
		return;
	}
610

611 612 613 614 615 616 617 618 619
	nvm_ppa_tgt_to_dev(tgt_dev, rqd->ppa_list, rqd->nr_ppas);
}

static void nvm_rq_dev_to_tgt(struct nvm_tgt_dev *tgt_dev, struct nvm_rq *rqd)
{
	if (rqd->nr_ppas == 1) {
		nvm_ppa_dev_to_tgt(tgt_dev, &rqd->ppa_addr, 1);
		return;
	}
620

621
	nvm_ppa_dev_to_tgt(tgt_dev, rqd->ppa_list, rqd->nr_ppas);
622 623
}

624
int nvm_register_tgt_type(struct nvm_tgt_type *tt)
625 626 627
{
	int ret = 0;

628
	down_write(&nvm_tgtt_lock);
629
	if (__nvm_find_target_type(tt->name))
630 631
		ret = -EEXIST;
	else
632
		list_add(&tt->list, &nvm_tgt_types);
633
	up_write(&nvm_tgtt_lock);
634 635 636

	return ret;
}
637
EXPORT_SYMBOL(nvm_register_tgt_type);
638

639
void nvm_unregister_tgt_type(struct nvm_tgt_type *tt)
640 641 642 643
{
	if (!tt)
		return;

644
	down_write(&nvm_tgtt_lock);
645
	list_del(&tt->list);
646
	up_write(&nvm_tgtt_lock);
647
}
648
EXPORT_SYMBOL(nvm_unregister_tgt_type);
649 650 651 652

void *nvm_dev_dma_alloc(struct nvm_dev *dev, gfp_t mem_flags,
							dma_addr_t *dma_handler)
{
653
	return dev->ops->dev_dma_alloc(dev, dev->dma_pool, mem_flags,
654 655 656 657
								dma_handler);
}
EXPORT_SYMBOL(nvm_dev_dma_alloc);

658
void nvm_dev_dma_free(struct nvm_dev *dev, void *addr, dma_addr_t dma_handler)
659
{
660
	dev->ops->dev_dma_free(dev->dma_pool, addr, dma_handler);
661 662 663 664 665 666 667 668 669 670 671 672 673 674
}
EXPORT_SYMBOL(nvm_dev_dma_free);

static struct nvm_dev *nvm_find_nvm_dev(const char *name)
{
	struct nvm_dev *dev;

	list_for_each_entry(dev, &nvm_devices, devices)
		if (!strcmp(name, dev->name))
			return dev;

	return NULL;
}

675 676 677 678 679 680 681 682
static int nvm_set_rqd_ppalist(struct nvm_tgt_dev *tgt_dev, struct nvm_rq *rqd,
			const struct ppa_addr *ppas, int nr_ppas)
{
	struct nvm_dev *dev = tgt_dev->parent;
	struct nvm_geo *geo = &tgt_dev->geo;
	int i, plane_cnt, pl_idx;
	struct ppa_addr ppa;

683
	if (geo->pln_mode == NVM_PLANE_SINGLE && nr_ppas == 1) {
684 685 686 687 688 689 690 691 692 693 694 695 696
		rqd->nr_ppas = nr_ppas;
		rqd->ppa_addr = ppas[0];

		return 0;
	}

	rqd->nr_ppas = nr_ppas;
	rqd->ppa_list = nvm_dev_dma_alloc(dev, GFP_KERNEL, &rqd->dma_ppa_list);
	if (!rqd->ppa_list) {
		pr_err("nvm: failed to allocate dma memory\n");
		return -ENOMEM;
	}

697
	plane_cnt = geo->pln_mode;
698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719
	rqd->nr_ppas *= plane_cnt;

	for (i = 0; i < nr_ppas; i++) {
		for (pl_idx = 0; pl_idx < plane_cnt; pl_idx++) {
			ppa = ppas[i];
			ppa.g.pl = pl_idx;
			rqd->ppa_list[(pl_idx * nr_ppas) + i] = ppa;
		}
	}

	return 0;
}

static void nvm_free_rqd_ppalist(struct nvm_tgt_dev *tgt_dev,
			struct nvm_rq *rqd)
{
	if (!rqd->ppa_list)
		return;

	nvm_dev_dma_free(tgt_dev->parent, rqd->ppa_list, rqd->dma_ppa_list);
}

720 721 722 723 724 725 726 727 728 729 730
int nvm_get_chunk_meta(struct nvm_tgt_dev *tgt_dev, struct nvm_chk_meta *meta,
		struct ppa_addr ppa, int nchks)
{
	struct nvm_dev *dev = tgt_dev->parent;

	nvm_ppa_tgt_to_dev(tgt_dev, &ppa, 1);

	return dev->ops->get_chk_meta(tgt_dev->parent, meta,
						(sector_t)ppa.ppa, nchks);
}
EXPORT_SYMBOL(nvm_get_chunk_meta);
731

732 733 734 735 736 737 738
int nvm_set_tgt_bb_tbl(struct nvm_tgt_dev *tgt_dev, struct ppa_addr *ppas,
		       int nr_ppas, int type)
{
	struct nvm_dev *dev = tgt_dev->parent;
	struct nvm_rq rqd;
	int ret;

739
	if (nr_ppas > NVM_MAX_VLBA) {
740 741 742 743 744 745
		pr_err("nvm: unable to update all blocks atomically\n");
		return -EINVAL;
	}

	memset(&rqd, 0, sizeof(struct nvm_rq));

746
	nvm_set_rqd_ppalist(tgt_dev, &rqd, ppas, nr_ppas);
747
	nvm_rq_tgt_to_dev(tgt_dev, &rqd);
748 749

	ret = dev->ops->set_bb_tbl(dev, &rqd.ppa_addr, rqd.nr_ppas, type);
750
	nvm_free_rqd_ppalist(tgt_dev, &rqd);
751
	if (ret) {
752
		pr_err("nvm: failed bb mark\n");
753 754 755 756 757 758 759
		return -EINVAL;
	}

	return 0;
}
EXPORT_SYMBOL(nvm_set_tgt_bb_tbl);

760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777
static int nvm_set_flags(struct nvm_geo *geo, struct nvm_rq *rqd)
{
	int flags = 0;

	if (geo->version == NVM_OCSSD_SPEC_20)
		return 0;

	if (rqd->is_seq)
		flags |= geo->pln_mode >> 1;

	if (rqd->opcode == NVM_OP_PREAD)
		flags |= (NVM_IO_SCRAMBLE_ENABLE | NVM_IO_SUSPEND);
	else if (rqd->opcode == NVM_OP_PWRITE)
		flags |= NVM_IO_SCRAMBLE_ENABLE;

	return flags;
}

778
int nvm_submit_io(struct nvm_tgt_dev *tgt_dev, struct nvm_rq *rqd)
779
{
780
	struct nvm_dev *dev = tgt_dev->parent;
781
	int ret;
782

783 784 785
	if (!dev->ops->submit_io)
		return -ENODEV;

786
	nvm_rq_tgt_to_dev(tgt_dev, rqd);
787 788

	rqd->dev = tgt_dev;
789
	rqd->flags = nvm_set_flags(&tgt_dev->geo, rqd);
790 791 792 793 794 795

	/* In case of error, fail with right address format */
	ret = dev->ops->submit_io(dev, rqd);
	if (ret)
		nvm_rq_dev_to_tgt(tgt_dev, rqd);
	return ret;
796 797 798
}
EXPORT_SYMBOL(nvm_submit_io);

799
int nvm_submit_io_sync(struct nvm_tgt_dev *tgt_dev, struct nvm_rq *rqd)
800
{
801 802 803 804 805 806 807
	struct nvm_dev *dev = tgt_dev->parent;
	int ret;

	if (!dev->ops->submit_io_sync)
		return -ENODEV;

	nvm_rq_tgt_to_dev(tgt_dev, rqd);
808

809
	rqd->dev = tgt_dev;
810
	rqd->flags = nvm_set_flags(&tgt_dev->geo, rqd);
811 812 813 814 815 816

	/* In case of error, fail with right address format */
	ret = dev->ops->submit_io_sync(dev, rqd);
	nvm_rq_dev_to_tgt(tgt_dev, rqd);

	return ret;
817
}
818
EXPORT_SYMBOL(nvm_submit_io_sync);
819

820
void nvm_end_io(struct nvm_rq *rqd)
821
{
822 823 824 825
	struct nvm_tgt_dev *tgt_dev = rqd->dev;

	/* Convert address space */
	if (tgt_dev)
826
		nvm_rq_dev_to_tgt(tgt_dev, rqd);
827

828 829
	if (rqd->end_io)
		rqd->end_io(rqd);
830 831 832
}
EXPORT_SYMBOL(nvm_end_io);

833 834 835 836 837 838 839 840 841 842
/*
 * folds a bad block list from its plane representation to its virtual
 * block representation. The fold is done in place and reduced size is
 * returned.
 *
 * If any of the planes status are bad or grown bad block, the virtual block
 * is marked bad. If not bad, the first plane state acts as the block state.
 */
int nvm_bb_tbl_fold(struct nvm_dev *dev, u8 *blks, int nr_blks)
{
843
	struct nvm_geo *geo = &dev->geo;
844 845
	int blk, offset, pl, blktype;

846
	if (nr_blks != geo->num_chk * geo->pln_mode)
847 848
		return -EINVAL;

849 850
	for (blk = 0; blk < geo->num_chk; blk++) {
		offset = blk * geo->pln_mode;
851 852 853
		blktype = blks[offset];

		/* Bad blocks on any planes take precedence over other types */
854
		for (pl = 0; pl < geo->pln_mode; pl++) {
855 856 857 858 859 860 861 862 863 864
			if (blks[offset + pl] &
					(NVM_BLK_T_BAD|NVM_BLK_T_GRWN_BAD)) {
				blktype = blks[offset + pl];
				break;
			}
		}

		blks[blk] = blktype;
	}

865
	return geo->num_chk;
866 867 868
}
EXPORT_SYMBOL(nvm_bb_tbl_fold);

869 870 871
int nvm_get_tgt_bb_tbl(struct nvm_tgt_dev *tgt_dev, struct ppa_addr ppa,
		       u8 *blks)
{
872 873
	struct nvm_dev *dev = tgt_dev->parent;

874
	nvm_ppa_tgt_to_dev(tgt_dev, &ppa, 1);
875

876
	return dev->ops->get_bb_tbl(dev, ppa, blks);
877 878 879
}
EXPORT_SYMBOL(nvm_get_tgt_bb_tbl);

880 881
static int nvm_core_init(struct nvm_dev *dev)
{
882
	struct nvm_geo *geo = &dev->geo;
883
	int ret;
884

885
	dev->lun_map = kcalloc(BITS_TO_LONGS(geo->all_luns),
W
Wenwei Tao 已提交
886 887 888
					sizeof(unsigned long), GFP_KERNEL);
	if (!dev->lun_map)
		return -ENOMEM;
889

890 891
	INIT_LIST_HEAD(&dev->area_list);
	INIT_LIST_HEAD(&dev->targets);
892
	mutex_init(&dev->mlock);
893
	spin_lock_init(&dev->lock);
894

895 896 897
	ret = nvm_register_map(dev);
	if (ret)
		goto err_fmtype;
898

899
	return 0;
900 901 902
err_fmtype:
	kfree(dev->lun_map);
	return ret;
903 904
}

905
static void nvm_free(struct nvm_dev *dev)
906 907 908 909
{
	if (!dev)
		return;

910 911 912
	if (dev->dma_pool)
		dev->ops->destroy_dma_pool(dev->dma_pool);

913
	nvm_unregister_map(dev);
914
	kfree(dev->lun_map);
915
	kfree(dev);
916 917 918 919
}

static int nvm_init(struct nvm_dev *dev)
{
920
	struct nvm_geo *geo = &dev->geo;
921
	int ret = -EINVAL;
922

923
	if (dev->ops->identity(dev)) {
924 925 926 927
		pr_err("nvm: device could not be identified\n");
		goto err;
	}

928 929
	pr_debug("nvm: ver:%u.%u nvm_vendor:%x\n",
				geo->major_ver_id, geo->minor_ver_id,
930
				geo->vmnt);
931 932 933 934 935 936 937

	ret = nvm_core_init(dev);
	if (ret) {
		pr_err("nvm: could not initialize core structures.\n");
		goto err;
	}

938
	pr_info("nvm: registered %s [%u/%u/%u/%u/%u]\n",
939 940 941
			dev->name, dev->geo.ws_min, dev->geo.ws_opt,
			dev->geo.num_chk, dev->geo.all_luns,
			dev->geo.num_ch);
942 943 944 945 946 947
	return 0;
err:
	pr_err("nvm: failed to initialize nvm\n");
	return ret;
}

948
struct nvm_dev *nvm_alloc_dev(int node)
949
{
950
	return kzalloc_node(sizeof(struct nvm_dev), GFP_KERNEL, node);
951
}
952
EXPORT_SYMBOL(nvm_alloc_dev);
953

954
int nvm_register(struct nvm_dev *dev)
955 956 957
{
	int ret;

958 959
	if (!dev->q || !dev->ops)
		return -EINVAL;
960

961 962 963 964
	dev->dma_pool = dev->ops->create_dma_pool(dev, "ppalist");
	if (!dev->dma_pool) {
		pr_err("nvm: could not create dma pool\n");
		return -ENOMEM;
965 966
	}

967 968 969
	ret = nvm_init(dev);
	if (ret)
		goto err_init;
970

971
	/* register device with a supported media manager */
972 973 974 975
	down_write(&nvm_lock);
	list_add(&dev->devices, &nvm_devices);
	up_write(&nvm_lock);

976 977
	return 0;
err_init:
978
	dev->ops->destroy_dma_pool(dev->dma_pool);
979 980 981 982
	return ret;
}
EXPORT_SYMBOL(nvm_register);

983
void nvm_unregister(struct nvm_dev *dev)
984
{
985 986 987 988 989 990
	struct nvm_target *t, *tmp;

	mutex_lock(&dev->mlock);
	list_for_each_entry_safe(t, tmp, &dev->targets, list) {
		if (t->dev->parent != dev)
			continue;
991
		__nvm_remove_target(t, false);
992 993 994
	}
	mutex_unlock(&dev->mlock);

W
Wenwei Tao 已提交
995
	down_write(&nvm_lock);
996 997
	list_del(&dev->devices);
	up_write(&nvm_lock);
998

999
	nvm_free(dev);
1000 1001 1002 1003 1004 1005 1006
}
EXPORT_SYMBOL(nvm_unregister);

static int __nvm_configure_create(struct nvm_ioctl_create *create)
{
	struct nvm_dev *dev;

W
Wenwei Tao 已提交
1007
	down_write(&nvm_lock);
1008
	dev = nvm_find_nvm_dev(create->dev);
W
Wenwei Tao 已提交
1009
	up_write(&nvm_lock);
1010

1011 1012 1013 1014 1015
	if (!dev) {
		pr_err("nvm: device not found\n");
		return -EINVAL;
	}

1016
	return nvm_create_tgt(dev, create);
1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032
}

static long nvm_ioctl_info(struct file *file, void __user *arg)
{
	struct nvm_ioctl_info *info;
	struct nvm_tgt_type *tt;
	int tgt_iter = 0;

	info = memdup_user(arg, sizeof(struct nvm_ioctl_info));
	if (IS_ERR(info))
		return -EFAULT;

	info->version[0] = NVM_VERSION_MAJOR;
	info->version[1] = NVM_VERSION_MINOR;
	info->version[2] = NVM_VERSION_PATCH;

1033
	down_write(&nvm_tgtt_lock);
1034
	list_for_each_entry(tt, &nvm_tgt_types, list) {
1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045
		struct nvm_ioctl_info_tgt *tgt = &info->tgts[tgt_iter];

		tgt->version[0] = tt->version[0];
		tgt->version[1] = tt->version[1];
		tgt->version[2] = tt->version[2];
		strncpy(tgt->tgtname, tt->name, NVM_TTYPE_NAME_MAX);

		tgt_iter++;
	}

	info->tgtsize = tgt_iter;
1046
	up_write(&nvm_tgtt_lock);
1047

S
Sudip Mukherjee 已提交
1048 1049
	if (copy_to_user(arg, info, sizeof(struct nvm_ioctl_info))) {
		kfree(info);
1050
		return -EFAULT;
S
Sudip Mukherjee 已提交
1051
	}
1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070

	kfree(info);
	return 0;
}

static long nvm_ioctl_get_devices(struct file *file, void __user *arg)
{
	struct nvm_ioctl_get_devices *devices;
	struct nvm_dev *dev;
	int i = 0;

	devices = kzalloc(sizeof(struct nvm_ioctl_get_devices), GFP_KERNEL);
	if (!devices)
		return -ENOMEM;

	down_write(&nvm_lock);
	list_for_each_entry(dev, &nvm_devices, devices) {
		struct nvm_ioctl_device_info *info = &devices->info[i];

1071
		strlcpy(info->devname, dev->name, sizeof(info->devname));
1072

1073 1074 1075 1076
		/* kept for compatibility */
		info->bmversion[0] = 1;
		info->bmversion[1] = 0;
		info->bmversion[2] = 0;
1077
		strlcpy(info->bmname, "gennvm", sizeof(info->bmname));
1078
		i++;
1079

1080 1081 1082 1083 1084 1085 1086 1087 1088
		if (i > 31) {
			pr_err("nvm: max 31 devices can be reported.\n");
			break;
		}
	}
	up_write(&nvm_lock);

	devices->nr_devices = i;

S
Sudip Mukherjee 已提交
1089 1090 1091
	if (copy_to_user(arg, devices,
			 sizeof(struct nvm_ioctl_get_devices))) {
		kfree(devices);
1092
		return -EFAULT;
S
Sudip Mukherjee 已提交
1093
	}
1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105

	kfree(devices);
	return 0;
}

static long nvm_ioctl_dev_create(struct file *file, void __user *arg)
{
	struct nvm_ioctl_create create;

	if (copy_from_user(&create, arg, sizeof(struct nvm_ioctl_create)))
		return -EFAULT;

1106 1107 1108 1109 1110 1111
	if (create.conf.type == NVM_CONFIG_TYPE_EXTENDED &&
	    create.conf.e.rsv != 0) {
		pr_err("nvm: reserved config field in use\n");
		return -EINVAL;
	}

1112 1113 1114 1115 1116
	create.dev[DISK_NAME_LEN - 1] = '\0';
	create.tgttype[NVM_TTYPE_NAME_MAX - 1] = '\0';
	create.tgtname[DISK_NAME_LEN - 1] = '\0';

	if (create.flags != 0) {
1117 1118 1119 1120 1121 1122 1123 1124 1125 1126
		__u32 flags = create.flags;

		/* Check for valid flags */
		if (flags & NVM_TARGET_FACTORY)
			flags &= ~NVM_TARGET_FACTORY;

		if (flags) {
			pr_err("nvm: flag not supported\n");
			return -EINVAL;
		}
1127 1128 1129 1130 1131 1132 1133 1134
	}

	return __nvm_configure_create(&create);
}

static long nvm_ioctl_dev_remove(struct file *file, void __user *arg)
{
	struct nvm_ioctl_remove remove;
1135 1136
	struct nvm_dev *dev;
	int ret = 0;
1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147

	if (copy_from_user(&remove, arg, sizeof(struct nvm_ioctl_remove)))
		return -EFAULT;

	remove.tgtname[DISK_NAME_LEN - 1] = '\0';

	if (remove.flags != 0) {
		pr_err("nvm: no flags supported\n");
		return -EINVAL;
	}

1148
	list_for_each_entry(dev, &nvm_devices, devices) {
1149
		ret = nvm_remove_tgt(dev, &remove);
1150 1151 1152 1153 1154
		if (!ret)
			break;
	}

	return ret;
1155 1156
}

1157
/* kept for compatibility reasons */
1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169
static long nvm_ioctl_dev_init(struct file *file, void __user *arg)
{
	struct nvm_ioctl_dev_init init;

	if (copy_from_user(&init, arg, sizeof(struct nvm_ioctl_dev_init)))
		return -EFAULT;

	if (init.flags != 0) {
		pr_err("nvm: no flags supported\n");
		return -EINVAL;
	}

1170
	return 0;
1171 1172
}

1173
/* Kept for compatibility reasons */
1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185
static long nvm_ioctl_dev_factory(struct file *file, void __user *arg)
{
	struct nvm_ioctl_dev_factory fact;

	if (copy_from_user(&fact, arg, sizeof(struct nvm_ioctl_dev_factory)))
		return -EFAULT;

	fact.dev[DISK_NAME_LEN - 1] = '\0';

	if (fact.flags & ~(NVM_FACTORY_NR_BITS - 1))
		return -EINVAL;

1186
	return 0;
1187 1188
}

1189 1190 1191 1192
static long nvm_ctl_ioctl(struct file *file, uint cmd, unsigned long arg)
{
	void __user *argp = (void __user *)arg;

1193 1194 1195
	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

1196 1197 1198 1199 1200 1201 1202 1203 1204
	switch (cmd) {
	case NVM_INFO:
		return nvm_ioctl_info(file, argp);
	case NVM_GET_DEVICES:
		return nvm_ioctl_get_devices(file, argp);
	case NVM_DEV_CREATE:
		return nvm_ioctl_dev_create(file, argp);
	case NVM_DEV_REMOVE:
		return nvm_ioctl_dev_remove(file, argp);
1205 1206
	case NVM_DEV_INIT:
		return nvm_ioctl_dev_init(file, argp);
1207 1208
	case NVM_DEV_FACTORY:
		return nvm_ioctl_dev_factory(file, argp);
1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225
	}
	return 0;
}

static const struct file_operations _ctl_fops = {
	.open = nonseekable_open,
	.unlocked_ioctl = nvm_ctl_ioctl,
	.owner = THIS_MODULE,
	.llseek  = noop_llseek,
};

static struct miscdevice _nvm_misc = {
	.minor		= MISC_DYNAMIC_MINOR,
	.name		= "lightnvm",
	.nodename	= "lightnvm/control",
	.fops		= &_ctl_fops,
};
1226
builtin_misc_device(_nvm_misc);