lightnvm.c 30.3 KB
Newer Older
M
Matias Bjørling 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * nvme-lightnvm.c - LightNVM NVMe device
 *
 * Copyright (C) 2014-2015 IT University of Copenhagen
 * Initial release: Matias Bjorling <mb@lightnvm.io>
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version
 * 2 as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; see the file COPYING.  If not, write to
 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
 * USA.
 *
 */

#include "nvme.h"

#include <linux/nvme.h>
#include <linux/bitops.h>
#include <linux/lightnvm.h>
#include <linux/vmalloc.h>
29 30
#include <linux/sched/sysctl.h>
#include <uapi/linux/lightnvm.h>
M
Matias Bjørling 已提交
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53

enum nvme_nvm_admin_opcode {
	nvme_nvm_admin_identity		= 0xe2,
	nvme_nvm_admin_get_bb_tbl	= 0xf2,
	nvme_nvm_admin_set_bb_tbl	= 0xf1,
};

struct nvme_nvm_ph_rw {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd2;
	__le64			metadata;
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
struct nvme_nvm_erase_blk {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

M
Matias Bjørling 已提交
69 70 71 72 73 74 75 76
struct nvme_nvm_identity {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
77
	__u32			rsvd11[6];
M
Matias Bjørling 已提交
78 79
};

80
struct nvme_nvm_getbbtbl {
M
Matias Bjørling 已提交
81 82 83 84 85 86 87
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
	__le64			spba;
	__u32			rsvd4[4];
};

struct nvme_nvm_setbbtbl {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__le64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			nlb;
	__u8			value;
	__u8			rsvd3;
	__u32			rsvd4[3];
M
Matias Bjørling 已提交
105 106 107 108 109 110
};

struct nvme_nvm_command {
	union {
		struct nvme_common_command common;
		struct nvme_nvm_ph_rw ph_rw;
111 112
		struct nvme_nvm_erase_blk erase;
		struct nvme_nvm_identity identity;
113 114
		struct nvme_nvm_getbbtbl get_bb;
		struct nvme_nvm_setbbtbl set_bb;
M
Matias Bjørling 已提交
115 116 117
	};
};

118
struct nvme_nvm_id12_grp {
M
Matias Bjørling 已提交
119 120 121 122 123 124
	__u8			mtype;
	__u8			fmtype;
	__le16			res16;
	__u8			num_ch;
	__u8			num_lun;
	__u8			num_pln;
125
	__u8			rsvd1;
126
	__le16			num_chk;
M
Matias Bjørling 已提交
127 128 129 130
	__le16			num_pg;
	__le16			fpg_sz;
	__le16			csecs;
	__le16			sos;
131
	__le16			rsvd2;
M
Matias Bjørling 已提交
132 133 134 135 136 137 138
	__le32			trdt;
	__le32			trdm;
	__le32			tprt;
	__le32			tprm;
	__le32			tbet;
	__le32			tbem;
	__le32			mpos;
139
	__le32			mccap;
M
Matias Bjørling 已提交
140
	__le16			cpar;
141
	__u8			reserved[906];
M
Matias Bjørling 已提交
142 143
} __packed;

144
struct nvme_nvm_id12_addrf {
M
Matias Bjørling 已提交
145 146 147 148 149 150 151 152 153 154
	__u8			ch_offset;
	__u8			ch_len;
	__u8			lun_offset;
	__u8			lun_len;
	__u8			pln_offset;
	__u8			pln_len;
	__u8			blk_offset;
	__u8			blk_len;
	__u8			pg_offset;
	__u8			pg_len;
155 156
	__u8			sec_offset;
	__u8			sec_len;
M
Matias Bjørling 已提交
157 158 159
	__u8			res[4];
} __packed;

160
struct nvme_nvm_id12 {
M
Matias Bjørling 已提交
161 162 163
	__u8			ver_id;
	__u8			vmnt;
	__u8			cgrps;
164
	__u8			res;
M
Matias Bjørling 已提交
165 166
	__le32			cap;
	__le32			dom;
167
	struct nvme_nvm_id12_addrf ppaf;
168
	__u8			resv[228];
169
	struct nvme_nvm_id12_grp grp;
170
	__u8			resv2[2880];
M
Matias Bjørling 已提交
171 172
} __packed;

173 174 175 176 177 178 179 180 181 182 183 184 185 186
struct nvme_nvm_bb_tbl {
	__u8	tblid[4];
	__le16	verid;
	__le16	revid;
	__le32	rvsd1;
	__le32	tblks;
	__le32	tfact;
	__le32	tgrown;
	__le32	tdresv;
	__le32	thresv;
	__le32	rsvd2[8];
	__u8	blk[0];
};

187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238
struct nvme_nvm_id20_addrf {
	__u8			grp_len;
	__u8			pu_len;
	__u8			chk_len;
	__u8			lba_len;
	__u8			resv[4];
};

struct nvme_nvm_id20 {
	__u8			mjr;
	__u8			mnr;
	__u8			resv[6];

	struct nvme_nvm_id20_addrf lbaf;

	__le32			mccap;
	__u8			resv2[12];

	__u8			wit;
	__u8			resv3[31];

	/* Geometry */
	__le16			num_grp;
	__le16			num_pu;
	__le32			num_chk;
	__le32			clba;
	__u8			resv4[52];

	/* Write data requirements */
	__le32			ws_min;
	__le32			ws_opt;
	__le32			mw_cunits;
	__le32			maxoc;
	__le32			maxocpu;
	__u8			resv5[44];

	/* Performance related metrics */
	__le32			trdt;
	__le32			trdm;
	__le32			twrt;
	__le32			twrm;
	__le32			tcrst;
	__le32			tcrsm;
	__u8			resv6[40];

	/* Reserved area */
	__u8			resv7[2816];

	/* Vendor specific */
	__u8			vs[1024];
};

M
Matias Bjørling 已提交
239 240 241 242 243 244 245
/*
 * Check we didn't inadvertently grow the command struct
 */
static inline void _nvme_nvm_check_size(void)
{
	BUILD_BUG_ON(sizeof(struct nvme_nvm_identity) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_ph_rw) != 64);
246
	BUILD_BUG_ON(sizeof(struct nvme_nvm_erase_blk) != 64);
247 248
	BUILD_BUG_ON(sizeof(struct nvme_nvm_getbbtbl) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_setbbtbl) != 64);
249 250 251
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_grp) != 960);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_addrf) != 16);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12) != NVME_IDENTIFY_DATA_SIZE);
252
	BUILD_BUG_ON(sizeof(struct nvme_nvm_bb_tbl) != 64);
253 254
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20_addrf) != 8);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20) != NVME_IDENTIFY_DATA_SIZE);
M
Matias Bjørling 已提交
255 256
}

257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283
static void nvme_nvm_set_addr_12(struct nvm_addrf_12 *dst,
				 struct nvme_nvm_id12_addrf *src)
{
	dst->ch_len = src->ch_len;
	dst->lun_len = src->lun_len;
	dst->blk_len = src->blk_len;
	dst->pg_len = src->pg_len;
	dst->pln_len = src->pln_len;
	dst->sect_len = src->sec_len;

	dst->ch_offset = src->ch_offset;
	dst->lun_offset = src->lun_offset;
	dst->blk_offset = src->blk_offset;
	dst->pg_offset = src->pg_offset;
	dst->pln_offset = src->pln_offset;
	dst->sect_offset = src->sec_offset;

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->blk_mask = ((1ULL << dst->blk_len) - 1) << dst->blk_offset;
	dst->pg_mask = ((1ULL << dst->pg_len) - 1) << dst->pg_offset;
	dst->pln_mask = ((1ULL << dst->pln_len) - 1) << dst->pln_offset;
	dst->sec_mask = ((1ULL << dst->sect_len) - 1) << dst->sect_offset;
}

static int nvme_nvm_setup_12(struct nvme_nvm_id12 *id,
			     struct nvm_geo *geo)
M
Matias Bjørling 已提交
284
{
285
	struct nvme_nvm_id12_grp *src;
286
	int sec_per_pg, sec_per_pl, pg_per_blk;
287

288 289 290 291 292 293 294
	if (id->cgrps != 1)
		return -EINVAL;

	src = &id->grp;

	if (src->mtype != 0) {
		pr_err("nvm: memory type not supported\n");
295
		return -EINVAL;
296
	}
297

298
	geo->ver_id = id->ver_id;
299

300 301 302
	geo->nr_chnls = src->num_ch;
	geo->nr_luns = src->num_lun;
	geo->all_luns = geo->nr_chnls * geo->nr_luns;
303

304
	geo->nr_chks = le16_to_cpu(src->num_chk);
305

306 307
	geo->csecs = le16_to_cpu(src->csecs);
	geo->sos = le16_to_cpu(src->sos);
308 309

	pg_per_blk = le16_to_cpu(src->num_pg);
310
	sec_per_pg = le16_to_cpu(src->fpg_sz) / geo->csecs;
311
	sec_per_pl = sec_per_pg * src->num_pln;
312 313 314 315 316 317 318 319
	geo->clba = sec_per_pl * pg_per_blk;

	geo->all_chunks = geo->all_luns * geo->nr_chks;
	geo->total_secs = geo->clba * geo->all_chunks;

	geo->ws_min = sec_per_pg;
	geo->ws_opt = sec_per_pg;
	geo->mw_cunits = geo->ws_opt << 3;	/* default to MLC safe values */
320

321 322 323 324 325 326 327 328
	geo->mccap = le32_to_cpu(src->mccap);

	geo->trdt = le32_to_cpu(src->trdt);
	geo->trdm = le32_to_cpu(src->trdm);
	geo->tprt = le32_to_cpu(src->tprt);
	geo->tprm = le32_to_cpu(src->tprm);
	geo->tbet = le32_to_cpu(src->tbet);
	geo->tbem = le32_to_cpu(src->tbem);
329 330

	/* 1.2 compatibility */
331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355
	geo->vmnt = id->vmnt;
	geo->cap = le32_to_cpu(id->cap);
	geo->dom = le32_to_cpu(id->dom);

	geo->mtype = src->mtype;
	geo->fmtype = src->fmtype;

	geo->cpar = le16_to_cpu(src->cpar);
	geo->mpos = le32_to_cpu(src->mpos);

	geo->plane_mode = NVM_PLANE_SINGLE;

	if (geo->mpos & 0x020202) {
		geo->plane_mode = NVM_PLANE_DOUBLE;
		geo->ws_opt <<= 1;
	} else if (geo->mpos & 0x040404) {
		geo->plane_mode = NVM_PLANE_QUAD;
		geo->ws_opt <<= 2;
	}

	geo->num_pln = src->num_pln;
	geo->num_pg = le16_to_cpu(src->num_pg);
	geo->fpg_sz = le16_to_cpu(src->fpg_sz);

	nvme_nvm_set_addr_12((struct nvm_addrf_12 *)&geo->addrf, &id->ppaf);
356

M
Matias Bjørling 已提交
357 358 359
	return 0;
}

360 361
static void nvme_nvm_set_addr_20(struct nvm_addrf *dst,
				 struct nvme_nvm_id20_addrf *src)
362
{
363 364 365 366 367 368 369 370 371 372 373 374 375 376
	dst->ch_len = src->grp_len;
	dst->lun_len = src->pu_len;
	dst->chk_len = src->chk_len;
	dst->sec_len = src->lba_len;

	dst->sec_offset = 0;
	dst->chk_offset = dst->sec_len;
	dst->lun_offset = dst->chk_offset + dst->chk_len;
	dst->ch_offset = dst->lun_offset + dst->lun_len;

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->chk_mask = ((1ULL << dst->chk_len) - 1) << dst->chk_offset;
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
377 378
}

379 380
static int nvme_nvm_setup_20(struct nvme_nvm_id20 *id,
			     struct nvm_geo *geo)
381
{
382
	geo->ver_id = id->mjr;
383

384 385 386
	geo->nr_chnls = le16_to_cpu(id->num_grp);
	geo->nr_luns = le16_to_cpu(id->num_pu);
	geo->all_luns = geo->nr_chnls * geo->nr_luns;
387

388 389
	geo->nr_chks = le32_to_cpu(id->num_chk);
	geo->clba = le32_to_cpu(id->clba);
390

391 392
	geo->all_chunks = geo->all_luns * geo->nr_chks;
	geo->total_secs = geo->clba * geo->all_chunks;
393

394 395 396
	geo->ws_min = le32_to_cpu(id->ws_min);
	geo->ws_opt = le32_to_cpu(id->ws_opt);
	geo->mw_cunits = le32_to_cpu(id->mw_cunits);
397

398 399 400 401 402 403 404 405
	geo->trdt = le32_to_cpu(id->trdt);
	geo->trdm = le32_to_cpu(id->trdm);
	geo->tprt = le32_to_cpu(id->twrt);
	geo->tprm = le32_to_cpu(id->twrm);
	geo->tbet = le32_to_cpu(id->tcrst);
	geo->tbem = le32_to_cpu(id->tcrsm);

	nvme_nvm_set_addr_20(&geo->addrf, &id->lbaf);
406 407 408 409

	return 0;
}

410
static int nvme_nvm_identity(struct nvm_dev *nvmdev)
M
Matias Bjørling 已提交
411
{
412
	struct nvme_ns *ns = nvmdev->q->queuedata;
413
	struct nvme_nvm_id12 *id;
M
Matias Bjørling 已提交
414 415 416 417
	struct nvme_nvm_command c = {};
	int ret;

	c.identity.opcode = nvme_nvm_admin_identity;
C
Christoph Hellwig 已提交
418
	c.identity.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
419

420 421
	id = kmalloc(sizeof(struct nvme_nvm_id12), GFP_KERNEL);
	if (!id)
M
Matias Bjørling 已提交
422 423
		return -ENOMEM;

424
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
425
				id, sizeof(struct nvme_nvm_id12));
M
Matias Bjørling 已提交
426 427 428 429 430
	if (ret) {
		ret = -EIO;
		goto out;
	}

431 432 433 434 435 436
	/*
	 * The 1.2 and 2.0 specifications share the first byte in their geometry
	 * command to make it possible to know what version a device implements.
	 */
	switch (id->ver_id) {
	case 1:
437
		ret = nvme_nvm_setup_12(id, &nvmdev->geo);
438 439
		break;
	case 2:
440 441
		ret = nvme_nvm_setup_20((struct nvme_nvm_id20 *)id,
							&nvmdev->geo);
442 443
		break;
	default:
444 445
		dev_err(ns->ctrl->device, "OCSSD revision not supported (%d)\n",
							id->ver_id);
446 447
		ret = -EINVAL;
	}
448

M
Matias Bjørling 已提交
449
out:
450
	kfree(id);
M
Matias Bjørling 已提交
451 452 453
	return ret;
}

454
static int nvme_nvm_get_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr ppa,
455
								u8 *blks)
M
Matias Bjørling 已提交
456
{
457
	struct request_queue *q = nvmdev->q;
458
	struct nvm_geo *geo = &nvmdev->geo;
M
Matias Bjørling 已提交
459
	struct nvme_ns *ns = q->queuedata;
460
	struct nvme_ctrl *ctrl = ns->ctrl;
M
Matias Bjørling 已提交
461
	struct nvme_nvm_command c = {};
462
	struct nvme_nvm_bb_tbl *bb_tbl;
463
	int nr_blks = geo->nr_chks * geo->num_pln;
464
	int tblsz = sizeof(struct nvme_nvm_bb_tbl) + nr_blks;
M
Matias Bjørling 已提交
465 466 467
	int ret = 0;

	c.get_bb.opcode = nvme_nvm_admin_get_bb_tbl;
C
Christoph Hellwig 已提交
468
	c.get_bb.nsid = cpu_to_le32(ns->head->ns_id);
469
	c.get_bb.spba = cpu_to_le64(ppa.ppa);
M
Matias Bjørling 已提交
470

471 472 473
	bb_tbl = kzalloc(tblsz, GFP_KERNEL);
	if (!bb_tbl)
		return -ENOMEM;
M
Matias Bjørling 已提交
474

475
	ret = nvme_submit_sync_cmd(ctrl->admin_q, (struct nvme_command *)&c,
476
								bb_tbl, tblsz);
M
Matias Bjørling 已提交
477
	if (ret) {
478
		dev_err(ctrl->device, "get bad block table failed (%d)\n", ret);
M
Matias Bjørling 已提交
479 480 481 482
		ret = -EIO;
		goto out;
	}

483 484
	if (bb_tbl->tblid[0] != 'B' || bb_tbl->tblid[1] != 'B' ||
		bb_tbl->tblid[2] != 'L' || bb_tbl->tblid[3] != 'T') {
485
		dev_err(ctrl->device, "bbt format mismatch\n");
486 487 488 489 490 491
		ret = -EINVAL;
		goto out;
	}

	if (le16_to_cpu(bb_tbl->verid) != 1) {
		ret = -EINVAL;
492
		dev_err(ctrl->device, "bbt version not supported\n");
493 494 495
		goto out;
	}

496
	if (le32_to_cpu(bb_tbl->tblks) != nr_blks) {
497
		ret = -EINVAL;
498 499
		dev_err(ctrl->device,
				"bbt unsuspected blocks returned (%u!=%u)",
500
				le32_to_cpu(bb_tbl->tblks), nr_blks);
501 502 503
		goto out;
	}

504
	memcpy(blks, bb_tbl->blk, geo->nr_chks * geo->num_pln);
M
Matias Bjørling 已提交
505
out:
506 507 508 509
	kfree(bb_tbl);
	return ret;
}

510 511
static int nvme_nvm_set_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr *ppas,
							int nr_ppas, int type)
512
{
513
	struct nvme_ns *ns = nvmdev->q->queuedata;
514 515 516 517
	struct nvme_nvm_command c = {};
	int ret = 0;

	c.set_bb.opcode = nvme_nvm_admin_set_bb_tbl;
C
Christoph Hellwig 已提交
518
	c.set_bb.nsid = cpu_to_le32(ns->head->ns_id);
519 520
	c.set_bb.spba = cpu_to_le64(ppas->ppa);
	c.set_bb.nlb = cpu_to_le16(nr_ppas - 1);
521 522
	c.set_bb.value = type;

523
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
524
								NULL, 0);
525
	if (ret)
526 527
		dev_err(ns->ctrl->device, "set bad block table failed (%d)\n",
									ret);
M
Matias Bjørling 已提交
528 529 530
	return ret;
}

531 532
static inline void nvme_nvm_rqtocmd(struct nvm_rq *rqd, struct nvme_ns *ns,
				    struct nvme_nvm_command *c)
M
Matias Bjørling 已提交
533 534
{
	c->ph_rw.opcode = rqd->opcode;
C
Christoph Hellwig 已提交
535
	c->ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
536
	c->ph_rw.spba = cpu_to_le64(rqd->ppa_addr.ppa);
537
	c->ph_rw.metadata = cpu_to_le64(rqd->dma_meta_list);
M
Matias Bjørling 已提交
538
	c->ph_rw.control = cpu_to_le16(rqd->flags);
539
	c->ph_rw.length = cpu_to_le16(rqd->nr_ppas - 1);
M
Matias Bjørling 已提交
540 541
}

542
static void nvme_nvm_end_io(struct request *rq, blk_status_t status)
M
Matias Bjørling 已提交
543 544 545
{
	struct nvm_rq *rqd = rq->end_io_data;

546
	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
547
	rqd->error = nvme_req(rq)->status;
548
	nvm_end_io(rqd);
M
Matias Bjørling 已提交
549

550
	kfree(nvme_req(rq)->cmd);
M
Matias Bjørling 已提交
551 552 553
	blk_mq_free_request(rq);
}

554 555 556
static struct request *nvme_nvm_alloc_request(struct request_queue *q,
					      struct nvm_rq *rqd,
					      struct nvme_nvm_command *cmd)
M
Matias Bjørling 已提交
557 558 559 560
{
	struct nvme_ns *ns = q->queuedata;
	struct request *rq;

561
	nvme_nvm_rqtocmd(rqd, ns, cmd);
562

563
	rq = nvme_alloc_request(q, (struct nvme_command *)cmd, 0, NVME_QID_ANY);
564 565 566
	if (IS_ERR(rq))
		return rq;

567
	rq->cmd_flags &= ~REQ_FAILFAST_DRIVER;
M
Matias Bjørling 已提交
568

569 570
	if (rqd->bio) {
		blk_init_request_from_bio(rq, rqd->bio);
571 572 573 574
	} else {
		rq->ioprio = IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, IOPRIO_NORM);
		rq->__data_len = 0;
	}
M
Matias Bjørling 已提交
575

576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594
	return rq;
}

static int nvme_nvm_submit_io(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct nvme_nvm_command *cmd;
	struct request *rq;

	cmd = kzalloc(sizeof(struct nvme_nvm_command), GFP_KERNEL);
	if (!cmd)
		return -ENOMEM;

	rq = nvme_nvm_alloc_request(q, rqd, cmd);
	if (IS_ERR(rq)) {
		kfree(cmd);
		return PTR_ERR(rq);
	}

M
Matias Bjørling 已提交
595 596 597 598 599 600 601
	rq->end_io_data = rqd;

	blk_execute_rq_nowait(q, NULL, rq, 0, nvme_nvm_end_io);

	return 0;
}

602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629
static int nvme_nvm_submit_io_sync(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct request *rq;
	struct nvme_nvm_command cmd;
	int ret = 0;

	memset(&cmd, 0, sizeof(struct nvme_nvm_command));

	rq = nvme_nvm_alloc_request(q, rqd, &cmd);
	if (IS_ERR(rq))
		return PTR_ERR(rq);

	/* I/Os can fail and the error is signaled through rqd. Callers must
	 * handle the error accordingly.
	 */
	blk_execute_rq(q, NULL, rq, 0);
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;

	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
	rqd->error = nvme_req(rq)->status;

	blk_mq_free_request(rq);

	return ret;
}

630
static void *nvme_nvm_create_dma_pool(struct nvm_dev *nvmdev, char *name)
M
Matias Bjørling 已提交
631
{
632
	struct nvme_ns *ns = nvmdev->q->queuedata;
M
Matias Bjørling 已提交
633

634
	return dma_pool_create(name, ns->ctrl->dev, PAGE_SIZE, PAGE_SIZE, 0);
M
Matias Bjørling 已提交
635 636 637 638 639 640 641 642 643
}

static void nvme_nvm_destroy_dma_pool(void *pool)
{
	struct dma_pool *dma_pool = pool;

	dma_pool_destroy(dma_pool);
}

644
static void *nvme_nvm_dev_dma_alloc(struct nvm_dev *dev, void *pool,
M
Matias Bjørling 已提交
645 646 647 648 649
				    gfp_t mem_flags, dma_addr_t *dma_handler)
{
	return dma_pool_alloc(pool, mem_flags, dma_handler);
}

650
static void nvme_nvm_dev_dma_free(void *pool, void *addr,
M
Matias Bjørling 已提交
651 652
							dma_addr_t dma_handler)
{
653
	dma_pool_free(pool, addr, dma_handler);
M
Matias Bjørling 已提交
654 655 656 657 658 659
}

static struct nvm_dev_ops nvme_nvm_dev_ops = {
	.identity		= nvme_nvm_identity,

	.get_bb_tbl		= nvme_nvm_get_bb_tbl,
660
	.set_bb_tbl		= nvme_nvm_set_bb_tbl,
M
Matias Bjørling 已提交
661 662

	.submit_io		= nvme_nvm_submit_io,
663
	.submit_io_sync		= nvme_nvm_submit_io_sync,
M
Matias Bjørling 已提交
664 665 666 667 668 669 670

	.create_dma_pool	= nvme_nvm_create_dma_pool,
	.destroy_dma_pool	= nvme_nvm_destroy_dma_pool,
	.dev_dma_alloc		= nvme_nvm_dev_dma_alloc,
	.dev_dma_free		= nvme_nvm_dev_dma_free,
};

671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688
static int nvme_nvm_submit_user_cmd(struct request_queue *q,
				struct nvme_ns *ns,
				struct nvme_nvm_command *vcmd,
				void __user *ubuf, unsigned int bufflen,
				void __user *meta_buf, unsigned int meta_len,
				void __user *ppa_buf, unsigned int ppa_len,
				u32 *result, u64 *status, unsigned int timeout)
{
	bool write = nvme_is_write((struct nvme_command *)vcmd);
	struct nvm_dev *dev = ns->ndev;
	struct gendisk *disk = ns->disk;
	struct request *rq;
	struct bio *bio = NULL;
	__le64 *ppa_list = NULL;
	dma_addr_t ppa_dma;
	__le64 *metadata = NULL;
	dma_addr_t metadata_dma;
	DECLARE_COMPLETION_ONSTACK(wait);
689
	int ret = 0;
690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740

	rq = nvme_alloc_request(q, (struct nvme_command *)vcmd, 0,
			NVME_QID_ANY);
	if (IS_ERR(rq)) {
		ret = -ENOMEM;
		goto err_cmd;
	}

	rq->timeout = timeout ? timeout : ADMIN_TIMEOUT;

	if (ppa_buf && ppa_len) {
		ppa_list = dma_pool_alloc(dev->dma_pool, GFP_KERNEL, &ppa_dma);
		if (!ppa_list) {
			ret = -ENOMEM;
			goto err_rq;
		}
		if (copy_from_user(ppa_list, (void __user *)ppa_buf,
						sizeof(u64) * (ppa_len + 1))) {
			ret = -EFAULT;
			goto err_ppa;
		}
		vcmd->ph_rw.spba = cpu_to_le64(ppa_dma);
	} else {
		vcmd->ph_rw.spba = cpu_to_le64((uintptr_t)ppa_buf);
	}

	if (ubuf && bufflen) {
		ret = blk_rq_map_user(q, rq, NULL, ubuf, bufflen, GFP_KERNEL);
		if (ret)
			goto err_ppa;
		bio = rq->bio;

		if (meta_buf && meta_len) {
			metadata = dma_pool_alloc(dev->dma_pool, GFP_KERNEL,
								&metadata_dma);
			if (!metadata) {
				ret = -ENOMEM;
				goto err_map;
			}

			if (write) {
				if (copy_from_user(metadata,
						(void __user *)meta_buf,
						meta_len)) {
					ret = -EFAULT;
					goto err_meta;
				}
			}
			vcmd->ph_rw.metadata = cpu_to_le64(metadata_dma);
		}

741
		bio->bi_disk = disk;
742 743
	}

744
	blk_execute_rq(q, NULL, rq, 0);
745

746 747
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;
748 749
	else if (nvme_req(rq)->status & 0x7ff)
		ret = -EIO;
750
	if (result)
751
		*result = nvme_req(rq)->status & 0x7ff;
752 753 754 755 756 757 758 759 760 761 762
	if (status)
		*status = le64_to_cpu(nvme_req(rq)->result.u64);

	if (metadata && !ret && !write) {
		if (copy_to_user(meta_buf, (void *)metadata, meta_len))
			ret = -EFAULT;
	}
err_meta:
	if (meta_buf && meta_len)
		dma_pool_free(dev->dma_pool, metadata, metadata_dma);
err_map:
763
	if (bio)
764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788
		blk_rq_unmap_user(bio);
err_ppa:
	if (ppa_buf && ppa_len)
		dma_pool_free(dev->dma_pool, ppa_list, ppa_dma);
err_rq:
	blk_mq_free_request(rq);
err_cmd:
	return ret;
}

static int nvme_nvm_submit_vio(struct nvme_ns *ns,
					struct nvm_user_vio __user *uvio)
{
	struct nvm_user_vio vio;
	struct nvme_nvm_command c;
	unsigned int length;
	int ret;

	if (copy_from_user(&vio, uvio, sizeof(vio)))
		return -EFAULT;
	if (vio.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.ph_rw.opcode = vio.opcode;
C
Christoph Hellwig 已提交
789
	c.ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825
	c.ph_rw.control = cpu_to_le16(vio.control);
	c.ph_rw.length = cpu_to_le16(vio.nppas);

	length = (vio.nppas + 1) << ns->lba_shift;

	ret = nvme_nvm_submit_user_cmd(ns->queue, ns, &c,
			(void __user *)(uintptr_t)vio.addr, length,
			(void __user *)(uintptr_t)vio.metadata,
							vio.metadata_len,
			(void __user *)(uintptr_t)vio.ppa_list, vio.nppas,
			&vio.result, &vio.status, 0);

	if (ret && copy_to_user(uvio, &vio, sizeof(vio)))
		return -EFAULT;

	return ret;
}

static int nvme_nvm_user_vcmd(struct nvme_ns *ns, int admin,
					struct nvm_passthru_vio __user *uvcmd)
{
	struct nvm_passthru_vio vcmd;
	struct nvme_nvm_command c;
	struct request_queue *q;
	unsigned int timeout = 0;
	int ret;

	if (copy_from_user(&vcmd, uvcmd, sizeof(vcmd)))
		return -EFAULT;
	if ((vcmd.opcode != 0xF2) && (!capable(CAP_SYS_ADMIN)))
		return -EACCES;
	if (vcmd.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.common.opcode = vcmd.opcode;
C
Christoph Hellwig 已提交
826
	c.common.nsid = cpu_to_le32(ns->head->ns_id);
827 828 829 830
	c.common.cdw2[0] = cpu_to_le32(vcmd.cdw2);
	c.common.cdw2[1] = cpu_to_le32(vcmd.cdw3);
	/* cdw11-12 */
	c.ph_rw.length = cpu_to_le16(vcmd.nppas);
831
	c.ph_rw.control  = cpu_to_le16(vcmd.control);
832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868
	c.common.cdw10[3] = cpu_to_le32(vcmd.cdw13);
	c.common.cdw10[4] = cpu_to_le32(vcmd.cdw14);
	c.common.cdw10[5] = cpu_to_le32(vcmd.cdw15);

	if (vcmd.timeout_ms)
		timeout = msecs_to_jiffies(vcmd.timeout_ms);

	q = admin ? ns->ctrl->admin_q : ns->queue;

	ret = nvme_nvm_submit_user_cmd(q, ns,
			(struct nvme_nvm_command *)&c,
			(void __user *)(uintptr_t)vcmd.addr, vcmd.data_len,
			(void __user *)(uintptr_t)vcmd.metadata,
							vcmd.metadata_len,
			(void __user *)(uintptr_t)vcmd.ppa_list, vcmd.nppas,
			&vcmd.result, &vcmd.status, timeout);

	if (ret && copy_to_user(uvcmd, &vcmd, sizeof(vcmd)))
		return -EFAULT;

	return ret;
}

int nvme_nvm_ioctl(struct nvme_ns *ns, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
	case NVME_NVM_IOCTL_ADMIN_VIO:
		return nvme_nvm_user_vcmd(ns, 1, (void __user *)arg);
	case NVME_NVM_IOCTL_IO_VIO:
		return nvme_nvm_user_vcmd(ns, 0, (void __user *)arg);
	case NVME_NVM_IOCTL_SUBMIT_VIO:
		return nvme_nvm_submit_vio(ns, (void __user *)arg);
	default:
		return -ENOTTY;
	}
}

869 870 871
void nvme_nvm_update_nvm_info(struct nvme_ns *ns)
{
	struct nvm_dev *ndev = ns->ndev;
872
	struct nvm_geo *geo = &ndev->geo;
873

874 875
	geo->csecs = 1 << ns->lba_shift;
	geo->sos = ns->ms;
876 877
}

878
int nvme_nvm_register(struct nvme_ns *ns, char *disk_name, int node)
M
Matias Bjørling 已提交
879
{
880 881 882
	struct request_queue *q = ns->queue;
	struct nvm_dev *dev;

883 884
	_nvme_nvm_check_size();

885 886 887 888 889 890 891
	dev = nvm_alloc_dev(node);
	if (!dev)
		return -ENOMEM;

	dev->q = q;
	memcpy(dev->name, disk_name, DISK_NAME_LEN);
	dev->ops = &nvme_nvm_dev_ops;
892
	dev->private_data = ns;
893 894
	ns->ndev = dev;

895
	return nvm_register(dev);
M
Matias Bjørling 已提交
896 897
}

898
void nvme_nvm_unregister(struct nvme_ns *ns)
M
Matias Bjørling 已提交
899
{
900
	nvm_unregister(ns->ndev);
M
Matias Bjørling 已提交
901 902
}

903
static ssize_t nvm_dev_attr_show(struct device *dev,
904
		struct device_attribute *dattr, char *page)
905 906 907
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
908
	struct nvm_geo *geo = &ndev->geo;
909 910 911 912 913 914 915 916
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "version") == 0) {
917
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ver_id);
918
	} else if (strcmp(attr->name, "capabilities") == 0) {
919
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->cap);
920
	} else if (strcmp(attr->name, "read_typ") == 0) {
921
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdt);
922
	} else if (strcmp(attr->name, "read_max") == 0) {
923
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdm);
924 925 926 927 928 929 930 931
	} else {
		return scnprintf(page,
				 PAGE_SIZE,
				 "Unhandled attr(%s) in `nvm_dev_attr_show`\n",
				 attr->name);
	}
}

932 933 934 935 936 937 938 939 940 941 942 943
static ssize_t nvm_dev_attr_show_ppaf(struct nvm_addrf_12 *ppaf, char *page)
{
	return scnprintf(page, PAGE_SIZE,
		"0x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x\n",
				ppaf->ch_offset, ppaf->ch_len,
				ppaf->lun_offset, ppaf->lun_len,
				ppaf->pln_offset, ppaf->pln_len,
				ppaf->blk_offset, ppaf->blk_len,
				ppaf->pg_offset, ppaf->pg_len,
				ppaf->sect_offset, ppaf->sect_len);
}

944 945 946 947 948
static ssize_t nvm_dev_attr_show_12(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
949
	struct nvm_geo *geo = &ndev->geo;
950 951 952 953 954 955 956 957
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "vendor_opcode") == 0) {
958
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->vmnt);
959
	} else if (strcmp(attr->name, "device_mode") == 0) {
960
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->dom);
961
	/* kept for compatibility */
962
	} else if (strcmp(attr->name, "media_manager") == 0) {
963
		return scnprintf(page, PAGE_SIZE, "%s\n", "gennvm");
964
	} else if (strcmp(attr->name, "ppa_format") == 0) {
965
		return nvm_dev_attr_show_ppaf((void *)&geo->addrf, page);
966
	} else if (strcmp(attr->name, "media_type") == 0) {	/* u8 */
967
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mtype);
968
	} else if (strcmp(attr->name, "flash_media_type") == 0) {
969
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fmtype);
970
	} else if (strcmp(attr->name, "num_channels") == 0) {
971
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->nr_chnls);
972
	} else if (strcmp(attr->name, "num_luns") == 0) {
973
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->nr_luns);
974
	} else if (strcmp(attr->name, "num_planes") == 0) {
975
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pln);
976
	} else if (strcmp(attr->name, "num_blocks") == 0) {	/* u16 */
977
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->nr_chks);
978
	} else if (strcmp(attr->name, "num_pages") == 0) {
979
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pg);
980
	} else if (strcmp(attr->name, "page_size") == 0) {
981
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fpg_sz);
982
	} else if (strcmp(attr->name, "hw_sector_size") == 0) {
983
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->csecs);
984
	} else if (strcmp(attr->name, "oob_sector_size") == 0) {/* u32 */
985
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->sos);
986
	} else if (strcmp(attr->name, "prog_typ") == 0) {
987
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
988
	} else if (strcmp(attr->name, "prog_max") == 0) {
989
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
990
	} else if (strcmp(attr->name, "erase_typ") == 0) {
991
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
992
	} else if (strcmp(attr->name, "erase_max") == 0) {
993
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
994
	} else if (strcmp(attr->name, "multiplane_modes") == 0) {
995
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mpos);
996
	} else if (strcmp(attr->name, "media_capabilities") == 0) {
997
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mccap);
998
	} else if (strcmp(attr->name, "max_phys_secs") == 0) {
999
		return scnprintf(page, PAGE_SIZE, "%u\n", NVM_MAX_VLBA);
1000
	} else {
1001 1002 1003
		return scnprintf(page, PAGE_SIZE,
			"Unhandled attr(%s) in `nvm_dev_attr_show_12`\n",
			attr->name);
1004 1005 1006
	}
}

1007 1008 1009 1010 1011
static ssize_t nvm_dev_attr_show_20(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1012
	struct nvm_geo *geo = &ndev->geo;
1013 1014 1015 1016 1017 1018 1019 1020
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "groups") == 0) {
1021
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->nr_chnls);
1022
	} else if (strcmp(attr->name, "punits") == 0) {
1023
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->nr_luns);
1024
	} else if (strcmp(attr->name, "chunks") == 0) {
1025
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->nr_chks);
1026
	} else if (strcmp(attr->name, "clba") == 0) {
1027
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->clba);
1028
	} else if (strcmp(attr->name, "ws_min") == 0) {
1029
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_min);
1030
	} else if (strcmp(attr->name, "ws_opt") == 0) {
1031
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_opt);
1032
	} else if (strcmp(attr->name, "mw_cunits") == 0) {
1033
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mw_cunits);
1034
	} else if (strcmp(attr->name, "write_typ") == 0) {
1035
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1036
	} else if (strcmp(attr->name, "write_max") == 0) {
1037
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1038
	} else if (strcmp(attr->name, "reset_typ") == 0) {
1039
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1040
	} else if (strcmp(attr->name, "reset_max") == 0) {
1041
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1042
	} else {
1043 1044 1045
		return scnprintf(page, PAGE_SIZE,
			"Unhandled attr(%s) in `nvm_dev_attr_show_20`\n",
			attr->name);
1046 1047 1048 1049
	}
}

#define NVM_DEV_ATTR_RO(_name)					\
1050
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show, NULL)
1051 1052 1053 1054
#define NVM_DEV_ATTR_12_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_12, NULL)
#define NVM_DEV_ATTR_20_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_20, NULL)
1055

1056
/* general attributes */
1057 1058
static NVM_DEV_ATTR_RO(version);
static NVM_DEV_ATTR_RO(capabilities);
1059

1060 1061
static NVM_DEV_ATTR_RO(read_typ);
static NVM_DEV_ATTR_RO(read_max);
1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086

/* 1.2 values */
static NVM_DEV_ATTR_12_RO(vendor_opcode);
static NVM_DEV_ATTR_12_RO(device_mode);
static NVM_DEV_ATTR_12_RO(ppa_format);
static NVM_DEV_ATTR_12_RO(media_manager);
static NVM_DEV_ATTR_12_RO(media_type);
static NVM_DEV_ATTR_12_RO(flash_media_type);
static NVM_DEV_ATTR_12_RO(num_channels);
static NVM_DEV_ATTR_12_RO(num_luns);
static NVM_DEV_ATTR_12_RO(num_planes);
static NVM_DEV_ATTR_12_RO(num_blocks);
static NVM_DEV_ATTR_12_RO(num_pages);
static NVM_DEV_ATTR_12_RO(page_size);
static NVM_DEV_ATTR_12_RO(hw_sector_size);
static NVM_DEV_ATTR_12_RO(oob_sector_size);
static NVM_DEV_ATTR_12_RO(prog_typ);
static NVM_DEV_ATTR_12_RO(prog_max);
static NVM_DEV_ATTR_12_RO(erase_typ);
static NVM_DEV_ATTR_12_RO(erase_max);
static NVM_DEV_ATTR_12_RO(multiplane_modes);
static NVM_DEV_ATTR_12_RO(media_capabilities);
static NVM_DEV_ATTR_12_RO(max_phys_secs);

static struct attribute *nvm_dev_attrs_12[] = {
1087 1088
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,
1089 1090

	&dev_attr_vendor_opcode.attr,
1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112
	&dev_attr_device_mode.attr,
	&dev_attr_media_manager.attr,
	&dev_attr_ppa_format.attr,
	&dev_attr_media_type.attr,
	&dev_attr_flash_media_type.attr,
	&dev_attr_num_channels.attr,
	&dev_attr_num_luns.attr,
	&dev_attr_num_planes.attr,
	&dev_attr_num_blocks.attr,
	&dev_attr_num_pages.attr,
	&dev_attr_page_size.attr,
	&dev_attr_hw_sector_size.attr,
	&dev_attr_oob_sector_size.attr,
	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_prog_typ.attr,
	&dev_attr_prog_max.attr,
	&dev_attr_erase_typ.attr,
	&dev_attr_erase_max.attr,
	&dev_attr_multiplane_modes.attr,
	&dev_attr_media_capabilities.attr,
	&dev_attr_max_phys_secs.attr,
1113

1114 1115 1116
	NULL,
};

1117
static const struct attribute_group nvm_dev_attr_group_12 = {
1118
	.name		= "lightnvm",
1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159
	.attrs		= nvm_dev_attrs_12,
};

/* 2.0 values */
static NVM_DEV_ATTR_20_RO(groups);
static NVM_DEV_ATTR_20_RO(punits);
static NVM_DEV_ATTR_20_RO(chunks);
static NVM_DEV_ATTR_20_RO(clba);
static NVM_DEV_ATTR_20_RO(ws_min);
static NVM_DEV_ATTR_20_RO(ws_opt);
static NVM_DEV_ATTR_20_RO(mw_cunits);
static NVM_DEV_ATTR_20_RO(write_typ);
static NVM_DEV_ATTR_20_RO(write_max);
static NVM_DEV_ATTR_20_RO(reset_typ);
static NVM_DEV_ATTR_20_RO(reset_max);

static struct attribute *nvm_dev_attrs_20[] = {
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,

	&dev_attr_groups.attr,
	&dev_attr_punits.attr,
	&dev_attr_chunks.attr,
	&dev_attr_clba.attr,
	&dev_attr_ws_min.attr,
	&dev_attr_ws_opt.attr,
	&dev_attr_mw_cunits.attr,

	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_write_typ.attr,
	&dev_attr_write_max.attr,
	&dev_attr_reset_typ.attr,
	&dev_attr_reset_max.attr,

	NULL,
};

static const struct attribute_group nvm_dev_attr_group_20 = {
	.name		= "lightnvm",
	.attrs		= nvm_dev_attrs_20,
1160 1161 1162 1163
};

int nvme_nvm_register_sysfs(struct nvme_ns *ns)
{
1164 1165 1166 1167
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

	if (!ndev)
1168 1169
		return -EINVAL;

1170
	switch (geo->ver_id) {
1171 1172 1173 1174 1175 1176 1177 1178 1179
	case 1:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
	case 2:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
	}

	return -EINVAL;
1180 1181 1182 1183
}

void nvme_nvm_unregister_sysfs(struct nvme_ns *ns)
{
1184 1185 1186 1187
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

	switch (geo->ver_id) {
1188 1189 1190 1191 1192 1193 1194 1195 1196
	case 1:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
		break;
	case 2:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
		break;
	}
1197
}