lightnvm.c 32.6 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
M
Matias Bjørling 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * nvme-lightnvm.c - LightNVM NVMe device
 *
 * Copyright (C) 2014-2015 IT University of Copenhagen
 * Initial release: Matias Bjorling <mb@lightnvm.io>
 */

#include "nvme.h"

#include <linux/nvme.h>
#include <linux/bitops.h>
#include <linux/lightnvm.h>
#include <linux/vmalloc.h>
15 16
#include <linux/sched/sysctl.h>
#include <uapi/linux/lightnvm.h>
M
Matias Bjørling 已提交
17 18 19 20 21 22 23

enum nvme_nvm_admin_opcode {
	nvme_nvm_admin_identity		= 0xe2,
	nvme_nvm_admin_get_bb_tbl	= 0xf2,
	nvme_nvm_admin_set_bb_tbl	= 0xf1,
};

24 25 26 27
enum nvme_nvm_log_page {
	NVME_NVM_LOG_REPORT_CHUNK	= 0xca,
};

M
Matias Bjørling 已提交
28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
struct nvme_nvm_ph_rw {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd2;
	__le64			metadata;
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

44 45 46 47 48 49 50 51 52 53 54 55 56 57 58
struct nvme_nvm_erase_blk {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

M
Matias Bjørling 已提交
59 60 61 62 63 64 65 66
struct nvme_nvm_identity {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
67
	__u32			rsvd11[6];
M
Matias Bjørling 已提交
68 69
};

70
struct nvme_nvm_getbbtbl {
M
Matias Bjørling 已提交
71 72 73 74 75 76 77
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
	__le64			spba;
	__u32			rsvd4[4];
};

struct nvme_nvm_setbbtbl {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__le64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			nlb;
	__u8			value;
	__u8			rsvd3;
	__u32			rsvd4[3];
M
Matias Bjørling 已提交
95 96 97 98 99 100
};

struct nvme_nvm_command {
	union {
		struct nvme_common_command common;
		struct nvme_nvm_ph_rw ph_rw;
101 102
		struct nvme_nvm_erase_blk erase;
		struct nvme_nvm_identity identity;
103 104
		struct nvme_nvm_getbbtbl get_bb;
		struct nvme_nvm_setbbtbl set_bb;
M
Matias Bjørling 已提交
105 106 107
	};
};

108
struct nvme_nvm_id12_grp {
M
Matias Bjørling 已提交
109 110 111 112 113 114
	__u8			mtype;
	__u8			fmtype;
	__le16			res16;
	__u8			num_ch;
	__u8			num_lun;
	__u8			num_pln;
115
	__u8			rsvd1;
116
	__le16			num_chk;
M
Matias Bjørling 已提交
117 118 119 120
	__le16			num_pg;
	__le16			fpg_sz;
	__le16			csecs;
	__le16			sos;
121
	__le16			rsvd2;
M
Matias Bjørling 已提交
122 123 124 125 126 127 128
	__le32			trdt;
	__le32			trdm;
	__le32			tprt;
	__le32			tprm;
	__le32			tbet;
	__le32			tbem;
	__le32			mpos;
129
	__le32			mccap;
M
Matias Bjørling 已提交
130
	__le16			cpar;
131
	__u8			reserved[906];
M
Matias Bjørling 已提交
132 133
} __packed;

134
struct nvme_nvm_id12_addrf {
M
Matias Bjørling 已提交
135 136 137 138 139 140 141 142 143 144
	__u8			ch_offset;
	__u8			ch_len;
	__u8			lun_offset;
	__u8			lun_len;
	__u8			pln_offset;
	__u8			pln_len;
	__u8			blk_offset;
	__u8			blk_len;
	__u8			pg_offset;
	__u8			pg_len;
145 146
	__u8			sec_offset;
	__u8			sec_len;
M
Matias Bjørling 已提交
147 148 149
	__u8			res[4];
} __packed;

150
struct nvme_nvm_id12 {
M
Matias Bjørling 已提交
151 152 153
	__u8			ver_id;
	__u8			vmnt;
	__u8			cgrps;
154
	__u8			res;
M
Matias Bjørling 已提交
155 156
	__le32			cap;
	__le32			dom;
157
	struct nvme_nvm_id12_addrf ppaf;
158
	__u8			resv[228];
159
	struct nvme_nvm_id12_grp grp;
160
	__u8			resv2[2880];
M
Matias Bjørling 已提交
161 162
} __packed;

163 164 165 166 167 168 169 170 171 172 173 174 175 176
struct nvme_nvm_bb_tbl {
	__u8	tblid[4];
	__le16	verid;
	__le16	revid;
	__le32	rvsd1;
	__le32	tblks;
	__le32	tfact;
	__le32	tgrown;
	__le32	tdresv;
	__le32	thresv;
	__le32	rsvd2[8];
	__u8	blk[0];
};

177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228
struct nvme_nvm_id20_addrf {
	__u8			grp_len;
	__u8			pu_len;
	__u8			chk_len;
	__u8			lba_len;
	__u8			resv[4];
};

struct nvme_nvm_id20 {
	__u8			mjr;
	__u8			mnr;
	__u8			resv[6];

	struct nvme_nvm_id20_addrf lbaf;

	__le32			mccap;
	__u8			resv2[12];

	__u8			wit;
	__u8			resv3[31];

	/* Geometry */
	__le16			num_grp;
	__le16			num_pu;
	__le32			num_chk;
	__le32			clba;
	__u8			resv4[52];

	/* Write data requirements */
	__le32			ws_min;
	__le32			ws_opt;
	__le32			mw_cunits;
	__le32			maxoc;
	__le32			maxocpu;
	__u8			resv5[44];

	/* Performance related metrics */
	__le32			trdt;
	__le32			trdm;
	__le32			twrt;
	__le32			twrm;
	__le32			tcrst;
	__le32			tcrsm;
	__u8			resv6[40];

	/* Reserved area */
	__u8			resv7[2816];

	/* Vendor specific */
	__u8			vs[1024];
};

229 230 231 232 233 234 235 236 237 238
struct nvme_nvm_chk_meta {
	__u8	state;
	__u8	type;
	__u8	wi;
	__u8	rsvd[5];
	__le64	slba;
	__le64	cnlb;
	__le64	wp;
};

M
Matias Bjørling 已提交
239 240 241 242 243 244 245
/*
 * Check we didn't inadvertently grow the command struct
 */
static inline void _nvme_nvm_check_size(void)
{
	BUILD_BUG_ON(sizeof(struct nvme_nvm_identity) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_ph_rw) != 64);
246
	BUILD_BUG_ON(sizeof(struct nvme_nvm_erase_blk) != 64);
247 248
	BUILD_BUG_ON(sizeof(struct nvme_nvm_getbbtbl) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_setbbtbl) != 64);
249 250 251
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_grp) != 960);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_addrf) != 16);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12) != NVME_IDENTIFY_DATA_SIZE);
252
	BUILD_BUG_ON(sizeof(struct nvme_nvm_bb_tbl) != 64);
253 254
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20_addrf) != 8);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20) != NVME_IDENTIFY_DATA_SIZE);
255 256 257
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) != 32);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) !=
						sizeof(struct nvm_chk_meta));
M
Matias Bjørling 已提交
258 259
}

260 261 262 263 264 265 266 267
static void nvme_nvm_set_addr_12(struct nvm_addrf_12 *dst,
				 struct nvme_nvm_id12_addrf *src)
{
	dst->ch_len = src->ch_len;
	dst->lun_len = src->lun_len;
	dst->blk_len = src->blk_len;
	dst->pg_len = src->pg_len;
	dst->pln_len = src->pln_len;
268
	dst->sec_len = src->sec_len;
269 270 271 272 273 274

	dst->ch_offset = src->ch_offset;
	dst->lun_offset = src->lun_offset;
	dst->blk_offset = src->blk_offset;
	dst->pg_offset = src->pg_offset;
	dst->pln_offset = src->pln_offset;
275
	dst->sec_offset = src->sec_offset;
276 277 278 279 280 281

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->blk_mask = ((1ULL << dst->blk_len) - 1) << dst->blk_offset;
	dst->pg_mask = ((1ULL << dst->pg_len) - 1) << dst->pg_offset;
	dst->pln_mask = ((1ULL << dst->pln_len) - 1) << dst->pln_offset;
282
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
283 284 285 286
}

static int nvme_nvm_setup_12(struct nvme_nvm_id12 *id,
			     struct nvm_geo *geo)
M
Matias Bjørling 已提交
287
{
288
	struct nvme_nvm_id12_grp *src;
289
	int sec_per_pg, sec_per_pl, pg_per_blk;
290

291 292 293 294 295 296 297
	if (id->cgrps != 1)
		return -EINVAL;

	src = &id->grp;

	if (src->mtype != 0) {
		pr_err("nvm: memory type not supported\n");
298
		return -EINVAL;
299
	}
300

301 302 303
	/* 1.2 spec. only reports a single version id - unfold */
	geo->major_ver_id = id->ver_id;
	geo->minor_ver_id = 2;
304

305 306 307
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_12;

308 309 310
	geo->num_ch = src->num_ch;
	geo->num_lun = src->num_lun;
	geo->all_luns = geo->num_ch * geo->num_lun;
311

312
	geo->num_chk = le16_to_cpu(src->num_chk);
313

314 315
	geo->csecs = le16_to_cpu(src->csecs);
	geo->sos = le16_to_cpu(src->sos);
316 317

	pg_per_blk = le16_to_cpu(src->num_pg);
318
	sec_per_pg = le16_to_cpu(src->fpg_sz) / geo->csecs;
319
	sec_per_pl = sec_per_pg * src->num_pln;
320 321
	geo->clba = sec_per_pl * pg_per_blk;

322
	geo->all_chunks = geo->all_luns * geo->num_chk;
323 324 325 326 327
	geo->total_secs = geo->clba * geo->all_chunks;

	geo->ws_min = sec_per_pg;
	geo->ws_opt = sec_per_pg;
	geo->mw_cunits = geo->ws_opt << 3;	/* default to MLC safe values */
328

329 330 331 332
	/* Do not impose values for maximum number of open blocks as it is
	 * unspecified in 1.2. Users of 1.2 must be aware of this and eventually
	 * specify these values through a quirk if restrictions apply.
	 */
333 334
	geo->maxoc = geo->all_luns * geo->num_chk;
	geo->maxocpu = geo->num_chk;
335

336 337 338 339 340 341 342 343
	geo->mccap = le32_to_cpu(src->mccap);

	geo->trdt = le32_to_cpu(src->trdt);
	geo->trdm = le32_to_cpu(src->trdm);
	geo->tprt = le32_to_cpu(src->tprt);
	geo->tprm = le32_to_cpu(src->tprm);
	geo->tbet = le32_to_cpu(src->tbet);
	geo->tbem = le32_to_cpu(src->tbem);
344 345

	/* 1.2 compatibility */
346 347 348 349 350 351 352 353 354 355
	geo->vmnt = id->vmnt;
	geo->cap = le32_to_cpu(id->cap);
	geo->dom = le32_to_cpu(id->dom);

	geo->mtype = src->mtype;
	geo->fmtype = src->fmtype;

	geo->cpar = le16_to_cpu(src->cpar);
	geo->mpos = le32_to_cpu(src->mpos);

356
	geo->pln_mode = NVM_PLANE_SINGLE;
357 358

	if (geo->mpos & 0x020202) {
359
		geo->pln_mode = NVM_PLANE_DOUBLE;
360 361
		geo->ws_opt <<= 1;
	} else if (geo->mpos & 0x040404) {
362
		geo->pln_mode = NVM_PLANE_QUAD;
363 364 365 366 367 368 369 370
		geo->ws_opt <<= 2;
	}

	geo->num_pln = src->num_pln;
	geo->num_pg = le16_to_cpu(src->num_pg);
	geo->fpg_sz = le16_to_cpu(src->fpg_sz);

	nvme_nvm_set_addr_12((struct nvm_addrf_12 *)&geo->addrf, &id->ppaf);
371

M
Matias Bjørling 已提交
372 373 374
	return 0;
}

375 376
static void nvme_nvm_set_addr_20(struct nvm_addrf *dst,
				 struct nvme_nvm_id20_addrf *src)
377
{
378 379 380 381 382 383 384 385 386 387 388 389 390 391
	dst->ch_len = src->grp_len;
	dst->lun_len = src->pu_len;
	dst->chk_len = src->chk_len;
	dst->sec_len = src->lba_len;

	dst->sec_offset = 0;
	dst->chk_offset = dst->sec_len;
	dst->lun_offset = dst->chk_offset + dst->chk_len;
	dst->ch_offset = dst->lun_offset + dst->lun_len;

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->chk_mask = ((1ULL << dst->chk_len) - 1) << dst->chk_offset;
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
392 393
}

394 395
static int nvme_nvm_setup_20(struct nvme_nvm_id20 *id,
			     struct nvm_geo *geo)
396
{
397 398 399
	geo->major_ver_id = id->mjr;
	geo->minor_ver_id = id->mnr;

400 401 402
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_20;

403 404 405
	geo->num_ch = le16_to_cpu(id->num_grp);
	geo->num_lun = le16_to_cpu(id->num_pu);
	geo->all_luns = geo->num_ch * geo->num_lun;
406

407
	geo->num_chk = le32_to_cpu(id->num_chk);
408
	geo->clba = le32_to_cpu(id->clba);
409

410
	geo->all_chunks = geo->all_luns * geo->num_chk;
411
	geo->total_secs = geo->clba * geo->all_chunks;
412

413 414 415
	geo->ws_min = le32_to_cpu(id->ws_min);
	geo->ws_opt = le32_to_cpu(id->ws_opt);
	geo->mw_cunits = le32_to_cpu(id->mw_cunits);
416 417
	geo->maxoc = le32_to_cpu(id->maxoc);
	geo->maxocpu = le32_to_cpu(id->maxocpu);
418

419 420 421 422 423 424 425 426
	geo->trdt = le32_to_cpu(id->trdt);
	geo->trdm = le32_to_cpu(id->trdm);
	geo->tprt = le32_to_cpu(id->twrt);
	geo->tprm = le32_to_cpu(id->twrm);
	geo->tbet = le32_to_cpu(id->tcrst);
	geo->tbem = le32_to_cpu(id->tcrsm);

	nvme_nvm_set_addr_20(&geo->addrf, &id->lbaf);
427 428 429 430

	return 0;
}

431
static int nvme_nvm_identity(struct nvm_dev *nvmdev)
M
Matias Bjørling 已提交
432
{
433
	struct nvme_ns *ns = nvmdev->q->queuedata;
434
	struct nvme_nvm_id12 *id;
M
Matias Bjørling 已提交
435 436 437 438
	struct nvme_nvm_command c = {};
	int ret;

	c.identity.opcode = nvme_nvm_admin_identity;
C
Christoph Hellwig 已提交
439
	c.identity.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
440

441 442
	id = kmalloc(sizeof(struct nvme_nvm_id12), GFP_KERNEL);
	if (!id)
M
Matias Bjørling 已提交
443 444
		return -ENOMEM;

445
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
446
				id, sizeof(struct nvme_nvm_id12));
M
Matias Bjørling 已提交
447 448 449 450 451
	if (ret) {
		ret = -EIO;
		goto out;
	}

452 453 454 455 456 457
	/*
	 * The 1.2 and 2.0 specifications share the first byte in their geometry
	 * command to make it possible to know what version a device implements.
	 */
	switch (id->ver_id) {
	case 1:
458
		ret = nvme_nvm_setup_12(id, &nvmdev->geo);
459 460
		break;
	case 2:
461 462
		ret = nvme_nvm_setup_20((struct nvme_nvm_id20 *)id,
							&nvmdev->geo);
463 464
		break;
	default:
465 466
		dev_err(ns->ctrl->device, "OCSSD revision not supported (%d)\n",
							id->ver_id);
467 468
		ret = -EINVAL;
	}
469

M
Matias Bjørling 已提交
470
out:
471
	kfree(id);
M
Matias Bjørling 已提交
472 473 474
	return ret;
}

475
static int nvme_nvm_get_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr ppa,
476
								u8 *blks)
M
Matias Bjørling 已提交
477
{
478
	struct request_queue *q = nvmdev->q;
479
	struct nvm_geo *geo = &nvmdev->geo;
M
Matias Bjørling 已提交
480
	struct nvme_ns *ns = q->queuedata;
481
	struct nvme_ctrl *ctrl = ns->ctrl;
M
Matias Bjørling 已提交
482
	struct nvme_nvm_command c = {};
483
	struct nvme_nvm_bb_tbl *bb_tbl;
484
	int nr_blks = geo->num_chk * geo->num_pln;
485
	int tblsz = sizeof(struct nvme_nvm_bb_tbl) + nr_blks;
M
Matias Bjørling 已提交
486 487 488
	int ret = 0;

	c.get_bb.opcode = nvme_nvm_admin_get_bb_tbl;
C
Christoph Hellwig 已提交
489
	c.get_bb.nsid = cpu_to_le32(ns->head->ns_id);
490
	c.get_bb.spba = cpu_to_le64(ppa.ppa);
M
Matias Bjørling 已提交
491

492 493 494
	bb_tbl = kzalloc(tblsz, GFP_KERNEL);
	if (!bb_tbl)
		return -ENOMEM;
M
Matias Bjørling 已提交
495

496
	ret = nvme_submit_sync_cmd(ctrl->admin_q, (struct nvme_command *)&c,
497
								bb_tbl, tblsz);
M
Matias Bjørling 已提交
498
	if (ret) {
499
		dev_err(ctrl->device, "get bad block table failed (%d)\n", ret);
M
Matias Bjørling 已提交
500 501 502 503
		ret = -EIO;
		goto out;
	}

504 505
	if (bb_tbl->tblid[0] != 'B' || bb_tbl->tblid[1] != 'B' ||
		bb_tbl->tblid[2] != 'L' || bb_tbl->tblid[3] != 'T') {
506
		dev_err(ctrl->device, "bbt format mismatch\n");
507 508 509 510 511 512
		ret = -EINVAL;
		goto out;
	}

	if (le16_to_cpu(bb_tbl->verid) != 1) {
		ret = -EINVAL;
513
		dev_err(ctrl->device, "bbt version not supported\n");
514 515 516
		goto out;
	}

517
	if (le32_to_cpu(bb_tbl->tblks) != nr_blks) {
518
		ret = -EINVAL;
519 520
		dev_err(ctrl->device,
				"bbt unsuspected blocks returned (%u!=%u)",
521
				le32_to_cpu(bb_tbl->tblks), nr_blks);
522 523 524
		goto out;
	}

525
	memcpy(blks, bb_tbl->blk, geo->num_chk * geo->num_pln);
M
Matias Bjørling 已提交
526
out:
527 528 529 530
	kfree(bb_tbl);
	return ret;
}

531 532
static int nvme_nvm_set_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr *ppas,
							int nr_ppas, int type)
533
{
534
	struct nvme_ns *ns = nvmdev->q->queuedata;
535 536 537 538
	struct nvme_nvm_command c = {};
	int ret = 0;

	c.set_bb.opcode = nvme_nvm_admin_set_bb_tbl;
C
Christoph Hellwig 已提交
539
	c.set_bb.nsid = cpu_to_le32(ns->head->ns_id);
540 541
	c.set_bb.spba = cpu_to_le64(ppas->ppa);
	c.set_bb.nlb = cpu_to_le16(nr_ppas - 1);
542 543
	c.set_bb.value = type;

544
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
545
								NULL, 0);
546
	if (ret)
547 548
		dev_err(ns->ctrl->device, "set bad block table failed (%d)\n",
									ret);
M
Matias Bjørling 已提交
549 550 551
	return ret;
}

552 553 554 555
/*
 * Expect the lba in device format
 */
static int nvme_nvm_get_chk_meta(struct nvm_dev *ndev,
556 557
				 sector_t slba, int nchks,
				 struct nvm_chk_meta *meta)
558 559 560 561
{
	struct nvm_geo *geo = &ndev->geo;
	struct nvme_ns *ns = ndev->q->queuedata;
	struct nvme_ctrl *ctrl = ns->ctrl;
562
	struct nvme_nvm_chk_meta *dev_meta, *dev_meta_off;
563 564 565
	struct ppa_addr ppa;
	size_t left = nchks * sizeof(struct nvme_nvm_chk_meta);
	size_t log_pos, offset, len;
566 567
	int i, max_len;
	int ret = 0;
568 569 570 571 572 573

	/*
	 * limit requests to maximum 256K to avoid issuing arbitrary large
	 * requests when the device does not specific a maximum transfer size.
	 */
	max_len = min_t(unsigned int, ctrl->max_hw_sectors << 9, 256 * 1024);
574

575 576 577 578
	dev_meta = kmalloc(max_len, GFP_KERNEL);
	if (!dev_meta)
		return -ENOMEM;

579 580 581 582 583 584 585 586 587 588 589
	/* Normalize lba address space to obtain log offset */
	ppa.ppa = slba;
	ppa = dev_to_generic_addr(ndev, ppa);

	log_pos = ppa.m.chk;
	log_pos += ppa.m.pu * geo->num_chk;
	log_pos += ppa.m.grp * geo->num_lun * geo->num_chk;

	offset = log_pos * sizeof(struct nvme_nvm_chk_meta);

	while (left) {
590
		len = min_t(unsigned int, left, max_len);
591

592 593 594
		memset(dev_meta, 0, max_len);
		dev_meta_off = dev_meta;

595 596 597
		ret = nvme_get_log(ctrl, ns->head->ns_id,
				NVME_NVM_LOG_REPORT_CHUNK, 0, dev_meta, len,
				offset);
598 599 600 601 602 603
		if (ret) {
			dev_err(ctrl->device, "Get REPORT CHUNK log error\n");
			break;
		}

		for (i = 0; i < len; i += sizeof(struct nvme_nvm_chk_meta)) {
604 605 606 607 608 609
			meta->state = dev_meta_off->state;
			meta->type = dev_meta_off->type;
			meta->wi = dev_meta_off->wi;
			meta->slba = le64_to_cpu(dev_meta_off->slba);
			meta->cnlb = le64_to_cpu(dev_meta_off->cnlb);
			meta->wp = le64_to_cpu(dev_meta_off->wp);
610 611

			meta++;
612
			dev_meta_off++;
613 614 615 616 617 618
		}

		offset += len;
		left -= len;
	}

619 620
	kfree(dev_meta);

621 622 623
	return ret;
}

624 625
static inline void nvme_nvm_rqtocmd(struct nvm_rq *rqd, struct nvme_ns *ns,
				    struct nvme_nvm_command *c)
M
Matias Bjørling 已提交
626 627
{
	c->ph_rw.opcode = rqd->opcode;
C
Christoph Hellwig 已提交
628
	c->ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
629
	c->ph_rw.spba = cpu_to_le64(rqd->ppa_addr.ppa);
630
	c->ph_rw.metadata = cpu_to_le64(rqd->dma_meta_list);
M
Matias Bjørling 已提交
631
	c->ph_rw.control = cpu_to_le16(rqd->flags);
632
	c->ph_rw.length = cpu_to_le16(rqd->nr_ppas - 1);
M
Matias Bjørling 已提交
633 634
}

635
static void nvme_nvm_end_io(struct request *rq, blk_status_t status)
M
Matias Bjørling 已提交
636 637 638
{
	struct nvm_rq *rqd = rq->end_io_data;

639
	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
640
	rqd->error = nvme_req(rq)->status;
641
	nvm_end_io(rqd);
M
Matias Bjørling 已提交
642

643
	kfree(nvme_req(rq)->cmd);
M
Matias Bjørling 已提交
644 645 646
	blk_mq_free_request(rq);
}

647 648 649
static struct request *nvme_nvm_alloc_request(struct request_queue *q,
					      struct nvm_rq *rqd,
					      struct nvme_nvm_command *cmd)
M
Matias Bjørling 已提交
650 651 652 653
{
	struct nvme_ns *ns = q->queuedata;
	struct request *rq;

654
	nvme_nvm_rqtocmd(rqd, ns, cmd);
655

656
	rq = nvme_alloc_request(q, (struct nvme_command *)cmd, 0, NVME_QID_ANY);
657 658 659
	if (IS_ERR(rq))
		return rq;

660
	rq->cmd_flags &= ~REQ_FAILFAST_DRIVER;
M
Matias Bjørling 已提交
661

662
	if (rqd->bio)
663
		blk_init_request_from_bio(rq, rqd->bio);
664
	else
665
		rq->ioprio = IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, IOPRIO_NORM);
M
Matias Bjørling 已提交
666

667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685
	return rq;
}

static int nvme_nvm_submit_io(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct nvme_nvm_command *cmd;
	struct request *rq;

	cmd = kzalloc(sizeof(struct nvme_nvm_command), GFP_KERNEL);
	if (!cmd)
		return -ENOMEM;

	rq = nvme_nvm_alloc_request(q, rqd, cmd);
	if (IS_ERR(rq)) {
		kfree(cmd);
		return PTR_ERR(rq);
	}

M
Matias Bjørling 已提交
686 687 688 689 690 691 692
	rq->end_io_data = rqd;

	blk_execute_rq_nowait(q, NULL, rq, 0, nvme_nvm_end_io);

	return 0;
}

693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720
static int nvme_nvm_submit_io_sync(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct request *rq;
	struct nvme_nvm_command cmd;
	int ret = 0;

	memset(&cmd, 0, sizeof(struct nvme_nvm_command));

	rq = nvme_nvm_alloc_request(q, rqd, &cmd);
	if (IS_ERR(rq))
		return PTR_ERR(rq);

	/* I/Os can fail and the error is signaled through rqd. Callers must
	 * handle the error accordingly.
	 */
	blk_execute_rq(q, NULL, rq, 0);
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;

	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
	rqd->error = nvme_req(rq)->status;

	blk_mq_free_request(rq);

	return ret;
}

721 722
static void *nvme_nvm_create_dma_pool(struct nvm_dev *nvmdev, char *name,
					int size)
M
Matias Bjørling 已提交
723
{
724
	struct nvme_ns *ns = nvmdev->q->queuedata;
M
Matias Bjørling 已提交
725

726
	return dma_pool_create(name, ns->ctrl->dev, size, PAGE_SIZE, 0);
M
Matias Bjørling 已提交
727 728 729 730 731 732 733 734 735
}

static void nvme_nvm_destroy_dma_pool(void *pool)
{
	struct dma_pool *dma_pool = pool;

	dma_pool_destroy(dma_pool);
}

736
static void *nvme_nvm_dev_dma_alloc(struct nvm_dev *dev, void *pool,
M
Matias Bjørling 已提交
737 738 739 740 741
				    gfp_t mem_flags, dma_addr_t *dma_handler)
{
	return dma_pool_alloc(pool, mem_flags, dma_handler);
}

742
static void nvme_nvm_dev_dma_free(void *pool, void *addr,
M
Matias Bjørling 已提交
743 744
							dma_addr_t dma_handler)
{
745
	dma_pool_free(pool, addr, dma_handler);
M
Matias Bjørling 已提交
746 747 748 749 750 751
}

static struct nvm_dev_ops nvme_nvm_dev_ops = {
	.identity		= nvme_nvm_identity,

	.get_bb_tbl		= nvme_nvm_get_bb_tbl,
752
	.set_bb_tbl		= nvme_nvm_set_bb_tbl,
M
Matias Bjørling 已提交
753

754 755
	.get_chk_meta		= nvme_nvm_get_chk_meta,

M
Matias Bjørling 已提交
756
	.submit_io		= nvme_nvm_submit_io,
757
	.submit_io_sync		= nvme_nvm_submit_io_sync,
M
Matias Bjørling 已提交
758 759 760 761 762 763 764

	.create_dma_pool	= nvme_nvm_create_dma_pool,
	.destroy_dma_pool	= nvme_nvm_destroy_dma_pool,
	.dev_dma_alloc		= nvme_nvm_dev_dma_alloc,
	.dev_dma_free		= nvme_nvm_dev_dma_free,
};

765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782
static int nvme_nvm_submit_user_cmd(struct request_queue *q,
				struct nvme_ns *ns,
				struct nvme_nvm_command *vcmd,
				void __user *ubuf, unsigned int bufflen,
				void __user *meta_buf, unsigned int meta_len,
				void __user *ppa_buf, unsigned int ppa_len,
				u32 *result, u64 *status, unsigned int timeout)
{
	bool write = nvme_is_write((struct nvme_command *)vcmd);
	struct nvm_dev *dev = ns->ndev;
	struct gendisk *disk = ns->disk;
	struct request *rq;
	struct bio *bio = NULL;
	__le64 *ppa_list = NULL;
	dma_addr_t ppa_dma;
	__le64 *metadata = NULL;
	dma_addr_t metadata_dma;
	DECLARE_COMPLETION_ONSTACK(wait);
783
	int ret = 0;
784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834

	rq = nvme_alloc_request(q, (struct nvme_command *)vcmd, 0,
			NVME_QID_ANY);
	if (IS_ERR(rq)) {
		ret = -ENOMEM;
		goto err_cmd;
	}

	rq->timeout = timeout ? timeout : ADMIN_TIMEOUT;

	if (ppa_buf && ppa_len) {
		ppa_list = dma_pool_alloc(dev->dma_pool, GFP_KERNEL, &ppa_dma);
		if (!ppa_list) {
			ret = -ENOMEM;
			goto err_rq;
		}
		if (copy_from_user(ppa_list, (void __user *)ppa_buf,
						sizeof(u64) * (ppa_len + 1))) {
			ret = -EFAULT;
			goto err_ppa;
		}
		vcmd->ph_rw.spba = cpu_to_le64(ppa_dma);
	} else {
		vcmd->ph_rw.spba = cpu_to_le64((uintptr_t)ppa_buf);
	}

	if (ubuf && bufflen) {
		ret = blk_rq_map_user(q, rq, NULL, ubuf, bufflen, GFP_KERNEL);
		if (ret)
			goto err_ppa;
		bio = rq->bio;

		if (meta_buf && meta_len) {
			metadata = dma_pool_alloc(dev->dma_pool, GFP_KERNEL,
								&metadata_dma);
			if (!metadata) {
				ret = -ENOMEM;
				goto err_map;
			}

			if (write) {
				if (copy_from_user(metadata,
						(void __user *)meta_buf,
						meta_len)) {
					ret = -EFAULT;
					goto err_meta;
				}
			}
			vcmd->ph_rw.metadata = cpu_to_le64(metadata_dma);
		}

835
		bio->bi_disk = disk;
836 837
	}

838
	blk_execute_rq(q, NULL, rq, 0);
839

840 841
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;
842 843
	else if (nvme_req(rq)->status & 0x7ff)
		ret = -EIO;
844
	if (result)
845
		*result = nvme_req(rq)->status & 0x7ff;
846 847 848 849 850 851 852 853 854 855 856
	if (status)
		*status = le64_to_cpu(nvme_req(rq)->result.u64);

	if (metadata && !ret && !write) {
		if (copy_to_user(meta_buf, (void *)metadata, meta_len))
			ret = -EFAULT;
	}
err_meta:
	if (meta_buf && meta_len)
		dma_pool_free(dev->dma_pool, metadata, metadata_dma);
err_map:
857
	if (bio)
858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882
		blk_rq_unmap_user(bio);
err_ppa:
	if (ppa_buf && ppa_len)
		dma_pool_free(dev->dma_pool, ppa_list, ppa_dma);
err_rq:
	blk_mq_free_request(rq);
err_cmd:
	return ret;
}

static int nvme_nvm_submit_vio(struct nvme_ns *ns,
					struct nvm_user_vio __user *uvio)
{
	struct nvm_user_vio vio;
	struct nvme_nvm_command c;
	unsigned int length;
	int ret;

	if (copy_from_user(&vio, uvio, sizeof(vio)))
		return -EFAULT;
	if (vio.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.ph_rw.opcode = vio.opcode;
C
Christoph Hellwig 已提交
883
	c.ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919
	c.ph_rw.control = cpu_to_le16(vio.control);
	c.ph_rw.length = cpu_to_le16(vio.nppas);

	length = (vio.nppas + 1) << ns->lba_shift;

	ret = nvme_nvm_submit_user_cmd(ns->queue, ns, &c,
			(void __user *)(uintptr_t)vio.addr, length,
			(void __user *)(uintptr_t)vio.metadata,
							vio.metadata_len,
			(void __user *)(uintptr_t)vio.ppa_list, vio.nppas,
			&vio.result, &vio.status, 0);

	if (ret && copy_to_user(uvio, &vio, sizeof(vio)))
		return -EFAULT;

	return ret;
}

static int nvme_nvm_user_vcmd(struct nvme_ns *ns, int admin,
					struct nvm_passthru_vio __user *uvcmd)
{
	struct nvm_passthru_vio vcmd;
	struct nvme_nvm_command c;
	struct request_queue *q;
	unsigned int timeout = 0;
	int ret;

	if (copy_from_user(&vcmd, uvcmd, sizeof(vcmd)))
		return -EFAULT;
	if ((vcmd.opcode != 0xF2) && (!capable(CAP_SYS_ADMIN)))
		return -EACCES;
	if (vcmd.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.common.opcode = vcmd.opcode;
C
Christoph Hellwig 已提交
920
	c.common.nsid = cpu_to_le32(ns->head->ns_id);
921 922 923 924
	c.common.cdw2[0] = cpu_to_le32(vcmd.cdw2);
	c.common.cdw2[1] = cpu_to_le32(vcmd.cdw3);
	/* cdw11-12 */
	c.ph_rw.length = cpu_to_le16(vcmd.nppas);
925
	c.ph_rw.control  = cpu_to_le16(vcmd.control);
926 927 928
	c.common.cdw13 = cpu_to_le32(vcmd.cdw13);
	c.common.cdw14 = cpu_to_le32(vcmd.cdw14);
	c.common.cdw15 = cpu_to_le32(vcmd.cdw15);
929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962

	if (vcmd.timeout_ms)
		timeout = msecs_to_jiffies(vcmd.timeout_ms);

	q = admin ? ns->ctrl->admin_q : ns->queue;

	ret = nvme_nvm_submit_user_cmd(q, ns,
			(struct nvme_nvm_command *)&c,
			(void __user *)(uintptr_t)vcmd.addr, vcmd.data_len,
			(void __user *)(uintptr_t)vcmd.metadata,
							vcmd.metadata_len,
			(void __user *)(uintptr_t)vcmd.ppa_list, vcmd.nppas,
			&vcmd.result, &vcmd.status, timeout);

	if (ret && copy_to_user(uvcmd, &vcmd, sizeof(vcmd)))
		return -EFAULT;

	return ret;
}

int nvme_nvm_ioctl(struct nvme_ns *ns, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
	case NVME_NVM_IOCTL_ADMIN_VIO:
		return nvme_nvm_user_vcmd(ns, 1, (void __user *)arg);
	case NVME_NVM_IOCTL_IO_VIO:
		return nvme_nvm_user_vcmd(ns, 0, (void __user *)arg);
	case NVME_NVM_IOCTL_SUBMIT_VIO:
		return nvme_nvm_submit_vio(ns, (void __user *)arg);
	default:
		return -ENOTTY;
	}
}

963
int nvme_nvm_register(struct nvme_ns *ns, char *disk_name, int node)
M
Matias Bjørling 已提交
964
{
965 966
	struct request_queue *q = ns->queue;
	struct nvm_dev *dev;
967
	struct nvm_geo *geo;
968

969 970
	_nvme_nvm_check_size();

971 972 973 974
	dev = nvm_alloc_dev(node);
	if (!dev)
		return -ENOMEM;

975 976 977 978
	/* Note that csecs and sos will be overridden if it is a 1.2 drive. */
	geo = &dev->geo;
	geo->csecs = 1 << ns->lba_shift;
	geo->sos = ns->ms;
979
	geo->ext = ns->ext;
980

981 982 983
	dev->q = q;
	memcpy(dev->name, disk_name, DISK_NAME_LEN);
	dev->ops = &nvme_nvm_dev_ops;
984
	dev->private_data = ns;
985 986
	ns->ndev = dev;

987
	return nvm_register(dev);
M
Matias Bjørling 已提交
988 989
}

990
void nvme_nvm_unregister(struct nvme_ns *ns)
M
Matias Bjørling 已提交
991
{
992
	nvm_unregister(ns->ndev);
M
Matias Bjørling 已提交
993 994
}

995
static ssize_t nvm_dev_attr_show(struct device *dev,
996
		struct device_attribute *dattr, char *page)
997 998 999
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1000
	struct nvm_geo *geo = &ndev->geo;
1001 1002 1003 1004 1005 1006 1007 1008
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "version") == 0) {
1009 1010 1011 1012 1013 1014 1015
		if (geo->major_ver_id == 1)
			return scnprintf(page, PAGE_SIZE, "%u\n",
						geo->major_ver_id);
		else
			return scnprintf(page, PAGE_SIZE, "%u.%u\n",
						geo->major_ver_id,
						geo->minor_ver_id);
1016
	} else if (strcmp(attr->name, "capabilities") == 0) {
1017
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->cap);
1018
	} else if (strcmp(attr->name, "read_typ") == 0) {
1019
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdt);
1020
	} else if (strcmp(attr->name, "read_max") == 0) {
1021
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdm);
1022 1023 1024
	} else {
		return scnprintf(page,
				 PAGE_SIZE,
1025 1026
				 "Unhandled attr(%s) in `%s`\n",
				 attr->name, __func__);
1027 1028 1029
	}
}

1030 1031 1032 1033 1034 1035 1036 1037 1038
static ssize_t nvm_dev_attr_show_ppaf(struct nvm_addrf_12 *ppaf, char *page)
{
	return scnprintf(page, PAGE_SIZE,
		"0x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x\n",
				ppaf->ch_offset, ppaf->ch_len,
				ppaf->lun_offset, ppaf->lun_len,
				ppaf->pln_offset, ppaf->pln_len,
				ppaf->blk_offset, ppaf->blk_len,
				ppaf->pg_offset, ppaf->pg_len,
1039
				ppaf->sec_offset, ppaf->sec_len);
1040 1041
}

1042 1043 1044 1045 1046
static ssize_t nvm_dev_attr_show_12(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1047
	struct nvm_geo *geo = &ndev->geo;
1048 1049 1050 1051 1052 1053 1054 1055
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "vendor_opcode") == 0) {
1056
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->vmnt);
1057
	} else if (strcmp(attr->name, "device_mode") == 0) {
1058
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->dom);
1059
	/* kept for compatibility */
1060
	} else if (strcmp(attr->name, "media_manager") == 0) {
1061
		return scnprintf(page, PAGE_SIZE, "%s\n", "gennvm");
1062
	} else if (strcmp(attr->name, "ppa_format") == 0) {
1063
		return nvm_dev_attr_show_ppaf((void *)&geo->addrf, page);
1064
	} else if (strcmp(attr->name, "media_type") == 0) {	/* u8 */
1065
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mtype);
1066
	} else if (strcmp(attr->name, "flash_media_type") == 0) {
1067
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fmtype);
1068
	} else if (strcmp(attr->name, "num_channels") == 0) {
1069
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1070
	} else if (strcmp(attr->name, "num_luns") == 0) {
1071
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1072
	} else if (strcmp(attr->name, "num_planes") == 0) {
1073
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pln);
1074
	} else if (strcmp(attr->name, "num_blocks") == 0) {	/* u16 */
1075
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1076
	} else if (strcmp(attr->name, "num_pages") == 0) {
1077
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pg);
1078
	} else if (strcmp(attr->name, "page_size") == 0) {
1079
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fpg_sz);
1080
	} else if (strcmp(attr->name, "hw_sector_size") == 0) {
1081
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->csecs);
1082
	} else if (strcmp(attr->name, "oob_sector_size") == 0) {/* u32 */
1083
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->sos);
1084
	} else if (strcmp(attr->name, "prog_typ") == 0) {
1085
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1086
	} else if (strcmp(attr->name, "prog_max") == 0) {
1087
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1088
	} else if (strcmp(attr->name, "erase_typ") == 0) {
1089
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1090
	} else if (strcmp(attr->name, "erase_max") == 0) {
1091
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1092
	} else if (strcmp(attr->name, "multiplane_modes") == 0) {
1093
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mpos);
1094
	} else if (strcmp(attr->name, "media_capabilities") == 0) {
1095
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mccap);
1096
	} else if (strcmp(attr->name, "max_phys_secs") == 0) {
1097
		return scnprintf(page, PAGE_SIZE, "%u\n", NVM_MAX_VLBA);
1098
	} else {
1099
		return scnprintf(page, PAGE_SIZE,
1100 1101
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1102 1103 1104
	}
}

1105 1106 1107 1108 1109
static ssize_t nvm_dev_attr_show_20(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1110
	struct nvm_geo *geo = &ndev->geo;
1111 1112 1113 1114 1115 1116 1117 1118
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "groups") == 0) {
1119
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1120
	} else if (strcmp(attr->name, "punits") == 0) {
1121
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1122
	} else if (strcmp(attr->name, "chunks") == 0) {
1123
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1124
	} else if (strcmp(attr->name, "clba") == 0) {
1125
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->clba);
1126
	} else if (strcmp(attr->name, "ws_min") == 0) {
1127
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_min);
1128
	} else if (strcmp(attr->name, "ws_opt") == 0) {
1129
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_opt);
1130 1131 1132 1133
	} else if (strcmp(attr->name, "maxoc") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxoc);
	} else if (strcmp(attr->name, "maxocpu") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxocpu);
1134
	} else if (strcmp(attr->name, "mw_cunits") == 0) {
1135
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mw_cunits);
1136
	} else if (strcmp(attr->name, "write_typ") == 0) {
1137
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1138
	} else if (strcmp(attr->name, "write_max") == 0) {
1139
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1140
	} else if (strcmp(attr->name, "reset_typ") == 0) {
1141
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1142
	} else if (strcmp(attr->name, "reset_max") == 0) {
1143
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1144
	} else {
1145
		return scnprintf(page, PAGE_SIZE,
1146 1147
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1148 1149 1150 1151
	}
}

#define NVM_DEV_ATTR_RO(_name)					\
1152
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show, NULL)
1153 1154 1155 1156
#define NVM_DEV_ATTR_12_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_12, NULL)
#define NVM_DEV_ATTR_20_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_20, NULL)
1157

1158
/* general attributes */
1159 1160
static NVM_DEV_ATTR_RO(version);
static NVM_DEV_ATTR_RO(capabilities);
1161

1162 1163
static NVM_DEV_ATTR_RO(read_typ);
static NVM_DEV_ATTR_RO(read_max);
1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187

/* 1.2 values */
static NVM_DEV_ATTR_12_RO(vendor_opcode);
static NVM_DEV_ATTR_12_RO(device_mode);
static NVM_DEV_ATTR_12_RO(ppa_format);
static NVM_DEV_ATTR_12_RO(media_manager);
static NVM_DEV_ATTR_12_RO(media_type);
static NVM_DEV_ATTR_12_RO(flash_media_type);
static NVM_DEV_ATTR_12_RO(num_channels);
static NVM_DEV_ATTR_12_RO(num_luns);
static NVM_DEV_ATTR_12_RO(num_planes);
static NVM_DEV_ATTR_12_RO(num_blocks);
static NVM_DEV_ATTR_12_RO(num_pages);
static NVM_DEV_ATTR_12_RO(page_size);
static NVM_DEV_ATTR_12_RO(hw_sector_size);
static NVM_DEV_ATTR_12_RO(oob_sector_size);
static NVM_DEV_ATTR_12_RO(prog_typ);
static NVM_DEV_ATTR_12_RO(prog_max);
static NVM_DEV_ATTR_12_RO(erase_typ);
static NVM_DEV_ATTR_12_RO(erase_max);
static NVM_DEV_ATTR_12_RO(multiplane_modes);
static NVM_DEV_ATTR_12_RO(media_capabilities);
static NVM_DEV_ATTR_12_RO(max_phys_secs);

1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204
/* 2.0 values */
static NVM_DEV_ATTR_20_RO(groups);
static NVM_DEV_ATTR_20_RO(punits);
static NVM_DEV_ATTR_20_RO(chunks);
static NVM_DEV_ATTR_20_RO(clba);
static NVM_DEV_ATTR_20_RO(ws_min);
static NVM_DEV_ATTR_20_RO(ws_opt);
static NVM_DEV_ATTR_20_RO(maxoc);
static NVM_DEV_ATTR_20_RO(maxocpu);
static NVM_DEV_ATTR_20_RO(mw_cunits);
static NVM_DEV_ATTR_20_RO(write_typ);
static NVM_DEV_ATTR_20_RO(write_max);
static NVM_DEV_ATTR_20_RO(reset_typ);
static NVM_DEV_ATTR_20_RO(reset_max);

static struct attribute *nvm_dev_attrs[] = {
	/* version agnostic attrs */
1205 1206
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,
1207 1208
	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
1209

1210
	/* 1.2 attrs */
1211
	&dev_attr_vendor_opcode.attr,
1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231
	&dev_attr_device_mode.attr,
	&dev_attr_media_manager.attr,
	&dev_attr_ppa_format.attr,
	&dev_attr_media_type.attr,
	&dev_attr_flash_media_type.attr,
	&dev_attr_num_channels.attr,
	&dev_attr_num_luns.attr,
	&dev_attr_num_planes.attr,
	&dev_attr_num_blocks.attr,
	&dev_attr_num_pages.attr,
	&dev_attr_page_size.attr,
	&dev_attr_hw_sector_size.attr,
	&dev_attr_oob_sector_size.attr,
	&dev_attr_prog_typ.attr,
	&dev_attr_prog_max.attr,
	&dev_attr_erase_typ.attr,
	&dev_attr_erase_max.attr,
	&dev_attr_multiplane_modes.attr,
	&dev_attr_media_capabilities.attr,
	&dev_attr_max_phys_secs.attr,
1232

1233
	/* 2.0 attrs */
1234 1235 1236 1237 1238 1239
	&dev_attr_groups.attr,
	&dev_attr_punits.attr,
	&dev_attr_chunks.attr,
	&dev_attr_clba.attr,
	&dev_attr_ws_min.attr,
	&dev_attr_ws_opt.attr,
1240 1241
	&dev_attr_maxoc.attr,
	&dev_attr_maxocpu.attr,
1242 1243 1244 1245 1246 1247 1248 1249 1250 1251
	&dev_attr_mw_cunits.attr,

	&dev_attr_write_typ.attr,
	&dev_attr_write_max.attr,
	&dev_attr_reset_typ.attr,
	&dev_attr_reset_max.attr,

	NULL,
};

1252 1253
static umode_t nvm_dev_attrs_visible(struct kobject *kobj,
				     struct attribute *attr, int index)
1254
{
1255 1256 1257
	struct device *dev = container_of(kobj, struct device, kobj);
	struct gendisk *disk = dev_to_disk(dev);
	struct nvme_ns *ns = disk->private_data;
1258
	struct nvm_dev *ndev = ns->ndev;
1259 1260
	struct device_attribute *dev_attr =
		container_of(attr, typeof(*dev_attr), attr);
1261 1262

	if (!ndev)
1263
		return 0;
1264

1265 1266
	if (dev_attr->show == nvm_dev_attr_show)
		return attr->mode;
1267

1268
	switch (ndev->geo.major_ver_id) {
1269
	case 1:
1270 1271
		if (dev_attr->show == nvm_dev_attr_show_12)
			return attr->mode;
1272 1273
		break;
	case 2:
1274 1275
		if (dev_attr->show == nvm_dev_attr_show_20)
			return attr->mode;
1276 1277
		break;
	}
1278 1279

	return 0;
1280
}
1281 1282 1283 1284 1285 1286

const struct attribute_group nvme_nvm_attr_group = {
	.name		= "lightnvm",
	.attrs		= nvm_dev_attrs,
	.is_visible	= nvm_dev_attrs_visible,
};