lightnvm.c 33.3 KB
Newer Older
M
Matias Bjørling 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * nvme-lightnvm.c - LightNVM NVMe device
 *
 * Copyright (C) 2014-2015 IT University of Copenhagen
 * Initial release: Matias Bjorling <mb@lightnvm.io>
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version
 * 2 as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; see the file COPYING.  If not, write to
 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
 * USA.
 *
 */

#include "nvme.h"

#include <linux/nvme.h>
#include <linux/bitops.h>
#include <linux/lightnvm.h>
#include <linux/vmalloc.h>
29 30
#include <linux/sched/sysctl.h>
#include <uapi/linux/lightnvm.h>
M
Matias Bjørling 已提交
31 32 33 34 35 36 37

enum nvme_nvm_admin_opcode {
	nvme_nvm_admin_identity		= 0xe2,
	nvme_nvm_admin_get_bb_tbl	= 0xf2,
	nvme_nvm_admin_set_bb_tbl	= 0xf1,
};

38 39 40 41
enum nvme_nvm_log_page {
	NVME_NVM_LOG_REPORT_CHUNK	= 0xca,
};

M
Matias Bjørling 已提交
42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
struct nvme_nvm_ph_rw {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd2;
	__le64			metadata;
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
struct nvme_nvm_erase_blk {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

M
Matias Bjørling 已提交
73 74 75 76 77 78 79 80
struct nvme_nvm_identity {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
81
	__u32			rsvd11[6];
M
Matias Bjørling 已提交
82 83
};

84
struct nvme_nvm_getbbtbl {
M
Matias Bjørling 已提交
85 86 87 88 89 90 91
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	__le64			spba;
	__u32			rsvd4[4];
};

struct nvme_nvm_setbbtbl {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__le64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			nlb;
	__u8			value;
	__u8			rsvd3;
	__u32			rsvd4[3];
M
Matias Bjørling 已提交
109 110 111 112 113 114
};

struct nvme_nvm_command {
	union {
		struct nvme_common_command common;
		struct nvme_nvm_ph_rw ph_rw;
115 116
		struct nvme_nvm_erase_blk erase;
		struct nvme_nvm_identity identity;
117 118
		struct nvme_nvm_getbbtbl get_bb;
		struct nvme_nvm_setbbtbl set_bb;
M
Matias Bjørling 已提交
119 120 121
	};
};

122
struct nvme_nvm_id12_grp {
M
Matias Bjørling 已提交
123 124 125 126 127 128
	__u8			mtype;
	__u8			fmtype;
	__le16			res16;
	__u8			num_ch;
	__u8			num_lun;
	__u8			num_pln;
129
	__u8			rsvd1;
130
	__le16			num_chk;
M
Matias Bjørling 已提交
131 132 133 134
	__le16			num_pg;
	__le16			fpg_sz;
	__le16			csecs;
	__le16			sos;
135
	__le16			rsvd2;
M
Matias Bjørling 已提交
136 137 138 139 140 141 142
	__le32			trdt;
	__le32			trdm;
	__le32			tprt;
	__le32			tprm;
	__le32			tbet;
	__le32			tbem;
	__le32			mpos;
143
	__le32			mccap;
M
Matias Bjørling 已提交
144
	__le16			cpar;
145
	__u8			reserved[906];
M
Matias Bjørling 已提交
146 147
} __packed;

148
struct nvme_nvm_id12_addrf {
M
Matias Bjørling 已提交
149 150 151 152 153 154 155 156 157 158
	__u8			ch_offset;
	__u8			ch_len;
	__u8			lun_offset;
	__u8			lun_len;
	__u8			pln_offset;
	__u8			pln_len;
	__u8			blk_offset;
	__u8			blk_len;
	__u8			pg_offset;
	__u8			pg_len;
159 160
	__u8			sec_offset;
	__u8			sec_len;
M
Matias Bjørling 已提交
161 162 163
	__u8			res[4];
} __packed;

164
struct nvme_nvm_id12 {
M
Matias Bjørling 已提交
165 166 167
	__u8			ver_id;
	__u8			vmnt;
	__u8			cgrps;
168
	__u8			res;
M
Matias Bjørling 已提交
169 170
	__le32			cap;
	__le32			dom;
171
	struct nvme_nvm_id12_addrf ppaf;
172
	__u8			resv[228];
173
	struct nvme_nvm_id12_grp grp;
174
	__u8			resv2[2880];
M
Matias Bjørling 已提交
175 176
} __packed;

177 178 179 180 181 182 183 184 185 186 187 188 189 190
struct nvme_nvm_bb_tbl {
	__u8	tblid[4];
	__le16	verid;
	__le16	revid;
	__le32	rvsd1;
	__le32	tblks;
	__le32	tfact;
	__le32	tgrown;
	__le32	tdresv;
	__le32	thresv;
	__le32	rsvd2[8];
	__u8	blk[0];
};

191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242
struct nvme_nvm_id20_addrf {
	__u8			grp_len;
	__u8			pu_len;
	__u8			chk_len;
	__u8			lba_len;
	__u8			resv[4];
};

struct nvme_nvm_id20 {
	__u8			mjr;
	__u8			mnr;
	__u8			resv[6];

	struct nvme_nvm_id20_addrf lbaf;

	__le32			mccap;
	__u8			resv2[12];

	__u8			wit;
	__u8			resv3[31];

	/* Geometry */
	__le16			num_grp;
	__le16			num_pu;
	__le32			num_chk;
	__le32			clba;
	__u8			resv4[52];

	/* Write data requirements */
	__le32			ws_min;
	__le32			ws_opt;
	__le32			mw_cunits;
	__le32			maxoc;
	__le32			maxocpu;
	__u8			resv5[44];

	/* Performance related metrics */
	__le32			trdt;
	__le32			trdm;
	__le32			twrt;
	__le32			twrm;
	__le32			tcrst;
	__le32			tcrsm;
	__u8			resv6[40];

	/* Reserved area */
	__u8			resv7[2816];

	/* Vendor specific */
	__u8			vs[1024];
};

243 244 245 246 247 248 249 250 251 252
struct nvme_nvm_chk_meta {
	__u8	state;
	__u8	type;
	__u8	wi;
	__u8	rsvd[5];
	__le64	slba;
	__le64	cnlb;
	__le64	wp;
};

M
Matias Bjørling 已提交
253 254 255 256 257 258 259
/*
 * Check we didn't inadvertently grow the command struct
 */
static inline void _nvme_nvm_check_size(void)
{
	BUILD_BUG_ON(sizeof(struct nvme_nvm_identity) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_ph_rw) != 64);
260
	BUILD_BUG_ON(sizeof(struct nvme_nvm_erase_blk) != 64);
261 262
	BUILD_BUG_ON(sizeof(struct nvme_nvm_getbbtbl) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_setbbtbl) != 64);
263 264 265
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_grp) != 960);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_addrf) != 16);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12) != NVME_IDENTIFY_DATA_SIZE);
266
	BUILD_BUG_ON(sizeof(struct nvme_nvm_bb_tbl) != 64);
267 268
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20_addrf) != 8);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20) != NVME_IDENTIFY_DATA_SIZE);
269 270 271
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) != 32);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) !=
						sizeof(struct nvm_chk_meta));
M
Matias Bjørling 已提交
272 273
}

274 275 276 277 278 279 280 281
static void nvme_nvm_set_addr_12(struct nvm_addrf_12 *dst,
				 struct nvme_nvm_id12_addrf *src)
{
	dst->ch_len = src->ch_len;
	dst->lun_len = src->lun_len;
	dst->blk_len = src->blk_len;
	dst->pg_len = src->pg_len;
	dst->pln_len = src->pln_len;
282
	dst->sec_len = src->sec_len;
283 284 285 286 287 288

	dst->ch_offset = src->ch_offset;
	dst->lun_offset = src->lun_offset;
	dst->blk_offset = src->blk_offset;
	dst->pg_offset = src->pg_offset;
	dst->pln_offset = src->pln_offset;
289
	dst->sec_offset = src->sec_offset;
290 291 292 293 294 295

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->blk_mask = ((1ULL << dst->blk_len) - 1) << dst->blk_offset;
	dst->pg_mask = ((1ULL << dst->pg_len) - 1) << dst->pg_offset;
	dst->pln_mask = ((1ULL << dst->pln_len) - 1) << dst->pln_offset;
296
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
297 298 299 300
}

static int nvme_nvm_setup_12(struct nvme_nvm_id12 *id,
			     struct nvm_geo *geo)
M
Matias Bjørling 已提交
301
{
302
	struct nvme_nvm_id12_grp *src;
303
	int sec_per_pg, sec_per_pl, pg_per_blk;
304

305 306 307 308 309 310 311
	if (id->cgrps != 1)
		return -EINVAL;

	src = &id->grp;

	if (src->mtype != 0) {
		pr_err("nvm: memory type not supported\n");
312
		return -EINVAL;
313
	}
314

315 316 317
	/* 1.2 spec. only reports a single version id - unfold */
	geo->major_ver_id = id->ver_id;
	geo->minor_ver_id = 2;
318

319 320 321
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_12;

322 323 324
	geo->num_ch = src->num_ch;
	geo->num_lun = src->num_lun;
	geo->all_luns = geo->num_ch * geo->num_lun;
325

326
	geo->num_chk = le16_to_cpu(src->num_chk);
327

328 329
	geo->csecs = le16_to_cpu(src->csecs);
	geo->sos = le16_to_cpu(src->sos);
330 331

	pg_per_blk = le16_to_cpu(src->num_pg);
332
	sec_per_pg = le16_to_cpu(src->fpg_sz) / geo->csecs;
333
	sec_per_pl = sec_per_pg * src->num_pln;
334 335
	geo->clba = sec_per_pl * pg_per_blk;

336
	geo->all_chunks = geo->all_luns * geo->num_chk;
337 338 339 340 341
	geo->total_secs = geo->clba * geo->all_chunks;

	geo->ws_min = sec_per_pg;
	geo->ws_opt = sec_per_pg;
	geo->mw_cunits = geo->ws_opt << 3;	/* default to MLC safe values */
342

343 344 345 346
	/* Do not impose values for maximum number of open blocks as it is
	 * unspecified in 1.2. Users of 1.2 must be aware of this and eventually
	 * specify these values through a quirk if restrictions apply.
	 */
347 348
	geo->maxoc = geo->all_luns * geo->num_chk;
	geo->maxocpu = geo->num_chk;
349

350 351 352 353 354 355 356 357
	geo->mccap = le32_to_cpu(src->mccap);

	geo->trdt = le32_to_cpu(src->trdt);
	geo->trdm = le32_to_cpu(src->trdm);
	geo->tprt = le32_to_cpu(src->tprt);
	geo->tprm = le32_to_cpu(src->tprm);
	geo->tbet = le32_to_cpu(src->tbet);
	geo->tbem = le32_to_cpu(src->tbem);
358 359

	/* 1.2 compatibility */
360 361 362 363 364 365 366 367 368 369
	geo->vmnt = id->vmnt;
	geo->cap = le32_to_cpu(id->cap);
	geo->dom = le32_to_cpu(id->dom);

	geo->mtype = src->mtype;
	geo->fmtype = src->fmtype;

	geo->cpar = le16_to_cpu(src->cpar);
	geo->mpos = le32_to_cpu(src->mpos);

370
	geo->pln_mode = NVM_PLANE_SINGLE;
371 372

	if (geo->mpos & 0x020202) {
373
		geo->pln_mode = NVM_PLANE_DOUBLE;
374 375
		geo->ws_opt <<= 1;
	} else if (geo->mpos & 0x040404) {
376
		geo->pln_mode = NVM_PLANE_QUAD;
377 378 379 380 381 382 383 384
		geo->ws_opt <<= 2;
	}

	geo->num_pln = src->num_pln;
	geo->num_pg = le16_to_cpu(src->num_pg);
	geo->fpg_sz = le16_to_cpu(src->fpg_sz);

	nvme_nvm_set_addr_12((struct nvm_addrf_12 *)&geo->addrf, &id->ppaf);
385

M
Matias Bjørling 已提交
386 387 388
	return 0;
}

389 390
static void nvme_nvm_set_addr_20(struct nvm_addrf *dst,
				 struct nvme_nvm_id20_addrf *src)
391
{
392 393 394 395 396 397 398 399 400 401 402 403 404 405
	dst->ch_len = src->grp_len;
	dst->lun_len = src->pu_len;
	dst->chk_len = src->chk_len;
	dst->sec_len = src->lba_len;

	dst->sec_offset = 0;
	dst->chk_offset = dst->sec_len;
	dst->lun_offset = dst->chk_offset + dst->chk_len;
	dst->ch_offset = dst->lun_offset + dst->lun_len;

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->chk_mask = ((1ULL << dst->chk_len) - 1) << dst->chk_offset;
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
406 407
}

408 409
static int nvme_nvm_setup_20(struct nvme_nvm_id20 *id,
			     struct nvm_geo *geo)
410
{
411 412 413
	geo->major_ver_id = id->mjr;
	geo->minor_ver_id = id->mnr;

414 415 416
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_20;

417 418 419
	geo->num_ch = le16_to_cpu(id->num_grp);
	geo->num_lun = le16_to_cpu(id->num_pu);
	geo->all_luns = geo->num_ch * geo->num_lun;
420

421
	geo->num_chk = le32_to_cpu(id->num_chk);
422
	geo->clba = le32_to_cpu(id->clba);
423

424
	geo->all_chunks = geo->all_luns * geo->num_chk;
425
	geo->total_secs = geo->clba * geo->all_chunks;
426

427 428 429
	geo->ws_min = le32_to_cpu(id->ws_min);
	geo->ws_opt = le32_to_cpu(id->ws_opt);
	geo->mw_cunits = le32_to_cpu(id->mw_cunits);
430 431
	geo->maxoc = le32_to_cpu(id->maxoc);
	geo->maxocpu = le32_to_cpu(id->maxocpu);
432

433 434 435 436 437 438 439 440
	geo->trdt = le32_to_cpu(id->trdt);
	geo->trdm = le32_to_cpu(id->trdm);
	geo->tprt = le32_to_cpu(id->twrt);
	geo->tprm = le32_to_cpu(id->twrm);
	geo->tbet = le32_to_cpu(id->tcrst);
	geo->tbem = le32_to_cpu(id->tcrsm);

	nvme_nvm_set_addr_20(&geo->addrf, &id->lbaf);
441 442 443 444

	return 0;
}

445
static int nvme_nvm_identity(struct nvm_dev *nvmdev)
M
Matias Bjørling 已提交
446
{
447
	struct nvme_ns *ns = nvmdev->q->queuedata;
448
	struct nvme_nvm_id12 *id;
M
Matias Bjørling 已提交
449 450 451 452
	struct nvme_nvm_command c = {};
	int ret;

	c.identity.opcode = nvme_nvm_admin_identity;
C
Christoph Hellwig 已提交
453
	c.identity.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
454

455 456
	id = kmalloc(sizeof(struct nvme_nvm_id12), GFP_KERNEL);
	if (!id)
M
Matias Bjørling 已提交
457 458
		return -ENOMEM;

459
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
460
				id, sizeof(struct nvme_nvm_id12));
M
Matias Bjørling 已提交
461 462 463 464 465
	if (ret) {
		ret = -EIO;
		goto out;
	}

466 467 468 469 470 471
	/*
	 * The 1.2 and 2.0 specifications share the first byte in their geometry
	 * command to make it possible to know what version a device implements.
	 */
	switch (id->ver_id) {
	case 1:
472
		ret = nvme_nvm_setup_12(id, &nvmdev->geo);
473 474
		break;
	case 2:
475 476
		ret = nvme_nvm_setup_20((struct nvme_nvm_id20 *)id,
							&nvmdev->geo);
477 478
		break;
	default:
479 480
		dev_err(ns->ctrl->device, "OCSSD revision not supported (%d)\n",
							id->ver_id);
481 482
		ret = -EINVAL;
	}
483

M
Matias Bjørling 已提交
484
out:
485
	kfree(id);
M
Matias Bjørling 已提交
486 487 488
	return ret;
}

489
static int nvme_nvm_get_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr ppa,
490
								u8 *blks)
M
Matias Bjørling 已提交
491
{
492
	struct request_queue *q = nvmdev->q;
493
	struct nvm_geo *geo = &nvmdev->geo;
M
Matias Bjørling 已提交
494
	struct nvme_ns *ns = q->queuedata;
495
	struct nvme_ctrl *ctrl = ns->ctrl;
M
Matias Bjørling 已提交
496
	struct nvme_nvm_command c = {};
497
	struct nvme_nvm_bb_tbl *bb_tbl;
498
	int nr_blks = geo->num_chk * geo->num_pln;
499
	int tblsz = sizeof(struct nvme_nvm_bb_tbl) + nr_blks;
M
Matias Bjørling 已提交
500 501 502
	int ret = 0;

	c.get_bb.opcode = nvme_nvm_admin_get_bb_tbl;
C
Christoph Hellwig 已提交
503
	c.get_bb.nsid = cpu_to_le32(ns->head->ns_id);
504
	c.get_bb.spba = cpu_to_le64(ppa.ppa);
M
Matias Bjørling 已提交
505

506 507 508
	bb_tbl = kzalloc(tblsz, GFP_KERNEL);
	if (!bb_tbl)
		return -ENOMEM;
M
Matias Bjørling 已提交
509

510
	ret = nvme_submit_sync_cmd(ctrl->admin_q, (struct nvme_command *)&c,
511
								bb_tbl, tblsz);
M
Matias Bjørling 已提交
512
	if (ret) {
513
		dev_err(ctrl->device, "get bad block table failed (%d)\n", ret);
M
Matias Bjørling 已提交
514 515 516 517
		ret = -EIO;
		goto out;
	}

518 519
	if (bb_tbl->tblid[0] != 'B' || bb_tbl->tblid[1] != 'B' ||
		bb_tbl->tblid[2] != 'L' || bb_tbl->tblid[3] != 'T') {
520
		dev_err(ctrl->device, "bbt format mismatch\n");
521 522 523 524 525 526
		ret = -EINVAL;
		goto out;
	}

	if (le16_to_cpu(bb_tbl->verid) != 1) {
		ret = -EINVAL;
527
		dev_err(ctrl->device, "bbt version not supported\n");
528 529 530
		goto out;
	}

531
	if (le32_to_cpu(bb_tbl->tblks) != nr_blks) {
532
		ret = -EINVAL;
533 534
		dev_err(ctrl->device,
				"bbt unsuspected blocks returned (%u!=%u)",
535
				le32_to_cpu(bb_tbl->tblks), nr_blks);
536 537 538
		goto out;
	}

539
	memcpy(blks, bb_tbl->blk, geo->num_chk * geo->num_pln);
M
Matias Bjørling 已提交
540
out:
541 542 543 544
	kfree(bb_tbl);
	return ret;
}

545 546
static int nvme_nvm_set_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr *ppas,
							int nr_ppas, int type)
547
{
548
	struct nvme_ns *ns = nvmdev->q->queuedata;
549 550 551 552
	struct nvme_nvm_command c = {};
	int ret = 0;

	c.set_bb.opcode = nvme_nvm_admin_set_bb_tbl;
C
Christoph Hellwig 已提交
553
	c.set_bb.nsid = cpu_to_le32(ns->head->ns_id);
554 555
	c.set_bb.spba = cpu_to_le64(ppas->ppa);
	c.set_bb.nlb = cpu_to_le16(nr_ppas - 1);
556 557
	c.set_bb.value = type;

558
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
559
								NULL, 0);
560
	if (ret)
561 562
		dev_err(ns->ctrl->device, "set bad block table failed (%d)\n",
									ret);
M
Matias Bjørling 已提交
563 564 565
	return ret;
}

566 567 568 569 570 571 572 573 574 575 576 577 578 579
/*
 * Expect the lba in device format
 */
static int nvme_nvm_get_chk_meta(struct nvm_dev *ndev,
				 struct nvm_chk_meta *meta,
				 sector_t slba, int nchks)
{
	struct nvm_geo *geo = &ndev->geo;
	struct nvme_ns *ns = ndev->q->queuedata;
	struct nvme_ctrl *ctrl = ns->ctrl;
	struct nvme_nvm_chk_meta *dev_meta = (struct nvme_nvm_chk_meta *)meta;
	struct ppa_addr ppa;
	size_t left = nchks * sizeof(struct nvme_nvm_chk_meta);
	size_t log_pos, offset, len;
580 581 582 583 584 585 586
	int ret, i, max_len;

	/*
	 * limit requests to maximum 256K to avoid issuing arbitrary large
	 * requests when the device does not specific a maximum transfer size.
	 */
	max_len = min_t(unsigned int, ctrl->max_hw_sectors << 9, 256 * 1024);
587 588 589 590 591 592 593 594 595 596 597 598

	/* Normalize lba address space to obtain log offset */
	ppa.ppa = slba;
	ppa = dev_to_generic_addr(ndev, ppa);

	log_pos = ppa.m.chk;
	log_pos += ppa.m.pu * geo->num_chk;
	log_pos += ppa.m.grp * geo->num_lun * geo->num_chk;

	offset = log_pos * sizeof(struct nvme_nvm_chk_meta);

	while (left) {
599
		len = min_t(unsigned int, left, max_len);
600

601 602 603
		ret = nvme_get_log(ctrl, ns->head->ns_id,
				NVME_NVM_LOG_REPORT_CHUNK, 0, dev_meta, len,
				offset);
604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627
		if (ret) {
			dev_err(ctrl->device, "Get REPORT CHUNK log error\n");
			break;
		}

		for (i = 0; i < len; i += sizeof(struct nvme_nvm_chk_meta)) {
			meta->state = dev_meta->state;
			meta->type = dev_meta->type;
			meta->wi = dev_meta->wi;
			meta->slba = le64_to_cpu(dev_meta->slba);
			meta->cnlb = le64_to_cpu(dev_meta->cnlb);
			meta->wp = le64_to_cpu(dev_meta->wp);

			meta++;
			dev_meta++;
		}

		offset += len;
		left -= len;
	}

	return ret;
}

628 629
static inline void nvme_nvm_rqtocmd(struct nvm_rq *rqd, struct nvme_ns *ns,
				    struct nvme_nvm_command *c)
M
Matias Bjørling 已提交
630 631
{
	c->ph_rw.opcode = rqd->opcode;
C
Christoph Hellwig 已提交
632
	c->ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
633
	c->ph_rw.spba = cpu_to_le64(rqd->ppa_addr.ppa);
634
	c->ph_rw.metadata = cpu_to_le64(rqd->dma_meta_list);
M
Matias Bjørling 已提交
635
	c->ph_rw.control = cpu_to_le16(rqd->flags);
636
	c->ph_rw.length = cpu_to_le16(rqd->nr_ppas - 1);
M
Matias Bjørling 已提交
637 638
}

639
static void nvme_nvm_end_io(struct request *rq, blk_status_t status)
M
Matias Bjørling 已提交
640 641 642
{
	struct nvm_rq *rqd = rq->end_io_data;

643
	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
644
	rqd->error = nvme_req(rq)->status;
645
	nvm_end_io(rqd);
M
Matias Bjørling 已提交
646

647
	kfree(nvme_req(rq)->cmd);
M
Matias Bjørling 已提交
648 649 650
	blk_mq_free_request(rq);
}

651 652 653
static struct request *nvme_nvm_alloc_request(struct request_queue *q,
					      struct nvm_rq *rqd,
					      struct nvme_nvm_command *cmd)
M
Matias Bjørling 已提交
654 655 656 657
{
	struct nvme_ns *ns = q->queuedata;
	struct request *rq;

658
	nvme_nvm_rqtocmd(rqd, ns, cmd);
659

660
	rq = nvme_alloc_request(q, (struct nvme_command *)cmd, 0, NVME_QID_ANY);
661 662 663
	if (IS_ERR(rq))
		return rq;

664
	rq->cmd_flags &= ~REQ_FAILFAST_DRIVER;
M
Matias Bjørling 已提交
665

666
	if (rqd->bio)
667
		blk_init_request_from_bio(rq, rqd->bio);
668
	else
669
		rq->ioprio = IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, IOPRIO_NORM);
M
Matias Bjørling 已提交
670

671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689
	return rq;
}

static int nvme_nvm_submit_io(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct nvme_nvm_command *cmd;
	struct request *rq;

	cmd = kzalloc(sizeof(struct nvme_nvm_command), GFP_KERNEL);
	if (!cmd)
		return -ENOMEM;

	rq = nvme_nvm_alloc_request(q, rqd, cmd);
	if (IS_ERR(rq)) {
		kfree(cmd);
		return PTR_ERR(rq);
	}

M
Matias Bjørling 已提交
690 691 692 693 694 695 696
	rq->end_io_data = rqd;

	blk_execute_rq_nowait(q, NULL, rq, 0, nvme_nvm_end_io);

	return 0;
}

697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724
static int nvme_nvm_submit_io_sync(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct request *rq;
	struct nvme_nvm_command cmd;
	int ret = 0;

	memset(&cmd, 0, sizeof(struct nvme_nvm_command));

	rq = nvme_nvm_alloc_request(q, rqd, &cmd);
	if (IS_ERR(rq))
		return PTR_ERR(rq);

	/* I/Os can fail and the error is signaled through rqd. Callers must
	 * handle the error accordingly.
	 */
	blk_execute_rq(q, NULL, rq, 0);
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;

	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
	rqd->error = nvme_req(rq)->status;

	blk_mq_free_request(rq);

	return ret;
}

725
static void *nvme_nvm_create_dma_pool(struct nvm_dev *nvmdev, char *name)
M
Matias Bjørling 已提交
726
{
727
	struct nvme_ns *ns = nvmdev->q->queuedata;
M
Matias Bjørling 已提交
728

729
	return dma_pool_create(name, ns->ctrl->dev, PAGE_SIZE, PAGE_SIZE, 0);
M
Matias Bjørling 已提交
730 731 732 733 734 735 736 737 738
}

static void nvme_nvm_destroy_dma_pool(void *pool)
{
	struct dma_pool *dma_pool = pool;

	dma_pool_destroy(dma_pool);
}

739
static void *nvme_nvm_dev_dma_alloc(struct nvm_dev *dev, void *pool,
M
Matias Bjørling 已提交
740 741 742 743 744
				    gfp_t mem_flags, dma_addr_t *dma_handler)
{
	return dma_pool_alloc(pool, mem_flags, dma_handler);
}

745
static void nvme_nvm_dev_dma_free(void *pool, void *addr,
M
Matias Bjørling 已提交
746 747
							dma_addr_t dma_handler)
{
748
	dma_pool_free(pool, addr, dma_handler);
M
Matias Bjørling 已提交
749 750 751 752 753 754
}

static struct nvm_dev_ops nvme_nvm_dev_ops = {
	.identity		= nvme_nvm_identity,

	.get_bb_tbl		= nvme_nvm_get_bb_tbl,
755
	.set_bb_tbl		= nvme_nvm_set_bb_tbl,
M
Matias Bjørling 已提交
756

757 758
	.get_chk_meta		= nvme_nvm_get_chk_meta,

M
Matias Bjørling 已提交
759
	.submit_io		= nvme_nvm_submit_io,
760
	.submit_io_sync		= nvme_nvm_submit_io_sync,
M
Matias Bjørling 已提交
761 762 763 764 765 766 767

	.create_dma_pool	= nvme_nvm_create_dma_pool,
	.destroy_dma_pool	= nvme_nvm_destroy_dma_pool,
	.dev_dma_alloc		= nvme_nvm_dev_dma_alloc,
	.dev_dma_free		= nvme_nvm_dev_dma_free,
};

768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785
static int nvme_nvm_submit_user_cmd(struct request_queue *q,
				struct nvme_ns *ns,
				struct nvme_nvm_command *vcmd,
				void __user *ubuf, unsigned int bufflen,
				void __user *meta_buf, unsigned int meta_len,
				void __user *ppa_buf, unsigned int ppa_len,
				u32 *result, u64 *status, unsigned int timeout)
{
	bool write = nvme_is_write((struct nvme_command *)vcmd);
	struct nvm_dev *dev = ns->ndev;
	struct gendisk *disk = ns->disk;
	struct request *rq;
	struct bio *bio = NULL;
	__le64 *ppa_list = NULL;
	dma_addr_t ppa_dma;
	__le64 *metadata = NULL;
	dma_addr_t metadata_dma;
	DECLARE_COMPLETION_ONSTACK(wait);
786
	int ret = 0;
787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837

	rq = nvme_alloc_request(q, (struct nvme_command *)vcmd, 0,
			NVME_QID_ANY);
	if (IS_ERR(rq)) {
		ret = -ENOMEM;
		goto err_cmd;
	}

	rq->timeout = timeout ? timeout : ADMIN_TIMEOUT;

	if (ppa_buf && ppa_len) {
		ppa_list = dma_pool_alloc(dev->dma_pool, GFP_KERNEL, &ppa_dma);
		if (!ppa_list) {
			ret = -ENOMEM;
			goto err_rq;
		}
		if (copy_from_user(ppa_list, (void __user *)ppa_buf,
						sizeof(u64) * (ppa_len + 1))) {
			ret = -EFAULT;
			goto err_ppa;
		}
		vcmd->ph_rw.spba = cpu_to_le64(ppa_dma);
	} else {
		vcmd->ph_rw.spba = cpu_to_le64((uintptr_t)ppa_buf);
	}

	if (ubuf && bufflen) {
		ret = blk_rq_map_user(q, rq, NULL, ubuf, bufflen, GFP_KERNEL);
		if (ret)
			goto err_ppa;
		bio = rq->bio;

		if (meta_buf && meta_len) {
			metadata = dma_pool_alloc(dev->dma_pool, GFP_KERNEL,
								&metadata_dma);
			if (!metadata) {
				ret = -ENOMEM;
				goto err_map;
			}

			if (write) {
				if (copy_from_user(metadata,
						(void __user *)meta_buf,
						meta_len)) {
					ret = -EFAULT;
					goto err_meta;
				}
			}
			vcmd->ph_rw.metadata = cpu_to_le64(metadata_dma);
		}

838
		bio->bi_disk = disk;
839 840
	}

841
	blk_execute_rq(q, NULL, rq, 0);
842

843 844
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;
845 846
	else if (nvme_req(rq)->status & 0x7ff)
		ret = -EIO;
847
	if (result)
848
		*result = nvme_req(rq)->status & 0x7ff;
849 850 851 852 853 854 855 856 857 858 859
	if (status)
		*status = le64_to_cpu(nvme_req(rq)->result.u64);

	if (metadata && !ret && !write) {
		if (copy_to_user(meta_buf, (void *)metadata, meta_len))
			ret = -EFAULT;
	}
err_meta:
	if (meta_buf && meta_len)
		dma_pool_free(dev->dma_pool, metadata, metadata_dma);
err_map:
860
	if (bio)
861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885
		blk_rq_unmap_user(bio);
err_ppa:
	if (ppa_buf && ppa_len)
		dma_pool_free(dev->dma_pool, ppa_list, ppa_dma);
err_rq:
	blk_mq_free_request(rq);
err_cmd:
	return ret;
}

static int nvme_nvm_submit_vio(struct nvme_ns *ns,
					struct nvm_user_vio __user *uvio)
{
	struct nvm_user_vio vio;
	struct nvme_nvm_command c;
	unsigned int length;
	int ret;

	if (copy_from_user(&vio, uvio, sizeof(vio)))
		return -EFAULT;
	if (vio.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.ph_rw.opcode = vio.opcode;
C
Christoph Hellwig 已提交
886
	c.ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922
	c.ph_rw.control = cpu_to_le16(vio.control);
	c.ph_rw.length = cpu_to_le16(vio.nppas);

	length = (vio.nppas + 1) << ns->lba_shift;

	ret = nvme_nvm_submit_user_cmd(ns->queue, ns, &c,
			(void __user *)(uintptr_t)vio.addr, length,
			(void __user *)(uintptr_t)vio.metadata,
							vio.metadata_len,
			(void __user *)(uintptr_t)vio.ppa_list, vio.nppas,
			&vio.result, &vio.status, 0);

	if (ret && copy_to_user(uvio, &vio, sizeof(vio)))
		return -EFAULT;

	return ret;
}

static int nvme_nvm_user_vcmd(struct nvme_ns *ns, int admin,
					struct nvm_passthru_vio __user *uvcmd)
{
	struct nvm_passthru_vio vcmd;
	struct nvme_nvm_command c;
	struct request_queue *q;
	unsigned int timeout = 0;
	int ret;

	if (copy_from_user(&vcmd, uvcmd, sizeof(vcmd)))
		return -EFAULT;
	if ((vcmd.opcode != 0xF2) && (!capable(CAP_SYS_ADMIN)))
		return -EACCES;
	if (vcmd.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.common.opcode = vcmd.opcode;
C
Christoph Hellwig 已提交
923
	c.common.nsid = cpu_to_le32(ns->head->ns_id);
924 925 926 927
	c.common.cdw2[0] = cpu_to_le32(vcmd.cdw2);
	c.common.cdw2[1] = cpu_to_le32(vcmd.cdw3);
	/* cdw11-12 */
	c.ph_rw.length = cpu_to_le16(vcmd.nppas);
928
	c.ph_rw.control  = cpu_to_le16(vcmd.control);
929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965
	c.common.cdw10[3] = cpu_to_le32(vcmd.cdw13);
	c.common.cdw10[4] = cpu_to_le32(vcmd.cdw14);
	c.common.cdw10[5] = cpu_to_le32(vcmd.cdw15);

	if (vcmd.timeout_ms)
		timeout = msecs_to_jiffies(vcmd.timeout_ms);

	q = admin ? ns->ctrl->admin_q : ns->queue;

	ret = nvme_nvm_submit_user_cmd(q, ns,
			(struct nvme_nvm_command *)&c,
			(void __user *)(uintptr_t)vcmd.addr, vcmd.data_len,
			(void __user *)(uintptr_t)vcmd.metadata,
							vcmd.metadata_len,
			(void __user *)(uintptr_t)vcmd.ppa_list, vcmd.nppas,
			&vcmd.result, &vcmd.status, timeout);

	if (ret && copy_to_user(uvcmd, &vcmd, sizeof(vcmd)))
		return -EFAULT;

	return ret;
}

int nvme_nvm_ioctl(struct nvme_ns *ns, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
	case NVME_NVM_IOCTL_ADMIN_VIO:
		return nvme_nvm_user_vcmd(ns, 1, (void __user *)arg);
	case NVME_NVM_IOCTL_IO_VIO:
		return nvme_nvm_user_vcmd(ns, 0, (void __user *)arg);
	case NVME_NVM_IOCTL_SUBMIT_VIO:
		return nvme_nvm_submit_vio(ns, (void __user *)arg);
	default:
		return -ENOTTY;
	}
}

966 967 968
void nvme_nvm_update_nvm_info(struct nvme_ns *ns)
{
	struct nvm_dev *ndev = ns->ndev;
969
	struct nvm_geo *geo = &ndev->geo;
970

971 972
	geo->csecs = 1 << ns->lba_shift;
	geo->sos = ns->ms;
973 974
}

975
int nvme_nvm_register(struct nvme_ns *ns, char *disk_name, int node)
M
Matias Bjørling 已提交
976
{
977 978 979
	struct request_queue *q = ns->queue;
	struct nvm_dev *dev;

980 981
	_nvme_nvm_check_size();

982 983 984 985 986 987 988
	dev = nvm_alloc_dev(node);
	if (!dev)
		return -ENOMEM;

	dev->q = q;
	memcpy(dev->name, disk_name, DISK_NAME_LEN);
	dev->ops = &nvme_nvm_dev_ops;
989
	dev->private_data = ns;
990 991
	ns->ndev = dev;

992
	return nvm_register(dev);
M
Matias Bjørling 已提交
993 994
}

995
void nvme_nvm_unregister(struct nvme_ns *ns)
M
Matias Bjørling 已提交
996
{
997
	nvm_unregister(ns->ndev);
M
Matias Bjørling 已提交
998 999
}

1000
static ssize_t nvm_dev_attr_show(struct device *dev,
1001
		struct device_attribute *dattr, char *page)
1002 1003 1004
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1005
	struct nvm_geo *geo = &ndev->geo;
1006 1007 1008 1009 1010 1011 1012 1013
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "version") == 0) {
1014 1015 1016 1017 1018 1019 1020
		if (geo->major_ver_id == 1)
			return scnprintf(page, PAGE_SIZE, "%u\n",
						geo->major_ver_id);
		else
			return scnprintf(page, PAGE_SIZE, "%u.%u\n",
						geo->major_ver_id,
						geo->minor_ver_id);
1021
	} else if (strcmp(attr->name, "capabilities") == 0) {
1022
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->cap);
1023
	} else if (strcmp(attr->name, "read_typ") == 0) {
1024
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdt);
1025
	} else if (strcmp(attr->name, "read_max") == 0) {
1026
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdm);
1027 1028 1029
	} else {
		return scnprintf(page,
				 PAGE_SIZE,
1030 1031
				 "Unhandled attr(%s) in `%s`\n",
				 attr->name, __func__);
1032 1033 1034
	}
}

1035 1036 1037 1038 1039 1040 1041 1042 1043
static ssize_t nvm_dev_attr_show_ppaf(struct nvm_addrf_12 *ppaf, char *page)
{
	return scnprintf(page, PAGE_SIZE,
		"0x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x\n",
				ppaf->ch_offset, ppaf->ch_len,
				ppaf->lun_offset, ppaf->lun_len,
				ppaf->pln_offset, ppaf->pln_len,
				ppaf->blk_offset, ppaf->blk_len,
				ppaf->pg_offset, ppaf->pg_len,
1044
				ppaf->sec_offset, ppaf->sec_len);
1045 1046
}

1047 1048 1049 1050 1051
static ssize_t nvm_dev_attr_show_12(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1052
	struct nvm_geo *geo = &ndev->geo;
1053 1054 1055 1056 1057 1058 1059 1060
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "vendor_opcode") == 0) {
1061
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->vmnt);
1062
	} else if (strcmp(attr->name, "device_mode") == 0) {
1063
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->dom);
1064
	/* kept for compatibility */
1065
	} else if (strcmp(attr->name, "media_manager") == 0) {
1066
		return scnprintf(page, PAGE_SIZE, "%s\n", "gennvm");
1067
	} else if (strcmp(attr->name, "ppa_format") == 0) {
1068
		return nvm_dev_attr_show_ppaf((void *)&geo->addrf, page);
1069
	} else if (strcmp(attr->name, "media_type") == 0) {	/* u8 */
1070
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mtype);
1071
	} else if (strcmp(attr->name, "flash_media_type") == 0) {
1072
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fmtype);
1073
	} else if (strcmp(attr->name, "num_channels") == 0) {
1074
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1075
	} else if (strcmp(attr->name, "num_luns") == 0) {
1076
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1077
	} else if (strcmp(attr->name, "num_planes") == 0) {
1078
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pln);
1079
	} else if (strcmp(attr->name, "num_blocks") == 0) {	/* u16 */
1080
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1081
	} else if (strcmp(attr->name, "num_pages") == 0) {
1082
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pg);
1083
	} else if (strcmp(attr->name, "page_size") == 0) {
1084
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fpg_sz);
1085
	} else if (strcmp(attr->name, "hw_sector_size") == 0) {
1086
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->csecs);
1087
	} else if (strcmp(attr->name, "oob_sector_size") == 0) {/* u32 */
1088
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->sos);
1089
	} else if (strcmp(attr->name, "prog_typ") == 0) {
1090
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1091
	} else if (strcmp(attr->name, "prog_max") == 0) {
1092
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1093
	} else if (strcmp(attr->name, "erase_typ") == 0) {
1094
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1095
	} else if (strcmp(attr->name, "erase_max") == 0) {
1096
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1097
	} else if (strcmp(attr->name, "multiplane_modes") == 0) {
1098
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mpos);
1099
	} else if (strcmp(attr->name, "media_capabilities") == 0) {
1100
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mccap);
1101
	} else if (strcmp(attr->name, "max_phys_secs") == 0) {
1102
		return scnprintf(page, PAGE_SIZE, "%u\n", NVM_MAX_VLBA);
1103
	} else {
1104
		return scnprintf(page, PAGE_SIZE,
1105 1106
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1107 1108 1109
	}
}

1110 1111 1112 1113 1114
static ssize_t nvm_dev_attr_show_20(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1115
	struct nvm_geo *geo = &ndev->geo;
1116 1117 1118 1119 1120 1121 1122 1123
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "groups") == 0) {
1124
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1125
	} else if (strcmp(attr->name, "punits") == 0) {
1126
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1127
	} else if (strcmp(attr->name, "chunks") == 0) {
1128
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1129
	} else if (strcmp(attr->name, "clba") == 0) {
1130
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->clba);
1131
	} else if (strcmp(attr->name, "ws_min") == 0) {
1132
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_min);
1133
	} else if (strcmp(attr->name, "ws_opt") == 0) {
1134
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_opt);
1135 1136 1137 1138
	} else if (strcmp(attr->name, "maxoc") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxoc);
	} else if (strcmp(attr->name, "maxocpu") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxocpu);
1139
	} else if (strcmp(attr->name, "mw_cunits") == 0) {
1140
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mw_cunits);
1141
	} else if (strcmp(attr->name, "write_typ") == 0) {
1142
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1143
	} else if (strcmp(attr->name, "write_max") == 0) {
1144
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1145
	} else if (strcmp(attr->name, "reset_typ") == 0) {
1146
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1147
	} else if (strcmp(attr->name, "reset_max") == 0) {
1148
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1149
	} else {
1150
		return scnprintf(page, PAGE_SIZE,
1151 1152
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1153 1154 1155 1156
	}
}

#define NVM_DEV_ATTR_RO(_name)					\
1157
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show, NULL)
1158 1159 1160 1161
#define NVM_DEV_ATTR_12_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_12, NULL)
#define NVM_DEV_ATTR_20_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_20, NULL)
1162

1163
/* general attributes */
1164 1165
static NVM_DEV_ATTR_RO(version);
static NVM_DEV_ATTR_RO(capabilities);
1166

1167 1168
static NVM_DEV_ATTR_RO(read_typ);
static NVM_DEV_ATTR_RO(read_max);
1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193

/* 1.2 values */
static NVM_DEV_ATTR_12_RO(vendor_opcode);
static NVM_DEV_ATTR_12_RO(device_mode);
static NVM_DEV_ATTR_12_RO(ppa_format);
static NVM_DEV_ATTR_12_RO(media_manager);
static NVM_DEV_ATTR_12_RO(media_type);
static NVM_DEV_ATTR_12_RO(flash_media_type);
static NVM_DEV_ATTR_12_RO(num_channels);
static NVM_DEV_ATTR_12_RO(num_luns);
static NVM_DEV_ATTR_12_RO(num_planes);
static NVM_DEV_ATTR_12_RO(num_blocks);
static NVM_DEV_ATTR_12_RO(num_pages);
static NVM_DEV_ATTR_12_RO(page_size);
static NVM_DEV_ATTR_12_RO(hw_sector_size);
static NVM_DEV_ATTR_12_RO(oob_sector_size);
static NVM_DEV_ATTR_12_RO(prog_typ);
static NVM_DEV_ATTR_12_RO(prog_max);
static NVM_DEV_ATTR_12_RO(erase_typ);
static NVM_DEV_ATTR_12_RO(erase_max);
static NVM_DEV_ATTR_12_RO(multiplane_modes);
static NVM_DEV_ATTR_12_RO(media_capabilities);
static NVM_DEV_ATTR_12_RO(max_phys_secs);

static struct attribute *nvm_dev_attrs_12[] = {
1194 1195
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,
1196 1197

	&dev_attr_vendor_opcode.attr,
1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219
	&dev_attr_device_mode.attr,
	&dev_attr_media_manager.attr,
	&dev_attr_ppa_format.attr,
	&dev_attr_media_type.attr,
	&dev_attr_flash_media_type.attr,
	&dev_attr_num_channels.attr,
	&dev_attr_num_luns.attr,
	&dev_attr_num_planes.attr,
	&dev_attr_num_blocks.attr,
	&dev_attr_num_pages.attr,
	&dev_attr_page_size.attr,
	&dev_attr_hw_sector_size.attr,
	&dev_attr_oob_sector_size.attr,
	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_prog_typ.attr,
	&dev_attr_prog_max.attr,
	&dev_attr_erase_typ.attr,
	&dev_attr_erase_max.attr,
	&dev_attr_multiplane_modes.attr,
	&dev_attr_media_capabilities.attr,
	&dev_attr_max_phys_secs.attr,
1220

1221 1222 1223
	NULL,
};

1224
static const struct attribute_group nvm_dev_attr_group_12 = {
1225
	.name		= "lightnvm",
1226 1227 1228 1229 1230 1231 1232 1233 1234 1235
	.attrs		= nvm_dev_attrs_12,
};

/* 2.0 values */
static NVM_DEV_ATTR_20_RO(groups);
static NVM_DEV_ATTR_20_RO(punits);
static NVM_DEV_ATTR_20_RO(chunks);
static NVM_DEV_ATTR_20_RO(clba);
static NVM_DEV_ATTR_20_RO(ws_min);
static NVM_DEV_ATTR_20_RO(ws_opt);
1236 1237
static NVM_DEV_ATTR_20_RO(maxoc);
static NVM_DEV_ATTR_20_RO(maxocpu);
1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253
static NVM_DEV_ATTR_20_RO(mw_cunits);
static NVM_DEV_ATTR_20_RO(write_typ);
static NVM_DEV_ATTR_20_RO(write_max);
static NVM_DEV_ATTR_20_RO(reset_typ);
static NVM_DEV_ATTR_20_RO(reset_max);

static struct attribute *nvm_dev_attrs_20[] = {
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,

	&dev_attr_groups.attr,
	&dev_attr_punits.attr,
	&dev_attr_chunks.attr,
	&dev_attr_clba.attr,
	&dev_attr_ws_min.attr,
	&dev_attr_ws_opt.attr,
1254 1255
	&dev_attr_maxoc.attr,
	&dev_attr_maxocpu.attr,
1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270
	&dev_attr_mw_cunits.attr,

	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_write_typ.attr,
	&dev_attr_write_max.attr,
	&dev_attr_reset_typ.attr,
	&dev_attr_reset_max.attr,

	NULL,
};

static const struct attribute_group nvm_dev_attr_group_20 = {
	.name		= "lightnvm",
	.attrs		= nvm_dev_attrs_20,
1271 1272 1273 1274
};

int nvme_nvm_register_sysfs(struct nvme_ns *ns)
{
1275 1276 1277 1278
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

	if (!ndev)
1279 1280
		return -EINVAL;

1281
	switch (geo->major_ver_id) {
1282 1283 1284 1285 1286 1287 1288 1289 1290
	case 1:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
	case 2:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
	}

	return -EINVAL;
1291 1292 1293 1294
}

void nvme_nvm_unregister_sysfs(struct nvme_ns *ns)
{
1295 1296 1297
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

1298
	switch (geo->major_ver_id) {
1299 1300 1301 1302 1303 1304 1305 1306 1307
	case 1:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
		break;
	case 2:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
		break;
	}
1308
}