lightnvm.c 33.5 KB
Newer Older
M
Matias Bjørling 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * nvme-lightnvm.c - LightNVM NVMe device
 *
 * Copyright (C) 2014-2015 IT University of Copenhagen
 * Initial release: Matias Bjorling <mb@lightnvm.io>
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version
 * 2 as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; see the file COPYING.  If not, write to
 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
 * USA.
 *
 */

#include "nvme.h"

#include <linux/nvme.h>
#include <linux/bitops.h>
#include <linux/lightnvm.h>
#include <linux/vmalloc.h>
29 30
#include <linux/sched/sysctl.h>
#include <uapi/linux/lightnvm.h>
M
Matias Bjørling 已提交
31 32 33 34 35 36 37

enum nvme_nvm_admin_opcode {
	nvme_nvm_admin_identity		= 0xe2,
	nvme_nvm_admin_get_bb_tbl	= 0xf2,
	nvme_nvm_admin_set_bb_tbl	= 0xf1,
};

38 39 40 41
enum nvme_nvm_log_page {
	NVME_NVM_LOG_REPORT_CHUNK	= 0xca,
};

M
Matias Bjørling 已提交
42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
struct nvme_nvm_ph_rw {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd2;
	__le64			metadata;
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
struct nvme_nvm_erase_blk {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

M
Matias Bjørling 已提交
73 74 75 76 77 78 79 80
struct nvme_nvm_identity {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
81
	__u32			rsvd11[6];
M
Matias Bjørling 已提交
82 83
};

84
struct nvme_nvm_getbbtbl {
M
Matias Bjørling 已提交
85 86 87 88 89 90 91
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	__le64			spba;
	__u32			rsvd4[4];
};

struct nvme_nvm_setbbtbl {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__le64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			nlb;
	__u8			value;
	__u8			rsvd3;
	__u32			rsvd4[3];
M
Matias Bjørling 已提交
109 110 111 112 113 114
};

struct nvme_nvm_command {
	union {
		struct nvme_common_command common;
		struct nvme_nvm_ph_rw ph_rw;
115 116
		struct nvme_nvm_erase_blk erase;
		struct nvme_nvm_identity identity;
117 118
		struct nvme_nvm_getbbtbl get_bb;
		struct nvme_nvm_setbbtbl set_bb;
M
Matias Bjørling 已提交
119 120 121
	};
};

122
struct nvme_nvm_id12_grp {
M
Matias Bjørling 已提交
123 124 125 126 127 128
	__u8			mtype;
	__u8			fmtype;
	__le16			res16;
	__u8			num_ch;
	__u8			num_lun;
	__u8			num_pln;
129
	__u8			rsvd1;
130
	__le16			num_chk;
M
Matias Bjørling 已提交
131 132 133 134
	__le16			num_pg;
	__le16			fpg_sz;
	__le16			csecs;
	__le16			sos;
135
	__le16			rsvd2;
M
Matias Bjørling 已提交
136 137 138 139 140 141 142
	__le32			trdt;
	__le32			trdm;
	__le32			tprt;
	__le32			tprm;
	__le32			tbet;
	__le32			tbem;
	__le32			mpos;
143
	__le32			mccap;
M
Matias Bjørling 已提交
144
	__le16			cpar;
145
	__u8			reserved[906];
M
Matias Bjørling 已提交
146 147
} __packed;

148
struct nvme_nvm_id12_addrf {
M
Matias Bjørling 已提交
149 150 151 152 153 154 155 156 157 158
	__u8			ch_offset;
	__u8			ch_len;
	__u8			lun_offset;
	__u8			lun_len;
	__u8			pln_offset;
	__u8			pln_len;
	__u8			blk_offset;
	__u8			blk_len;
	__u8			pg_offset;
	__u8			pg_len;
159 160
	__u8			sec_offset;
	__u8			sec_len;
M
Matias Bjørling 已提交
161 162 163
	__u8			res[4];
} __packed;

164
struct nvme_nvm_id12 {
M
Matias Bjørling 已提交
165 166 167
	__u8			ver_id;
	__u8			vmnt;
	__u8			cgrps;
168
	__u8			res;
M
Matias Bjørling 已提交
169 170
	__le32			cap;
	__le32			dom;
171
	struct nvme_nvm_id12_addrf ppaf;
172
	__u8			resv[228];
173
	struct nvme_nvm_id12_grp grp;
174
	__u8			resv2[2880];
M
Matias Bjørling 已提交
175 176
} __packed;

177 178 179 180 181 182 183 184 185 186 187 188 189 190
struct nvme_nvm_bb_tbl {
	__u8	tblid[4];
	__le16	verid;
	__le16	revid;
	__le32	rvsd1;
	__le32	tblks;
	__le32	tfact;
	__le32	tgrown;
	__le32	tdresv;
	__le32	thresv;
	__le32	rsvd2[8];
	__u8	blk[0];
};

191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242
struct nvme_nvm_id20_addrf {
	__u8			grp_len;
	__u8			pu_len;
	__u8			chk_len;
	__u8			lba_len;
	__u8			resv[4];
};

struct nvme_nvm_id20 {
	__u8			mjr;
	__u8			mnr;
	__u8			resv[6];

	struct nvme_nvm_id20_addrf lbaf;

	__le32			mccap;
	__u8			resv2[12];

	__u8			wit;
	__u8			resv3[31];

	/* Geometry */
	__le16			num_grp;
	__le16			num_pu;
	__le32			num_chk;
	__le32			clba;
	__u8			resv4[52];

	/* Write data requirements */
	__le32			ws_min;
	__le32			ws_opt;
	__le32			mw_cunits;
	__le32			maxoc;
	__le32			maxocpu;
	__u8			resv5[44];

	/* Performance related metrics */
	__le32			trdt;
	__le32			trdm;
	__le32			twrt;
	__le32			twrm;
	__le32			tcrst;
	__le32			tcrsm;
	__u8			resv6[40];

	/* Reserved area */
	__u8			resv7[2816];

	/* Vendor specific */
	__u8			vs[1024];
};

243 244 245 246 247 248 249 250 251 252
struct nvme_nvm_chk_meta {
	__u8	state;
	__u8	type;
	__u8	wi;
	__u8	rsvd[5];
	__le64	slba;
	__le64	cnlb;
	__le64	wp;
};

M
Matias Bjørling 已提交
253 254 255 256 257 258 259
/*
 * Check we didn't inadvertently grow the command struct
 */
static inline void _nvme_nvm_check_size(void)
{
	BUILD_BUG_ON(sizeof(struct nvme_nvm_identity) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_ph_rw) != 64);
260
	BUILD_BUG_ON(sizeof(struct nvme_nvm_erase_blk) != 64);
261 262
	BUILD_BUG_ON(sizeof(struct nvme_nvm_getbbtbl) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_setbbtbl) != 64);
263 264 265
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_grp) != 960);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_addrf) != 16);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12) != NVME_IDENTIFY_DATA_SIZE);
266
	BUILD_BUG_ON(sizeof(struct nvme_nvm_bb_tbl) != 64);
267 268
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20_addrf) != 8);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20) != NVME_IDENTIFY_DATA_SIZE);
269 270 271
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) != 32);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) !=
						sizeof(struct nvm_chk_meta));
M
Matias Bjørling 已提交
272 273
}

274 275 276 277 278 279 280 281
static void nvme_nvm_set_addr_12(struct nvm_addrf_12 *dst,
				 struct nvme_nvm_id12_addrf *src)
{
	dst->ch_len = src->ch_len;
	dst->lun_len = src->lun_len;
	dst->blk_len = src->blk_len;
	dst->pg_len = src->pg_len;
	dst->pln_len = src->pln_len;
282
	dst->sec_len = src->sec_len;
283 284 285 286 287 288

	dst->ch_offset = src->ch_offset;
	dst->lun_offset = src->lun_offset;
	dst->blk_offset = src->blk_offset;
	dst->pg_offset = src->pg_offset;
	dst->pln_offset = src->pln_offset;
289
	dst->sec_offset = src->sec_offset;
290 291 292 293 294 295

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->blk_mask = ((1ULL << dst->blk_len) - 1) << dst->blk_offset;
	dst->pg_mask = ((1ULL << dst->pg_len) - 1) << dst->pg_offset;
	dst->pln_mask = ((1ULL << dst->pln_len) - 1) << dst->pln_offset;
296
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
297 298 299 300
}

static int nvme_nvm_setup_12(struct nvme_nvm_id12 *id,
			     struct nvm_geo *geo)
M
Matias Bjørling 已提交
301
{
302
	struct nvme_nvm_id12_grp *src;
303
	int sec_per_pg, sec_per_pl, pg_per_blk;
304

305 306 307 308 309 310 311
	if (id->cgrps != 1)
		return -EINVAL;

	src = &id->grp;

	if (src->mtype != 0) {
		pr_err("nvm: memory type not supported\n");
312
		return -EINVAL;
313
	}
314

315 316 317
	/* 1.2 spec. only reports a single version id - unfold */
	geo->major_ver_id = id->ver_id;
	geo->minor_ver_id = 2;
318

319 320 321
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_12;

322 323 324
	geo->num_ch = src->num_ch;
	geo->num_lun = src->num_lun;
	geo->all_luns = geo->num_ch * geo->num_lun;
325

326
	geo->num_chk = le16_to_cpu(src->num_chk);
327

328 329
	geo->csecs = le16_to_cpu(src->csecs);
	geo->sos = le16_to_cpu(src->sos);
330 331

	pg_per_blk = le16_to_cpu(src->num_pg);
332
	sec_per_pg = le16_to_cpu(src->fpg_sz) / geo->csecs;
333
	sec_per_pl = sec_per_pg * src->num_pln;
334 335
	geo->clba = sec_per_pl * pg_per_blk;

336
	geo->all_chunks = geo->all_luns * geo->num_chk;
337 338 339 340 341
	geo->total_secs = geo->clba * geo->all_chunks;

	geo->ws_min = sec_per_pg;
	geo->ws_opt = sec_per_pg;
	geo->mw_cunits = geo->ws_opt << 3;	/* default to MLC safe values */
342

343 344 345 346
	/* Do not impose values for maximum number of open blocks as it is
	 * unspecified in 1.2. Users of 1.2 must be aware of this and eventually
	 * specify these values through a quirk if restrictions apply.
	 */
347 348
	geo->maxoc = geo->all_luns * geo->num_chk;
	geo->maxocpu = geo->num_chk;
349

350 351 352 353 354 355 356 357
	geo->mccap = le32_to_cpu(src->mccap);

	geo->trdt = le32_to_cpu(src->trdt);
	geo->trdm = le32_to_cpu(src->trdm);
	geo->tprt = le32_to_cpu(src->tprt);
	geo->tprm = le32_to_cpu(src->tprm);
	geo->tbet = le32_to_cpu(src->tbet);
	geo->tbem = le32_to_cpu(src->tbem);
358 359

	/* 1.2 compatibility */
360 361 362 363 364 365 366 367 368 369
	geo->vmnt = id->vmnt;
	geo->cap = le32_to_cpu(id->cap);
	geo->dom = le32_to_cpu(id->dom);

	geo->mtype = src->mtype;
	geo->fmtype = src->fmtype;

	geo->cpar = le16_to_cpu(src->cpar);
	geo->mpos = le32_to_cpu(src->mpos);

370
	geo->pln_mode = NVM_PLANE_SINGLE;
371 372

	if (geo->mpos & 0x020202) {
373
		geo->pln_mode = NVM_PLANE_DOUBLE;
374 375
		geo->ws_opt <<= 1;
	} else if (geo->mpos & 0x040404) {
376
		geo->pln_mode = NVM_PLANE_QUAD;
377 378 379 380 381 382 383 384
		geo->ws_opt <<= 2;
	}

	geo->num_pln = src->num_pln;
	geo->num_pg = le16_to_cpu(src->num_pg);
	geo->fpg_sz = le16_to_cpu(src->fpg_sz);

	nvme_nvm_set_addr_12((struct nvm_addrf_12 *)&geo->addrf, &id->ppaf);
385

M
Matias Bjørling 已提交
386 387 388
	return 0;
}

389 390
static void nvme_nvm_set_addr_20(struct nvm_addrf *dst,
				 struct nvme_nvm_id20_addrf *src)
391
{
392 393 394 395 396 397 398 399 400 401 402 403 404 405
	dst->ch_len = src->grp_len;
	dst->lun_len = src->pu_len;
	dst->chk_len = src->chk_len;
	dst->sec_len = src->lba_len;

	dst->sec_offset = 0;
	dst->chk_offset = dst->sec_len;
	dst->lun_offset = dst->chk_offset + dst->chk_len;
	dst->ch_offset = dst->lun_offset + dst->lun_len;

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->chk_mask = ((1ULL << dst->chk_len) - 1) << dst->chk_offset;
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
406 407
}

408 409
static int nvme_nvm_setup_20(struct nvme_nvm_id20 *id,
			     struct nvm_geo *geo)
410
{
411 412 413
	geo->major_ver_id = id->mjr;
	geo->minor_ver_id = id->mnr;

414 415 416
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_20;

417 418 419 420 421
	if (!(geo->major_ver_id == 2 && geo->minor_ver_id == 0)) {
		pr_err("nvm: OCSSD version not supported (v%d.%d)\n",
				geo->major_ver_id, geo->minor_ver_id);
		return -EINVAL;
	}
422

423 424 425
	geo->num_ch = le16_to_cpu(id->num_grp);
	geo->num_lun = le16_to_cpu(id->num_pu);
	geo->all_luns = geo->num_ch * geo->num_lun;
426

427
	geo->num_chk = le32_to_cpu(id->num_chk);
428
	geo->clba = le32_to_cpu(id->clba);
429

430
	geo->all_chunks = geo->all_luns * geo->num_chk;
431
	geo->total_secs = geo->clba * geo->all_chunks;
432

433 434 435
	geo->ws_min = le32_to_cpu(id->ws_min);
	geo->ws_opt = le32_to_cpu(id->ws_opt);
	geo->mw_cunits = le32_to_cpu(id->mw_cunits);
436 437
	geo->maxoc = le32_to_cpu(id->maxoc);
	geo->maxocpu = le32_to_cpu(id->maxocpu);
438

439 440 441 442 443 444 445 446
	geo->trdt = le32_to_cpu(id->trdt);
	geo->trdm = le32_to_cpu(id->trdm);
	geo->tprt = le32_to_cpu(id->twrt);
	geo->tprm = le32_to_cpu(id->twrm);
	geo->tbet = le32_to_cpu(id->tcrst);
	geo->tbem = le32_to_cpu(id->tcrsm);

	nvme_nvm_set_addr_20(&geo->addrf, &id->lbaf);
447 448 449 450

	return 0;
}

451
static int nvme_nvm_identity(struct nvm_dev *nvmdev)
M
Matias Bjørling 已提交
452
{
453
	struct nvme_ns *ns = nvmdev->q->queuedata;
454
	struct nvme_nvm_id12 *id;
M
Matias Bjørling 已提交
455 456 457 458
	struct nvme_nvm_command c = {};
	int ret;

	c.identity.opcode = nvme_nvm_admin_identity;
C
Christoph Hellwig 已提交
459
	c.identity.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
460

461 462
	id = kmalloc(sizeof(struct nvme_nvm_id12), GFP_KERNEL);
	if (!id)
M
Matias Bjørling 已提交
463 464
		return -ENOMEM;

465
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
466
				id, sizeof(struct nvme_nvm_id12));
M
Matias Bjørling 已提交
467 468 469 470 471
	if (ret) {
		ret = -EIO;
		goto out;
	}

472 473 474 475 476 477
	/*
	 * The 1.2 and 2.0 specifications share the first byte in their geometry
	 * command to make it possible to know what version a device implements.
	 */
	switch (id->ver_id) {
	case 1:
478
		ret = nvme_nvm_setup_12(id, &nvmdev->geo);
479 480
		break;
	case 2:
481 482
		ret = nvme_nvm_setup_20((struct nvme_nvm_id20 *)id,
							&nvmdev->geo);
483 484
		break;
	default:
485 486
		dev_err(ns->ctrl->device, "OCSSD revision not supported (%d)\n",
							id->ver_id);
487 488
		ret = -EINVAL;
	}
489

M
Matias Bjørling 已提交
490
out:
491
	kfree(id);
M
Matias Bjørling 已提交
492 493 494
	return ret;
}

495
static int nvme_nvm_get_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr ppa,
496
								u8 *blks)
M
Matias Bjørling 已提交
497
{
498
	struct request_queue *q = nvmdev->q;
499
	struct nvm_geo *geo = &nvmdev->geo;
M
Matias Bjørling 已提交
500
	struct nvme_ns *ns = q->queuedata;
501
	struct nvme_ctrl *ctrl = ns->ctrl;
M
Matias Bjørling 已提交
502
	struct nvme_nvm_command c = {};
503
	struct nvme_nvm_bb_tbl *bb_tbl;
504
	int nr_blks = geo->num_chk * geo->num_pln;
505
	int tblsz = sizeof(struct nvme_nvm_bb_tbl) + nr_blks;
M
Matias Bjørling 已提交
506 507 508
	int ret = 0;

	c.get_bb.opcode = nvme_nvm_admin_get_bb_tbl;
C
Christoph Hellwig 已提交
509
	c.get_bb.nsid = cpu_to_le32(ns->head->ns_id);
510
	c.get_bb.spba = cpu_to_le64(ppa.ppa);
M
Matias Bjørling 已提交
511

512 513 514
	bb_tbl = kzalloc(tblsz, GFP_KERNEL);
	if (!bb_tbl)
		return -ENOMEM;
M
Matias Bjørling 已提交
515

516
	ret = nvme_submit_sync_cmd(ctrl->admin_q, (struct nvme_command *)&c,
517
								bb_tbl, tblsz);
M
Matias Bjørling 已提交
518
	if (ret) {
519
		dev_err(ctrl->device, "get bad block table failed (%d)\n", ret);
M
Matias Bjørling 已提交
520 521 522 523
		ret = -EIO;
		goto out;
	}

524 525
	if (bb_tbl->tblid[0] != 'B' || bb_tbl->tblid[1] != 'B' ||
		bb_tbl->tblid[2] != 'L' || bb_tbl->tblid[3] != 'T') {
526
		dev_err(ctrl->device, "bbt format mismatch\n");
527 528 529 530 531 532
		ret = -EINVAL;
		goto out;
	}

	if (le16_to_cpu(bb_tbl->verid) != 1) {
		ret = -EINVAL;
533
		dev_err(ctrl->device, "bbt version not supported\n");
534 535 536
		goto out;
	}

537
	if (le32_to_cpu(bb_tbl->tblks) != nr_blks) {
538
		ret = -EINVAL;
539 540
		dev_err(ctrl->device,
				"bbt unsuspected blocks returned (%u!=%u)",
541
				le32_to_cpu(bb_tbl->tblks), nr_blks);
542 543 544
		goto out;
	}

545
	memcpy(blks, bb_tbl->blk, geo->num_chk * geo->num_pln);
M
Matias Bjørling 已提交
546
out:
547 548 549 550
	kfree(bb_tbl);
	return ret;
}

551 552
static int nvme_nvm_set_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr *ppas,
							int nr_ppas, int type)
553
{
554
	struct nvme_ns *ns = nvmdev->q->queuedata;
555 556 557 558
	struct nvme_nvm_command c = {};
	int ret = 0;

	c.set_bb.opcode = nvme_nvm_admin_set_bb_tbl;
C
Christoph Hellwig 已提交
559
	c.set_bb.nsid = cpu_to_le32(ns->head->ns_id);
560 561
	c.set_bb.spba = cpu_to_le64(ppas->ppa);
	c.set_bb.nlb = cpu_to_le16(nr_ppas - 1);
562 563
	c.set_bb.value = type;

564
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
565
								NULL, 0);
566
	if (ret)
567 568
		dev_err(ns->ctrl->device, "set bad block table failed (%d)\n",
									ret);
M
Matias Bjørling 已提交
569 570 571
	return ret;
}

572 573 574 575 576 577 578 579 580 581 582 583 584 585
/*
 * Expect the lba in device format
 */
static int nvme_nvm_get_chk_meta(struct nvm_dev *ndev,
				 struct nvm_chk_meta *meta,
				 sector_t slba, int nchks)
{
	struct nvm_geo *geo = &ndev->geo;
	struct nvme_ns *ns = ndev->q->queuedata;
	struct nvme_ctrl *ctrl = ns->ctrl;
	struct nvme_nvm_chk_meta *dev_meta = (struct nvme_nvm_chk_meta *)meta;
	struct ppa_addr ppa;
	size_t left = nchks * sizeof(struct nvme_nvm_chk_meta);
	size_t log_pos, offset, len;
586 587 588 589 590 591 592
	int ret, i, max_len;

	/*
	 * limit requests to maximum 256K to avoid issuing arbitrary large
	 * requests when the device does not specific a maximum transfer size.
	 */
	max_len = min_t(unsigned int, ctrl->max_hw_sectors << 9, 256 * 1024);
593 594 595 596 597 598 599 600 601 602 603 604

	/* Normalize lba address space to obtain log offset */
	ppa.ppa = slba;
	ppa = dev_to_generic_addr(ndev, ppa);

	log_pos = ppa.m.chk;
	log_pos += ppa.m.pu * geo->num_chk;
	log_pos += ppa.m.grp * geo->num_lun * geo->num_chk;

	offset = log_pos * sizeof(struct nvme_nvm_chk_meta);

	while (left) {
605
		len = min_t(unsigned int, left, max_len);
606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632

		ret = nvme_get_log_ext(ctrl, ns, NVME_NVM_LOG_REPORT_CHUNK,
				dev_meta, len, offset);
		if (ret) {
			dev_err(ctrl->device, "Get REPORT CHUNK log error\n");
			break;
		}

		for (i = 0; i < len; i += sizeof(struct nvme_nvm_chk_meta)) {
			meta->state = dev_meta->state;
			meta->type = dev_meta->type;
			meta->wi = dev_meta->wi;
			meta->slba = le64_to_cpu(dev_meta->slba);
			meta->cnlb = le64_to_cpu(dev_meta->cnlb);
			meta->wp = le64_to_cpu(dev_meta->wp);

			meta++;
			dev_meta++;
		}

		offset += len;
		left -= len;
	}

	return ret;
}

633 634
static inline void nvme_nvm_rqtocmd(struct nvm_rq *rqd, struct nvme_ns *ns,
				    struct nvme_nvm_command *c)
M
Matias Bjørling 已提交
635 636
{
	c->ph_rw.opcode = rqd->opcode;
C
Christoph Hellwig 已提交
637
	c->ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
638
	c->ph_rw.spba = cpu_to_le64(rqd->ppa_addr.ppa);
639
	c->ph_rw.metadata = cpu_to_le64(rqd->dma_meta_list);
M
Matias Bjørling 已提交
640
	c->ph_rw.control = cpu_to_le16(rqd->flags);
641
	c->ph_rw.length = cpu_to_le16(rqd->nr_ppas - 1);
M
Matias Bjørling 已提交
642 643
}

644
static void nvme_nvm_end_io(struct request *rq, blk_status_t status)
M
Matias Bjørling 已提交
645 646 647
{
	struct nvm_rq *rqd = rq->end_io_data;

648
	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
649
	rqd->error = nvme_req(rq)->status;
650
	nvm_end_io(rqd);
M
Matias Bjørling 已提交
651

652
	kfree(nvme_req(rq)->cmd);
M
Matias Bjørling 已提交
653 654 655
	blk_mq_free_request(rq);
}

656 657 658
static struct request *nvme_nvm_alloc_request(struct request_queue *q,
					      struct nvm_rq *rqd,
					      struct nvme_nvm_command *cmd)
M
Matias Bjørling 已提交
659 660 661 662
{
	struct nvme_ns *ns = q->queuedata;
	struct request *rq;

663
	nvme_nvm_rqtocmd(rqd, ns, cmd);
664

665
	rq = nvme_alloc_request(q, (struct nvme_command *)cmd, 0, NVME_QID_ANY);
666 667 668
	if (IS_ERR(rq))
		return rq;

669
	rq->cmd_flags &= ~REQ_FAILFAST_DRIVER;
M
Matias Bjørling 已提交
670

671
	if (rqd->bio)
672
		blk_init_request_from_bio(rq, rqd->bio);
673
	else
674
		rq->ioprio = IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, IOPRIO_NORM);
M
Matias Bjørling 已提交
675

676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694
	return rq;
}

static int nvme_nvm_submit_io(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct nvme_nvm_command *cmd;
	struct request *rq;

	cmd = kzalloc(sizeof(struct nvme_nvm_command), GFP_KERNEL);
	if (!cmd)
		return -ENOMEM;

	rq = nvme_nvm_alloc_request(q, rqd, cmd);
	if (IS_ERR(rq)) {
		kfree(cmd);
		return PTR_ERR(rq);
	}

M
Matias Bjørling 已提交
695 696 697 698 699 700 701
	rq->end_io_data = rqd;

	blk_execute_rq_nowait(q, NULL, rq, 0, nvme_nvm_end_io);

	return 0;
}

702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729
static int nvme_nvm_submit_io_sync(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct request *rq;
	struct nvme_nvm_command cmd;
	int ret = 0;

	memset(&cmd, 0, sizeof(struct nvme_nvm_command));

	rq = nvme_nvm_alloc_request(q, rqd, &cmd);
	if (IS_ERR(rq))
		return PTR_ERR(rq);

	/* I/Os can fail and the error is signaled through rqd. Callers must
	 * handle the error accordingly.
	 */
	blk_execute_rq(q, NULL, rq, 0);
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;

	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
	rqd->error = nvme_req(rq)->status;

	blk_mq_free_request(rq);

	return ret;
}

730
static void *nvme_nvm_create_dma_pool(struct nvm_dev *nvmdev, char *name)
M
Matias Bjørling 已提交
731
{
732
	struct nvme_ns *ns = nvmdev->q->queuedata;
M
Matias Bjørling 已提交
733

734
	return dma_pool_create(name, ns->ctrl->dev, PAGE_SIZE, PAGE_SIZE, 0);
M
Matias Bjørling 已提交
735 736 737 738 739 740 741 742 743
}

static void nvme_nvm_destroy_dma_pool(void *pool)
{
	struct dma_pool *dma_pool = pool;

	dma_pool_destroy(dma_pool);
}

744
static void *nvme_nvm_dev_dma_alloc(struct nvm_dev *dev, void *pool,
M
Matias Bjørling 已提交
745 746 747 748 749
				    gfp_t mem_flags, dma_addr_t *dma_handler)
{
	return dma_pool_alloc(pool, mem_flags, dma_handler);
}

750
static void nvme_nvm_dev_dma_free(void *pool, void *addr,
M
Matias Bjørling 已提交
751 752
							dma_addr_t dma_handler)
{
753
	dma_pool_free(pool, addr, dma_handler);
M
Matias Bjørling 已提交
754 755 756 757 758 759
}

static struct nvm_dev_ops nvme_nvm_dev_ops = {
	.identity		= nvme_nvm_identity,

	.get_bb_tbl		= nvme_nvm_get_bb_tbl,
760
	.set_bb_tbl		= nvme_nvm_set_bb_tbl,
M
Matias Bjørling 已提交
761

762 763
	.get_chk_meta		= nvme_nvm_get_chk_meta,

M
Matias Bjørling 已提交
764
	.submit_io		= nvme_nvm_submit_io,
765
	.submit_io_sync		= nvme_nvm_submit_io_sync,
M
Matias Bjørling 已提交
766 767 768 769 770 771 772

	.create_dma_pool	= nvme_nvm_create_dma_pool,
	.destroy_dma_pool	= nvme_nvm_destroy_dma_pool,
	.dev_dma_alloc		= nvme_nvm_dev_dma_alloc,
	.dev_dma_free		= nvme_nvm_dev_dma_free,
};

773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790
static int nvme_nvm_submit_user_cmd(struct request_queue *q,
				struct nvme_ns *ns,
				struct nvme_nvm_command *vcmd,
				void __user *ubuf, unsigned int bufflen,
				void __user *meta_buf, unsigned int meta_len,
				void __user *ppa_buf, unsigned int ppa_len,
				u32 *result, u64 *status, unsigned int timeout)
{
	bool write = nvme_is_write((struct nvme_command *)vcmd);
	struct nvm_dev *dev = ns->ndev;
	struct gendisk *disk = ns->disk;
	struct request *rq;
	struct bio *bio = NULL;
	__le64 *ppa_list = NULL;
	dma_addr_t ppa_dma;
	__le64 *metadata = NULL;
	dma_addr_t metadata_dma;
	DECLARE_COMPLETION_ONSTACK(wait);
791
	int ret = 0;
792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842

	rq = nvme_alloc_request(q, (struct nvme_command *)vcmd, 0,
			NVME_QID_ANY);
	if (IS_ERR(rq)) {
		ret = -ENOMEM;
		goto err_cmd;
	}

	rq->timeout = timeout ? timeout : ADMIN_TIMEOUT;

	if (ppa_buf && ppa_len) {
		ppa_list = dma_pool_alloc(dev->dma_pool, GFP_KERNEL, &ppa_dma);
		if (!ppa_list) {
			ret = -ENOMEM;
			goto err_rq;
		}
		if (copy_from_user(ppa_list, (void __user *)ppa_buf,
						sizeof(u64) * (ppa_len + 1))) {
			ret = -EFAULT;
			goto err_ppa;
		}
		vcmd->ph_rw.spba = cpu_to_le64(ppa_dma);
	} else {
		vcmd->ph_rw.spba = cpu_to_le64((uintptr_t)ppa_buf);
	}

	if (ubuf && bufflen) {
		ret = blk_rq_map_user(q, rq, NULL, ubuf, bufflen, GFP_KERNEL);
		if (ret)
			goto err_ppa;
		bio = rq->bio;

		if (meta_buf && meta_len) {
			metadata = dma_pool_alloc(dev->dma_pool, GFP_KERNEL,
								&metadata_dma);
			if (!metadata) {
				ret = -ENOMEM;
				goto err_map;
			}

			if (write) {
				if (copy_from_user(metadata,
						(void __user *)meta_buf,
						meta_len)) {
					ret = -EFAULT;
					goto err_meta;
				}
			}
			vcmd->ph_rw.metadata = cpu_to_le64(metadata_dma);
		}

843
		bio->bi_disk = disk;
844 845
	}

846
	blk_execute_rq(q, NULL, rq, 0);
847

848 849
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;
850 851
	else if (nvme_req(rq)->status & 0x7ff)
		ret = -EIO;
852
	if (result)
853
		*result = nvme_req(rq)->status & 0x7ff;
854 855 856 857 858 859 860 861 862 863 864
	if (status)
		*status = le64_to_cpu(nvme_req(rq)->result.u64);

	if (metadata && !ret && !write) {
		if (copy_to_user(meta_buf, (void *)metadata, meta_len))
			ret = -EFAULT;
	}
err_meta:
	if (meta_buf && meta_len)
		dma_pool_free(dev->dma_pool, metadata, metadata_dma);
err_map:
865
	if (bio)
866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890
		blk_rq_unmap_user(bio);
err_ppa:
	if (ppa_buf && ppa_len)
		dma_pool_free(dev->dma_pool, ppa_list, ppa_dma);
err_rq:
	blk_mq_free_request(rq);
err_cmd:
	return ret;
}

static int nvme_nvm_submit_vio(struct nvme_ns *ns,
					struct nvm_user_vio __user *uvio)
{
	struct nvm_user_vio vio;
	struct nvme_nvm_command c;
	unsigned int length;
	int ret;

	if (copy_from_user(&vio, uvio, sizeof(vio)))
		return -EFAULT;
	if (vio.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.ph_rw.opcode = vio.opcode;
C
Christoph Hellwig 已提交
891
	c.ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927
	c.ph_rw.control = cpu_to_le16(vio.control);
	c.ph_rw.length = cpu_to_le16(vio.nppas);

	length = (vio.nppas + 1) << ns->lba_shift;

	ret = nvme_nvm_submit_user_cmd(ns->queue, ns, &c,
			(void __user *)(uintptr_t)vio.addr, length,
			(void __user *)(uintptr_t)vio.metadata,
							vio.metadata_len,
			(void __user *)(uintptr_t)vio.ppa_list, vio.nppas,
			&vio.result, &vio.status, 0);

	if (ret && copy_to_user(uvio, &vio, sizeof(vio)))
		return -EFAULT;

	return ret;
}

static int nvme_nvm_user_vcmd(struct nvme_ns *ns, int admin,
					struct nvm_passthru_vio __user *uvcmd)
{
	struct nvm_passthru_vio vcmd;
	struct nvme_nvm_command c;
	struct request_queue *q;
	unsigned int timeout = 0;
	int ret;

	if (copy_from_user(&vcmd, uvcmd, sizeof(vcmd)))
		return -EFAULT;
	if ((vcmd.opcode != 0xF2) && (!capable(CAP_SYS_ADMIN)))
		return -EACCES;
	if (vcmd.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.common.opcode = vcmd.opcode;
C
Christoph Hellwig 已提交
928
	c.common.nsid = cpu_to_le32(ns->head->ns_id);
929 930 931 932
	c.common.cdw2[0] = cpu_to_le32(vcmd.cdw2);
	c.common.cdw2[1] = cpu_to_le32(vcmd.cdw3);
	/* cdw11-12 */
	c.ph_rw.length = cpu_to_le16(vcmd.nppas);
933
	c.ph_rw.control  = cpu_to_le16(vcmd.control);
934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970
	c.common.cdw10[3] = cpu_to_le32(vcmd.cdw13);
	c.common.cdw10[4] = cpu_to_le32(vcmd.cdw14);
	c.common.cdw10[5] = cpu_to_le32(vcmd.cdw15);

	if (vcmd.timeout_ms)
		timeout = msecs_to_jiffies(vcmd.timeout_ms);

	q = admin ? ns->ctrl->admin_q : ns->queue;

	ret = nvme_nvm_submit_user_cmd(q, ns,
			(struct nvme_nvm_command *)&c,
			(void __user *)(uintptr_t)vcmd.addr, vcmd.data_len,
			(void __user *)(uintptr_t)vcmd.metadata,
							vcmd.metadata_len,
			(void __user *)(uintptr_t)vcmd.ppa_list, vcmd.nppas,
			&vcmd.result, &vcmd.status, timeout);

	if (ret && copy_to_user(uvcmd, &vcmd, sizeof(vcmd)))
		return -EFAULT;

	return ret;
}

int nvme_nvm_ioctl(struct nvme_ns *ns, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
	case NVME_NVM_IOCTL_ADMIN_VIO:
		return nvme_nvm_user_vcmd(ns, 1, (void __user *)arg);
	case NVME_NVM_IOCTL_IO_VIO:
		return nvme_nvm_user_vcmd(ns, 0, (void __user *)arg);
	case NVME_NVM_IOCTL_SUBMIT_VIO:
		return nvme_nvm_submit_vio(ns, (void __user *)arg);
	default:
		return -ENOTTY;
	}
}

971 972 973
void nvme_nvm_update_nvm_info(struct nvme_ns *ns)
{
	struct nvm_dev *ndev = ns->ndev;
974
	struct nvm_geo *geo = &ndev->geo;
975

976 977
	geo->csecs = 1 << ns->lba_shift;
	geo->sos = ns->ms;
978 979
}

980
int nvme_nvm_register(struct nvme_ns *ns, char *disk_name, int node)
M
Matias Bjørling 已提交
981
{
982 983 984
	struct request_queue *q = ns->queue;
	struct nvm_dev *dev;

985 986
	_nvme_nvm_check_size();

987 988 989 990 991 992 993
	dev = nvm_alloc_dev(node);
	if (!dev)
		return -ENOMEM;

	dev->q = q;
	memcpy(dev->name, disk_name, DISK_NAME_LEN);
	dev->ops = &nvme_nvm_dev_ops;
994
	dev->private_data = ns;
995 996
	ns->ndev = dev;

997
	return nvm_register(dev);
M
Matias Bjørling 已提交
998 999
}

1000
void nvme_nvm_unregister(struct nvme_ns *ns)
M
Matias Bjørling 已提交
1001
{
1002
	nvm_unregister(ns->ndev);
M
Matias Bjørling 已提交
1003 1004
}

1005
static ssize_t nvm_dev_attr_show(struct device *dev,
1006
		struct device_attribute *dattr, char *page)
1007 1008 1009
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1010
	struct nvm_geo *geo = &ndev->geo;
1011 1012 1013 1014 1015 1016 1017 1018
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "version") == 0) {
1019 1020 1021 1022 1023 1024 1025
		if (geo->major_ver_id == 1)
			return scnprintf(page, PAGE_SIZE, "%u\n",
						geo->major_ver_id);
		else
			return scnprintf(page, PAGE_SIZE, "%u.%u\n",
						geo->major_ver_id,
						geo->minor_ver_id);
1026
	} else if (strcmp(attr->name, "capabilities") == 0) {
1027
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->cap);
1028
	} else if (strcmp(attr->name, "read_typ") == 0) {
1029
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdt);
1030
	} else if (strcmp(attr->name, "read_max") == 0) {
1031
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdm);
1032 1033 1034
	} else {
		return scnprintf(page,
				 PAGE_SIZE,
1035 1036
				 "Unhandled attr(%s) in `%s`\n",
				 attr->name, __func__);
1037 1038 1039
	}
}

1040 1041 1042 1043 1044 1045 1046 1047 1048
static ssize_t nvm_dev_attr_show_ppaf(struct nvm_addrf_12 *ppaf, char *page)
{
	return scnprintf(page, PAGE_SIZE,
		"0x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x\n",
				ppaf->ch_offset, ppaf->ch_len,
				ppaf->lun_offset, ppaf->lun_len,
				ppaf->pln_offset, ppaf->pln_len,
				ppaf->blk_offset, ppaf->blk_len,
				ppaf->pg_offset, ppaf->pg_len,
1049
				ppaf->sec_offset, ppaf->sec_len);
1050 1051
}

1052 1053 1054 1055 1056
static ssize_t nvm_dev_attr_show_12(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1057
	struct nvm_geo *geo = &ndev->geo;
1058 1059 1060 1061 1062 1063 1064 1065
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "vendor_opcode") == 0) {
1066
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->vmnt);
1067
	} else if (strcmp(attr->name, "device_mode") == 0) {
1068
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->dom);
1069
	/* kept for compatibility */
1070
	} else if (strcmp(attr->name, "media_manager") == 0) {
1071
		return scnprintf(page, PAGE_SIZE, "%s\n", "gennvm");
1072
	} else if (strcmp(attr->name, "ppa_format") == 0) {
1073
		return nvm_dev_attr_show_ppaf((void *)&geo->addrf, page);
1074
	} else if (strcmp(attr->name, "media_type") == 0) {	/* u8 */
1075
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mtype);
1076
	} else if (strcmp(attr->name, "flash_media_type") == 0) {
1077
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fmtype);
1078
	} else if (strcmp(attr->name, "num_channels") == 0) {
1079
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1080
	} else if (strcmp(attr->name, "num_luns") == 0) {
1081
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1082
	} else if (strcmp(attr->name, "num_planes") == 0) {
1083
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pln);
1084
	} else if (strcmp(attr->name, "num_blocks") == 0) {	/* u16 */
1085
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1086
	} else if (strcmp(attr->name, "num_pages") == 0) {
1087
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pg);
1088
	} else if (strcmp(attr->name, "page_size") == 0) {
1089
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fpg_sz);
1090
	} else if (strcmp(attr->name, "hw_sector_size") == 0) {
1091
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->csecs);
1092
	} else if (strcmp(attr->name, "oob_sector_size") == 0) {/* u32 */
1093
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->sos);
1094
	} else if (strcmp(attr->name, "prog_typ") == 0) {
1095
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1096
	} else if (strcmp(attr->name, "prog_max") == 0) {
1097
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1098
	} else if (strcmp(attr->name, "erase_typ") == 0) {
1099
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1100
	} else if (strcmp(attr->name, "erase_max") == 0) {
1101
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1102
	} else if (strcmp(attr->name, "multiplane_modes") == 0) {
1103
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mpos);
1104
	} else if (strcmp(attr->name, "media_capabilities") == 0) {
1105
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mccap);
1106
	} else if (strcmp(attr->name, "max_phys_secs") == 0) {
1107
		return scnprintf(page, PAGE_SIZE, "%u\n", NVM_MAX_VLBA);
1108
	} else {
1109
		return scnprintf(page, PAGE_SIZE,
1110 1111
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1112 1113 1114
	}
}

1115 1116 1117 1118 1119
static ssize_t nvm_dev_attr_show_20(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1120
	struct nvm_geo *geo = &ndev->geo;
1121 1122 1123 1124 1125 1126 1127 1128
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "groups") == 0) {
1129
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1130
	} else if (strcmp(attr->name, "punits") == 0) {
1131
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1132
	} else if (strcmp(attr->name, "chunks") == 0) {
1133
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1134
	} else if (strcmp(attr->name, "clba") == 0) {
1135
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->clba);
1136
	} else if (strcmp(attr->name, "ws_min") == 0) {
1137
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_min);
1138
	} else if (strcmp(attr->name, "ws_opt") == 0) {
1139
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_opt);
1140 1141 1142 1143
	} else if (strcmp(attr->name, "maxoc") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxoc);
	} else if (strcmp(attr->name, "maxocpu") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxocpu);
1144
	} else if (strcmp(attr->name, "mw_cunits") == 0) {
1145
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mw_cunits);
1146
	} else if (strcmp(attr->name, "write_typ") == 0) {
1147
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1148
	} else if (strcmp(attr->name, "write_max") == 0) {
1149
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1150
	} else if (strcmp(attr->name, "reset_typ") == 0) {
1151
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1152
	} else if (strcmp(attr->name, "reset_max") == 0) {
1153
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1154
	} else {
1155
		return scnprintf(page, PAGE_SIZE,
1156 1157
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1158 1159 1160 1161
	}
}

#define NVM_DEV_ATTR_RO(_name)					\
1162
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show, NULL)
1163 1164 1165 1166
#define NVM_DEV_ATTR_12_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_12, NULL)
#define NVM_DEV_ATTR_20_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_20, NULL)
1167

1168
/* general attributes */
1169 1170
static NVM_DEV_ATTR_RO(version);
static NVM_DEV_ATTR_RO(capabilities);
1171

1172 1173
static NVM_DEV_ATTR_RO(read_typ);
static NVM_DEV_ATTR_RO(read_max);
1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198

/* 1.2 values */
static NVM_DEV_ATTR_12_RO(vendor_opcode);
static NVM_DEV_ATTR_12_RO(device_mode);
static NVM_DEV_ATTR_12_RO(ppa_format);
static NVM_DEV_ATTR_12_RO(media_manager);
static NVM_DEV_ATTR_12_RO(media_type);
static NVM_DEV_ATTR_12_RO(flash_media_type);
static NVM_DEV_ATTR_12_RO(num_channels);
static NVM_DEV_ATTR_12_RO(num_luns);
static NVM_DEV_ATTR_12_RO(num_planes);
static NVM_DEV_ATTR_12_RO(num_blocks);
static NVM_DEV_ATTR_12_RO(num_pages);
static NVM_DEV_ATTR_12_RO(page_size);
static NVM_DEV_ATTR_12_RO(hw_sector_size);
static NVM_DEV_ATTR_12_RO(oob_sector_size);
static NVM_DEV_ATTR_12_RO(prog_typ);
static NVM_DEV_ATTR_12_RO(prog_max);
static NVM_DEV_ATTR_12_RO(erase_typ);
static NVM_DEV_ATTR_12_RO(erase_max);
static NVM_DEV_ATTR_12_RO(multiplane_modes);
static NVM_DEV_ATTR_12_RO(media_capabilities);
static NVM_DEV_ATTR_12_RO(max_phys_secs);

static struct attribute *nvm_dev_attrs_12[] = {
1199 1200
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,
1201 1202

	&dev_attr_vendor_opcode.attr,
1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224
	&dev_attr_device_mode.attr,
	&dev_attr_media_manager.attr,
	&dev_attr_ppa_format.attr,
	&dev_attr_media_type.attr,
	&dev_attr_flash_media_type.attr,
	&dev_attr_num_channels.attr,
	&dev_attr_num_luns.attr,
	&dev_attr_num_planes.attr,
	&dev_attr_num_blocks.attr,
	&dev_attr_num_pages.attr,
	&dev_attr_page_size.attr,
	&dev_attr_hw_sector_size.attr,
	&dev_attr_oob_sector_size.attr,
	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_prog_typ.attr,
	&dev_attr_prog_max.attr,
	&dev_attr_erase_typ.attr,
	&dev_attr_erase_max.attr,
	&dev_attr_multiplane_modes.attr,
	&dev_attr_media_capabilities.attr,
	&dev_attr_max_phys_secs.attr,
1225

1226 1227 1228
	NULL,
};

1229
static const struct attribute_group nvm_dev_attr_group_12 = {
1230
	.name		= "lightnvm",
1231 1232 1233 1234 1235 1236 1237 1238 1239 1240
	.attrs		= nvm_dev_attrs_12,
};

/* 2.0 values */
static NVM_DEV_ATTR_20_RO(groups);
static NVM_DEV_ATTR_20_RO(punits);
static NVM_DEV_ATTR_20_RO(chunks);
static NVM_DEV_ATTR_20_RO(clba);
static NVM_DEV_ATTR_20_RO(ws_min);
static NVM_DEV_ATTR_20_RO(ws_opt);
1241 1242
static NVM_DEV_ATTR_20_RO(maxoc);
static NVM_DEV_ATTR_20_RO(maxocpu);
1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258
static NVM_DEV_ATTR_20_RO(mw_cunits);
static NVM_DEV_ATTR_20_RO(write_typ);
static NVM_DEV_ATTR_20_RO(write_max);
static NVM_DEV_ATTR_20_RO(reset_typ);
static NVM_DEV_ATTR_20_RO(reset_max);

static struct attribute *nvm_dev_attrs_20[] = {
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,

	&dev_attr_groups.attr,
	&dev_attr_punits.attr,
	&dev_attr_chunks.attr,
	&dev_attr_clba.attr,
	&dev_attr_ws_min.attr,
	&dev_attr_ws_opt.attr,
1259 1260
	&dev_attr_maxoc.attr,
	&dev_attr_maxocpu.attr,
1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275
	&dev_attr_mw_cunits.attr,

	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_write_typ.attr,
	&dev_attr_write_max.attr,
	&dev_attr_reset_typ.attr,
	&dev_attr_reset_max.attr,

	NULL,
};

static const struct attribute_group nvm_dev_attr_group_20 = {
	.name		= "lightnvm",
	.attrs		= nvm_dev_attrs_20,
1276 1277 1278 1279
};

int nvme_nvm_register_sysfs(struct nvme_ns *ns)
{
1280 1281 1282 1283
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

	if (!ndev)
1284 1285
		return -EINVAL;

1286
	switch (geo->major_ver_id) {
1287 1288 1289 1290 1291 1292 1293 1294 1295
	case 1:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
	case 2:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
	}

	return -EINVAL;
1296 1297 1298 1299
}

void nvme_nvm_unregister_sysfs(struct nvme_ns *ns)
{
1300 1301 1302
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

1303
	switch (geo->major_ver_id) {
1304 1305 1306 1307 1308 1309 1310 1311 1312
	case 1:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
		break;
	case 2:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
		break;
	}
1313
}