lightnvm.c 33.3 KB
Newer Older
M
Matias Bjørling 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * nvme-lightnvm.c - LightNVM NVMe device
 *
 * Copyright (C) 2014-2015 IT University of Copenhagen
 * Initial release: Matias Bjorling <mb@lightnvm.io>
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version
 * 2 as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; see the file COPYING.  If not, write to
 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
 * USA.
 *
 */

#include "nvme.h"

#include <linux/nvme.h>
#include <linux/bitops.h>
#include <linux/lightnvm.h>
#include <linux/vmalloc.h>
29 30
#include <linux/sched/sysctl.h>
#include <uapi/linux/lightnvm.h>
M
Matias Bjørling 已提交
31 32 33 34 35 36 37

enum nvme_nvm_admin_opcode {
	nvme_nvm_admin_identity		= 0xe2,
	nvme_nvm_admin_get_bb_tbl	= 0xf2,
	nvme_nvm_admin_set_bb_tbl	= 0xf1,
};

38 39 40 41
enum nvme_nvm_log_page {
	NVME_NVM_LOG_REPORT_CHUNK	= 0xca,
};

M
Matias Bjørling 已提交
42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
struct nvme_nvm_ph_rw {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd2;
	__le64			metadata;
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
struct nvme_nvm_erase_blk {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			length;
	__le16			control;
	__le32			dsmgmt;
	__le64			resv;
};

M
Matias Bjørling 已提交
73 74 75 76 77 78 79 80
struct nvme_nvm_identity {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
81
	__u32			rsvd11[6];
M
Matias Bjørling 已提交
82 83
};

84
struct nvme_nvm_getbbtbl {
M
Matias Bjørling 已提交
85 86 87 88 89 90 91
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__u64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	__le64			spba;
	__u32			rsvd4[4];
};

struct nvme_nvm_setbbtbl {
	__u8			opcode;
	__u8			flags;
	__u16			command_id;
	__le32			nsid;
	__le64			rsvd[2];
	__le64			prp1;
	__le64			prp2;
	__le64			spba;
	__le16			nlb;
	__u8			value;
	__u8			rsvd3;
	__u32			rsvd4[3];
M
Matias Bjørling 已提交
109 110 111 112 113 114
};

struct nvme_nvm_command {
	union {
		struct nvme_common_command common;
		struct nvme_nvm_ph_rw ph_rw;
115 116
		struct nvme_nvm_erase_blk erase;
		struct nvme_nvm_identity identity;
117 118
		struct nvme_nvm_getbbtbl get_bb;
		struct nvme_nvm_setbbtbl set_bb;
M
Matias Bjørling 已提交
119 120 121
	};
};

122
struct nvme_nvm_id12_grp {
M
Matias Bjørling 已提交
123 124 125 126 127 128
	__u8			mtype;
	__u8			fmtype;
	__le16			res16;
	__u8			num_ch;
	__u8			num_lun;
	__u8			num_pln;
129
	__u8			rsvd1;
130
	__le16			num_chk;
M
Matias Bjørling 已提交
131 132 133 134
	__le16			num_pg;
	__le16			fpg_sz;
	__le16			csecs;
	__le16			sos;
135
	__le16			rsvd2;
M
Matias Bjørling 已提交
136 137 138 139 140 141 142
	__le32			trdt;
	__le32			trdm;
	__le32			tprt;
	__le32			tprm;
	__le32			tbet;
	__le32			tbem;
	__le32			mpos;
143
	__le32			mccap;
M
Matias Bjørling 已提交
144
	__le16			cpar;
145
	__u8			reserved[906];
M
Matias Bjørling 已提交
146 147
} __packed;

148
struct nvme_nvm_id12_addrf {
M
Matias Bjørling 已提交
149 150 151 152 153 154 155 156 157 158
	__u8			ch_offset;
	__u8			ch_len;
	__u8			lun_offset;
	__u8			lun_len;
	__u8			pln_offset;
	__u8			pln_len;
	__u8			blk_offset;
	__u8			blk_len;
	__u8			pg_offset;
	__u8			pg_len;
159 160
	__u8			sec_offset;
	__u8			sec_len;
M
Matias Bjørling 已提交
161 162 163
	__u8			res[4];
} __packed;

164
struct nvme_nvm_id12 {
M
Matias Bjørling 已提交
165 166 167
	__u8			ver_id;
	__u8			vmnt;
	__u8			cgrps;
168
	__u8			res;
M
Matias Bjørling 已提交
169 170
	__le32			cap;
	__le32			dom;
171
	struct nvme_nvm_id12_addrf ppaf;
172
	__u8			resv[228];
173
	struct nvme_nvm_id12_grp grp;
174
	__u8			resv2[2880];
M
Matias Bjørling 已提交
175 176
} __packed;

177 178 179 180 181 182 183 184 185 186 187 188 189 190
struct nvme_nvm_bb_tbl {
	__u8	tblid[4];
	__le16	verid;
	__le16	revid;
	__le32	rvsd1;
	__le32	tblks;
	__le32	tfact;
	__le32	tgrown;
	__le32	tdresv;
	__le32	thresv;
	__le32	rsvd2[8];
	__u8	blk[0];
};

191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242
struct nvme_nvm_id20_addrf {
	__u8			grp_len;
	__u8			pu_len;
	__u8			chk_len;
	__u8			lba_len;
	__u8			resv[4];
};

struct nvme_nvm_id20 {
	__u8			mjr;
	__u8			mnr;
	__u8			resv[6];

	struct nvme_nvm_id20_addrf lbaf;

	__le32			mccap;
	__u8			resv2[12];

	__u8			wit;
	__u8			resv3[31];

	/* Geometry */
	__le16			num_grp;
	__le16			num_pu;
	__le32			num_chk;
	__le32			clba;
	__u8			resv4[52];

	/* Write data requirements */
	__le32			ws_min;
	__le32			ws_opt;
	__le32			mw_cunits;
	__le32			maxoc;
	__le32			maxocpu;
	__u8			resv5[44];

	/* Performance related metrics */
	__le32			trdt;
	__le32			trdm;
	__le32			twrt;
	__le32			twrm;
	__le32			tcrst;
	__le32			tcrsm;
	__u8			resv6[40];

	/* Reserved area */
	__u8			resv7[2816];

	/* Vendor specific */
	__u8			vs[1024];
};

243 244 245 246 247 248 249 250 251 252
struct nvme_nvm_chk_meta {
	__u8	state;
	__u8	type;
	__u8	wi;
	__u8	rsvd[5];
	__le64	slba;
	__le64	cnlb;
	__le64	wp;
};

M
Matias Bjørling 已提交
253 254 255 256 257 258 259
/*
 * Check we didn't inadvertently grow the command struct
 */
static inline void _nvme_nvm_check_size(void)
{
	BUILD_BUG_ON(sizeof(struct nvme_nvm_identity) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_ph_rw) != 64);
260
	BUILD_BUG_ON(sizeof(struct nvme_nvm_erase_blk) != 64);
261 262
	BUILD_BUG_ON(sizeof(struct nvme_nvm_getbbtbl) != 64);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_setbbtbl) != 64);
263 264 265
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_grp) != 960);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12_addrf) != 16);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id12) != NVME_IDENTIFY_DATA_SIZE);
266
	BUILD_BUG_ON(sizeof(struct nvme_nvm_bb_tbl) != 64);
267 268
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20_addrf) != 8);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_id20) != NVME_IDENTIFY_DATA_SIZE);
269 270 271
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) != 32);
	BUILD_BUG_ON(sizeof(struct nvme_nvm_chk_meta) !=
						sizeof(struct nvm_chk_meta));
M
Matias Bjørling 已提交
272 273
}

274 275 276 277 278 279 280 281
static void nvme_nvm_set_addr_12(struct nvm_addrf_12 *dst,
				 struct nvme_nvm_id12_addrf *src)
{
	dst->ch_len = src->ch_len;
	dst->lun_len = src->lun_len;
	dst->blk_len = src->blk_len;
	dst->pg_len = src->pg_len;
	dst->pln_len = src->pln_len;
282
	dst->sec_len = src->sec_len;
283 284 285 286 287 288

	dst->ch_offset = src->ch_offset;
	dst->lun_offset = src->lun_offset;
	dst->blk_offset = src->blk_offset;
	dst->pg_offset = src->pg_offset;
	dst->pln_offset = src->pln_offset;
289
	dst->sec_offset = src->sec_offset;
290 291 292 293 294 295

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->blk_mask = ((1ULL << dst->blk_len) - 1) << dst->blk_offset;
	dst->pg_mask = ((1ULL << dst->pg_len) - 1) << dst->pg_offset;
	dst->pln_mask = ((1ULL << dst->pln_len) - 1) << dst->pln_offset;
296
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
297 298 299 300
}

static int nvme_nvm_setup_12(struct nvme_nvm_id12 *id,
			     struct nvm_geo *geo)
M
Matias Bjørling 已提交
301
{
302
	struct nvme_nvm_id12_grp *src;
303
	int sec_per_pg, sec_per_pl, pg_per_blk;
304

305 306 307 308 309 310 311
	if (id->cgrps != 1)
		return -EINVAL;

	src = &id->grp;

	if (src->mtype != 0) {
		pr_err("nvm: memory type not supported\n");
312
		return -EINVAL;
313
	}
314

315 316 317
	/* 1.2 spec. only reports a single version id - unfold */
	geo->major_ver_id = id->ver_id;
	geo->minor_ver_id = 2;
318

319 320 321
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_12;

322 323 324
	geo->num_ch = src->num_ch;
	geo->num_lun = src->num_lun;
	geo->all_luns = geo->num_ch * geo->num_lun;
325

326
	geo->num_chk = le16_to_cpu(src->num_chk);
327

328 329
	geo->csecs = le16_to_cpu(src->csecs);
	geo->sos = le16_to_cpu(src->sos);
330 331

	pg_per_blk = le16_to_cpu(src->num_pg);
332
	sec_per_pg = le16_to_cpu(src->fpg_sz) / geo->csecs;
333
	sec_per_pl = sec_per_pg * src->num_pln;
334 335
	geo->clba = sec_per_pl * pg_per_blk;

336
	geo->all_chunks = geo->all_luns * geo->num_chk;
337 338 339 340 341
	geo->total_secs = geo->clba * geo->all_chunks;

	geo->ws_min = sec_per_pg;
	geo->ws_opt = sec_per_pg;
	geo->mw_cunits = geo->ws_opt << 3;	/* default to MLC safe values */
342

343 344 345 346
	/* Do not impose values for maximum number of open blocks as it is
	 * unspecified in 1.2. Users of 1.2 must be aware of this and eventually
	 * specify these values through a quirk if restrictions apply.
	 */
347 348
	geo->maxoc = geo->all_luns * geo->num_chk;
	geo->maxocpu = geo->num_chk;
349

350 351 352 353 354 355 356 357
	geo->mccap = le32_to_cpu(src->mccap);

	geo->trdt = le32_to_cpu(src->trdt);
	geo->trdm = le32_to_cpu(src->trdm);
	geo->tprt = le32_to_cpu(src->tprt);
	geo->tprm = le32_to_cpu(src->tprm);
	geo->tbet = le32_to_cpu(src->tbet);
	geo->tbem = le32_to_cpu(src->tbem);
358 359

	/* 1.2 compatibility */
360 361 362 363 364 365 366 367 368 369
	geo->vmnt = id->vmnt;
	geo->cap = le32_to_cpu(id->cap);
	geo->dom = le32_to_cpu(id->dom);

	geo->mtype = src->mtype;
	geo->fmtype = src->fmtype;

	geo->cpar = le16_to_cpu(src->cpar);
	geo->mpos = le32_to_cpu(src->mpos);

370
	geo->pln_mode = NVM_PLANE_SINGLE;
371 372

	if (geo->mpos & 0x020202) {
373
		geo->pln_mode = NVM_PLANE_DOUBLE;
374 375
		geo->ws_opt <<= 1;
	} else if (geo->mpos & 0x040404) {
376
		geo->pln_mode = NVM_PLANE_QUAD;
377 378 379 380 381 382 383 384
		geo->ws_opt <<= 2;
	}

	geo->num_pln = src->num_pln;
	geo->num_pg = le16_to_cpu(src->num_pg);
	geo->fpg_sz = le16_to_cpu(src->fpg_sz);

	nvme_nvm_set_addr_12((struct nvm_addrf_12 *)&geo->addrf, &id->ppaf);
385

M
Matias Bjørling 已提交
386 387 388
	return 0;
}

389 390
static void nvme_nvm_set_addr_20(struct nvm_addrf *dst,
				 struct nvme_nvm_id20_addrf *src)
391
{
392 393 394 395 396 397 398 399 400 401 402 403 404 405
	dst->ch_len = src->grp_len;
	dst->lun_len = src->pu_len;
	dst->chk_len = src->chk_len;
	dst->sec_len = src->lba_len;

	dst->sec_offset = 0;
	dst->chk_offset = dst->sec_len;
	dst->lun_offset = dst->chk_offset + dst->chk_len;
	dst->ch_offset = dst->lun_offset + dst->lun_len;

	dst->ch_mask = ((1ULL << dst->ch_len) - 1) << dst->ch_offset;
	dst->lun_mask = ((1ULL << dst->lun_len) - 1) << dst->lun_offset;
	dst->chk_mask = ((1ULL << dst->chk_len) - 1) << dst->chk_offset;
	dst->sec_mask = ((1ULL << dst->sec_len) - 1) << dst->sec_offset;
406 407
}

408 409
static int nvme_nvm_setup_20(struct nvme_nvm_id20 *id,
			     struct nvm_geo *geo)
410
{
411 412 413
	geo->major_ver_id = id->mjr;
	geo->minor_ver_id = id->mnr;

414 415 416
	/* Set compacted version for upper layers */
	geo->version = NVM_OCSSD_SPEC_20;

417 418 419 420 421
	if (!(geo->major_ver_id == 2 && geo->minor_ver_id == 0)) {
		pr_err("nvm: OCSSD version not supported (v%d.%d)\n",
				geo->major_ver_id, geo->minor_ver_id);
		return -EINVAL;
	}
422

423 424 425
	geo->num_ch = le16_to_cpu(id->num_grp);
	geo->num_lun = le16_to_cpu(id->num_pu);
	geo->all_luns = geo->num_ch * geo->num_lun;
426

427
	geo->num_chk = le32_to_cpu(id->num_chk);
428
	geo->clba = le32_to_cpu(id->clba);
429

430
	geo->all_chunks = geo->all_luns * geo->num_chk;
431
	geo->total_secs = geo->clba * geo->all_chunks;
432

433 434 435
	geo->ws_min = le32_to_cpu(id->ws_min);
	geo->ws_opt = le32_to_cpu(id->ws_opt);
	geo->mw_cunits = le32_to_cpu(id->mw_cunits);
436 437
	geo->maxoc = le32_to_cpu(id->maxoc);
	geo->maxocpu = le32_to_cpu(id->maxocpu);
438

439 440 441 442 443 444 445 446
	geo->trdt = le32_to_cpu(id->trdt);
	geo->trdm = le32_to_cpu(id->trdm);
	geo->tprt = le32_to_cpu(id->twrt);
	geo->tprm = le32_to_cpu(id->twrm);
	geo->tbet = le32_to_cpu(id->tcrst);
	geo->tbem = le32_to_cpu(id->tcrsm);

	nvme_nvm_set_addr_20(&geo->addrf, &id->lbaf);
447 448 449 450

	return 0;
}

451
static int nvme_nvm_identity(struct nvm_dev *nvmdev)
M
Matias Bjørling 已提交
452
{
453
	struct nvme_ns *ns = nvmdev->q->queuedata;
454
	struct nvme_nvm_id12 *id;
M
Matias Bjørling 已提交
455 456 457 458
	struct nvme_nvm_command c = {};
	int ret;

	c.identity.opcode = nvme_nvm_admin_identity;
C
Christoph Hellwig 已提交
459
	c.identity.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
460

461 462
	id = kmalloc(sizeof(struct nvme_nvm_id12), GFP_KERNEL);
	if (!id)
M
Matias Bjørling 已提交
463 464
		return -ENOMEM;

465
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
466
				id, sizeof(struct nvme_nvm_id12));
M
Matias Bjørling 已提交
467 468 469 470 471
	if (ret) {
		ret = -EIO;
		goto out;
	}

472 473 474 475 476 477
	/*
	 * The 1.2 and 2.0 specifications share the first byte in their geometry
	 * command to make it possible to know what version a device implements.
	 */
	switch (id->ver_id) {
	case 1:
478
		ret = nvme_nvm_setup_12(id, &nvmdev->geo);
479 480
		break;
	case 2:
481 482
		ret = nvme_nvm_setup_20((struct nvme_nvm_id20 *)id,
							&nvmdev->geo);
483 484
		break;
	default:
485 486
		dev_err(ns->ctrl->device, "OCSSD revision not supported (%d)\n",
							id->ver_id);
487 488
		ret = -EINVAL;
	}
489

M
Matias Bjørling 已提交
490
out:
491
	kfree(id);
M
Matias Bjørling 已提交
492 493 494
	return ret;
}

495
static int nvme_nvm_get_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr ppa,
496
								u8 *blks)
M
Matias Bjørling 已提交
497
{
498
	struct request_queue *q = nvmdev->q;
499
	struct nvm_geo *geo = &nvmdev->geo;
M
Matias Bjørling 已提交
500
	struct nvme_ns *ns = q->queuedata;
501
	struct nvme_ctrl *ctrl = ns->ctrl;
M
Matias Bjørling 已提交
502
	struct nvme_nvm_command c = {};
503
	struct nvme_nvm_bb_tbl *bb_tbl;
504
	int nr_blks = geo->num_chk * geo->num_pln;
505
	int tblsz = sizeof(struct nvme_nvm_bb_tbl) + nr_blks;
M
Matias Bjørling 已提交
506 507 508
	int ret = 0;

	c.get_bb.opcode = nvme_nvm_admin_get_bb_tbl;
C
Christoph Hellwig 已提交
509
	c.get_bb.nsid = cpu_to_le32(ns->head->ns_id);
510
	c.get_bb.spba = cpu_to_le64(ppa.ppa);
M
Matias Bjørling 已提交
511

512 513 514
	bb_tbl = kzalloc(tblsz, GFP_KERNEL);
	if (!bb_tbl)
		return -ENOMEM;
M
Matias Bjørling 已提交
515

516
	ret = nvme_submit_sync_cmd(ctrl->admin_q, (struct nvme_command *)&c,
517
								bb_tbl, tblsz);
M
Matias Bjørling 已提交
518
	if (ret) {
519
		dev_err(ctrl->device, "get bad block table failed (%d)\n", ret);
M
Matias Bjørling 已提交
520 521 522 523
		ret = -EIO;
		goto out;
	}

524 525
	if (bb_tbl->tblid[0] != 'B' || bb_tbl->tblid[1] != 'B' ||
		bb_tbl->tblid[2] != 'L' || bb_tbl->tblid[3] != 'T') {
526
		dev_err(ctrl->device, "bbt format mismatch\n");
527 528 529 530 531 532
		ret = -EINVAL;
		goto out;
	}

	if (le16_to_cpu(bb_tbl->verid) != 1) {
		ret = -EINVAL;
533
		dev_err(ctrl->device, "bbt version not supported\n");
534 535 536
		goto out;
	}

537
	if (le32_to_cpu(bb_tbl->tblks) != nr_blks) {
538
		ret = -EINVAL;
539 540
		dev_err(ctrl->device,
				"bbt unsuspected blocks returned (%u!=%u)",
541
				le32_to_cpu(bb_tbl->tblks), nr_blks);
542 543 544
		goto out;
	}

545
	memcpy(blks, bb_tbl->blk, geo->num_chk * geo->num_pln);
M
Matias Bjørling 已提交
546
out:
547 548 549 550
	kfree(bb_tbl);
	return ret;
}

551 552
static int nvme_nvm_set_bb_tbl(struct nvm_dev *nvmdev, struct ppa_addr *ppas,
							int nr_ppas, int type)
553
{
554
	struct nvme_ns *ns = nvmdev->q->queuedata;
555 556 557 558
	struct nvme_nvm_command c = {};
	int ret = 0;

	c.set_bb.opcode = nvme_nvm_admin_set_bb_tbl;
C
Christoph Hellwig 已提交
559
	c.set_bb.nsid = cpu_to_le32(ns->head->ns_id);
560 561
	c.set_bb.spba = cpu_to_le64(ppas->ppa);
	c.set_bb.nlb = cpu_to_le16(nr_ppas - 1);
562 563
	c.set_bb.value = type;

564
	ret = nvme_submit_sync_cmd(ns->ctrl->admin_q, (struct nvme_command *)&c,
565
								NULL, 0);
566
	if (ret)
567 568
		dev_err(ns->ctrl->device, "set bad block table failed (%d)\n",
									ret);
M
Matias Bjørling 已提交
569 570 571
	return ret;
}

572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626
/*
 * Expect the lba in device format
 */
static int nvme_nvm_get_chk_meta(struct nvm_dev *ndev,
				 struct nvm_chk_meta *meta,
				 sector_t slba, int nchks)
{
	struct nvm_geo *geo = &ndev->geo;
	struct nvme_ns *ns = ndev->q->queuedata;
	struct nvme_ctrl *ctrl = ns->ctrl;
	struct nvme_nvm_chk_meta *dev_meta = (struct nvme_nvm_chk_meta *)meta;
	struct ppa_addr ppa;
	size_t left = nchks * sizeof(struct nvme_nvm_chk_meta);
	size_t log_pos, offset, len;
	int ret, i;

	/* Normalize lba address space to obtain log offset */
	ppa.ppa = slba;
	ppa = dev_to_generic_addr(ndev, ppa);

	log_pos = ppa.m.chk;
	log_pos += ppa.m.pu * geo->num_chk;
	log_pos += ppa.m.grp * geo->num_lun * geo->num_chk;

	offset = log_pos * sizeof(struct nvme_nvm_chk_meta);

	while (left) {
		len = min_t(unsigned int, left, ctrl->max_hw_sectors << 9);

		ret = nvme_get_log_ext(ctrl, ns, NVME_NVM_LOG_REPORT_CHUNK,
				dev_meta, len, offset);
		if (ret) {
			dev_err(ctrl->device, "Get REPORT CHUNK log error\n");
			break;
		}

		for (i = 0; i < len; i += sizeof(struct nvme_nvm_chk_meta)) {
			meta->state = dev_meta->state;
			meta->type = dev_meta->type;
			meta->wi = dev_meta->wi;
			meta->slba = le64_to_cpu(dev_meta->slba);
			meta->cnlb = le64_to_cpu(dev_meta->cnlb);
			meta->wp = le64_to_cpu(dev_meta->wp);

			meta++;
			dev_meta++;
		}

		offset += len;
		left -= len;
	}

	return ret;
}

627 628
static inline void nvme_nvm_rqtocmd(struct nvm_rq *rqd, struct nvme_ns *ns,
				    struct nvme_nvm_command *c)
M
Matias Bjørling 已提交
629 630
{
	c->ph_rw.opcode = rqd->opcode;
C
Christoph Hellwig 已提交
631
	c->ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
M
Matias Bjørling 已提交
632
	c->ph_rw.spba = cpu_to_le64(rqd->ppa_addr.ppa);
633
	c->ph_rw.metadata = cpu_to_le64(rqd->dma_meta_list);
M
Matias Bjørling 已提交
634
	c->ph_rw.control = cpu_to_le16(rqd->flags);
635
	c->ph_rw.length = cpu_to_le16(rqd->nr_ppas - 1);
M
Matias Bjørling 已提交
636 637
}

638
static void nvme_nvm_end_io(struct request *rq, blk_status_t status)
M
Matias Bjørling 已提交
639 640 641
{
	struct nvm_rq *rqd = rq->end_io_data;

642
	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
643
	rqd->error = nvme_req(rq)->status;
644
	nvm_end_io(rqd);
M
Matias Bjørling 已提交
645

646
	kfree(nvme_req(rq)->cmd);
M
Matias Bjørling 已提交
647 648 649
	blk_mq_free_request(rq);
}

650 651 652
static struct request *nvme_nvm_alloc_request(struct request_queue *q,
					      struct nvm_rq *rqd,
					      struct nvme_nvm_command *cmd)
M
Matias Bjørling 已提交
653 654 655 656
{
	struct nvme_ns *ns = q->queuedata;
	struct request *rq;

657
	nvme_nvm_rqtocmd(rqd, ns, cmd);
658

659
	rq = nvme_alloc_request(q, (struct nvme_command *)cmd, 0, NVME_QID_ANY);
660 661 662
	if (IS_ERR(rq))
		return rq;

663
	rq->cmd_flags &= ~REQ_FAILFAST_DRIVER;
M
Matias Bjørling 已提交
664

665
	if (rqd->bio)
666
		blk_init_request_from_bio(rq, rqd->bio);
667
	else
668
		rq->ioprio = IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, IOPRIO_NORM);
M
Matias Bjørling 已提交
669

670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688
	return rq;
}

static int nvme_nvm_submit_io(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct nvme_nvm_command *cmd;
	struct request *rq;

	cmd = kzalloc(sizeof(struct nvme_nvm_command), GFP_KERNEL);
	if (!cmd)
		return -ENOMEM;

	rq = nvme_nvm_alloc_request(q, rqd, cmd);
	if (IS_ERR(rq)) {
		kfree(cmd);
		return PTR_ERR(rq);
	}

M
Matias Bjørling 已提交
689 690 691 692 693 694 695
	rq->end_io_data = rqd;

	blk_execute_rq_nowait(q, NULL, rq, 0, nvme_nvm_end_io);

	return 0;
}

696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723
static int nvme_nvm_submit_io_sync(struct nvm_dev *dev, struct nvm_rq *rqd)
{
	struct request_queue *q = dev->q;
	struct request *rq;
	struct nvme_nvm_command cmd;
	int ret = 0;

	memset(&cmd, 0, sizeof(struct nvme_nvm_command));

	rq = nvme_nvm_alloc_request(q, rqd, &cmd);
	if (IS_ERR(rq))
		return PTR_ERR(rq);

	/* I/Os can fail and the error is signaled through rqd. Callers must
	 * handle the error accordingly.
	 */
	blk_execute_rq(q, NULL, rq, 0);
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;

	rqd->ppa_status = le64_to_cpu(nvme_req(rq)->result.u64);
	rqd->error = nvme_req(rq)->status;

	blk_mq_free_request(rq);

	return ret;
}

724
static void *nvme_nvm_create_dma_pool(struct nvm_dev *nvmdev, char *name)
M
Matias Bjørling 已提交
725
{
726
	struct nvme_ns *ns = nvmdev->q->queuedata;
M
Matias Bjørling 已提交
727

728
	return dma_pool_create(name, ns->ctrl->dev, PAGE_SIZE, PAGE_SIZE, 0);
M
Matias Bjørling 已提交
729 730 731 732 733 734 735 736 737
}

static void nvme_nvm_destroy_dma_pool(void *pool)
{
	struct dma_pool *dma_pool = pool;

	dma_pool_destroy(dma_pool);
}

738
static void *nvme_nvm_dev_dma_alloc(struct nvm_dev *dev, void *pool,
M
Matias Bjørling 已提交
739 740 741 742 743
				    gfp_t mem_flags, dma_addr_t *dma_handler)
{
	return dma_pool_alloc(pool, mem_flags, dma_handler);
}

744
static void nvme_nvm_dev_dma_free(void *pool, void *addr,
M
Matias Bjørling 已提交
745 746
							dma_addr_t dma_handler)
{
747
	dma_pool_free(pool, addr, dma_handler);
M
Matias Bjørling 已提交
748 749 750 751 752 753
}

static struct nvm_dev_ops nvme_nvm_dev_ops = {
	.identity		= nvme_nvm_identity,

	.get_bb_tbl		= nvme_nvm_get_bb_tbl,
754
	.set_bb_tbl		= nvme_nvm_set_bb_tbl,
M
Matias Bjørling 已提交
755

756 757
	.get_chk_meta		= nvme_nvm_get_chk_meta,

M
Matias Bjørling 已提交
758
	.submit_io		= nvme_nvm_submit_io,
759
	.submit_io_sync		= nvme_nvm_submit_io_sync,
M
Matias Bjørling 已提交
760 761 762 763 764 765 766

	.create_dma_pool	= nvme_nvm_create_dma_pool,
	.destroy_dma_pool	= nvme_nvm_destroy_dma_pool,
	.dev_dma_alloc		= nvme_nvm_dev_dma_alloc,
	.dev_dma_free		= nvme_nvm_dev_dma_free,
};

767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784
static int nvme_nvm_submit_user_cmd(struct request_queue *q,
				struct nvme_ns *ns,
				struct nvme_nvm_command *vcmd,
				void __user *ubuf, unsigned int bufflen,
				void __user *meta_buf, unsigned int meta_len,
				void __user *ppa_buf, unsigned int ppa_len,
				u32 *result, u64 *status, unsigned int timeout)
{
	bool write = nvme_is_write((struct nvme_command *)vcmd);
	struct nvm_dev *dev = ns->ndev;
	struct gendisk *disk = ns->disk;
	struct request *rq;
	struct bio *bio = NULL;
	__le64 *ppa_list = NULL;
	dma_addr_t ppa_dma;
	__le64 *metadata = NULL;
	dma_addr_t metadata_dma;
	DECLARE_COMPLETION_ONSTACK(wait);
785
	int ret = 0;
786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836

	rq = nvme_alloc_request(q, (struct nvme_command *)vcmd, 0,
			NVME_QID_ANY);
	if (IS_ERR(rq)) {
		ret = -ENOMEM;
		goto err_cmd;
	}

	rq->timeout = timeout ? timeout : ADMIN_TIMEOUT;

	if (ppa_buf && ppa_len) {
		ppa_list = dma_pool_alloc(dev->dma_pool, GFP_KERNEL, &ppa_dma);
		if (!ppa_list) {
			ret = -ENOMEM;
			goto err_rq;
		}
		if (copy_from_user(ppa_list, (void __user *)ppa_buf,
						sizeof(u64) * (ppa_len + 1))) {
			ret = -EFAULT;
			goto err_ppa;
		}
		vcmd->ph_rw.spba = cpu_to_le64(ppa_dma);
	} else {
		vcmd->ph_rw.spba = cpu_to_le64((uintptr_t)ppa_buf);
	}

	if (ubuf && bufflen) {
		ret = blk_rq_map_user(q, rq, NULL, ubuf, bufflen, GFP_KERNEL);
		if (ret)
			goto err_ppa;
		bio = rq->bio;

		if (meta_buf && meta_len) {
			metadata = dma_pool_alloc(dev->dma_pool, GFP_KERNEL,
								&metadata_dma);
			if (!metadata) {
				ret = -ENOMEM;
				goto err_map;
			}

			if (write) {
				if (copy_from_user(metadata,
						(void __user *)meta_buf,
						meta_len)) {
					ret = -EFAULT;
					goto err_meta;
				}
			}
			vcmd->ph_rw.metadata = cpu_to_le64(metadata_dma);
		}

837
		bio->bi_disk = disk;
838 839
	}

840
	blk_execute_rq(q, NULL, rq, 0);
841

842 843
	if (nvme_req(rq)->flags & NVME_REQ_CANCELLED)
		ret = -EINTR;
844 845
	else if (nvme_req(rq)->status & 0x7ff)
		ret = -EIO;
846
	if (result)
847
		*result = nvme_req(rq)->status & 0x7ff;
848 849 850 851 852 853 854 855 856 857 858
	if (status)
		*status = le64_to_cpu(nvme_req(rq)->result.u64);

	if (metadata && !ret && !write) {
		if (copy_to_user(meta_buf, (void *)metadata, meta_len))
			ret = -EFAULT;
	}
err_meta:
	if (meta_buf && meta_len)
		dma_pool_free(dev->dma_pool, metadata, metadata_dma);
err_map:
859
	if (bio)
860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884
		blk_rq_unmap_user(bio);
err_ppa:
	if (ppa_buf && ppa_len)
		dma_pool_free(dev->dma_pool, ppa_list, ppa_dma);
err_rq:
	blk_mq_free_request(rq);
err_cmd:
	return ret;
}

static int nvme_nvm_submit_vio(struct nvme_ns *ns,
					struct nvm_user_vio __user *uvio)
{
	struct nvm_user_vio vio;
	struct nvme_nvm_command c;
	unsigned int length;
	int ret;

	if (copy_from_user(&vio, uvio, sizeof(vio)))
		return -EFAULT;
	if (vio.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.ph_rw.opcode = vio.opcode;
C
Christoph Hellwig 已提交
885
	c.ph_rw.nsid = cpu_to_le32(ns->head->ns_id);
886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921
	c.ph_rw.control = cpu_to_le16(vio.control);
	c.ph_rw.length = cpu_to_le16(vio.nppas);

	length = (vio.nppas + 1) << ns->lba_shift;

	ret = nvme_nvm_submit_user_cmd(ns->queue, ns, &c,
			(void __user *)(uintptr_t)vio.addr, length,
			(void __user *)(uintptr_t)vio.metadata,
							vio.metadata_len,
			(void __user *)(uintptr_t)vio.ppa_list, vio.nppas,
			&vio.result, &vio.status, 0);

	if (ret && copy_to_user(uvio, &vio, sizeof(vio)))
		return -EFAULT;

	return ret;
}

static int nvme_nvm_user_vcmd(struct nvme_ns *ns, int admin,
					struct nvm_passthru_vio __user *uvcmd)
{
	struct nvm_passthru_vio vcmd;
	struct nvme_nvm_command c;
	struct request_queue *q;
	unsigned int timeout = 0;
	int ret;

	if (copy_from_user(&vcmd, uvcmd, sizeof(vcmd)))
		return -EFAULT;
	if ((vcmd.opcode != 0xF2) && (!capable(CAP_SYS_ADMIN)))
		return -EACCES;
	if (vcmd.flags)
		return -EINVAL;

	memset(&c, 0, sizeof(c));
	c.common.opcode = vcmd.opcode;
C
Christoph Hellwig 已提交
922
	c.common.nsid = cpu_to_le32(ns->head->ns_id);
923 924 925 926
	c.common.cdw2[0] = cpu_to_le32(vcmd.cdw2);
	c.common.cdw2[1] = cpu_to_le32(vcmd.cdw3);
	/* cdw11-12 */
	c.ph_rw.length = cpu_to_le16(vcmd.nppas);
927
	c.ph_rw.control  = cpu_to_le16(vcmd.control);
928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964
	c.common.cdw10[3] = cpu_to_le32(vcmd.cdw13);
	c.common.cdw10[4] = cpu_to_le32(vcmd.cdw14);
	c.common.cdw10[5] = cpu_to_le32(vcmd.cdw15);

	if (vcmd.timeout_ms)
		timeout = msecs_to_jiffies(vcmd.timeout_ms);

	q = admin ? ns->ctrl->admin_q : ns->queue;

	ret = nvme_nvm_submit_user_cmd(q, ns,
			(struct nvme_nvm_command *)&c,
			(void __user *)(uintptr_t)vcmd.addr, vcmd.data_len,
			(void __user *)(uintptr_t)vcmd.metadata,
							vcmd.metadata_len,
			(void __user *)(uintptr_t)vcmd.ppa_list, vcmd.nppas,
			&vcmd.result, &vcmd.status, timeout);

	if (ret && copy_to_user(uvcmd, &vcmd, sizeof(vcmd)))
		return -EFAULT;

	return ret;
}

int nvme_nvm_ioctl(struct nvme_ns *ns, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
	case NVME_NVM_IOCTL_ADMIN_VIO:
		return nvme_nvm_user_vcmd(ns, 1, (void __user *)arg);
	case NVME_NVM_IOCTL_IO_VIO:
		return nvme_nvm_user_vcmd(ns, 0, (void __user *)arg);
	case NVME_NVM_IOCTL_SUBMIT_VIO:
		return nvme_nvm_submit_vio(ns, (void __user *)arg);
	default:
		return -ENOTTY;
	}
}

965 966 967
void nvme_nvm_update_nvm_info(struct nvme_ns *ns)
{
	struct nvm_dev *ndev = ns->ndev;
968
	struct nvm_geo *geo = &ndev->geo;
969

970 971
	geo->csecs = 1 << ns->lba_shift;
	geo->sos = ns->ms;
972 973
}

974
int nvme_nvm_register(struct nvme_ns *ns, char *disk_name, int node)
M
Matias Bjørling 已提交
975
{
976 977 978
	struct request_queue *q = ns->queue;
	struct nvm_dev *dev;

979 980
	_nvme_nvm_check_size();

981 982 983 984 985 986 987
	dev = nvm_alloc_dev(node);
	if (!dev)
		return -ENOMEM;

	dev->q = q;
	memcpy(dev->name, disk_name, DISK_NAME_LEN);
	dev->ops = &nvme_nvm_dev_ops;
988
	dev->private_data = ns;
989 990
	ns->ndev = dev;

991
	return nvm_register(dev);
M
Matias Bjørling 已提交
992 993
}

994
void nvme_nvm_unregister(struct nvme_ns *ns)
M
Matias Bjørling 已提交
995
{
996
	nvm_unregister(ns->ndev);
M
Matias Bjørling 已提交
997 998
}

999
static ssize_t nvm_dev_attr_show(struct device *dev,
1000
		struct device_attribute *dattr, char *page)
1001 1002 1003
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1004
	struct nvm_geo *geo = &ndev->geo;
1005 1006 1007 1008 1009 1010 1011 1012
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "version") == 0) {
1013 1014 1015 1016 1017 1018 1019
		if (geo->major_ver_id == 1)
			return scnprintf(page, PAGE_SIZE, "%u\n",
						geo->major_ver_id);
		else
			return scnprintf(page, PAGE_SIZE, "%u.%u\n",
						geo->major_ver_id,
						geo->minor_ver_id);
1020
	} else if (strcmp(attr->name, "capabilities") == 0) {
1021
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->cap);
1022
	} else if (strcmp(attr->name, "read_typ") == 0) {
1023
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdt);
1024
	} else if (strcmp(attr->name, "read_max") == 0) {
1025
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->trdm);
1026 1027 1028
	} else {
		return scnprintf(page,
				 PAGE_SIZE,
1029 1030
				 "Unhandled attr(%s) in `%s`\n",
				 attr->name, __func__);
1031 1032 1033
	}
}

1034 1035 1036 1037 1038 1039 1040 1041 1042
static ssize_t nvm_dev_attr_show_ppaf(struct nvm_addrf_12 *ppaf, char *page)
{
	return scnprintf(page, PAGE_SIZE,
		"0x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x%02x\n",
				ppaf->ch_offset, ppaf->ch_len,
				ppaf->lun_offset, ppaf->lun_len,
				ppaf->pln_offset, ppaf->pln_len,
				ppaf->blk_offset, ppaf->blk_len,
				ppaf->pg_offset, ppaf->pg_len,
1043
				ppaf->sec_offset, ppaf->sec_len);
1044 1045
}

1046 1047 1048 1049 1050
static ssize_t nvm_dev_attr_show_12(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1051
	struct nvm_geo *geo = &ndev->geo;
1052 1053 1054 1055 1056 1057 1058 1059
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "vendor_opcode") == 0) {
1060
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->vmnt);
1061
	} else if (strcmp(attr->name, "device_mode") == 0) {
1062
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->dom);
1063
	/* kept for compatibility */
1064
	} else if (strcmp(attr->name, "media_manager") == 0) {
1065
		return scnprintf(page, PAGE_SIZE, "%s\n", "gennvm");
1066
	} else if (strcmp(attr->name, "ppa_format") == 0) {
1067
		return nvm_dev_attr_show_ppaf((void *)&geo->addrf, page);
1068
	} else if (strcmp(attr->name, "media_type") == 0) {	/* u8 */
1069
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mtype);
1070
	} else if (strcmp(attr->name, "flash_media_type") == 0) {
1071
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fmtype);
1072
	} else if (strcmp(attr->name, "num_channels") == 0) {
1073
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1074
	} else if (strcmp(attr->name, "num_luns") == 0) {
1075
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1076
	} else if (strcmp(attr->name, "num_planes") == 0) {
1077
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pln);
1078
	} else if (strcmp(attr->name, "num_blocks") == 0) {	/* u16 */
1079
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1080
	} else if (strcmp(attr->name, "num_pages") == 0) {
1081
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_pg);
1082
	} else if (strcmp(attr->name, "page_size") == 0) {
1083
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->fpg_sz);
1084
	} else if (strcmp(attr->name, "hw_sector_size") == 0) {
1085
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->csecs);
1086
	} else if (strcmp(attr->name, "oob_sector_size") == 0) {/* u32 */
1087
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->sos);
1088
	} else if (strcmp(attr->name, "prog_typ") == 0) {
1089
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1090
	} else if (strcmp(attr->name, "prog_max") == 0) {
1091
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1092
	} else if (strcmp(attr->name, "erase_typ") == 0) {
1093
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1094
	} else if (strcmp(attr->name, "erase_max") == 0) {
1095
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1096
	} else if (strcmp(attr->name, "multiplane_modes") == 0) {
1097
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mpos);
1098
	} else if (strcmp(attr->name, "media_capabilities") == 0) {
1099
		return scnprintf(page, PAGE_SIZE, "0x%08x\n", geo->mccap);
1100
	} else if (strcmp(attr->name, "max_phys_secs") == 0) {
1101
		return scnprintf(page, PAGE_SIZE, "%u\n", NVM_MAX_VLBA);
1102
	} else {
1103
		return scnprintf(page, PAGE_SIZE,
1104 1105
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1106 1107 1108
	}
}

1109 1110 1111 1112 1113
static ssize_t nvm_dev_attr_show_20(struct device *dev,
		struct device_attribute *dattr, char *page)
{
	struct nvme_ns *ns = nvme_get_ns_from_dev(dev);
	struct nvm_dev *ndev = ns->ndev;
1114
	struct nvm_geo *geo = &ndev->geo;
1115 1116 1117 1118 1119 1120 1121 1122
	struct attribute *attr;

	if (!ndev)
		return 0;

	attr = &dattr->attr;

	if (strcmp(attr->name, "groups") == 0) {
1123
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_ch);
1124
	} else if (strcmp(attr->name, "punits") == 0) {
1125
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_lun);
1126
	} else if (strcmp(attr->name, "chunks") == 0) {
1127
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->num_chk);
1128
	} else if (strcmp(attr->name, "clba") == 0) {
1129
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->clba);
1130
	} else if (strcmp(attr->name, "ws_min") == 0) {
1131
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_min);
1132
	} else if (strcmp(attr->name, "ws_opt") == 0) {
1133
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->ws_opt);
1134 1135 1136 1137
	} else if (strcmp(attr->name, "maxoc") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxoc);
	} else if (strcmp(attr->name, "maxocpu") == 0) {
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->maxocpu);
1138
	} else if (strcmp(attr->name, "mw_cunits") == 0) {
1139
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->mw_cunits);
1140
	} else if (strcmp(attr->name, "write_typ") == 0) {
1141
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprt);
1142
	} else if (strcmp(attr->name, "write_max") == 0) {
1143
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tprm);
1144
	} else if (strcmp(attr->name, "reset_typ") == 0) {
1145
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbet);
1146
	} else if (strcmp(attr->name, "reset_max") == 0) {
1147
		return scnprintf(page, PAGE_SIZE, "%u\n", geo->tbem);
1148
	} else {
1149
		return scnprintf(page, PAGE_SIZE,
1150 1151
			"Unhandled attr(%s) in `%s`\n",
			attr->name, __func__);
1152 1153 1154 1155
	}
}

#define NVM_DEV_ATTR_RO(_name)					\
1156
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show, NULL)
1157 1158 1159 1160
#define NVM_DEV_ATTR_12_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_12, NULL)
#define NVM_DEV_ATTR_20_RO(_name)					\
	DEVICE_ATTR(_name, S_IRUGO, nvm_dev_attr_show_20, NULL)
1161

1162
/* general attributes */
1163 1164
static NVM_DEV_ATTR_RO(version);
static NVM_DEV_ATTR_RO(capabilities);
1165

1166 1167
static NVM_DEV_ATTR_RO(read_typ);
static NVM_DEV_ATTR_RO(read_max);
1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192

/* 1.2 values */
static NVM_DEV_ATTR_12_RO(vendor_opcode);
static NVM_DEV_ATTR_12_RO(device_mode);
static NVM_DEV_ATTR_12_RO(ppa_format);
static NVM_DEV_ATTR_12_RO(media_manager);
static NVM_DEV_ATTR_12_RO(media_type);
static NVM_DEV_ATTR_12_RO(flash_media_type);
static NVM_DEV_ATTR_12_RO(num_channels);
static NVM_DEV_ATTR_12_RO(num_luns);
static NVM_DEV_ATTR_12_RO(num_planes);
static NVM_DEV_ATTR_12_RO(num_blocks);
static NVM_DEV_ATTR_12_RO(num_pages);
static NVM_DEV_ATTR_12_RO(page_size);
static NVM_DEV_ATTR_12_RO(hw_sector_size);
static NVM_DEV_ATTR_12_RO(oob_sector_size);
static NVM_DEV_ATTR_12_RO(prog_typ);
static NVM_DEV_ATTR_12_RO(prog_max);
static NVM_DEV_ATTR_12_RO(erase_typ);
static NVM_DEV_ATTR_12_RO(erase_max);
static NVM_DEV_ATTR_12_RO(multiplane_modes);
static NVM_DEV_ATTR_12_RO(media_capabilities);
static NVM_DEV_ATTR_12_RO(max_phys_secs);

static struct attribute *nvm_dev_attrs_12[] = {
1193 1194
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,
1195 1196

	&dev_attr_vendor_opcode.attr,
1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218
	&dev_attr_device_mode.attr,
	&dev_attr_media_manager.attr,
	&dev_attr_ppa_format.attr,
	&dev_attr_media_type.attr,
	&dev_attr_flash_media_type.attr,
	&dev_attr_num_channels.attr,
	&dev_attr_num_luns.attr,
	&dev_attr_num_planes.attr,
	&dev_attr_num_blocks.attr,
	&dev_attr_num_pages.attr,
	&dev_attr_page_size.attr,
	&dev_attr_hw_sector_size.attr,
	&dev_attr_oob_sector_size.attr,
	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_prog_typ.attr,
	&dev_attr_prog_max.attr,
	&dev_attr_erase_typ.attr,
	&dev_attr_erase_max.attr,
	&dev_attr_multiplane_modes.attr,
	&dev_attr_media_capabilities.attr,
	&dev_attr_max_phys_secs.attr,
1219

1220 1221 1222
	NULL,
};

1223
static const struct attribute_group nvm_dev_attr_group_12 = {
1224
	.name		= "lightnvm",
1225 1226 1227 1228 1229 1230 1231 1232 1233 1234
	.attrs		= nvm_dev_attrs_12,
};

/* 2.0 values */
static NVM_DEV_ATTR_20_RO(groups);
static NVM_DEV_ATTR_20_RO(punits);
static NVM_DEV_ATTR_20_RO(chunks);
static NVM_DEV_ATTR_20_RO(clba);
static NVM_DEV_ATTR_20_RO(ws_min);
static NVM_DEV_ATTR_20_RO(ws_opt);
1235 1236
static NVM_DEV_ATTR_20_RO(maxoc);
static NVM_DEV_ATTR_20_RO(maxocpu);
1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252
static NVM_DEV_ATTR_20_RO(mw_cunits);
static NVM_DEV_ATTR_20_RO(write_typ);
static NVM_DEV_ATTR_20_RO(write_max);
static NVM_DEV_ATTR_20_RO(reset_typ);
static NVM_DEV_ATTR_20_RO(reset_max);

static struct attribute *nvm_dev_attrs_20[] = {
	&dev_attr_version.attr,
	&dev_attr_capabilities.attr,

	&dev_attr_groups.attr,
	&dev_attr_punits.attr,
	&dev_attr_chunks.attr,
	&dev_attr_clba.attr,
	&dev_attr_ws_min.attr,
	&dev_attr_ws_opt.attr,
1253 1254
	&dev_attr_maxoc.attr,
	&dev_attr_maxocpu.attr,
1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269
	&dev_attr_mw_cunits.attr,

	&dev_attr_read_typ.attr,
	&dev_attr_read_max.attr,
	&dev_attr_write_typ.attr,
	&dev_attr_write_max.attr,
	&dev_attr_reset_typ.attr,
	&dev_attr_reset_max.attr,

	NULL,
};

static const struct attribute_group nvm_dev_attr_group_20 = {
	.name		= "lightnvm",
	.attrs		= nvm_dev_attrs_20,
1270 1271 1272 1273
};

int nvme_nvm_register_sysfs(struct nvme_ns *ns)
{
1274 1275 1276 1277
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

	if (!ndev)
1278 1279
		return -EINVAL;

1280
	switch (geo->major_ver_id) {
1281 1282 1283 1284 1285 1286 1287 1288 1289
	case 1:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
	case 2:
		return sysfs_create_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
	}

	return -EINVAL;
1290 1291 1292 1293
}

void nvme_nvm_unregister_sysfs(struct nvme_ns *ns)
{
1294 1295 1296
	struct nvm_dev *ndev = ns->ndev;
	struct nvm_geo *geo = &ndev->geo;

1297
	switch (geo->major_ver_id) {
1298 1299 1300 1301 1302 1303 1304 1305 1306
	case 1:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_12);
		break;
	case 2:
		sysfs_remove_group(&disk_to_dev(ns->disk)->kobj,
					&nvm_dev_attr_group_20);
		break;
	}
1307
}