discovery.c 10.4 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
2 3 4 5 6 7 8 9 10 11 12
/*
 * Discovery service for the NVMe over Fabrics target.
 * Copyright (C) 2016 Intel Corporation. All rights reserved.
 */
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
#include <linux/slab.h>
#include <generated/utsrelease.h>
#include "nvmet.h"

struct nvmet_subsys *nvmet_disc_subsys;

13
static u64 nvmet_genctr;
14

15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32
static void __nvmet_disc_changed(struct nvmet_port *port,
				 struct nvmet_ctrl *ctrl)
{
	if (ctrl->port != port)
		return;

	if (nvmet_aen_bit_disabled(ctrl, NVME_AEN_BIT_DISC_CHANGE))
		return;

	nvmet_add_async_event(ctrl, NVME_AER_TYPE_NOTICE,
			      NVME_AER_NOTICE_DISC_CHANGED, NVME_LOG_DISC);
}

void nvmet_port_disc_changed(struct nvmet_port *port,
			     struct nvmet_subsys *subsys)
{
	struct nvmet_ctrl *ctrl;

33
	lockdep_assert_held(&nvmet_config_sem);
34 35
	nvmet_genctr++;

36
	mutex_lock(&nvmet_disc_subsys->lock);
37 38 39 40 41 42
	list_for_each_entry(ctrl, &nvmet_disc_subsys->ctrls, subsys_entry) {
		if (subsys && !nvmet_host_allowed(subsys, ctrl->hostnqn))
			continue;

		__nvmet_disc_changed(port, ctrl);
	}
43
	mutex_unlock(&nvmet_disc_subsys->lock);
44 45 46 47

	/* If transport can signal change, notify transport */
	if (port->tr_ops && port->tr_ops->discovery_chg)
		port->tr_ops->discovery_chg(port);
48 49 50 51 52 53 54 55
}

static void __nvmet_subsys_disc_changed(struct nvmet_port *port,
					struct nvmet_subsys *subsys,
					struct nvmet_host *host)
{
	struct nvmet_ctrl *ctrl;

56
	mutex_lock(&nvmet_disc_subsys->lock);
57 58 59 60 61 62
	list_for_each_entry(ctrl, &nvmet_disc_subsys->ctrls, subsys_entry) {
		if (host && strcmp(nvmet_host_name(host), ctrl->hostnqn))
			continue;

		__nvmet_disc_changed(port, ctrl);
	}
63
	mutex_unlock(&nvmet_disc_subsys->lock);
64 65 66 67 68 69 70 71
}

void nvmet_subsys_disc_changed(struct nvmet_subsys *subsys,
			       struct nvmet_host *host)
{
	struct nvmet_port *port;
	struct nvmet_subsys_link *s;

72
	lockdep_assert_held(&nvmet_config_sem);
73 74 75 76 77 78 79 80 81 82
	nvmet_genctr++;

	list_for_each_entry(port, nvmet_ports, global_entry)
		list_for_each_entry(s, &port->subsystems, entry) {
			if (s->subsys != subsys)
				continue;
			__nvmet_subsys_disc_changed(port, subsys, host);
		}
}

83 84 85 86 87 88
void nvmet_referral_enable(struct nvmet_port *parent, struct nvmet_port *port)
{
	down_write(&nvmet_config_sem);
	if (list_empty(&port->entry)) {
		list_add_tail(&port->entry, &parent->referrals);
		port->enabled = true;
89
		nvmet_port_disc_changed(parent, NULL);
90 91 92 93
	}
	up_write(&nvmet_config_sem);
}

94
void nvmet_referral_disable(struct nvmet_port *parent, struct nvmet_port *port)
95 96 97 98 99
{
	down_write(&nvmet_config_sem);
	if (!list_empty(&port->entry)) {
		port->enabled = false;
		list_del_init(&port->entry);
100
		nvmet_port_disc_changed(parent, NULL);
101 102 103 104 105
	}
	up_write(&nvmet_config_sem);
}

static void nvmet_format_discovery_entry(struct nvmf_disc_rsp_page_hdr *hdr,
106 107
		struct nvmet_port *port, char *subsys_nqn, char *traddr,
		u8 type, u32 numrec)
108 109 110 111 112 113 114 115 116
{
	struct nvmf_disc_rsp_page_entry *e = &hdr->entries[numrec];

	e->trtype = port->disc_addr.trtype;
	e->adrfam = port->disc_addr.adrfam;
	e->treq = port->disc_addr.treq;
	e->portid = port->disc_addr.portid;
	/* we support only dynamic controllers */
	e->cntlid = cpu_to_le16(NVME_CNTLID_DYNAMIC);
117
	e->asqsz = cpu_to_le16(NVME_AQ_DEPTH);
C
Christoph Hellwig 已提交
118
	e->subtype = type;
119
	memcpy(e->trsvcid, port->disc_addr.trsvcid, NVMF_TRSVCID_SIZE);
120
	memcpy(e->traddr, traddr, NVMF_TRADDR_SIZE);
121
	memcpy(e->tsas.common, port->disc_addr.tsas.common, NVMF_TSAS_SIZE);
122
	strncpy(e->subnqn, subsys_nqn, NVMF_NQN_SIZE);
123 124
}

125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143
/*
 * nvmet_set_disc_traddr - set a correct discovery log entry traddr
 *
 * IP based transports (e.g RDMA) can listen on "any" ipv4/ipv6 addresses
 * (INADDR_ANY or IN6ADDR_ANY_INIT). The discovery log page traddr reply
 * must not contain that "any" IP address. If the transport implements
 * .disc_traddr, use it. this callback will set the discovery traddr
 * from the req->port address in case the port in question listens
 * "any" IP address.
 */
static void nvmet_set_disc_traddr(struct nvmet_req *req, struct nvmet_port *port,
		char *traddr)
{
	if (req->ops->disc_traddr)
		req->ops->disc_traddr(req, port, traddr);
	else
		memcpy(traddr, port->disc_addr.traddr, NVMF_TRADDR_SIZE);
}

144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160
static size_t discovery_log_entries(struct nvmet_req *req)
{
	struct nvmet_ctrl *ctrl = req->sq->ctrl;
	struct nvmet_subsys_link *p;
	struct nvmet_port *r;
	size_t entries = 0;

	list_for_each_entry(p, &req->port->subsystems, entry) {
		if (!nvmet_host_allowed(p->subsys, ctrl->hostnqn))
			continue;
		entries++;
	}
	list_for_each_entry(r, &req->port->referrals, entry)
		entries++;
	return entries;
}

161
static void nvmet_execute_disc_get_log_page(struct nvmet_req *req)
162 163 164 165
{
	const int entry_size = sizeof(struct nvmf_disc_rsp_page_entry);
	struct nvmet_ctrl *ctrl = req->sq->ctrl;
	struct nvmf_disc_rsp_page_hdr *hdr;
166
	u64 offset = nvmet_get_log_page_offset(req->cmd);
167
	size_t data_len = nvmet_get_log_page_len(req->cmd);
168
	size_t alloc_len;
169 170 171 172
	struct nvmet_subsys_link *p;
	struct nvmet_port *r;
	u32 numrec = 0;
	u16 status = 0;
173 174
	void *buffer;

175
	if (!nvmet_check_transfer_len(req, data_len))
176 177
		return;

178 179 180
	if (req->cmd->get_log_page.lid != NVME_LOG_DISC) {
		req->error_loc =
			offsetof(struct nvme_get_log_page_command, lid);
181
		status = NVME_SC_INVALID_FIELD | NVME_SC_DNR;
182 183 184
		goto out;
	}

185 186
	/* Spec requires dword aligned offsets */
	if (offset & 0x3) {
187 188
		req->error_loc =
			offsetof(struct nvme_get_log_page_command, lpo);
189 190 191
		status = NVME_SC_INVALID_FIELD | NVME_SC_DNR;
		goto out;
	}
192 193 194 195 196 197

	/*
	 * Make sure we're passing at least a buffer of response header size.
	 * If host provided data len is less than the header size, only the
	 * number of bytes requested by host will be sent to host.
	 */
198 199 200 201 202
	down_read(&nvmet_config_sem);
	alloc_len = sizeof(*hdr) + entry_size * discovery_log_entries(req);
	buffer = kzalloc(alloc_len, GFP_KERNEL);
	if (!buffer) {
		up_read(&nvmet_config_sem);
203 204 205 206
		status = NVME_SC_INTERNAL;
		goto out;
	}

207
	hdr = buffer;
208
	list_for_each_entry(p, &req->port->subsystems, entry) {
209 210
		char traddr[NVMF_TRADDR_SIZE];

211
		if (!nvmet_host_allowed(p->subsys, ctrl->hostnqn))
212
			continue;
213 214 215 216 217

		nvmet_set_disc_traddr(req, req->port, traddr);
		nvmet_format_discovery_entry(hdr, req->port,
				p->subsys->subsysnqn, traddr,
				NVME_NQN_NVME, numrec);
218 219 220 221
		numrec++;
	}

	list_for_each_entry(r, &req->port->referrals, entry) {
222 223 224 225
		nvmet_format_discovery_entry(hdr, r,
				NVME_DISC_SUBSYS_NAME,
				r->disc_addr.traddr,
				NVME_NQN_DISC, numrec);
226 227 228 229 230 231 232
		numrec++;
	}

	hdr->genctr = cpu_to_le64(nvmet_genctr);
	hdr->numrec = cpu_to_le64(numrec);
	hdr->recfmt = cpu_to_le16(0);

233 234
	nvmet_clear_aen_bit(req, NVME_AEN_BIT_DISC_CHANGE);

235 236
	up_read(&nvmet_config_sem);

237 238
	status = nvmet_copy_to_sgl(req, 0, buffer + offset, data_len);
	kfree(buffer);
239 240 241 242
out:
	nvmet_req_complete(req, status);
}

243
static void nvmet_execute_disc_identify(struct nvmet_req *req)
244 245 246
{
	struct nvmet_ctrl *ctrl = req->sq->ctrl;
	struct nvme_id_ctrl *id;
247
	const char model[] = "Linux";
248 249
	u16 status = 0;

250
	if (!nvmet_check_transfer_len(req, NVME_IDENTIFY_DATA_SIZE))
251 252
		return;

253 254
	if (req->cmd->identify.cns != NVME_ID_CNS_CTRL) {
		req->error_loc = offsetof(struct nvme_identify, cns);
255
		status = NVME_SC_INVALID_FIELD | NVME_SC_DNR;
256 257 258
		goto out;
	}

259 260 261 262 263 264
	id = kzalloc(sizeof(*id), GFP_KERNEL);
	if (!id) {
		status = NVME_SC_INTERNAL;
		goto out;
	}

265 266 267
	memset(id->sn, ' ', sizeof(id->sn));
	bin2hex(id->sn, &ctrl->subsys->serial,
		min(sizeof(ctrl->subsys->serial), sizeof(id->sn) / 2));
268
	memset(id->fr, ' ', sizeof(id->fr));
269 270 271
	memcpy_and_pad(id->mn, sizeof(id->mn), model, sizeof(model) - 1, ' ');
	memcpy_and_pad(id->fr, sizeof(id->fr),
		       UTS_RELEASE, strlen(UTS_RELEASE), ' ');
272 273 274 275 276 277 278 279 280 281 282

	/* no limit on data transfer sizes for now */
	id->mdts = 0;
	id->cntlid = cpu_to_le16(ctrl->cntlid);
	id->ver = cpu_to_le32(ctrl->subsys->ver);
	id->lpa = (1 << 2);

	/* no enforcement soft-limit for maxcmd - pick arbitrary high value */
	id->maxcmd = cpu_to_le16(NVMET_MAX_CMD);

	id->sgls = cpu_to_le32(1 << 0);	/* we always support SGLs */
283
	if (ctrl->ops->flags & NVMF_KEYED_SGLS)
284
		id->sgls |= cpu_to_le32(1 << 2);
285
	if (req->port->inline_data_size)
286 287
		id->sgls |= cpu_to_le32(1 << 20);

288 289
	id->oaes = cpu_to_le32(NVMET_DISC_AEN_CFG_OPTIONAL);

290
	strlcpy(id->subnqn, ctrl->subsys->subsysnqn, sizeof(id->subnqn));
291 292 293 294 295 296 297 298

	status = nvmet_copy_to_sgl(req, 0, id, sizeof(*id));

	kfree(id);
out:
	nvmet_req_complete(req, status);
}

299 300
static void nvmet_execute_disc_set_features(struct nvmet_req *req)
{
301
	u32 cdw10 = le32_to_cpu(req->cmd->common.cdw10);
302 303
	u16 stat;

304
	if (!nvmet_check_transfer_len(req, 0))
305 306
		return;

307 308 309 310 311 312 313 314 315
	switch (cdw10 & 0xff) {
	case NVME_FEAT_KATO:
		stat = nvmet_set_feat_kato(req);
		break;
	case NVME_FEAT_ASYNC_EVENT:
		stat = nvmet_set_feat_async_event(req,
						  NVMET_DISC_AEN_CFG_OPTIONAL);
		break;
	default:
316 317
		req->error_loc =
			offsetof(struct nvme_common_command, cdw10);
318 319 320 321 322 323 324 325 326
		stat = NVME_SC_INVALID_FIELD | NVME_SC_DNR;
		break;
	}

	nvmet_req_complete(req, stat);
}

static void nvmet_execute_disc_get_features(struct nvmet_req *req)
{
327
	u32 cdw10 = le32_to_cpu(req->cmd->common.cdw10);
328 329
	u16 stat = 0;

330
	if (!nvmet_check_transfer_len(req, 0))
331 332
		return;

333 334 335 336 337 338 339 340
	switch (cdw10 & 0xff) {
	case NVME_FEAT_KATO:
		nvmet_get_feat_kato(req);
		break;
	case NVME_FEAT_ASYNC_EVENT:
		nvmet_get_feat_async_event(req);
		break;
	default:
341 342
		req->error_loc =
			offsetof(struct nvme_common_command, cdw10);
343 344 345 346 347 348 349
		stat = NVME_SC_INVALID_FIELD | NVME_SC_DNR;
		break;
	}

	nvmet_req_complete(req, stat);
}

350
u16 nvmet_parse_discovery_cmd(struct nvmet_req *req)
351 352 353 354
{
	struct nvme_command *cmd = req->cmd;

	if (unlikely(!(req->sq->ctrl->csts & NVME_CSTS_RDY))) {
355 356
		pr_err("got cmd %d while not ready\n",
		       cmd->common.opcode);
357 358
		req->error_loc =
			offsetof(struct nvme_common_command, opcode);
359 360 361 362
		return NVME_SC_INVALID_OPCODE | NVME_SC_DNR;
	}

	switch (cmd->common.opcode) {
363 364 365 366 367 368 369 370 371
	case nvme_admin_set_features:
		req->execute = nvmet_execute_disc_set_features;
		return 0;
	case nvme_admin_get_features:
		req->execute = nvmet_execute_disc_get_features;
		return 0;
	case nvme_admin_async_event:
		req->execute = nvmet_execute_async_event;
		return 0;
372 373 374
	case nvme_admin_keep_alive:
		req->execute = nvmet_execute_keep_alive;
		return 0;
375
	case nvme_admin_get_log_page:
376 377
		req->execute = nvmet_execute_disc_get_log_page;
		return 0;
378
	case nvme_admin_identify:
379 380
		req->execute = nvmet_execute_disc_identify;
		return 0;
381
	default:
382
		pr_debug("unhandled cmd %d\n", cmd->common.opcode);
383
		req->error_loc = offsetof(struct nvme_common_command, opcode);
384 385 386 387 388 389 390 391 392
		return NVME_SC_INVALID_OPCODE | NVME_SC_DNR;
	}

}

int __init nvmet_init_discovery(void)
{
	nvmet_disc_subsys =
		nvmet_subsys_alloc(NVME_DISC_SUBSYS_NAME, NVME_NQN_DISC);
393
	return PTR_ERR_OR_ZERO(nvmet_disc_subsys);
394 395 396 397 398 399
}

void nvmet_exit_discovery(void)
{
	nvmet_subsys_put(nvmet_disc_subsys);
}