intel_rdt_ctrlmondata.c 11.4 KB
Newer Older
T
Tony Luck 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Resource Director Technology(RDT)
 * - Cache Allocation code.
 *
 * Copyright (C) 2016 Intel Corporation
 *
 * Authors:
 *    Fenghua Yu <fenghua.yu@intel.com>
 *    Tony Luck <tony.luck@intel.com>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * More information about RDT be found in the Intel (R) x86 Architecture
 * Software Developer Manual June 2016, volume 3, section 17.17.
 */

#define pr_fmt(fmt)	KBUILD_MODNAME ": " fmt

#include <linux/kernfs.h>
#include <linux/seq_file.h>
#include <linux/slab.h>
29
#include "intel_rdt.h"
T
Tony Luck 已提交
30

31 32 33 34 35 36 37 38 39 40 41 42 43 44
/*
 * Check whether MBA bandwidth percentage value is correct. The value is
 * checked against the minimum and max bandwidth values specified by the
 * hardware. The allocated bandwidth percentage is rounded to the next
 * control step available on the hardware.
 */
static bool bw_validate(char *buf, unsigned long *data, struct rdt_resource *r)
{
	unsigned long bw;
	int ret;

	/*
	 * Only linear delay values is supported for current Intel SKUs.
	 */
45 46
	if (!r->membw.delay_linear) {
		rdt_last_cmd_puts("No support for non-linear MB domains\n");
47
		return false;
48
	}
49 50

	ret = kstrtoul(buf, 10, &bw);
51 52
	if (ret) {
		rdt_last_cmd_printf("Non-decimal digit in MB value %s\n", buf);
53
		return false;
54
	}
55

56 57
	if ((bw < r->membw.min_bw || bw > r->default_ctrl) &&
	    !is_mba_sc(r)) {
58 59
		rdt_last_cmd_printf("MB value %ld out of range [%d,%d]\n", bw,
				    r->membw.min_bw, r->default_ctrl);
60
		return false;
61
	}
62 63 64 65 66

	*data = roundup(bw, (unsigned long)r->membw.bw_gran);
	return true;
}

67
int parse_bw(void *_buf, struct rdt_resource *r, struct rdt_domain *d)
68 69
{
	unsigned long data;
70
	char *buf = _buf;
71

72 73
	if (d->have_new_ctrl) {
		rdt_last_cmd_printf("duplicate domain %d\n", d->id);
74
		return -EINVAL;
75
	}
76 77 78 79 80 81 82 83 84

	if (!bw_validate(buf, &data, r))
		return -EINVAL;
	d->new_ctrl = data;
	d->have_new_ctrl = true;

	return 0;
}

T
Tony Luck 已提交
85 86 87 88 89 90
/*
 * Check whether a cache bit mask is valid. The SDM says:
 *	Please note that all (and only) contiguous '1' combinations
 *	are allowed (e.g. FFFFH, 0FF0H, 003CH, etc.).
 * Additionally Haswell requires at least two bits set.
 */
91
static bool cbm_validate(char *buf, u32 *data, struct rdt_resource *r)
T
Tony Luck 已提交
92
{
93
	unsigned long first_bit, zero_bit, val;
94
	unsigned int cbm_len = r->cache.cbm_len;
95 96 97
	int ret;

	ret = kstrtoul(buf, 16, &val);
98 99
	if (ret) {
		rdt_last_cmd_printf("non-hex character in mask %s\n", buf);
100
		return false;
101
	}
T
Tony Luck 已提交
102

103 104
	if (val == 0 || val > r->default_ctrl) {
		rdt_last_cmd_puts("mask out of range\n");
T
Tony Luck 已提交
105
		return false;
106
	}
T
Tony Luck 已提交
107

108 109
	first_bit = find_first_bit(&val, cbm_len);
	zero_bit = find_next_zero_bit(&val, cbm_len, first_bit);
T
Tony Luck 已提交
110

111 112
	if (find_next_bit(&val, cbm_len, zero_bit) < cbm_len) {
		rdt_last_cmd_printf("mask %lx has non-consecutive 1-bits\n", val);
T
Tony Luck 已提交
113
		return false;
114
	}
T
Tony Luck 已提交
115

116 117 118
	if ((zero_bit - first_bit) < r->cache.min_cbm_bits) {
		rdt_last_cmd_printf("Need at least %d bits in mask\n",
				    r->cache.min_cbm_bits);
T
Tony Luck 已提交
119
		return false;
120
	}
121 122

	*data = val;
T
Tony Luck 已提交
123 124 125
	return true;
}

126 127 128 129 130
struct rdt_cbm_parse_data {
	struct rdtgroup		*rdtgrp;
	char			*buf;
};

T
Tony Luck 已提交
131 132 133 134
/*
 * Read one cache bit mask (hex). Check that it is valid for the current
 * resource type.
 */
135
int parse_cbm(void *_data, struct rdt_resource *r, struct rdt_domain *d)
T
Tony Luck 已提交
136
{
137 138
	struct rdt_cbm_parse_data *data = _data;
	struct rdtgroup *rdtgrp = data->rdtgrp;
139
	u32 cbm_val;
T
Tony Luck 已提交
140

141 142
	if (d->have_new_ctrl) {
		rdt_last_cmd_printf("duplicate domain %d\n", d->id);
143
		return -EINVAL;
144
	}
145

146 147 148 149 150 151 152 153 154 155
	/*
	 * Cannot set up more than one pseudo-locked region in a cache
	 * hierarchy.
	 */
	if (rdtgrp->mode == RDT_MODE_PSEUDO_LOCKSETUP &&
	    rdtgroup_pseudo_locked_in_hierarchy(d)) {
		rdt_last_cmd_printf("pseudo-locked region in hierarchy\n");
		return -EINVAL;
	}

156 157 158
	if (!cbm_validate(data->buf, &cbm_val, r))
		return -EINVAL;

159 160 161 162 163 164 165
	if ((rdtgrp->mode == RDT_MODE_EXCLUSIVE ||
	     rdtgrp->mode == RDT_MODE_SHAREABLE) &&
	    rdtgroup_cbm_overlaps_pseudo_locked(d, cbm_val)) {
		rdt_last_cmd_printf("CBM overlaps with pseudo-locked region\n");
		return -EINVAL;
	}

166 167 168 169 170 171
	/*
	 * The CBM may not overlap with the CBM of another closid if
	 * either is exclusive.
	 */
	if (rdtgroup_cbm_overlaps(r, d, cbm_val, rdtgrp->closid, true)) {
		rdt_last_cmd_printf("overlaps with exclusive group\n");
T
Tony Luck 已提交
172
		return -EINVAL;
173 174 175
	}

	if (rdtgroup_cbm_overlaps(r, d, cbm_val, rdtgrp->closid, false)) {
176 177
		if (rdtgrp->mode == RDT_MODE_EXCLUSIVE ||
		    rdtgrp->mode == RDT_MODE_PSEUDO_LOCKSETUP) {
178 179 180 181
			rdt_last_cmd_printf("overlaps with other group\n");
			return -EINVAL;
		}
	}
182 183

	d->new_ctrl = cbm_val;
184
	d->have_new_ctrl = true;
T
Tony Luck 已提交
185 186 187 188 189 190 191

	return 0;
}

/*
 * For each domain in this resource we expect to find a series of:
 *	id=mask
192 193
 * separated by ";". The "id" is in decimal, and must match one of
 * the "id"s for this resource.
T
Tony Luck 已提交
194
 */
195 196
static int parse_line(char *line, struct rdt_resource *r,
		      struct rdtgroup *rdtgrp)
T
Tony Luck 已提交
197
{
198
	struct rdt_cbm_parse_data data;
T
Tony Luck 已提交
199 200 201 202
	char *dom = NULL, *id;
	struct rdt_domain *d;
	unsigned long dom_id;

203 204 205 206 207
next:
	if (!line || line[0] == '\0')
		return 0;
	dom = strsep(&line, ";");
	id = strsep(&dom, "=");
208 209
	if (!dom || kstrtoul(id, 10, &dom_id)) {
		rdt_last_cmd_puts("Missing '=' or non-numeric domain\n");
210
		return -EINVAL;
211
	}
212
	dom = strim(dom);
T
Tony Luck 已提交
213
	list_for_each_entry(d, &r->domains, list) {
214
		if (d->id == dom_id) {
215 216 217
			data.buf = dom;
			data.rdtgrp = rdtgrp;
			if (r->parse_ctrlval(&data, r, d))
218
				return -EINVAL;
219 220 221 222 223 224 225 226 227 228 229 230 231 232 233
			if (rdtgrp->mode ==  RDT_MODE_PSEUDO_LOCKSETUP) {
				/*
				 * In pseudo-locking setup mode and just
				 * parsed a valid CBM that should be
				 * pseudo-locked. Only one locked region per
				 * resource group and domain so just do
				 * the required initialization for single
				 * region and return.
				 */
				rdtgrp->plr->r = r;
				rdtgrp->plr->d = d;
				rdtgrp->plr->cbm = d->new_ctrl;
				d->plr = rdtgrp->plr;
				return 0;
			}
234 235
			goto next;
		}
T
Tony Luck 已提交
236
	}
237
	return -EINVAL;
T
Tony Luck 已提交
238 239
}

240
int update_domains(struct rdt_resource *r, int closid)
T
Tony Luck 已提交
241 242 243 244
{
	struct msr_param msr_param;
	cpumask_var_t cpu_mask;
	struct rdt_domain *d;
245 246
	bool mba_sc;
	u32 *dc;
247
	int cpu;
T
Tony Luck 已提交
248 249 250 251 252 253 254 255

	if (!zalloc_cpumask_var(&cpu_mask, GFP_KERNEL))
		return -ENOMEM;

	msr_param.low = closid;
	msr_param.high = msr_param.low + 1;
	msr_param.res = r;

256
	mba_sc = is_mba_sc(r);
T
Tony Luck 已提交
257
	list_for_each_entry(d, &r->domains, list) {
258 259
		dc = !mba_sc ? d->ctrl_val : d->mbps_val;
		if (d->have_new_ctrl && d->new_ctrl != dc[closid]) {
260
			cpumask_set_cpu(cpumask_any(&d->cpu_mask), cpu_mask);
261
			dc[closid] = d->new_ctrl;
262
		}
T
Tony Luck 已提交
263
	}
264 265 266 267 268 269

	/*
	 * Avoid writing the control msr with control values when
	 * MBA software controller is enabled
	 */
	if (cpumask_empty(cpu_mask) || mba_sc)
270
		goto done;
T
Tony Luck 已提交
271 272 273
	cpu = get_cpu();
	/* Update CBM on this cpu if it's in cpu_mask. */
	if (cpumask_test_cpu(cpu, cpu_mask))
274
		rdt_ctrl_update(&msr_param);
T
Tony Luck 已提交
275
	/* Update CBM on other cpus. */
276
	smp_call_function_many(cpu_mask, rdt_ctrl_update, &msr_param, 1);
T
Tony Luck 已提交
277 278
	put_cpu();

279
done:
T
Tony Luck 已提交
280 281 282 283 284
	free_cpumask_var(cpu_mask);

	return 0;
}

285 286
static int rdtgroup_parse_resource(char *resname, char *tok,
				   struct rdtgroup *rdtgrp)
287 288 289
{
	struct rdt_resource *r;

290
	for_each_alloc_enabled_rdt_resource(r) {
291 292
		if (!strcmp(resname, r->name) && rdtgrp->closid < r->num_closid)
			return parse_line(tok, r, rdtgrp);
293
	}
294
	rdt_last_cmd_printf("unknown/unsupported resource name '%s'\n", resname);
295 296 297
	return -EINVAL;
}

T
Tony Luck 已提交
298 299 300 301
ssize_t rdtgroup_schemata_write(struct kernfs_open_file *of,
				char *buf, size_t nbytes, loff_t off)
{
	struct rdtgroup *rdtgrp;
302
	struct rdt_domain *dom;
T
Tony Luck 已提交
303 304
	struct rdt_resource *r;
	char *tok, *resname;
305
	int ret = 0;
T
Tony Luck 已提交
306 307

	/* Valid input requires a trailing newline */
308
	if (nbytes == 0 || buf[nbytes - 1] != '\n')
T
Tony Luck 已提交
309 310 311 312 313 314 315 316
		return -EINVAL;
	buf[nbytes - 1] = '\0';

	rdtgrp = rdtgroup_kn_lock_live(of->kn);
	if (!rdtgrp) {
		rdtgroup_kn_unlock(of->kn);
		return -ENOENT;
	}
317
	rdt_last_cmd_clear();
T
Tony Luck 已提交
318

319 320 321 322 323 324 325 326 327 328
	/*
	 * No changes to pseudo-locked region allowed. It has to be removed
	 * and re-created instead.
	 */
	if (rdtgrp->mode == RDT_MODE_PSEUDO_LOCKED) {
		ret = -EINVAL;
		rdt_last_cmd_puts("resource group is pseudo-locked\n");
		goto out;
	}

329
	for_each_alloc_enabled_rdt_resource(r) {
330
		list_for_each_entry(dom, &r->domains, list)
331
			dom->have_new_ctrl = false;
332
	}
T
Tony Luck 已提交
333 334

	while ((tok = strsep(&buf, "\n")) != NULL) {
335
		resname = strim(strsep(&tok, ":"));
T
Tony Luck 已提交
336
		if (!tok) {
337
			rdt_last_cmd_puts("Missing ':'\n");
T
Tony Luck 已提交
338 339 340
			ret = -EINVAL;
			goto out;
		}
341 342 343 344 345
		if (tok[0] == '\0') {
			rdt_last_cmd_printf("Missing '%s' value\n", resname);
			ret = -EINVAL;
			goto out;
		}
346
		ret = rdtgroup_parse_resource(resname, tok, rdtgrp);
347
		if (ret)
T
Tony Luck 已提交
348 349 350
			goto out;
	}

351
	for_each_alloc_enabled_rdt_resource(r) {
352
		ret = update_domains(r, rdtgrp->closid);
T
Tony Luck 已提交
353 354 355 356
		if (ret)
			goto out;
	}

357 358 359 360 361 362 363 364 365 366
	if (rdtgrp->mode == RDT_MODE_PSEUDO_LOCKSETUP) {
		/*
		 * If pseudo-locking fails we keep the resource group in
		 * mode RDT_MODE_PSEUDO_LOCKSETUP with its class of service
		 * active and updated for just the domain the pseudo-locked
		 * region was requested for.
		 */
		ret = rdtgroup_pseudo_lock_create(rdtgrp);
	}

T
Tony Luck 已提交
367 368 369 370 371 372 373 374 375
out:
	rdtgroup_kn_unlock(of->kn);
	return ret ?: nbytes;
}

static void show_doms(struct seq_file *s, struct rdt_resource *r, int closid)
{
	struct rdt_domain *dom;
	bool sep = false;
376
	u32 ctrl_val;
T
Tony Luck 已提交
377

378
	seq_printf(s, "%*s:", max_name_width, r->name);
T
Tony Luck 已提交
379 380 381
	list_for_each_entry(dom, &r->domains, list) {
		if (sep)
			seq_puts(s, ";");
382 383 384

		ctrl_val = (!is_mba_sc(r) ? dom->ctrl_val[closid] :
			    dom->mbps_val[closid]);
385
		seq_printf(s, r->format_str, dom->id, max_data_width,
386
			   ctrl_val);
T
Tony Luck 已提交
387 388 389 390 391 392 393 394 395 396
		sep = true;
	}
	seq_puts(s, "\n");
}

int rdtgroup_schemata_show(struct kernfs_open_file *of,
			   struct seq_file *s, void *v)
{
	struct rdtgroup *rdtgrp;
	struct rdt_resource *r;
V
Vikas Shivappa 已提交
397 398
	int ret = 0;
	u32 closid;
T
Tony Luck 已提交
399 400 401

	rdtgrp = rdtgroup_kn_lock_live(of->kn);
	if (rdtgrp) {
402 403 404
		if (rdtgrp->mode == RDT_MODE_PSEUDO_LOCKSETUP) {
			for_each_alloc_enabled_rdt_resource(r)
				seq_printf(s, "%s:uninitialized\n", r->name);
405 406 407
		} else if (rdtgrp->mode == RDT_MODE_PSEUDO_LOCKED) {
			seq_printf(s, "%s:%d=%x\n", rdtgrp->plr->r->name,
				   rdtgrp->plr->d->id, rdtgrp->plr->cbm);
408 409 410 411 412 413
		} else {
			closid = rdtgrp->closid;
			for_each_alloc_enabled_rdt_resource(r) {
				if (closid < r->num_closid)
					show_doms(s, r, closid);
			}
T
Tony Luck 已提交
414 415 416 417 418 419 420
		}
	} else {
		ret = -ENOENT;
	}
	rdtgroup_kn_unlock(of->kn);
	return ret;
}
V
Vikas Shivappa 已提交
421 422

void mon_event_read(struct rmid_read *rr, struct rdt_domain *d,
423
		    struct rdtgroup *rdtgrp, int evtid, int first)
V
Vikas Shivappa 已提交
424 425 426 427 428 429
{
	/*
	 * setup the parameters to send to the IPI to read the data.
	 */
	rr->rgrp = rdtgrp;
	rr->evtid = evtid;
430
	rr->d = d;
V
Vikas Shivappa 已提交
431
	rr->val = 0;
432
	rr->first = first;
V
Vikas Shivappa 已提交
433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461

	smp_call_function_any(&d->cpu_mask, mon_event_count, rr, 1);
}

int rdtgroup_mondata_show(struct seq_file *m, void *arg)
{
	struct kernfs_open_file *of = m->private;
	u32 resid, evtid, domid;
	struct rdtgroup *rdtgrp;
	struct rdt_resource *r;
	union mon_data_bits md;
	struct rdt_domain *d;
	struct rmid_read rr;
	int ret = 0;

	rdtgrp = rdtgroup_kn_lock_live(of->kn);

	md.priv = of->kn->priv;
	resid = md.u.rid;
	domid = md.u.domid;
	evtid = md.u.evtid;

	r = &rdt_resources_all[resid];
	d = rdt_find_domain(r, domid, NULL);
	if (!d) {
		ret = -ENOENT;
		goto out;
	}

462
	mon_event_read(&rr, d, rdtgrp, evtid, false);
V
Vikas Shivappa 已提交
463 464 465 466 467 468 469 470 471 472 473 474

	if (rr.val & RMID_VAL_ERROR)
		seq_puts(m, "Error\n");
	else if (rr.val & RMID_VAL_UNAVAIL)
		seq_puts(m, "Unavailable\n");
	else
		seq_printf(m, "%llu\n", rr.val * r->mon_scale);

out:
	rdtgroup_kn_unlock(of->kn);
	return ret;
}