intel_rdt_ctrlmondata.c 9.5 KB
Newer Older
T
Tony Luck 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Resource Director Technology(RDT)
 * - Cache Allocation code.
 *
 * Copyright (C) 2016 Intel Corporation
 *
 * Authors:
 *    Fenghua Yu <fenghua.yu@intel.com>
 *    Tony Luck <tony.luck@intel.com>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * More information about RDT be found in the Intel (R) x86 Architecture
 * Software Developer Manual June 2016, volume 3, section 17.17.
 */

#define pr_fmt(fmt)	KBUILD_MODNAME ": " fmt

#include <linux/kernfs.h>
#include <linux/seq_file.h>
#include <linux/slab.h>
29
#include "intel_rdt.h"
T
Tony Luck 已提交
30

31 32 33 34 35 36 37 38 39 40 41 42 43 44
/*
 * Check whether MBA bandwidth percentage value is correct. The value is
 * checked against the minimum and max bandwidth values specified by the
 * hardware. The allocated bandwidth percentage is rounded to the next
 * control step available on the hardware.
 */
static bool bw_validate(char *buf, unsigned long *data, struct rdt_resource *r)
{
	unsigned long bw;
	int ret;

	/*
	 * Only linear delay values is supported for current Intel SKUs.
	 */
45 46
	if (!r->membw.delay_linear) {
		rdt_last_cmd_puts("No support for non-linear MB domains\n");
47
		return false;
48
	}
49 50

	ret = kstrtoul(buf, 10, &bw);
51 52
	if (ret) {
		rdt_last_cmd_printf("Non-decimal digit in MB value %s\n", buf);
53
		return false;
54
	}
55

56 57
	if ((bw < r->membw.min_bw || bw > r->default_ctrl) &&
	    !is_mba_sc(r)) {
58 59
		rdt_last_cmd_printf("MB value %ld out of range [%d,%d]\n", bw,
				    r->membw.min_bw, r->default_ctrl);
60
		return false;
61
	}
62 63 64 65 66

	*data = roundup(bw, (unsigned long)r->membw.bw_gran);
	return true;
}

67
int parse_bw(void *_buf, struct rdt_resource *r, struct rdt_domain *d)
68 69
{
	unsigned long data;
70
	char *buf = _buf;
71

72 73
	if (d->have_new_ctrl) {
		rdt_last_cmd_printf("duplicate domain %d\n", d->id);
74
		return -EINVAL;
75
	}
76 77 78 79 80 81 82 83 84

	if (!bw_validate(buf, &data, r))
		return -EINVAL;
	d->new_ctrl = data;
	d->have_new_ctrl = true;

	return 0;
}

T
Tony Luck 已提交
85 86 87 88 89 90
/*
 * Check whether a cache bit mask is valid. The SDM says:
 *	Please note that all (and only) contiguous '1' combinations
 *	are allowed (e.g. FFFFH, 0FF0H, 003CH, etc.).
 * Additionally Haswell requires at least two bits set.
 */
91
static bool cbm_validate(char *buf, u32 *data, struct rdt_resource *r)
T
Tony Luck 已提交
92
{
93
	unsigned long first_bit, zero_bit, val;
94
	unsigned int cbm_len = r->cache.cbm_len;
95 96 97
	int ret;

	ret = kstrtoul(buf, 16, &val);
98 99
	if (ret) {
		rdt_last_cmd_printf("non-hex character in mask %s\n", buf);
100
		return false;
101
	}
T
Tony Luck 已提交
102

103 104
	if (val == 0 || val > r->default_ctrl) {
		rdt_last_cmd_puts("mask out of range\n");
T
Tony Luck 已提交
105
		return false;
106
	}
T
Tony Luck 已提交
107

108 109
	first_bit = find_first_bit(&val, cbm_len);
	zero_bit = find_next_zero_bit(&val, cbm_len, first_bit);
T
Tony Luck 已提交
110

111 112
	if (find_next_bit(&val, cbm_len, zero_bit) < cbm_len) {
		rdt_last_cmd_printf("mask %lx has non-consecutive 1-bits\n", val);
T
Tony Luck 已提交
113
		return false;
114
	}
T
Tony Luck 已提交
115

116 117 118
	if ((zero_bit - first_bit) < r->cache.min_cbm_bits) {
		rdt_last_cmd_printf("Need at least %d bits in mask\n",
				    r->cache.min_cbm_bits);
T
Tony Luck 已提交
119
		return false;
120
	}
121 122

	*data = val;
T
Tony Luck 已提交
123 124 125
	return true;
}

126 127 128 129 130
struct rdt_cbm_parse_data {
	struct rdtgroup		*rdtgrp;
	char			*buf;
};

T
Tony Luck 已提交
131 132 133 134
/*
 * Read one cache bit mask (hex). Check that it is valid for the current
 * resource type.
 */
135
int parse_cbm(void *_data, struct rdt_resource *r, struct rdt_domain *d)
T
Tony Luck 已提交
136
{
137 138
	struct rdt_cbm_parse_data *data = _data;
	struct rdtgroup *rdtgrp = data->rdtgrp;
139
	u32 cbm_val;
T
Tony Luck 已提交
140

141 142
	if (d->have_new_ctrl) {
		rdt_last_cmd_printf("duplicate domain %d\n", d->id);
143
		return -EINVAL;
144
	}
145

146 147 148 149 150 151 152 153 154
	if (!cbm_validate(data->buf, &cbm_val, r))
		return -EINVAL;

	/*
	 * The CBM may not overlap with the CBM of another closid if
	 * either is exclusive.
	 */
	if (rdtgroup_cbm_overlaps(r, d, cbm_val, rdtgrp->closid, true)) {
		rdt_last_cmd_printf("overlaps with exclusive group\n");
T
Tony Luck 已提交
155
		return -EINVAL;
156 157 158 159 160 161 162 163
	}

	if (rdtgroup_cbm_overlaps(r, d, cbm_val, rdtgrp->closid, false)) {
		if (rdtgrp->mode == RDT_MODE_EXCLUSIVE) {
			rdt_last_cmd_printf("overlaps with other group\n");
			return -EINVAL;
		}
	}
164 165

	d->new_ctrl = cbm_val;
166
	d->have_new_ctrl = true;
T
Tony Luck 已提交
167 168 169 170 171 172 173

	return 0;
}

/*
 * For each domain in this resource we expect to find a series of:
 *	id=mask
174 175
 * separated by ";". The "id" is in decimal, and must match one of
 * the "id"s for this resource.
T
Tony Luck 已提交
176
 */
177 178
static int parse_line(char *line, struct rdt_resource *r,
		      struct rdtgroup *rdtgrp)
T
Tony Luck 已提交
179
{
180
	struct rdt_cbm_parse_data data;
T
Tony Luck 已提交
181 182 183 184
	char *dom = NULL, *id;
	struct rdt_domain *d;
	unsigned long dom_id;

185 186 187 188 189
next:
	if (!line || line[0] == '\0')
		return 0;
	dom = strsep(&line, ";");
	id = strsep(&dom, "=");
190 191
	if (!dom || kstrtoul(id, 10, &dom_id)) {
		rdt_last_cmd_puts("Missing '=' or non-numeric domain\n");
192
		return -EINVAL;
193
	}
194
	dom = strim(dom);
T
Tony Luck 已提交
195
	list_for_each_entry(d, &r->domains, list) {
196
		if (d->id == dom_id) {
197 198 199
			data.buf = dom;
			data.rdtgrp = rdtgrp;
			if (r->parse_ctrlval(&data, r, d))
200 201 202
				return -EINVAL;
			goto next;
		}
T
Tony Luck 已提交
203
	}
204
	return -EINVAL;
T
Tony Luck 已提交
205 206
}

207
int update_domains(struct rdt_resource *r, int closid)
T
Tony Luck 已提交
208 209 210 211
{
	struct msr_param msr_param;
	cpumask_var_t cpu_mask;
	struct rdt_domain *d;
212 213
	bool mba_sc;
	u32 *dc;
214
	int cpu;
T
Tony Luck 已提交
215 216 217 218 219 220 221 222

	if (!zalloc_cpumask_var(&cpu_mask, GFP_KERNEL))
		return -ENOMEM;

	msr_param.low = closid;
	msr_param.high = msr_param.low + 1;
	msr_param.res = r;

223
	mba_sc = is_mba_sc(r);
T
Tony Luck 已提交
224
	list_for_each_entry(d, &r->domains, list) {
225 226
		dc = !mba_sc ? d->ctrl_val : d->mbps_val;
		if (d->have_new_ctrl && d->new_ctrl != dc[closid]) {
227
			cpumask_set_cpu(cpumask_any(&d->cpu_mask), cpu_mask);
228
			dc[closid] = d->new_ctrl;
229
		}
T
Tony Luck 已提交
230
	}
231 232 233 234 235 236

	/*
	 * Avoid writing the control msr with control values when
	 * MBA software controller is enabled
	 */
	if (cpumask_empty(cpu_mask) || mba_sc)
237
		goto done;
T
Tony Luck 已提交
238 239 240
	cpu = get_cpu();
	/* Update CBM on this cpu if it's in cpu_mask. */
	if (cpumask_test_cpu(cpu, cpu_mask))
241
		rdt_ctrl_update(&msr_param);
T
Tony Luck 已提交
242
	/* Update CBM on other cpus. */
243
	smp_call_function_many(cpu_mask, rdt_ctrl_update, &msr_param, 1);
T
Tony Luck 已提交
244 245
	put_cpu();

246
done:
T
Tony Luck 已提交
247 248 249 250 251
	free_cpumask_var(cpu_mask);

	return 0;
}

252 253
static int rdtgroup_parse_resource(char *resname, char *tok,
				   struct rdtgroup *rdtgrp)
254 255 256
{
	struct rdt_resource *r;

257
	for_each_alloc_enabled_rdt_resource(r) {
258 259
		if (!strcmp(resname, r->name) && rdtgrp->closid < r->num_closid)
			return parse_line(tok, r, rdtgrp);
260
	}
261
	rdt_last_cmd_printf("unknown/unsupported resource name '%s'\n", resname);
262 263 264
	return -EINVAL;
}

T
Tony Luck 已提交
265 266 267 268
ssize_t rdtgroup_schemata_write(struct kernfs_open_file *of,
				char *buf, size_t nbytes, loff_t off)
{
	struct rdtgroup *rdtgrp;
269
	struct rdt_domain *dom;
T
Tony Luck 已提交
270 271
	struct rdt_resource *r;
	char *tok, *resname;
272
	int ret = 0;
T
Tony Luck 已提交
273 274

	/* Valid input requires a trailing newline */
275
	if (nbytes == 0 || buf[nbytes - 1] != '\n')
T
Tony Luck 已提交
276 277 278 279 280 281 282 283
		return -EINVAL;
	buf[nbytes - 1] = '\0';

	rdtgrp = rdtgroup_kn_lock_live(of->kn);
	if (!rdtgrp) {
		rdtgroup_kn_unlock(of->kn);
		return -ENOENT;
	}
284
	rdt_last_cmd_clear();
T
Tony Luck 已提交
285

286
	for_each_alloc_enabled_rdt_resource(r) {
287
		list_for_each_entry(dom, &r->domains, list)
288
			dom->have_new_ctrl = false;
289
	}
T
Tony Luck 已提交
290 291

	while ((tok = strsep(&buf, "\n")) != NULL) {
292
		resname = strim(strsep(&tok, ":"));
T
Tony Luck 已提交
293
		if (!tok) {
294
			rdt_last_cmd_puts("Missing ':'\n");
T
Tony Luck 已提交
295 296 297
			ret = -EINVAL;
			goto out;
		}
298 299 300 301 302
		if (tok[0] == '\0') {
			rdt_last_cmd_printf("Missing '%s' value\n", resname);
			ret = -EINVAL;
			goto out;
		}
303
		ret = rdtgroup_parse_resource(resname, tok, rdtgrp);
304
		if (ret)
T
Tony Luck 已提交
305 306 307
			goto out;
	}

308
	for_each_alloc_enabled_rdt_resource(r) {
309
		ret = update_domains(r, rdtgrp->closid);
T
Tony Luck 已提交
310 311 312 313 314 315 316 317 318 319 320 321 322
		if (ret)
			goto out;
	}

out:
	rdtgroup_kn_unlock(of->kn);
	return ret ?: nbytes;
}

static void show_doms(struct seq_file *s, struct rdt_resource *r, int closid)
{
	struct rdt_domain *dom;
	bool sep = false;
323
	u32 ctrl_val;
T
Tony Luck 已提交
324

325
	seq_printf(s, "%*s:", max_name_width, r->name);
T
Tony Luck 已提交
326 327 328
	list_for_each_entry(dom, &r->domains, list) {
		if (sep)
			seq_puts(s, ";");
329 330 331

		ctrl_val = (!is_mba_sc(r) ? dom->ctrl_val[closid] :
			    dom->mbps_val[closid]);
332
		seq_printf(s, r->format_str, dom->id, max_data_width,
333
			   ctrl_val);
T
Tony Luck 已提交
334 335 336 337 338 339 340 341 342 343
		sep = true;
	}
	seq_puts(s, "\n");
}

int rdtgroup_schemata_show(struct kernfs_open_file *of,
			   struct seq_file *s, void *v)
{
	struct rdtgroup *rdtgrp;
	struct rdt_resource *r;
V
Vikas Shivappa 已提交
344 345
	int ret = 0;
	u32 closid;
T
Tony Luck 已提交
346 347 348 349

	rdtgrp = rdtgroup_kn_lock_live(of->kn);
	if (rdtgrp) {
		closid = rdtgrp->closid;
350
		for_each_alloc_enabled_rdt_resource(r) {
T
Tony Luck 已提交
351 352 353 354 355 356 357 358 359
			if (closid < r->num_closid)
				show_doms(s, r, closid);
		}
	} else {
		ret = -ENOENT;
	}
	rdtgroup_kn_unlock(of->kn);
	return ret;
}
V
Vikas Shivappa 已提交
360 361

void mon_event_read(struct rmid_read *rr, struct rdt_domain *d,
362
		    struct rdtgroup *rdtgrp, int evtid, int first)
V
Vikas Shivappa 已提交
363 364 365 366 367 368
{
	/*
	 * setup the parameters to send to the IPI to read the data.
	 */
	rr->rgrp = rdtgrp;
	rr->evtid = evtid;
369
	rr->d = d;
V
Vikas Shivappa 已提交
370
	rr->val = 0;
371
	rr->first = first;
V
Vikas Shivappa 已提交
372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400

	smp_call_function_any(&d->cpu_mask, mon_event_count, rr, 1);
}

int rdtgroup_mondata_show(struct seq_file *m, void *arg)
{
	struct kernfs_open_file *of = m->private;
	u32 resid, evtid, domid;
	struct rdtgroup *rdtgrp;
	struct rdt_resource *r;
	union mon_data_bits md;
	struct rdt_domain *d;
	struct rmid_read rr;
	int ret = 0;

	rdtgrp = rdtgroup_kn_lock_live(of->kn);

	md.priv = of->kn->priv;
	resid = md.u.rid;
	domid = md.u.domid;
	evtid = md.u.evtid;

	r = &rdt_resources_all[resid];
	d = rdt_find_domain(r, domid, NULL);
	if (!d) {
		ret = -ENOENT;
		goto out;
	}

401
	mon_event_read(&rr, d, rdtgrp, evtid, false);
V
Vikas Shivappa 已提交
402 403 404 405 406 407 408 409 410 411 412 413

	if (rr.val & RMID_VAL_ERROR)
		seq_puts(m, "Error\n");
	else if (rr.val & RMID_VAL_UNAVAIL)
		seq_puts(m, "Unavailable\n");
	else
		seq_printf(m, "%llu\n", rr.val * r->mon_scale);

out:
	rdtgroup_kn_unlock(of->kn);
	return ret;
}