record.c 7.1 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
2 3 4
#include "evlist.h"
#include "evsel.h"
#include "cpumap.h"
5
#include "parse-events.h"
6
#include <errno.h>
7
#include <api/fs/fs.h>
8
#include <subcmd/parse-options.h>
9
#include <perf/cpumap.h>
10
#include "util.h"
11
#include "cloexec.h"
12

13
typedef void (*setup_probe_fn_t)(struct evsel *evsel);
14 15 16

static int perf_do_probe_api(setup_probe_fn_t fn, int cpu, const char *str)
{
17
	struct evlist *evlist;
18
	struct evsel *evsel;
19
	unsigned long flags = perf_event_open_cloexec_flag();
20
	int err = -EAGAIN, fd;
21
	static pid_t pid = -1;
22

23
	evlist = evlist__new();
24 25 26
	if (!evlist)
		return -ENOMEM;

27
	if (parse_events(evlist, str, NULL))
28 29 30 31
		goto out_delete;

	evsel = perf_evlist__first(evlist);

32
	while (1) {
33
		fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, flags);
34 35 36 37 38 39 40 41 42
		if (fd < 0) {
			if (pid == -1 && errno == EACCES) {
				pid = 0;
				continue;
			}
			goto out_delete;
		}
		break;
	}
43 44 45 46
	close(fd);

	fn(evsel);

47
	fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1, flags);
48 49 50 51 52 53 54 55 56
	if (fd < 0) {
		if (errno == EINVAL)
			err = -EINVAL;
		goto out_delete;
	}
	close(fd);
	err = 0;

out_delete:
57
	evlist__delete(evlist);
58 59 60 61 62
	return err;
}

static bool perf_probe_api(setup_probe_fn_t fn)
{
63
	const char *try[] = {"cycles:u", "instructions:u", "cpu-clock:u", NULL};
64
	struct perf_cpu_map *cpus;
65 66
	int cpu, ret, i = 0;

67
	cpus = perf_cpu_map__new(NULL);
68 69 70
	if (!cpus)
		return false;
	cpu = cpus->map[0];
71
	perf_cpu_map__put(cpus);
72 73 74 75 76 77 78 79 80 81

	do {
		ret = perf_do_probe_api(fn, cpu, try[i++]);
		if (!ret)
			return true;
	} while (ret == -EAGAIN && try[i]);

	return false;
}

82
static void perf_probe_sample_identifier(struct evsel *evsel)
83
{
84
	evsel->core.attr.sample_type |= PERF_SAMPLE_IDENTIFIER;
85 86
}

87
static void perf_probe_comm_exec(struct evsel *evsel)
88
{
89
	evsel->core.attr.comm_exec = 1;
90 91
}

92
static void perf_probe_context_switch(struct evsel *evsel)
93
{
94
	evsel->core.attr.context_switch = 1;
95 96
}

97 98 99 100
bool perf_can_sample_identifier(void)
{
	return perf_probe_api(perf_probe_sample_identifier);
}
101

102 103 104 105 106
static bool perf_can_comm_exec(void)
{
	return perf_probe_api(perf_probe_comm_exec);
}

107 108 109 110 111
bool perf_can_record_switch_events(void)
{
	return perf_probe_api(perf_probe_context_switch);
}

112 113 114 115 116 117 118
bool perf_can_record_cpu_wide(void)
{
	struct perf_event_attr attr = {
		.type = PERF_TYPE_SOFTWARE,
		.config = PERF_COUNT_SW_CPU_CLOCK,
		.exclude_kernel = 1,
	};
119
	struct perf_cpu_map *cpus;
120 121
	int cpu, fd;

122
	cpus = perf_cpu_map__new(NULL);
123 124 125
	if (!cpus)
		return false;
	cpu = cpus->map[0];
126
	perf_cpu_map__put(cpus);
127 128 129 130 131 132 133 134 135

	fd = sys_perf_event_open(&attr, -1, cpu, -1, 0);
	if (fd < 0)
		return false;
	close(fd);

	return true;
}

136
void perf_evlist__config(struct evlist *evlist, struct record_opts *opts,
137
			 struct callchain_param *callchain)
138
{
139
	struct evsel *evsel;
140
	bool use_sample_identifier = false;
141
	bool use_comm_exec;
J
Jiri Olsa 已提交
142
	bool sample_id = opts->sample_id;
143

144 145 146 147 148 149 150
	/*
	 * Set the evsel leader links before we configure attributes,
	 * since some might depend on this info.
	 */
	if (opts->group)
		perf_evlist__set_leader(evlist);

151
	if (evlist->core.cpus->map[0] < 0)
152 153
		opts->no_inherit = true;

154 155
	use_comm_exec = perf_can_comm_exec();

156
	evlist__for_each_entry(evlist, evsel) {
157
		perf_evsel__config(evsel, opts, callchain);
158
		if (evsel->tracking && use_comm_exec)
159
			evsel->core.attr.comm_exec = 1;
160
	}
161

162 163 164 165 166 167 168
	if (opts->full_auxtrace) {
		/*
		 * Need to be able to synthesize and parse selected events with
		 * arbitrary sample types, which requires always being able to
		 * match the id.
		 */
		use_sample_identifier = perf_can_sample_identifier();
J
Jiri Olsa 已提交
169
		sample_id = true;
170
	} else if (evlist->core.nr_entries > 1) {
171
		struct evsel *first = perf_evlist__first(evlist);
172

173
		evlist__for_each_entry(evlist, evsel) {
174
			if (evsel->core.attr.sample_type == first->core.attr.sample_type)
175 176 177 178
				continue;
			use_sample_identifier = perf_can_sample_identifier();
			break;
		}
J
Jiri Olsa 已提交
179 180 181 182
		sample_id = true;
	}

	if (sample_id) {
183
		evlist__for_each_entry(evlist, evsel)
184
			perf_evsel__set_sample_id(evsel, use_sample_identifier);
185
	}
186 187

	perf_evlist__set_id_pos(evlist);
188
}
189 190 191

static int get_max_rate(unsigned int *rate)
{
192
	return sysctl__read_int("kernel/perf_event_max_sample_rate", (int *)rate);
193 194
}

195
static int record_opts__config_freq(struct record_opts *opts)
196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223
{
	bool user_freq = opts->user_freq != UINT_MAX;
	unsigned int max_rate;

	if (opts->user_interval != ULLONG_MAX)
		opts->default_interval = opts->user_interval;
	if (user_freq)
		opts->freq = opts->user_freq;

	/*
	 * User specified count overrides default frequency.
	 */
	if (opts->default_interval)
		opts->freq = 0;
	else if (opts->freq) {
		opts->default_interval = opts->freq;
	} else {
		pr_err("frequency and count are zero, aborting\n");
		return -1;
	}

	if (get_max_rate(&max_rate))
		return 0;

	/*
	 * User specified frequency is over current maximum.
	 */
	if (user_freq && (max_rate < opts->freq)) {
224 225 226 227 228 229 230 231 232 233 234 235 236 237 238
		if (opts->strict_freq) {
			pr_err("error: Maximum frequency rate (%'u Hz) exceeded.\n"
			       "       Please use -F freq option with a lower value or consider\n"
			       "       tweaking /proc/sys/kernel/perf_event_max_sample_rate.\n",
			       max_rate);
			return -1;
		} else {
			pr_warning("warning: Maximum frequency rate (%'u Hz) exceeded, throttling from %'u Hz to %'u Hz.\n"
				   "         The limit can be raised via /proc/sys/kernel/perf_event_max_sample_rate.\n"
				   "         The kernel will lower it when perf's interrupts take too long.\n"
				   "         Use --strict-freq to disable this throttling, refusing to record.\n",
				   max_rate, opts->freq, max_rate);

			opts->freq = max_rate;
		}
239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254
	}

	/*
	 * Default frequency is over current maximum.
	 */
	if (max_rate < opts->freq) {
		pr_warning("Lowering default frequency rate to %u.\n"
			   "Please consider tweaking "
			   "/proc/sys/kernel/perf_event_max_sample_rate.\n",
			   max_rate);
		opts->freq = max_rate;
	}

	return 0;
}

255
int record_opts__config(struct record_opts *opts)
256
{
257
	return record_opts__config_freq(opts);
258
}
259

260
bool perf_evlist__can_select_event(struct evlist *evlist, const char *str)
261
{
262
	struct evlist *temp_evlist;
263
	struct evsel *evsel;
264 265
	int err, fd, cpu;
	bool ret = false;
266
	pid_t pid = -1;
267

268
	temp_evlist = evlist__new();
269 270 271
	if (!temp_evlist)
		return false;

272
	err = parse_events(temp_evlist, str, NULL);
273 274 275 276 277
	if (err)
		goto out_delete;

	evsel = perf_evlist__last(temp_evlist);

278
	if (!evlist || cpu_map__empty(evlist->core.cpus)) {
279
		struct perf_cpu_map *cpus = perf_cpu_map__new(NULL);
280 281

		cpu =  cpus ? cpus->map[0] : 0;
282
		perf_cpu_map__put(cpus);
283
	} else {
284
		cpu = evlist->core.cpus->map[0];
285 286
	}

287
	while (1) {
288
		fd = sys_perf_event_open(&evsel->core.attr, pid, cpu, -1,
289 290 291 292 293 294 295 296 297
					 perf_event_open_cloexec_flag());
		if (fd < 0) {
			if (pid == -1 && errno == EACCES) {
				pid = 0;
				continue;
			}
			goto out_delete;
		}
		break;
298
	}
299 300
	close(fd);
	ret = true;
301 302

out_delete:
303
	evlist__delete(temp_evlist);
304 305
	return ret;
}
306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327

int record__parse_freq(const struct option *opt, const char *str, int unset __maybe_unused)
{
	unsigned int freq;
	struct record_opts *opts = opt->value;

	if (!str)
		return -EINVAL;

	if (strcasecmp(str, "max") == 0) {
		if (get_max_rate(&freq)) {
			pr_err("couldn't read /proc/sys/kernel/perf_event_max_sample_rate\n");
			return -1;
		}
		pr_info("info: Using a maximum frequency rate of %'d Hz\n", freq);
	} else {
		freq = atoi(str);
	}

	opts->user_freq = freq;
	return 0;
}