turbostat.c 112.7 KB
Newer Older
L
Len Brown 已提交
1 2 3 4
/*
 * turbostat -- show CPU frequency and C-state residency
 * on modern Intel turbo-capable processors.
 *
5
 * Copyright (c) 2013 Intel Corporation.
L
Len Brown 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 * Len Brown <len.brown@intel.com>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
 * this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
 */

22
#define _GNU_SOURCE
23
#include MSRHEADER
24
#include INTEL_FAMILY_HEADER
25
#include <stdarg.h>
L
Len Brown 已提交
26
#include <stdio.h>
27
#include <err.h>
L
Len Brown 已提交
28 29 30 31 32 33 34 35 36
#include <unistd.h>
#include <sys/types.h>
#include <sys/wait.h>
#include <sys/stat.h>
#include <sys/resource.h>
#include <fcntl.h>
#include <signal.h>
#include <sys/time.h>
#include <stdlib.h>
37
#include <getopt.h>
L
Len Brown 已提交
38 39 40
#include <dirent.h>
#include <string.h>
#include <ctype.h>
41
#include <sched.h>
42
#include <time.h>
43
#include <cpuid.h>
44 45
#include <linux/capability.h>
#include <errno.h>
L
Len Brown 已提交
46 47

char *proc_stat = "/proc/stat";
48
FILE *outf;
49
int *fd_percpu;
50
struct timespec interval_ts = {5, 0};
51 52 53 54
unsigned int debug;
unsigned int rapl_joules;
unsigned int summary_only;
unsigned int dump_only;
L
Len Brown 已提交
55
unsigned int do_snb_cstates;
56
unsigned int do_knl_cstates;
57 58 59 60
unsigned int do_pc2;
unsigned int do_pc3;
unsigned int do_pc6;
unsigned int do_pc7;
61
unsigned int do_c8_c9_c10;
62
unsigned int do_skl_residency;
63 64
unsigned int do_slm_cstates;
unsigned int use_c1_residency_msr;
L
Len Brown 已提交
65
unsigned int has_aperf;
66
unsigned int has_epb;
67 68
unsigned int do_irtl_snb;
unsigned int do_irtl_hsw;
69
unsigned int units = 1000000;	/* MHz etc */
L
Len Brown 已提交
70 71
unsigned int genuine_intel;
unsigned int has_invariant_tsc;
72
unsigned int do_nhm_platform_info;
73
unsigned int no_MSR_MISC_PWR_MGMT;
74
unsigned int aperf_mperf_multiplier = 1;
L
Len Brown 已提交
75
double bclk;
76
double base_hz;
77
unsigned int has_base_hz;
78
double tsc_tweak = 1.0;
79 80 81
unsigned int show_pkg_only;
unsigned int show_core_only;
char *output_buffer, *outp;
82 83 84
unsigned int do_rapl;
unsigned int do_dts;
unsigned int do_ptm;
L
Len Brown 已提交
85
unsigned long long  gfx_cur_rc6_ms;
L
Len Brown 已提交
86
unsigned int gfx_cur_mhz;
87 88
unsigned int tcc_activation_temp;
unsigned int tcc_activation_temp_override;
89 90
double rapl_power_units, rapl_time_units;
double rapl_dram_energy_units, rapl_energy_units;
91
double rapl_joule_counter_range;
92 93 94
unsigned int do_core_perf_limit_reasons;
unsigned int do_gfx_perf_limit_reasons;
unsigned int do_ring_perf_limit_reasons;
95 96
unsigned int crystal_hz;
unsigned long long tsc_hz;
97
int base_cpu;
98
double discover_bclk(unsigned int family, unsigned int model);
99 100 101 102 103 104
unsigned int has_hwp;	/* IA32_PM_ENABLE, IA32_HWP_CAPABILITIES */
			/* IA32_HWP_REQUEST, IA32_HWP_STATUS */
unsigned int has_hwp_notify;		/* IA32_HWP_INTERRUPT */
unsigned int has_hwp_activity_window;	/* IA32_HWP_REQUEST[bits 41:32] */
unsigned int has_hwp_epp;		/* IA32_HWP_REQUEST[bits 31:24] */
unsigned int has_hwp_pkg;		/* IA32_HWP_REQUEST_PKG */
105

L
Len Brown 已提交
106 107 108 109 110 111 112 113 114 115 116 117 118
#define RAPL_PKG		(1 << 0)
					/* 0x610 MSR_PKG_POWER_LIMIT */
					/* 0x611 MSR_PKG_ENERGY_STATUS */
#define RAPL_PKG_PERF_STATUS	(1 << 1)
					/* 0x613 MSR_PKG_PERF_STATUS */
#define RAPL_PKG_POWER_INFO	(1 << 2)
					/* 0x614 MSR_PKG_POWER_INFO */

#define RAPL_DRAM		(1 << 3)
					/* 0x618 MSR_DRAM_POWER_LIMIT */
					/* 0x619 MSR_DRAM_ENERGY_STATUS */
#define RAPL_DRAM_PERF_STATUS	(1 << 4)
					/* 0x61b MSR_DRAM_PERF_STATUS */
119 120
#define RAPL_DRAM_POWER_INFO	(1 << 5)
					/* 0x61c MSR_DRAM_POWER_INFO */
L
Len Brown 已提交
121

122
#define RAPL_CORES_POWER_LIMIT	(1 << 6)
L
Len Brown 已提交
123
					/* 0x638 MSR_PP0_POWER_LIMIT */
124
#define RAPL_CORE_POLICY	(1 << 7)
L
Len Brown 已提交
125 126
					/* 0x63a MSR_PP0_POLICY */

127
#define RAPL_GFX		(1 << 8)
L
Len Brown 已提交
128 129 130
					/* 0x640 MSR_PP1_POWER_LIMIT */
					/* 0x641 MSR_PP1_ENERGY_STATUS */
					/* 0x642 MSR_PP1_POLICY */
131 132 133 134

#define RAPL_CORES_ENERGY_STATUS	(1 << 9)
					/* 0x639 MSR_PP0_ENERGY_STATUS */
#define RAPL_CORES (RAPL_CORES_ENERGY_STATUS | RAPL_CORES_POWER_LIMIT)
135 136 137
#define	TJMAX_DEFAULT	100

#define MAX(a, b) ((a) > (b) ? (a) : (b))
L
Len Brown 已提交
138

139 140 141 142 143 144
/*
 * buffer size used by sscanf() for added column names
 * Usually truncated to 7 characters, but also handles 18 columns for raw 64-bit counters
 */
#define	NAME_BYTES 20

L
Len Brown 已提交
145 146 147
int backwards_count;
char *progname;

148 149
cpu_set_t *cpu_present_set, *cpu_affinity_set;
size_t cpu_present_setsize, cpu_affinity_setsize;
150
#define MAX_ADDED_COUNTERS 16
151 152 153 154 155

struct thread_data {
	unsigned long long tsc;
	unsigned long long aperf;
	unsigned long long mperf;
156
	unsigned long long c1;
157
	unsigned int irq_count;
158
	unsigned int smi_count;
159 160 161 162
	unsigned int cpu_id;
	unsigned int flags;
#define CPU_IS_FIRST_THREAD_IN_CORE	0x2
#define CPU_IS_FIRST_CORE_IN_PACKAGE	0x4
163
	unsigned long long counter[MAX_ADDED_COUNTERS];
164 165 166 167 168 169
} *thread_even, *thread_odd;

struct core_data {
	unsigned long long c3;
	unsigned long long c6;
	unsigned long long c7;
170
	unsigned int core_temp_c;
171
	unsigned int core_id;
172
	unsigned long long counter[MAX_ADDED_COUNTERS];
173 174 175 176 177 178 179
} *core_even, *core_odd;

struct pkg_data {
	unsigned long long pc2;
	unsigned long long pc3;
	unsigned long long pc6;
	unsigned long long pc7;
180 181 182
	unsigned long long pc8;
	unsigned long long pc9;
	unsigned long long pc10;
183 184 185 186
	unsigned long long pkg_wtd_core_c0;
	unsigned long long pkg_any_core_c0;
	unsigned long long pkg_any_gfxe_c0;
	unsigned long long pkg_both_core_gfxe_c0;
187
	long long gfx_rc6_ms;
L
Len Brown 已提交
188
	unsigned int gfx_mhz;
189
	unsigned int package_id;
190 191 192 193 194 195 196
	unsigned int energy_pkg;	/* MSR_PKG_ENERGY_STATUS */
	unsigned int energy_dram;	/* MSR_DRAM_ENERGY_STATUS */
	unsigned int energy_cores;	/* MSR_PP0_ENERGY_STATUS */
	unsigned int energy_gfx;	/* MSR_PP1_ENERGY_STATUS */
	unsigned int rapl_pkg_perf_status;	/* MSR_PKG_PERF_STATUS */
	unsigned int rapl_dram_perf_status;	/* MSR_DRAM_PERF_STATUS */
	unsigned int pkg_temp_c;
197
	unsigned long long counter[MAX_ADDED_COUNTERS];
198 199 200 201 202 203 204 205 206 207 208 209 210
} *package_even, *package_odd;

#define ODD_COUNTERS thread_odd, core_odd, package_odd
#define EVEN_COUNTERS thread_even, core_even, package_even

#define GET_THREAD(thread_base, thread_no, core_no, pkg_no) \
	(thread_base + (pkg_no) * topo.num_cores_per_pkg * \
		topo.num_threads_per_core + \
		(core_no) * topo.num_threads_per_core + (thread_no))
#define GET_CORE(core_base, core_no, pkg_no) \
	(core_base + (pkg_no) * topo.num_cores_per_pkg + (core_no))
#define GET_PKG(pkg_base, pkg_no) (pkg_base + pkg_no)

211 212 213 214 215 216 217 218 219 220 221
enum counter_scope {SCOPE_CPU, SCOPE_CORE, SCOPE_PACKAGE};
enum counter_type {COUNTER_CYCLES, COUNTER_SECONDS};
enum counter_format {FORMAT_RAW, FORMAT_DELTA, FORMAT_PERCENT};

struct msr_counter {
	unsigned int msr_num;
	char name[NAME_BYTES];
	unsigned int width;
	enum counter_type type;
	enum counter_format format;
	struct msr_counter *next;
222 223 224
	unsigned int flags;
#define	FLAGS_HIDE	(1 << 0)
#define	FLAGS_SHOW	(1 << 1)
225 226 227
};

struct sys_counters {
228 229 230
	unsigned int added_thread_counters;
	unsigned int added_core_counters;
	unsigned int added_package_counters;
231 232 233 234 235
	struct msr_counter *tp;
	struct msr_counter *cp;
	struct msr_counter *pp;
} sys;

236 237 238 239
struct system_summary {
	struct thread_data threads;
	struct core_data cores;
	struct pkg_data packages;
240
} average;
241 242 243 244 245 246 247 248 249 250 251 252 253


struct topo_params {
	int num_packages;
	int num_cpus;
	int num_cores;
	int max_cpu_num;
	int num_cores_per_pkg;
	int num_threads_per_core;
} topo;

struct timeval tv_even, tv_odd, tv_delta;

254 255 256
int *irq_column_2_cpu;	/* /proc/interrupts column numbers */
int *irqs_per_cpu;		/* indexed by cpu_num */

257 258 259
void setup_all_buffers(void);

int cpu_is_not_present(int cpu)
260
{
261
	return !CPU_ISSET_S(cpu, cpu_present_setsize, cpu_present_set);
262
}
263
/*
264 265
 * run func(thread, core, package) in topology order
 * skip non-present cpus
266
 */
267 268 269

int for_all_cpus(int (func)(struct thread_data *, struct core_data *, struct pkg_data *),
	struct thread_data *thread_base, struct core_data *core_base, struct pkg_data *pkg_base)
270
{
271
	int retval, pkg_no, core_no, thread_no;
272

273 274 275 276 277 278 279
	for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) {
		for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) {
			for (thread_no = 0; thread_no <
				topo.num_threads_per_core; ++thread_no) {
				struct thread_data *t;
				struct core_data *c;
				struct pkg_data *p;
280

281 282 283 284 285 286 287 288 289 290 291 292 293 294 295
				t = GET_THREAD(thread_base, thread_no, core_no, pkg_no);

				if (cpu_is_not_present(t->cpu_id))
					continue;

				c = GET_CORE(core_base, core_no, pkg_no);
				p = GET_PKG(pkg_base, pkg_no);

				retval = func(t, c, p);
				if (retval)
					return retval;
			}
		}
	}
	return 0;
296 297 298 299
}

int cpu_migrate(int cpu)
{
300 301 302
	CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set);
	CPU_SET_S(cpu, cpu_affinity_setsize, cpu_affinity_set);
	if (sched_setaffinity(0, cpu_affinity_setsize, cpu_affinity_set) == -1)
303 304 305 306
		return -1;
	else
		return 0;
}
307
int get_msr_fd(int cpu)
L
Len Brown 已提交
308 309 310 311
{
	char pathname[32];
	int fd;

312 313 314 315 316
	fd = fd_percpu[cpu];

	if (fd)
		return fd;

L
Len Brown 已提交
317 318
	sprintf(pathname, "/dev/cpu/%d/msr", cpu);
	fd = open(pathname, O_RDONLY);
319
	if (fd < 0)
320
		err(-1, "%s open failed, try chown or chmod +r /dev/cpu/*/msr, or run as root", pathname);
L
Len Brown 已提交
321

322 323 324 325 326 327 328 329 330 331
	fd_percpu[cpu] = fd;

	return fd;
}

int get_msr(int cpu, off_t offset, unsigned long long *msr)
{
	ssize_t retval;

	retval = pread(get_msr_fd(cpu), msr, sizeof(*msr), offset);
332

333
	if (retval != sizeof *msr)
334
		err(-1, "cpu%d: msr offset 0x%llx read failed", cpu, (unsigned long long)offset);
335 336

	return 0;
L
Len Brown 已提交
337 338
}

339
/*
340 341
 * Each string in this array is compared in --show and --hide cmdline.
 * Thus, strings that are proper sub-sets must follow their more specific peers.
342
 */
343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457
struct msr_counter bic[] = {
	{ 0x0, "Package" },
	{ 0x0, "Avg_MHz" },
	{ 0x0, "Bzy_MHz" },
	{ 0x0, "TSC_MHz" },
	{ 0x0, "IRQ" },
	{ 0x0, "SMI", 32, 0, FORMAT_DELTA, NULL},
	{ 0x0, "Busy%" },
	{ 0x0, "CPU%c1" },
	{ 0x0, "CPU%c3" },
	{ 0x0, "CPU%c6" },
	{ 0x0, "CPU%c7" },
	{ 0x0, "ThreadC" },
	{ 0x0, "CoreTmp" },
	{ 0x0, "CoreCnt" },
	{ 0x0, "PkgTmp" },
	{ 0x0, "GFX%rc6" },
	{ 0x0, "GFXMHz" },
	{ 0x0, "Pkg%pc2" },
	{ 0x0, "Pkg%pc3" },
	{ 0x0, "Pkg%pc6" },
	{ 0x0, "Pkg%pc7" },
	{ 0x0, "PkgWatt" },
	{ 0x0, "CorWatt" },
	{ 0x0, "GFXWatt" },
	{ 0x0, "PkgCnt" },
	{ 0x0, "RAMWatt" },
	{ 0x0, "PKG_%" },
	{ 0x0, "RAM_%" },
	{ 0x0, "Pkg_J" },
	{ 0x0, "Cor_J" },
	{ 0x0, "GFX_J" },
	{ 0x0, "RAM_J" },
	{ 0x0, "Core" },
	{ 0x0, "CPU" },
};

#define MAX_BIC (sizeof(bic) / sizeof(struct msr_counter))
#define	BIC_Package	(1ULL << 0)
#define	BIC_Avg_MHz	(1ULL << 1)
#define	BIC_Bzy_MHz	(1ULL << 2)
#define	BIC_TSC_MHz	(1ULL << 3)
#define	BIC_IRQ		(1ULL << 4)
#define	BIC_SMI		(1ULL << 5)
#define	BIC_Busy	(1ULL << 6)
#define	BIC_CPU_c1	(1ULL << 7)
#define	BIC_CPU_c3	(1ULL << 8)
#define	BIC_CPU_c6	(1ULL << 9)
#define	BIC_CPU_c7	(1ULL << 10)
#define	BIC_ThreadC	(1ULL << 11)
#define	BIC_CoreTmp	(1ULL << 12)
#define	BIC_CoreCnt	(1ULL << 13)
#define	BIC_PkgTmp	(1ULL << 14)
#define	BIC_GFX_rc6	(1ULL << 15)
#define	BIC_GFXMHz	(1ULL << 16)
#define	BIC_Pkgpc2	(1ULL << 17)
#define	BIC_Pkgpc3	(1ULL << 18)
#define	BIC_Pkgpc6	(1ULL << 19)
#define	BIC_Pkgpc7	(1ULL << 20)
#define	BIC_PkgWatt	(1ULL << 21)
#define	BIC_CorWatt	(1ULL << 22)
#define	BIC_GFXWatt	(1ULL << 23)
#define	BIC_PkgCnt	(1ULL << 24)
#define	BIC_RAMWatt	(1ULL << 27)
#define	BIC_PKG__	(1ULL << 28)
#define	BIC_RAM__	(1ULL << 29)
#define	BIC_Pkg_J	(1ULL << 30)
#define	BIC_Cor_J	(1ULL << 31)
#define	BIC_GFX_J	(1ULL << 30)
#define	BIC_RAM_J	(1ULL << 31)
#define	BIC_Core	(1ULL << 32)
#define	BIC_CPU		(1ULL << 33)

unsigned long long bic_enabled = 0xFFFFFFFFFFFFFFFFULL;
unsigned long long bic_present;

#define DO_BIC(COUNTER_NAME) (bic_enabled & bic_present & COUNTER_NAME)
#define BIC_PRESENT(COUNTER_BIT) (bic_present |= COUNTER_BIT)

/*
 * bic_lookup
 * for all the strings in comma separate name_list,
 * set the approprate bit in return value.
 */
unsigned long long bic_lookup(char *name_list)
{
	int i;
	unsigned long long retval = 0;

	while (name_list) {
		char *comma;

		comma = strchr(name_list, ',');

		if (comma)
			*comma = '\0';

		for (i = 0; i < MAX_BIC; ++i) {
			if (!strcmp(name_list, bic[i].name)) {
				retval |= (1ULL << i);
				break;
			}
		}
		if (i == MAX_BIC) {
			fprintf(stderr, "Invalid counter name: %s\n", name_list);
			exit(-1);
		}

		name_list = comma;
		if (name_list)
			name_list++;

	}
	return retval;
}
458

L
Len Brown 已提交
459
void print_header(void)
L
Len Brown 已提交
460
{
461 462
	struct msr_counter *mp;

463
	if (DO_BIC(BIC_Package))
464
		outp += sprintf(outp, "\tPackage");
465
	if (DO_BIC(BIC_Core))
466
		outp += sprintf(outp, "\tCore");
467
	if (DO_BIC(BIC_CPU))
468
		outp += sprintf(outp, "\tCPU");
469
	if (DO_BIC(BIC_Avg_MHz))
470
		outp += sprintf(outp, "\tAvg_MHz");
471
	if (DO_BIC(BIC_Busy))
472
		outp += sprintf(outp, "\tBusy%%");
473
	if (DO_BIC(BIC_Bzy_MHz))
474
		outp += sprintf(outp, "\tBzy_MHz");
475 476
	if (DO_BIC(BIC_TSC_MHz))
		outp += sprintf(outp, "\tTSC_MHz");
477 478 479 480

	if (!debug)
		goto done;

481
	if (DO_BIC(BIC_IRQ))
482
		outp += sprintf(outp, "\tIRQ");
483
	if (DO_BIC(BIC_SMI))
484
		outp += sprintf(outp, "\tSMI");
485

486
	if (DO_BIC(BIC_CPU_c1))
487
		outp += sprintf(outp, "\tCPU%%c1");
488

489 490 491 492 493 494 495 496 497 498 499
	for (mp = sys.tp; mp; mp = mp->next) {
		if (mp->format == FORMAT_RAW) {
			if (mp->width == 64)
				outp += sprintf(outp, "\t%18.18s", mp->name);
			else
				outp += sprintf(outp, "\t%10.10s", mp->name);
		} else {
			outp += sprintf(outp, "\t%-7.7s", mp->name);
		}
	}

500
	if (DO_BIC(BIC_CPU_c3) && !do_slm_cstates && !do_knl_cstates)
501
		outp += sprintf(outp, "\tCPU%%c3");
502
	if (DO_BIC(BIC_CPU_c6))
503
		outp += sprintf(outp, "\tCPU%%c6");
504
	if (DO_BIC(BIC_CPU_c7))
505 506 507
		outp += sprintf(outp, "\tCPU%%c7");


508
	if (DO_BIC(BIC_CoreTmp))
509
		outp += sprintf(outp, "\tCoreTmp");
510 511 512 513 514 515 516 517 518 519 520 521

	for (mp = sys.cp; mp; mp = mp->next) {
		if (mp->format == FORMAT_RAW) {
			if (mp->width == 64)
				outp += sprintf(outp, "\t%18.18s", mp->name);
			else
				outp += sprintf(outp, "\t%10.10s", mp->name);
		} else {
			outp += sprintf(outp, "\t%-7.7s", mp->name);
		}
	}

522
	if (DO_BIC(BIC_PkgTmp))
523
		outp += sprintf(outp, "\tPkgTmp");
524

525
	if (DO_BIC(BIC_GFX_rc6))
526
		outp += sprintf(outp, "\tGFX%%rc6");
L
Len Brown 已提交
527

528
	if (DO_BIC(BIC_GFXMHz))
529
		outp += sprintf(outp, "\tGFXMHz");
L
Len Brown 已提交
530

531
	if (do_skl_residency) {
532 533 534 535
		outp += sprintf(outp, "\tTotl%%C0");
		outp += sprintf(outp, "\tAny%%C0");
		outp += sprintf(outp, "\tGFX%%C0");
		outp += sprintf(outp, "\tCPUGFX%%");
536 537
	}

538
	if (do_pc2)
539
		outp += sprintf(outp, "\tPkg%%pc2");
540
	if (do_pc3)
541
		outp += sprintf(outp, "\tPkg%%pc3");
542
	if (do_pc6)
543
		outp += sprintf(outp, "\tPkg%%pc6");
544
	if (do_pc7)
545
		outp += sprintf(outp, "\tPkg%%pc7");
546
	if (do_c8_c9_c10) {
547 548 549
		outp += sprintf(outp, "\tPkg%%pc8");
		outp += sprintf(outp, "\tPkg%%pc9");
		outp += sprintf(outp, "\tPk%%pc10");
550
	}
L
Len Brown 已提交
551

552
	if (do_rapl && !rapl_joules) {
553
		if (DO_BIC(BIC_PkgWatt))
554
			outp += sprintf(outp, "\tPkgWatt");
555
		if (DO_BIC(BIC_CorWatt))
556
			outp += sprintf(outp, "\tCorWatt");
557
		if (DO_BIC(BIC_GFXWatt))
558
			outp += sprintf(outp, "\tGFXWatt");
559
		if (DO_BIC(BIC_RAMWatt))
560
			outp += sprintf(outp, "\tRAMWatt");
561
		if (DO_BIC(BIC_PKG__))
562
			outp += sprintf(outp, "\tPKG_%%");
563
		if (DO_BIC(BIC_RAM__))
564
			outp += sprintf(outp, "\tRAM_%%");
565
	} else if (do_rapl && rapl_joules) {
566
		if (DO_BIC(BIC_Pkg_J))
567
			outp += sprintf(outp, "\tPkg_J");
568
		if (DO_BIC(BIC_Cor_J))
569
			outp += sprintf(outp, "\tCor_J");
570
		if (DO_BIC(BIC_GFX_J))
571
			outp += sprintf(outp, "\tGFX_J");
572
		if (DO_BIC(BIC_RAM_J))
573
			outp += sprintf(outp, "\tRAM_J");
574
		if (DO_BIC(BIC_PKG__))
575
			outp += sprintf(outp, "\tPKG_%%");
576
		if (DO_BIC(BIC_RAM__))
577
			outp += sprintf(outp, "\tRAM_%%");
578
	}
579 580 581 582 583 584 585 586 587 588 589 590
	for (mp = sys.pp; mp; mp = mp->next) {
		if (mp->format == FORMAT_RAW) {
			if (mp->width == 64)
				outp += sprintf(outp, "\t%18.18s", mp->name);
			else
				outp += sprintf(outp, "\t%10.10s", mp->name);
		} else {
			outp += sprintf(outp, "\t%-7.7s", mp->name);
		}
	}

done:
591
	outp += sprintf(outp, "\n");
L
Len Brown 已提交
592 593
}

594 595
int dump_counters(struct thread_data *t, struct core_data *c,
	struct pkg_data *p)
L
Len Brown 已提交
596
{
597 598 599
	int i;
	struct msr_counter *mp;

600
	outp += sprintf(outp, "t %p, c %p, p %p\n", t, c, p);
601 602

	if (t) {
603 604 605 606 607 608
		outp += sprintf(outp, "CPU: %d flags 0x%x\n",
			t->cpu_id, t->flags);
		outp += sprintf(outp, "TSC: %016llX\n", t->tsc);
		outp += sprintf(outp, "aperf: %016llX\n", t->aperf);
		outp += sprintf(outp, "mperf: %016llX\n", t->mperf);
		outp += sprintf(outp, "c1: %016llX\n", t->c1);
609

610
		if (DO_BIC(BIC_IRQ))
611
			outp += sprintf(outp, "IRQ: %08X\n", t->irq_count);
612
		if (DO_BIC(BIC_SMI))
613
			outp += sprintf(outp, "SMI: %08X\n", t->smi_count);
614 615 616 617 618

		for (i = 0, mp = sys.tp; mp; i++, mp = mp->next) {
			outp += sprintf(outp, "tADDED [%d] msr0x%x: %08llX\n",
				i, mp->msr_num, t->counter[i]);
		}
619
	}
L
Len Brown 已提交
620

621
	if (c) {
622 623 624 625 626
		outp += sprintf(outp, "core: %d\n", c->core_id);
		outp += sprintf(outp, "c3: %016llX\n", c->c3);
		outp += sprintf(outp, "c6: %016llX\n", c->c6);
		outp += sprintf(outp, "c7: %016llX\n", c->c7);
		outp += sprintf(outp, "DTS: %dC\n", c->core_temp_c);
627 628 629 630 631

		for (i = 0, mp = sys.cp; mp; i++, mp = mp->next) {
			outp += sprintf(outp, "cADDED [%d] msr0x%x: %08llX\n",
				i, mp->msr_num, c->counter[i]);
		}
632
	}
L
Len Brown 已提交
633

634
	if (p) {
635
		outp += sprintf(outp, "package: %d\n", p->package_id);
636 637 638 639 640 641

		outp += sprintf(outp, "Weighted cores: %016llX\n", p->pkg_wtd_core_c0);
		outp += sprintf(outp, "Any cores: %016llX\n", p->pkg_any_core_c0);
		outp += sprintf(outp, "Any GFX: %016llX\n", p->pkg_any_gfxe_c0);
		outp += sprintf(outp, "CPU + GFX: %016llX\n", p->pkg_both_core_gfxe_c0);

642
		outp += sprintf(outp, "pc2: %016llX\n", p->pc2);
643 644 645 646 647 648
		if (do_pc3)
			outp += sprintf(outp, "pc3: %016llX\n", p->pc3);
		if (do_pc6)
			outp += sprintf(outp, "pc6: %016llX\n", p->pc6);
		if (do_pc7)
			outp += sprintf(outp, "pc7: %016llX\n", p->pc7);
649 650 651 652 653 654 655 656 657 658 659 660
		outp += sprintf(outp, "pc8: %016llX\n", p->pc8);
		outp += sprintf(outp, "pc9: %016llX\n", p->pc9);
		outp += sprintf(outp, "pc10: %016llX\n", p->pc10);
		outp += sprintf(outp, "Joules PKG: %0X\n", p->energy_pkg);
		outp += sprintf(outp, "Joules COR: %0X\n", p->energy_cores);
		outp += sprintf(outp, "Joules GFX: %0X\n", p->energy_gfx);
		outp += sprintf(outp, "Joules RAM: %0X\n", p->energy_dram);
		outp += sprintf(outp, "Throttle PKG: %0X\n",
			p->rapl_pkg_perf_status);
		outp += sprintf(outp, "Throttle RAM: %0X\n",
			p->rapl_dram_perf_status);
		outp += sprintf(outp, "PTM: %dC\n", p->pkg_temp_c);
661 662 663 664 665

		for (i = 0, mp = sys.pp; mp; i++, mp = mp->next) {
			outp += sprintf(outp, "pADDED [%d] msr0x%x: %08llX\n",
				i, mp->msr_num, p->counter[i]);
		}
666
	}
667 668 669

	outp += sprintf(outp, "\n");

670
	return 0;
L
Len Brown 已提交
671 672
}

L
Len Brown 已提交
673 674 675
/*
 * column formatting convention & formats
 */
676 677
int format_counters(struct thread_data *t, struct core_data *c,
	struct pkg_data *p)
L
Len Brown 已提交
678 679
{
	double interval_float;
680
	char *fmt8;
681 682
	int i;
	struct msr_counter *mp;
L
Len Brown 已提交
683

684 685 686 687 688 689 690 691
	 /* if showing only 1st thread in core and this isn't one, bail out */
	if (show_core_only && !(t->flags & CPU_IS_FIRST_THREAD_IN_CORE))
		return 0;

	 /* if showing only 1st thread in pkg and this isn't one, bail out */
	if (show_pkg_only && !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

L
Len Brown 已提交
692 693
	interval_float = tv_delta.tv_sec + tv_delta.tv_usec/1000000.0;

694 695
	/* topo columns, print blanks on 1st (average) line */
	if (t == &average.threads) {
696
		if (DO_BIC(BIC_Package))
697
			outp += sprintf(outp, "\t-");
698
		if (DO_BIC(BIC_Core))
699
			outp += sprintf(outp, "\t-");
700
		if (DO_BIC(BIC_CPU))
701
			outp += sprintf(outp, "\t-");
L
Len Brown 已提交
702
	} else {
703
		if (DO_BIC(BIC_Package)) {
704
			if (p)
705
				outp += sprintf(outp, "\t%d", p->package_id);
706
			else
707
				outp += sprintf(outp, "\t-");
708
		}
709
		if (DO_BIC(BIC_Core)) {
710
			if (c)
711
				outp += sprintf(outp, "\t%d", c->core_id);
712
			else
713
				outp += sprintf(outp, "\t-");
714
		}
715
		if (DO_BIC(BIC_CPU))
716
			outp += sprintf(outp, "\t%d", t->cpu_id);
L
Len Brown 已提交
717
	}
718

719
	if (DO_BIC(BIC_Avg_MHz))
720
		outp += sprintf(outp, "\t%.0f",
721 722
			1.0 / units * t->aperf / interval_float);

723
	if (DO_BIC(BIC_Busy))
724
		outp += sprintf(outp, "\t%.2f", 100.0 * t->mperf/t->tsc/tsc_tweak);
L
Len Brown 已提交
725

726
	if (DO_BIC(BIC_Bzy_MHz)) {
727
		if (has_base_hz)
728
			outp += sprintf(outp, "\t%.0f", base_hz / units * t->aperf / t->mperf);
729
		else
730
			outp += sprintf(outp, "\t%.0f",
731 732
				1.0 * t->tsc / units * t->aperf / t->mperf / interval_float);
	}
L
Len Brown 已提交
733

734 735
	if (DO_BIC(BIC_TSC_MHz))
		outp += sprintf(outp, "\t%.0f", 1.0 * t->tsc/units/interval_float);
L
Len Brown 已提交
736

737 738 739
	if (!debug)
		goto done;

740
	/* IRQ */
741
	if (DO_BIC(BIC_IRQ))
742
		outp += sprintf(outp, "\t%d", t->irq_count);
743

744
	/* SMI */
745
	if (DO_BIC(BIC_SMI))
746
		outp += sprintf(outp, "\t%d", t->smi_count);
747

748
	/* C1 */
749
	if (DO_BIC(BIC_CPU_c1))
750
		outp += sprintf(outp, "\t%.2f", 100.0 * t->c1/t->tsc);
751

752
	/* Added counters */
753 754 755 756 757 758 759
	for (i = 0, mp = sys.tp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW) {
			if (mp->width == 32)
				outp += sprintf(outp, "\t0x%08lx", (unsigned long) t->counter[i]);
			else
				outp += sprintf(outp, "\t0x%016llx", t->counter[i]);
		} else if (mp->format == FORMAT_DELTA) {
760
			outp += sprintf(outp, "\t%lld", t->counter[i]);
761 762 763 764 765
		} else if (mp->format == FORMAT_PERCENT) {
			outp += sprintf(outp, "\t%.2f", 100.0 * t->counter[i]/t->tsc);
		}
	}

766 767 768 769
	/* print per-core data only for 1st thread in core */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE))
		goto done;

770
	if (DO_BIC(BIC_CPU_c3) && !do_slm_cstates && !do_knl_cstates)
771
		outp += sprintf(outp, "\t%.2f", 100.0 * c->c3/t->tsc);
772
	if (DO_BIC(BIC_CPU_c6))
773
		outp += sprintf(outp, "\t%.2f", 100.0 * c->c6/t->tsc);
774
	if (DO_BIC(BIC_CPU_c7))
775 776
		outp += sprintf(outp, "\t%.2f", 100.0 * c->c7/t->tsc);

777
	if (DO_BIC(BIC_CoreTmp))
778
		outp += sprintf(outp, "\t%d", c->core_temp_c);
779

780 781 782 783 784 785 786
	for (i = 0, mp = sys.cp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW) {
			if (mp->width == 32)
				outp += sprintf(outp, "\t0x%08lx", (unsigned long) c->counter[i]);
			else
				outp += sprintf(outp, "\t0x%016llx", c->counter[i]);
		} else if (mp->format == FORMAT_DELTA) {
787
			outp += sprintf(outp, "\t%lld", c->counter[i]);
788 789 790 791 792
		} else if (mp->format == FORMAT_PERCENT) {
			outp += sprintf(outp, "\t%.2f", 100.0 * c->counter[i]/t->tsc);
		}
	}

793 794 795 796
	/* print per-package data only for 1st core in package */
	if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		goto done;

797
	/* PkgTmp */
798
	if (DO_BIC(BIC_PkgTmp))
799
		outp += sprintf(outp, "\t%d", p->pkg_temp_c);
800

L
Len Brown 已提交
801
	/* GFXrc6 */
802
	if (DO_BIC(BIC_GFX_rc6)) {
803
		if (p->gfx_rc6_ms == -1) {	/* detect GFX counter reset */
804
			outp += sprintf(outp, "\t**.**");
805
		} else {
806
			outp += sprintf(outp, "\t%.2f",
807 808 809
				p->gfx_rc6_ms / 10.0 / interval_float);
		}
	}
L
Len Brown 已提交
810

L
Len Brown 已提交
811
	/* GFXMHz */
812
	if (DO_BIC(BIC_GFXMHz))
813
		outp += sprintf(outp, "\t%d", p->gfx_mhz);
L
Len Brown 已提交
814

815 816
	/* Totl%C0, Any%C0 GFX%C0 CPUGFX% */
	if (do_skl_residency) {
817 818 819 820
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pkg_wtd_core_c0/t->tsc);
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pkg_any_core_c0/t->tsc);
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pkg_any_gfxe_c0/t->tsc);
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pkg_both_core_gfxe_c0/t->tsc);
821 822
	}

823
	if (do_pc2)
824
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc2/t->tsc);
825
	if (do_pc3)
826
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc3/t->tsc);
827
	if (do_pc6)
828
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc6/t->tsc);
829
	if (do_pc7)
830
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc7/t->tsc);
831
	if (do_c8_c9_c10) {
832 833 834
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc8/t->tsc);
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc9/t->tsc);
		outp += sprintf(outp, "\t%.2f", 100.0 * p->pc10/t->tsc);
835
	}
836 837 838 839 840

	/*
 	 * If measurement interval exceeds minimum RAPL Joule Counter range,
 	 * indicate that results are suspect by printing "**" in fraction place.
 	 */
841
	if (interval_float < rapl_joule_counter_range)
842
		fmt8 = "\t%.2f";
843
	else
844
		fmt8 = "%6.0f**";
845

846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866
	if (DO_BIC(BIC_PkgWatt))
		outp += sprintf(outp, fmt8, p->energy_pkg * rapl_energy_units / interval_float);
	if (DO_BIC(BIC_CorWatt))
		outp += sprintf(outp, fmt8, p->energy_cores * rapl_energy_units / interval_float);
	if (DO_BIC(BIC_GFXWatt))
		outp += sprintf(outp, fmt8, p->energy_gfx * rapl_energy_units / interval_float);
	if (DO_BIC(BIC_RAMWatt))
		outp += sprintf(outp, fmt8, p->energy_dram * rapl_dram_energy_units / interval_float);
	if (DO_BIC(BIC_Pkg_J))
		outp += sprintf(outp, fmt8, p->energy_pkg * rapl_energy_units);
	if (DO_BIC(BIC_Cor_J))
		outp += sprintf(outp, fmt8, p->energy_cores * rapl_energy_units);
	if (DO_BIC(BIC_GFX_J))
		outp += sprintf(outp, fmt8, p->energy_gfx * rapl_energy_units);
	if (DO_BIC(BIC_RAM_J))
		outp += sprintf(outp, fmt8, p->energy_dram * rapl_dram_energy_units);
	if (DO_BIC(BIC_PKG__))
		outp += sprintf(outp, fmt8, 100.0 * p->rapl_pkg_perf_status * rapl_time_units / interval_float);
	if (DO_BIC(BIC_RAM__))
		outp += sprintf(outp, fmt8, 100.0 * p->rapl_dram_perf_status * rapl_time_units / interval_float);

867 868 869 870 871 872 873
	for (i = 0, mp = sys.pp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW) {
			if (mp->width == 32)
				outp += sprintf(outp, "\t0x%08lx", (unsigned long) p->counter[i]);
			else
				outp += sprintf(outp, "\t0x%016llx", p->counter[i]);
		} else if (mp->format == FORMAT_DELTA) {
874
			outp += sprintf(outp, "\t%lld", p->counter[i]);
875 876 877 878 879
		} else if (mp->format == FORMAT_PERCENT) {
			outp += sprintf(outp, "\t%.2f", 100.0 * p->counter[i]/t->tsc);
		}
	}

880 881 882 883
done:
	outp += sprintf(outp, "\n");

	return 0;
L
Len Brown 已提交
884 885
}

886
void flush_output_stdout(void)
887
{
888 889 890 891 892 893 894 895 896 897
	FILE *filep;

	if (outf == stderr)
		filep = stdout;
	else
		filep = outf;

	fputs(output_buffer, filep);
	fflush(filep);

898 899
	outp = output_buffer;
}
900
void flush_output_stderr(void)
901
{
902 903
	fputs(output_buffer, outf);
	fflush(outf);
904 905 906
	outp = output_buffer;
}
void format_all_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p)
L
Len Brown 已提交
907
{
L
Len Brown 已提交
908
	static int printed;
L
Len Brown 已提交
909

L
Len Brown 已提交
910 911
	if (!printed || !summary_only)
		print_header();
L
Len Brown 已提交
912

913 914 915
	if (topo.num_cpus > 1)
		format_counters(&average.threads, &average.cores,
			&average.packages);
L
Len Brown 已提交
916

L
Len Brown 已提交
917 918 919 920 921
	printed = 1;

	if (summary_only)
		return;

922
	for_all_cpus(format_counters, t, c, p);
L
Len Brown 已提交
923 924
}

925 926 927 928 929 930 931
#define DELTA_WRAP32(new, old)			\
	if (new > old) {			\
		old = new - old;		\
	} else {				\
		old = 0x100000000 + new - old;	\
	}

932
int
933 934
delta_package(struct pkg_data *new, struct pkg_data *old)
{
935 936
	int i;
	struct msr_counter *mp;
937 938 939 940 941 942 943

	if (do_skl_residency) {
		old->pkg_wtd_core_c0 = new->pkg_wtd_core_c0 - old->pkg_wtd_core_c0;
		old->pkg_any_core_c0 = new->pkg_any_core_c0 - old->pkg_any_core_c0;
		old->pkg_any_gfxe_c0 = new->pkg_any_gfxe_c0 - old->pkg_any_gfxe_c0;
		old->pkg_both_core_gfxe_c0 = new->pkg_both_core_gfxe_c0 - old->pkg_both_core_gfxe_c0;
	}
944
	old->pc2 = new->pc2 - old->pc2;
945 946 947 948 949 950
	if (do_pc3)
		old->pc3 = new->pc3 - old->pc3;
	if (do_pc6)
		old->pc6 = new->pc6 - old->pc6;
	if (do_pc7)
		old->pc7 = new->pc7 - old->pc7;
951 952 953
	old->pc8 = new->pc8 - old->pc8;
	old->pc9 = new->pc9 - old->pc9;
	old->pc10 = new->pc10 - old->pc10;
954 955
	old->pkg_temp_c = new->pkg_temp_c;

956 957 958 959 960 961
	/* flag an error when rc6 counter resets/wraps */
	if (old->gfx_rc6_ms >  new->gfx_rc6_ms)
		old->gfx_rc6_ms = -1;
	else
		old->gfx_rc6_ms = new->gfx_rc6_ms - old->gfx_rc6_ms;

L
Len Brown 已提交
962 963
	old->gfx_mhz = new->gfx_mhz;

964 965 966 967 968 969
	DELTA_WRAP32(new->energy_pkg, old->energy_pkg);
	DELTA_WRAP32(new->energy_cores, old->energy_cores);
	DELTA_WRAP32(new->energy_gfx, old->energy_gfx);
	DELTA_WRAP32(new->energy_dram, old->energy_dram);
	DELTA_WRAP32(new->rapl_pkg_perf_status, old->rapl_pkg_perf_status);
	DELTA_WRAP32(new->rapl_dram_perf_status, old->rapl_dram_perf_status);
970

971 972 973 974 975 976 977
	for (i = 0, mp = sys.pp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			old->counter[i] = new->counter[i];
		else
			old->counter[i] = new->counter[i] - old->counter[i];
	}

978
	return 0;
979
}
L
Len Brown 已提交
980

981 982
void
delta_core(struct core_data *new, struct core_data *old)
L
Len Brown 已提交
983
{
984 985 986
	int i;
	struct msr_counter *mp;

987 988 989
	old->c3 = new->c3 - old->c3;
	old->c6 = new->c6 - old->c6;
	old->c7 = new->c7 - old->c7;
990
	old->core_temp_c = new->core_temp_c;
991 992 993 994 995 996 997

	for (i = 0, mp = sys.cp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			old->counter[i] = new->counter[i];
		else
			old->counter[i] = new->counter[i] - old->counter[i];
	}
998
}
L
Len Brown 已提交
999

1000 1001 1002
/*
 * old = new - old
 */
1003
int
1004 1005 1006
delta_thread(struct thread_data *new, struct thread_data *old,
	struct core_data *core_delta)
{
1007 1008 1009
	int i;
	struct msr_counter *mp;

1010 1011 1012
	old->tsc = new->tsc - old->tsc;

	/* check for TSC < 1 Mcycles over interval */
1013 1014 1015 1016
	if (old->tsc < (1000 * 1000))
		errx(-3, "Insanely slow TSC rate, TSC stops in idle?\n"
		     "You can disable all c-states by booting with \"idle=poll\"\n"
		     "or just the deep ones with \"processor.max_cstate=1\"");
L
Len Brown 已提交
1017

1018
	old->c1 = new->c1 - old->c1;
L
Len Brown 已提交
1019

1020
	if (DO_BIC(BIC_Avg_MHz) || DO_BIC(BIC_Busy) || DO_BIC(BIC_Bzy_MHz)) {
1021 1022 1023 1024
		if ((new->aperf > old->aperf) && (new->mperf > old->mperf)) {
			old->aperf = new->aperf - old->aperf;
			old->mperf = new->mperf - old->mperf;
		} else {
1025
			return -1;
L
Len Brown 已提交
1026
		}
1027
	}
L
Len Brown 已提交
1028 1029


1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045
	if (use_c1_residency_msr) {
		/*
		 * Some models have a dedicated C1 residency MSR,
		 * which should be more accurate than the derivation below.
		 */
	} else {
		/*
		 * As counter collection is not atomic,
		 * it is possible for mperf's non-halted cycles + idle states
		 * to exceed TSC's all cycles: show c1 = 0% in that case.
		 */
		if ((old->mperf + core_delta->c3 + core_delta->c6 + core_delta->c7) > old->tsc)
			old->c1 = 0;
		else {
			/* normal case, derive c1 */
			old->c1 = old->tsc - old->mperf - core_delta->c3
1046
				- core_delta->c6 - core_delta->c7;
1047
		}
1048
	}
1049

1050
	if (old->mperf == 0) {
1051 1052
		if (debug > 1)
			fprintf(outf, "cpu%d MPERF 0!\n", old->cpu_id);
1053
		old->mperf = 1;	/* divide by 0 protection */
L
Len Brown 已提交
1054
	}
1055

1056
	if (DO_BIC(BIC_IRQ))
1057 1058
		old->irq_count = new->irq_count - old->irq_count;

1059
	if (DO_BIC(BIC_SMI))
1060
		old->smi_count = new->smi_count - old->smi_count;
1061

1062 1063 1064 1065 1066 1067
	for (i = 0, mp = sys.tp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			old->counter[i] = new->counter[i];
		else
			old->counter[i] = new->counter[i] - old->counter[i];
	}
1068
	return 0;
1069 1070 1071 1072 1073 1074
}

int delta_cpu(struct thread_data *t, struct core_data *c,
	struct pkg_data *p, struct thread_data *t2,
	struct core_data *c2, struct pkg_data *p2)
{
1075 1076
	int retval = 0;

1077 1078 1079 1080 1081
	/* calculate core delta only for 1st thread in core */
	if (t->flags & CPU_IS_FIRST_THREAD_IN_CORE)
		delta_core(c, c2);

	/* always calculate thread delta */
1082 1083 1084
	retval = delta_thread(t, t2, c2);	/* c2 is core delta */
	if (retval)
		return retval;
1085 1086 1087

	/* calculate package delta only for 1st core in package */
	if (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)
1088
		retval = delta_package(p, p2);
1089

1090
	return retval;
L
Len Brown 已提交
1091 1092
}

1093 1094
void clear_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
1095 1096 1097
	int i;
	struct msr_counter  *mp;

1098 1099 1100 1101 1102
	t->tsc = 0;
	t->aperf = 0;
	t->mperf = 0;
	t->c1 = 0;

1103 1104 1105
	t->irq_count = 0;
	t->smi_count = 0;

1106 1107 1108 1109 1110 1111
	/* tells format_counters to dump all fields from this set */
	t->flags = CPU_IS_FIRST_THREAD_IN_CORE | CPU_IS_FIRST_CORE_IN_PACKAGE;

	c->c3 = 0;
	c->c6 = 0;
	c->c7 = 0;
1112
	c->core_temp_c = 0;
1113

1114 1115 1116 1117 1118
	p->pkg_wtd_core_c0 = 0;
	p->pkg_any_core_c0 = 0;
	p->pkg_any_gfxe_c0 = 0;
	p->pkg_both_core_gfxe_c0 = 0;

1119
	p->pc2 = 0;
1120 1121 1122 1123 1124 1125
	if (do_pc3)
		p->pc3 = 0;
	if (do_pc6)
		p->pc6 = 0;
	if (do_pc7)
		p->pc7 = 0;
1126 1127 1128
	p->pc8 = 0;
	p->pc9 = 0;
	p->pc10 = 0;
1129 1130 1131 1132 1133 1134 1135 1136

	p->energy_pkg = 0;
	p->energy_dram = 0;
	p->energy_cores = 0;
	p->energy_gfx = 0;
	p->rapl_pkg_perf_status = 0;
	p->rapl_dram_perf_status = 0;
	p->pkg_temp_c = 0;
L
Len Brown 已提交
1137

L
Len Brown 已提交
1138
	p->gfx_rc6_ms = 0;
L
Len Brown 已提交
1139
	p->gfx_mhz = 0;
1140 1141 1142 1143 1144 1145 1146 1147
	for (i = 0, mp = sys.tp; mp; i++, mp = mp->next)
		t->counter[i] = 0;

	for (i = 0, mp = sys.cp; mp; i++, mp = mp->next)
		c->counter[i] = 0;

	for (i = 0, mp = sys.pp; mp; i++, mp = mp->next)
		p->counter[i] = 0;
1148 1149 1150
}
int sum_counters(struct thread_data *t, struct core_data *c,
	struct pkg_data *p)
L
Len Brown 已提交
1151
{
1152 1153 1154
	int i;
	struct msr_counter *mp;

1155 1156 1157 1158
	average.threads.tsc += t->tsc;
	average.threads.aperf += t->aperf;
	average.threads.mperf += t->mperf;
	average.threads.c1 += t->c1;
L
Len Brown 已提交
1159

1160 1161 1162
	average.threads.irq_count += t->irq_count;
	average.threads.smi_count += t->smi_count;

1163 1164 1165 1166 1167 1168
	for (i = 0, mp = sys.tp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			continue;
		average.threads.counter[i] += t->counter[i];
	}

1169 1170 1171
	/* sum per-core values only for 1st thread in core */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE))
		return 0;
L
Len Brown 已提交
1172

1173 1174 1175 1176
	average.cores.c3 += c->c3;
	average.cores.c6 += c->c6;
	average.cores.c7 += c->c7;

1177 1178
	average.cores.core_temp_c = MAX(average.cores.core_temp_c, c->core_temp_c);

1179 1180 1181 1182 1183 1184
	for (i = 0, mp = sys.cp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			continue;
		average.cores.counter[i] += c->counter[i];
	}

1185 1186 1187 1188
	/* sum per-pkg values only for 1st core in pkg */
	if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

1189 1190 1191 1192 1193 1194 1195
	if (do_skl_residency) {
		average.packages.pkg_wtd_core_c0 += p->pkg_wtd_core_c0;
		average.packages.pkg_any_core_c0 += p->pkg_any_core_c0;
		average.packages.pkg_any_gfxe_c0 += p->pkg_any_gfxe_c0;
		average.packages.pkg_both_core_gfxe_c0 += p->pkg_both_core_gfxe_c0;
	}

1196
	average.packages.pc2 += p->pc2;
1197 1198 1199 1200 1201 1202
	if (do_pc3)
		average.packages.pc3 += p->pc3;
	if (do_pc6)
		average.packages.pc6 += p->pc6;
	if (do_pc7)
		average.packages.pc7 += p->pc7;
1203 1204 1205
	average.packages.pc8 += p->pc8;
	average.packages.pc9 += p->pc9;
	average.packages.pc10 += p->pc10;
1206

1207 1208 1209 1210 1211
	average.packages.energy_pkg += p->energy_pkg;
	average.packages.energy_dram += p->energy_dram;
	average.packages.energy_cores += p->energy_cores;
	average.packages.energy_gfx += p->energy_gfx;

L
Len Brown 已提交
1212
	average.packages.gfx_rc6_ms = p->gfx_rc6_ms;
L
Len Brown 已提交
1213 1214
	average.packages.gfx_mhz = p->gfx_mhz;

1215 1216 1217 1218
	average.packages.pkg_temp_c = MAX(average.packages.pkg_temp_c, p->pkg_temp_c);

	average.packages.rapl_pkg_perf_status += p->rapl_pkg_perf_status;
	average.packages.rapl_dram_perf_status += p->rapl_dram_perf_status;
1219 1220 1221 1222 1223 1224

	for (i = 0, mp = sys.pp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			continue;
		average.packages.counter[i] += p->counter[i];
	}
1225 1226 1227 1228 1229 1230 1231 1232 1233
	return 0;
}
/*
 * sum the counters for all cpus in the system
 * compute the weighted average
 */
void compute_average(struct thread_data *t, struct core_data *c,
	struct pkg_data *p)
{
1234 1235 1236
	int i;
	struct msr_counter *mp;

1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249
	clear_counters(&average.threads, &average.cores, &average.packages);

	for_all_cpus(sum_counters, t, c, p);

	average.threads.tsc /= topo.num_cpus;
	average.threads.aperf /= topo.num_cpus;
	average.threads.mperf /= topo.num_cpus;
	average.threads.c1 /= topo.num_cpus;

	average.cores.c3 /= topo.num_cores;
	average.cores.c6 /= topo.num_cores;
	average.cores.c7 /= topo.num_cores;

1250 1251 1252 1253 1254 1255 1256
	if (do_skl_residency) {
		average.packages.pkg_wtd_core_c0 /= topo.num_packages;
		average.packages.pkg_any_core_c0 /= topo.num_packages;
		average.packages.pkg_any_gfxe_c0 /= topo.num_packages;
		average.packages.pkg_both_core_gfxe_c0 /= topo.num_packages;
	}

1257
	average.packages.pc2 /= topo.num_packages;
1258 1259 1260 1261 1262 1263
	if (do_pc3)
		average.packages.pc3 /= topo.num_packages;
	if (do_pc6)
		average.packages.pc6 /= topo.num_packages;
	if (do_pc7)
		average.packages.pc7 /= topo.num_packages;
1264 1265 1266 1267

	average.packages.pc8 /= topo.num_packages;
	average.packages.pc9 /= topo.num_packages;
	average.packages.pc10 /= topo.num_packages;
1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283

	for (i = 0, mp = sys.tp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			continue;
		average.threads.counter[i] /= topo.num_cpus;
	}
	for (i = 0, mp = sys.cp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			continue;
		average.cores.counter[i] /= topo.num_cores;
	}
	for (i = 0, mp = sys.pp; mp; i++, mp = mp->next) {
		if (mp->format == FORMAT_RAW)
			continue;
		average.packages.counter[i] /= topo.num_packages;
	}
L
Len Brown 已提交
1284 1285
}

1286
static unsigned long long rdtsc(void)
L
Len Brown 已提交
1287
{
1288
	unsigned int low, high;
1289

1290
	asm volatile("rdtsc" : "=a" (low), "=d" (high));
1291

1292 1293
	return low | ((unsigned long long)high) << 32;
}
1294

1295 1296 1297 1298 1299 1300 1301 1302
/*
 * get_counters(...)
 * migrate to cpu
 * acquire and record local counters for that cpu
 */
int get_counters(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	int cpu = t->cpu_id;
1303
	unsigned long long msr;
1304
	int aperf_mperf_retry_count = 0;
1305 1306
	struct msr_counter *mp;
	int i;
1307

1308
	if (cpu_migrate(cpu)) {
1309
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
1310
		return -1;
1311
	}
1312

1313
retry:
1314 1315
	t->tsc = rdtsc();	/* we are running on local CPU of interest */

1316
	if (DO_BIC(BIC_Avg_MHz) || DO_BIC(BIC_Busy) || DO_BIC(BIC_Bzy_MHz)) {
1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340
		unsigned long long tsc_before, tsc_between, tsc_after, aperf_time, mperf_time;

		/*
		 * The TSC, APERF and MPERF must be read together for
		 * APERF/MPERF and MPERF/TSC to give accurate results.
		 *
		 * Unfortunately, APERF and MPERF are read by
		 * individual system call, so delays may occur
		 * between them.  If the time to read them
		 * varies by a large amount, we re-read them.
		 */

		/*
		 * This initial dummy APERF read has been seen to
		 * reduce jitter in the subsequent reads.
		 */

		if (get_msr(cpu, MSR_IA32_APERF, &t->aperf))
			return -3;

		t->tsc = rdtsc();	/* re-read close to APERF */

		tsc_before = t->tsc;

1341
		if (get_msr(cpu, MSR_IA32_APERF, &t->aperf))
1342
			return -3;
1343 1344 1345

		tsc_between = rdtsc();

1346
		if (get_msr(cpu, MSR_IA32_MPERF, &t->mperf))
1347
			return -4;
1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367

		tsc_after = rdtsc();

		aperf_time = tsc_between - tsc_before;
		mperf_time = tsc_after - tsc_between;

		/*
		 * If the system call latency to read APERF and MPERF
		 * differ by more than 2x, then try again.
		 */
		if ((aperf_time > (2 * mperf_time)) || (mperf_time > (2 * aperf_time))) {
			aperf_mperf_retry_count++;
			if (aperf_mperf_retry_count < 5)
				goto retry;
			else
				warnx("cpu%d jitter %lld %lld",
					cpu, aperf_time, mperf_time);
		}
		aperf_mperf_retry_count = 0;

1368 1369
		t->aperf = t->aperf * aperf_mperf_multiplier;
		t->mperf = t->mperf * aperf_mperf_multiplier;
1370 1371
	}

1372
	if (DO_BIC(BIC_IRQ))
1373
		t->irq_count = irqs_per_cpu[cpu];
1374
	if (DO_BIC(BIC_SMI)) {
1375 1376 1377 1378
		if (get_msr(cpu, MSR_SMI_COUNT, &msr))
			return -5;
		t->smi_count = msr & 0xFFFFFFFF;
	}
1379

1380 1381 1382 1383 1384
	if (use_c1_residency_msr) {
		if (get_msr(cpu, MSR_CORE_C1_RES, &t->c1))
			return -6;
	}

1385 1386 1387 1388 1389 1390
	for (i = 0, mp = sys.tp; mp; i++, mp = mp->next) {
		if (get_msr(cpu, mp->msr_num, &t->counter[i]))
			return -10;
	}


1391 1392 1393 1394
	/* collect core counters only for 1st thread in core */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE))
		return 0;

1395
	if (DO_BIC(BIC_CPU_c3) && !do_slm_cstates && !do_knl_cstates) {
1396 1397
		if (get_msr(cpu, MSR_CORE_C3_RESIDENCY, &c->c3))
			return -6;
1398 1399
	}

1400
	if (DO_BIC(BIC_CPU_c6) && !do_knl_cstates) {
1401 1402
		if (get_msr(cpu, MSR_CORE_C6_RESIDENCY, &c->c6))
			return -7;
1403 1404 1405
	} else if (do_knl_cstates) {
		if (get_msr(cpu, MSR_KNL_CORE_C6_RESIDENCY, &c->c6))
			return -7;
1406 1407
	}

1408
	if (DO_BIC(BIC_CPU_c7))
1409 1410 1411
		if (get_msr(cpu, MSR_CORE_C7_RESIDENCY, &c->c7))
			return -8;

1412
	if (DO_BIC(BIC_CoreTmp)) {
1413 1414 1415 1416 1417
		if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr))
			return -9;
		c->core_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F);
	}

1418 1419 1420 1421
	for (i = 0, mp = sys.cp; mp; i++, mp = mp->next) {
		if (get_msr(cpu, mp->msr_num, &c->counter[i]))
			return -10;
	}
1422

1423 1424 1425 1426
	/* collect package counters only for 1st core in package */
	if (!(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

1427 1428 1429 1430 1431 1432 1433 1434 1435 1436
	if (do_skl_residency) {
		if (get_msr(cpu, MSR_PKG_WEIGHTED_CORE_C0_RES, &p->pkg_wtd_core_c0))
			return -10;
		if (get_msr(cpu, MSR_PKG_ANY_CORE_C0_RES, &p->pkg_any_core_c0))
			return -11;
		if (get_msr(cpu, MSR_PKG_ANY_GFXE_C0_RES, &p->pkg_any_gfxe_c0))
			return -12;
		if (get_msr(cpu, MSR_PKG_BOTH_CORE_GFXE_C0_RES, &p->pkg_both_core_gfxe_c0))
			return -13;
	}
1437
	if (do_pc3)
1438 1439
		if (get_msr(cpu, MSR_PKG_C3_RESIDENCY, &p->pc3))
			return -9;
1440
	if (do_pc6)
1441 1442
		if (get_msr(cpu, MSR_PKG_C6_RESIDENCY, &p->pc6))
			return -10;
1443
	if (do_pc2)
1444 1445
		if (get_msr(cpu, MSR_PKG_C2_RESIDENCY, &p->pc2))
			return -11;
1446
	if (do_pc7)
1447 1448
		if (get_msr(cpu, MSR_PKG_C7_RESIDENCY, &p->pc7))
			return -12;
1449 1450 1451 1452 1453 1454 1455 1456
	if (do_c8_c9_c10) {
		if (get_msr(cpu, MSR_PKG_C8_RESIDENCY, &p->pc8))
			return -13;
		if (get_msr(cpu, MSR_PKG_C9_RESIDENCY, &p->pc9))
			return -13;
		if (get_msr(cpu, MSR_PKG_C10_RESIDENCY, &p->pc10))
			return -13;
	}
1457 1458 1459 1460 1461
	if (do_rapl & RAPL_PKG) {
		if (get_msr(cpu, MSR_PKG_ENERGY_STATUS, &msr))
			return -13;
		p->energy_pkg = msr & 0xFFFFFFFF;
	}
1462
	if (do_rapl & RAPL_CORES_ENERGY_STATUS) {
1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486
		if (get_msr(cpu, MSR_PP0_ENERGY_STATUS, &msr))
			return -14;
		p->energy_cores = msr & 0xFFFFFFFF;
	}
	if (do_rapl & RAPL_DRAM) {
		if (get_msr(cpu, MSR_DRAM_ENERGY_STATUS, &msr))
			return -15;
		p->energy_dram = msr & 0xFFFFFFFF;
	}
	if (do_rapl & RAPL_GFX) {
		if (get_msr(cpu, MSR_PP1_ENERGY_STATUS, &msr))
			return -16;
		p->energy_gfx = msr & 0xFFFFFFFF;
	}
	if (do_rapl & RAPL_PKG_PERF_STATUS) {
		if (get_msr(cpu, MSR_PKG_PERF_STATUS, &msr))
			return -16;
		p->rapl_pkg_perf_status = msr & 0xFFFFFFFF;
	}
	if (do_rapl & RAPL_DRAM_PERF_STATUS) {
		if (get_msr(cpu, MSR_DRAM_PERF_STATUS, &msr))
			return -16;
		p->rapl_dram_perf_status = msr & 0xFFFFFFFF;
	}
1487
	if (DO_BIC(BIC_PkgTmp)) {
1488 1489 1490 1491
		if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr))
			return -17;
		p->pkg_temp_c = tcc_activation_temp - ((msr >> 16) & 0x7F);
	}
L
Len Brown 已提交
1492

1493
	if (DO_BIC(BIC_GFX_rc6))
L
Len Brown 已提交
1494 1495
		p->gfx_rc6_ms = gfx_cur_rc6_ms;

1496
	if (DO_BIC(BIC_GFXMHz))
L
Len Brown 已提交
1497 1498
		p->gfx_mhz = gfx_cur_mhz;

1499 1500 1501 1502 1503
	for (i = 0, mp = sys.pp; mp; i++, mp = mp->next) {
		if (get_msr(cpu, mp->msr_num, &p->counter[i]))
			return -10;
	}

1504
	return 0;
L
Len Brown 已提交
1505 1506
}

1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524
/*
 * MSR_PKG_CST_CONFIG_CONTROL decoding for pkg_cstate_limit:
 * If you change the values, note they are used both in comparisons
 * (>= PCL__7) and to index pkg_cstate_limit_strings[].
 */

#define PCLUKN 0 /* Unknown */
#define PCLRSV 1 /* Reserved */
#define PCL__0 2 /* PC0 */
#define PCL__1 3 /* PC1 */
#define PCL__2 4 /* PC2 */
#define PCL__3 5 /* PC3 */
#define PCL__4 6 /* PC4 */
#define PCL__6 7 /* PC6 */
#define PCL_6N 8 /* PC6 No Retention */
#define PCL_6R 9 /* PC6 Retention */
#define PCL__7 10 /* PC7 */
#define PCL_7S 11 /* PC7 Shrink */
1525 1526 1527
#define PCL__8 12 /* PC8 */
#define PCL__9 13 /* PC9 */
#define PCLUNL 14 /* Unlimited */
1528 1529 1530

int pkg_cstate_limit = PCLUKN;
char *pkg_cstate_limit_strings[] = { "reserved", "unknown", "pc0", "pc1", "pc2",
1531
	"pc3", "pc4", "pc6", "pc6n", "pc6r", "pc7", "pc7s", "pc8", "pc9", "unlimited"};
1532

1533 1534 1535 1536
int nhm_pkg_cstate_limits[16] = {PCL__0, PCL__1, PCL__3, PCL__6, PCL__7, PCLRSV, PCLRSV, PCLUNL, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
int snb_pkg_cstate_limits[16] = {PCL__0, PCL__2, PCL_6N, PCL_6R, PCL__7, PCL_7S, PCLRSV, PCLUNL, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
int hsw_pkg_cstate_limits[16] = {PCL__0, PCL__2, PCL__3, PCL__6, PCL__7, PCL_7S, PCL__8, PCL__9, PCLUNL, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
int slv_pkg_cstate_limits[16] = {PCL__0, PCL__1, PCLRSV, PCLRSV, PCL__4, PCLRSV, PCL__6, PCL__7, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
1537
int amt_pkg_cstate_limits[16] = {PCLUNL, PCL__1, PCL__2, PCLRSV, PCLRSV, PCLRSV, PCL__6, PCL__7, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
1538
int phi_pkg_cstate_limits[16] = {PCL__0, PCL__2, PCL_6N, PCL_6R, PCLRSV, PCLRSV, PCLRSV, PCLUNL, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
1539
int bxt_pkg_cstate_limits[16] = {PCL__0, PCL__2, PCLUNL, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
1540
int skx_pkg_cstate_limits[16] = {PCL__0, PCL__2, PCL_6N, PCL_6R, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLUNL, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV, PCLRSV};
1541

1542 1543 1544 1545 1546 1547 1548

static void
calculate_tsc_tweak()
{
	tsc_tweak = base_hz / tsc_hz;
}

1549 1550
static void
dump_nhm_platform_info(void)
L
Len Brown 已提交
1551 1552 1553 1554
{
	unsigned long long msr;
	unsigned int ratio;

1555
	get_msr(base_cpu, MSR_PLATFORM_INFO, &msr);
L
Len Brown 已提交
1556

1557
	fprintf(outf, "cpu%d: MSR_PLATFORM_INFO: 0x%08llx\n", base_cpu, msr);
1558

L
Len Brown 已提交
1559
	ratio = (msr >> 40) & 0xFF;
1560
	fprintf(outf, "%d * %.0f = %.0f MHz max efficiency frequency\n",
L
Len Brown 已提交
1561 1562 1563
		ratio, bclk, ratio * bclk);

	ratio = (msr >> 8) & 0xFF;
1564
	fprintf(outf, "%d * %.0f = %.0f MHz base frequency\n",
L
Len Brown 已提交
1565 1566
		ratio, bclk, ratio * bclk);

1567
	get_msr(base_cpu, MSR_IA32_POWER_CTL, &msr);
1568
	fprintf(outf, "cpu%d: MSR_IA32_POWER_CTL: 0x%08llx (C1E auto-promotion: %sabled)\n",
1569
		base_cpu, msr, msr & 0x2 ? "EN" : "DIS");
1570

1571 1572 1573 1574 1575 1576 1577 1578 1579
	return;
}

static void
dump_hsw_turbo_ratio_limits(void)
{
	unsigned long long msr;
	unsigned int ratio;

1580
	get_msr(base_cpu, MSR_TURBO_RATIO_LIMIT2, &msr);
1581

1582
	fprintf(outf, "cpu%d: MSR_TURBO_RATIO_LIMIT2: 0x%08llx\n", base_cpu, msr);
1583 1584 1585

	ratio = (msr >> 8) & 0xFF;
	if (ratio)
1586
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 18 active cores\n",
1587 1588 1589 1590
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 0) & 0xFF;
	if (ratio)
1591
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 17 active cores\n",
1592 1593 1594 1595 1596 1597 1598 1599 1600
			ratio, bclk, ratio * bclk);
	return;
}

static void
dump_ivt_turbo_ratio_limits(void)
{
	unsigned long long msr;
	unsigned int ratio;
1601

1602
	get_msr(base_cpu, MSR_TURBO_RATIO_LIMIT1, &msr);
1603

1604
	fprintf(outf, "cpu%d: MSR_TURBO_RATIO_LIMIT1: 0x%08llx\n", base_cpu, msr);
1605 1606 1607

	ratio = (msr >> 56) & 0xFF;
	if (ratio)
1608
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 16 active cores\n",
1609 1610 1611 1612
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 48) & 0xFF;
	if (ratio)
1613
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 15 active cores\n",
1614 1615 1616 1617
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 40) & 0xFF;
	if (ratio)
1618
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 14 active cores\n",
1619 1620 1621 1622
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 32) & 0xFF;
	if (ratio)
1623
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 13 active cores\n",
1624 1625 1626 1627
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 24) & 0xFF;
	if (ratio)
1628
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 12 active cores\n",
1629 1630 1631 1632
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 16) & 0xFF;
	if (ratio)
1633
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 11 active cores\n",
1634 1635 1636 1637
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 8) & 0xFF;
	if (ratio)
1638
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 10 active cores\n",
1639 1640 1641 1642
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 0) & 0xFF;
	if (ratio)
1643
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 9 active cores\n",
1644
			ratio, bclk, ratio * bclk);
1645 1646
	return;
}
1647

1648 1649 1650 1651 1652
static void
dump_nhm_turbo_ratio_limits(void)
{
	unsigned long long msr;
	unsigned int ratio;
L
Len Brown 已提交
1653

1654
	get_msr(base_cpu, MSR_TURBO_RATIO_LIMIT, &msr);
L
Len Brown 已提交
1655

1656
	fprintf(outf, "cpu%d: MSR_TURBO_RATIO_LIMIT: 0x%08llx\n", base_cpu, msr);
1657 1658 1659

	ratio = (msr >> 56) & 0xFF;
	if (ratio)
1660
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 8 active cores\n",
1661 1662 1663 1664
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 48) & 0xFF;
	if (ratio)
1665
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 7 active cores\n",
1666 1667 1668 1669
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 40) & 0xFF;
	if (ratio)
1670
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 6 active cores\n",
1671 1672 1673 1674
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 32) & 0xFF;
	if (ratio)
1675
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 5 active cores\n",
1676 1677
			ratio, bclk, ratio * bclk);

L
Len Brown 已提交
1678 1679
	ratio = (msr >> 24) & 0xFF;
	if (ratio)
1680
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 4 active cores\n",
L
Len Brown 已提交
1681 1682 1683 1684
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 16) & 0xFF;
	if (ratio)
1685
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 3 active cores\n",
L
Len Brown 已提交
1686 1687 1688 1689
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 8) & 0xFF;
	if (ratio)
1690
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 2 active cores\n",
L
Len Brown 已提交
1691 1692 1693 1694
			ratio, bclk, ratio * bclk);

	ratio = (msr >> 0) & 0xFF;
	if (ratio)
1695
		fprintf(outf, "%d * %.0f = %.0f MHz max turbo 1 active cores\n",
L
Len Brown 已提交
1696
			ratio, bclk, ratio * bclk);
1697 1698
	return;
}
1699

1700 1701 1702
static void
dump_knl_turbo_ratio_limits(void)
{
1703 1704
	const unsigned int buckets_no = 7;

1705
	unsigned long long msr;
1706 1707 1708 1709
	int delta_cores, delta_ratio;
	int i, b_nr;
	unsigned int cores[buckets_no];
	unsigned int ratio[buckets_no];
1710

1711
	get_msr(base_cpu, MSR_TURBO_RATIO_LIMIT, &msr);
1712

1713
	fprintf(outf, "cpu%d: MSR_TURBO_RATIO_LIMIT: 0x%08llx\n",
1714
		base_cpu, msr);
1715 1716 1717

	/**
	 * Turbo encoding in KNL is as follows:
1718 1719
	 * [0] -- Reserved
	 * [7:1] -- Base value of number of active cores of bucket 1.
1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737
	 * [15:8] -- Base value of freq ratio of bucket 1.
	 * [20:16] -- +ve delta of number of active cores of bucket 2.
	 * i.e. active cores of bucket 2 =
	 * active cores of bucket 1 + delta
	 * [23:21] -- Negative delta of freq ratio of bucket 2.
	 * i.e. freq ratio of bucket 2 =
	 * freq ratio of bucket 1 - delta
	 * [28:24]-- +ve delta of number of active cores of bucket 3.
	 * [31:29]-- -ve delta of freq ratio of bucket 3.
	 * [36:32]-- +ve delta of number of active cores of bucket 4.
	 * [39:37]-- -ve delta of freq ratio of bucket 4.
	 * [44:40]-- +ve delta of number of active cores of bucket 5.
	 * [47:45]-- -ve delta of freq ratio of bucket 5.
	 * [52:48]-- +ve delta of number of active cores of bucket 6.
	 * [55:53]-- -ve delta of freq ratio of bucket 6.
	 * [60:56]-- +ve delta of number of active cores of bucket 7.
	 * [63:61]-- -ve delta of freq ratio of bucket 7.
	 */
1738 1739 1740 1741 1742 1743

	b_nr = 0;
	cores[b_nr] = (msr & 0xFF) >> 1;
	ratio[b_nr] = (msr >> 8) & 0xFF;

	for (i = 16; i < 64; i += 8) {
1744
		delta_cores = (msr >> i) & 0x1F;
1745 1746 1747 1748 1749
		delta_ratio = (msr >> (i + 5)) & 0x7;

		cores[b_nr + 1] = cores[b_nr] + delta_cores;
		ratio[b_nr + 1] = ratio[b_nr] - delta_ratio;
		b_nr++;
1750
	}
1751 1752 1753

	for (i = buckets_no - 1; i >= 0; i--)
		if (i > 0 ? ratio[i] != ratio[i - 1] : 1)
1754
			fprintf(outf,
1755
				"%d * %.0f = %.0f MHz max turbo %d active cores\n",
1756
				ratio[i], bclk, ratio[i] * bclk, cores[i]);
1757 1758
}

1759 1760 1761 1762 1763
static void
dump_nhm_cst_cfg(void)
{
	unsigned long long msr;

1764
	get_msr(base_cpu, MSR_PKG_CST_CONFIG_CONTROL, &msr);
1765 1766 1767 1768

#define SNB_C1_AUTO_UNDEMOTE              (1UL << 27)
#define SNB_C3_AUTO_UNDEMOTE              (1UL << 28)

1769
	fprintf(outf, "cpu%d: MSR_PKG_CST_CONFIG_CONTROL: 0x%08llx", base_cpu, msr);
1770

1771
	fprintf(outf, " (%s%s%s%s%slocked: pkg-cstate-limit=%d: %s)\n",
1772 1773 1774 1775 1776
		(msr & SNB_C3_AUTO_UNDEMOTE) ? "UNdemote-C3, " : "",
		(msr & SNB_C1_AUTO_UNDEMOTE) ? "UNdemote-C1, " : "",
		(msr & NHM_C3_AUTO_DEMOTE) ? "demote-C3, " : "",
		(msr & NHM_C1_AUTO_DEMOTE) ? "demote-C1, " : "",
		(msr & (1 << 15)) ? "" : "UN",
1777
		(unsigned int)msr & 0xF,
1778 1779
		pkg_cstate_limit_strings[pkg_cstate_limit]);
	return;
L
Len Brown 已提交
1780 1781
}

1782 1783 1784 1785 1786 1787
static void
dump_config_tdp(void)
{
	unsigned long long msr;

	get_msr(base_cpu, MSR_CONFIG_TDP_NOMINAL, &msr);
1788
	fprintf(outf, "cpu%d: MSR_CONFIG_TDP_NOMINAL: 0x%08llx", base_cpu, msr);
1789
	fprintf(outf, " (base_ratio=%d)\n", (unsigned int)msr & 0xFF);
1790 1791

	get_msr(base_cpu, MSR_CONFIG_TDP_LEVEL_1, &msr);
1792
	fprintf(outf, "cpu%d: MSR_CONFIG_TDP_LEVEL_1: 0x%08llx (", base_cpu, msr);
1793
	if (msr) {
1794 1795 1796 1797
		fprintf(outf, "PKG_MIN_PWR_LVL1=%d ", (unsigned int)(msr >> 48) & 0x7FFF);
		fprintf(outf, "PKG_MAX_PWR_LVL1=%d ", (unsigned int)(msr >> 32) & 0x7FFF);
		fprintf(outf, "LVL1_RATIO=%d ", (unsigned int)(msr >> 16) & 0xFF);
		fprintf(outf, "PKG_TDP_LVL1=%d", (unsigned int)(msr) & 0x7FFF);
1798
	}
1799
	fprintf(outf, ")\n");
1800 1801

	get_msr(base_cpu, MSR_CONFIG_TDP_LEVEL_2, &msr);
1802
	fprintf(outf, "cpu%d: MSR_CONFIG_TDP_LEVEL_2: 0x%08llx (", base_cpu, msr);
1803
	if (msr) {
1804 1805 1806 1807
		fprintf(outf, "PKG_MIN_PWR_LVL2=%d ", (unsigned int)(msr >> 48) & 0x7FFF);
		fprintf(outf, "PKG_MAX_PWR_LVL2=%d ", (unsigned int)(msr >> 32) & 0x7FFF);
		fprintf(outf, "LVL2_RATIO=%d ", (unsigned int)(msr >> 16) & 0xFF);
		fprintf(outf, "PKG_TDP_LVL2=%d", (unsigned int)(msr) & 0x7FFF);
1808
	}
1809
	fprintf(outf, ")\n");
1810 1811

	get_msr(base_cpu, MSR_CONFIG_TDP_CONTROL, &msr);
1812
	fprintf(outf, "cpu%d: MSR_CONFIG_TDP_CONTROL: 0x%08llx (", base_cpu, msr);
1813
	if ((msr) & 0x3)
1814 1815 1816
		fprintf(outf, "TDP_LEVEL=%d ", (unsigned int)(msr) & 0x3);
	fprintf(outf, " lock=%d", (unsigned int)(msr >> 31) & 1);
	fprintf(outf, ")\n");
1817

1818
	get_msr(base_cpu, MSR_TURBO_ACTIVATION_RATIO, &msr);
1819
	fprintf(outf, "cpu%d: MSR_TURBO_ACTIVATION_RATIO: 0x%08llx (", base_cpu, msr);
1820
	fprintf(outf, "MAX_NON_TURBO_RATIO=%d", (unsigned int)(msr) & 0xFF);
1821 1822
	fprintf(outf, " lock=%d", (unsigned int)(msr >> 31) & 1);
	fprintf(outf, ")\n");
1823
}
1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864

unsigned int irtl_time_units[] = {1, 32, 1024, 32768, 1048576, 33554432, 0, 0 };

void print_irtl(void)
{
	unsigned long long msr;

	get_msr(base_cpu, MSR_PKGC3_IRTL, &msr);
	fprintf(outf, "cpu%d: MSR_PKGC3_IRTL: 0x%08llx (", base_cpu, msr);
	fprintf(outf, "%svalid, %lld ns)\n", msr & (1 << 15) ? "" : "NOT",
		(msr & 0x3FF) * irtl_time_units[(msr >> 10) & 0x3]);

	get_msr(base_cpu, MSR_PKGC6_IRTL, &msr);
	fprintf(outf, "cpu%d: MSR_PKGC6_IRTL: 0x%08llx (", base_cpu, msr);
	fprintf(outf, "%svalid, %lld ns)\n", msr & (1 << 15) ? "" : "NOT",
		(msr & 0x3FF) * irtl_time_units[(msr >> 10) & 0x3]);

	get_msr(base_cpu, MSR_PKGC7_IRTL, &msr);
	fprintf(outf, "cpu%d: MSR_PKGC7_IRTL: 0x%08llx (", base_cpu, msr);
	fprintf(outf, "%svalid, %lld ns)\n", msr & (1 << 15) ? "" : "NOT",
		(msr & 0x3FF) * irtl_time_units[(msr >> 10) & 0x3]);

	if (!do_irtl_hsw)
		return;

	get_msr(base_cpu, MSR_PKGC8_IRTL, &msr);
	fprintf(outf, "cpu%d: MSR_PKGC8_IRTL: 0x%08llx (", base_cpu, msr);
	fprintf(outf, "%svalid, %lld ns)\n", msr & (1 << 15) ? "" : "NOT",
		(msr & 0x3FF) * irtl_time_units[(msr >> 10) & 0x3]);

	get_msr(base_cpu, MSR_PKGC9_IRTL, &msr);
	fprintf(outf, "cpu%d: MSR_PKGC9_IRTL: 0x%08llx (", base_cpu, msr);
	fprintf(outf, "%svalid, %lld ns)\n", msr & (1 << 15) ? "" : "NOT",
		(msr & 0x3FF) * irtl_time_units[(msr >> 10) & 0x3]);

	get_msr(base_cpu, MSR_PKGC10_IRTL, &msr);
	fprintf(outf, "cpu%d: MSR_PKGC10_IRTL: 0x%08llx (", base_cpu, msr);
	fprintf(outf, "%svalid, %lld ns)\n", msr & (1 << 15) ? "" : "NOT",
		(msr & 0x3FF) * irtl_time_units[(msr >> 10) & 0x3]);

}
1865 1866 1867 1868
void free_fd_percpu(void)
{
	int i;

1869
	for (i = 0; i < topo.max_cpu_num + 1; ++i) {
1870 1871 1872 1873 1874
		if (fd_percpu[i] != 0)
			close(fd_percpu[i]);
	}

	free(fd_percpu);
1875 1876
}

1877
void free_all_buffers(void)
L
Len Brown 已提交
1878
{
1879 1880
	CPU_FREE(cpu_present_set);
	cpu_present_set = NULL;
1881
	cpu_present_setsize = 0;
L
Len Brown 已提交
1882

1883 1884 1885
	CPU_FREE(cpu_affinity_set);
	cpu_affinity_set = NULL;
	cpu_affinity_setsize = 0;
L
Len Brown 已提交
1886

1887 1888 1889
	free(thread_even);
	free(core_even);
	free(package_even);
L
Len Brown 已提交
1890

1891 1892 1893
	thread_even = NULL;
	core_even = NULL;
	package_even = NULL;
L
Len Brown 已提交
1894

1895 1896 1897
	free(thread_odd);
	free(core_odd);
	free(package_odd);
L
Len Brown 已提交
1898

1899 1900 1901
	thread_odd = NULL;
	core_odd = NULL;
	package_odd = NULL;
L
Len Brown 已提交
1902

1903 1904 1905
	free(output_buffer);
	output_buffer = NULL;
	outp = NULL;
1906 1907

	free_fd_percpu();
1908 1909 1910

	free(irq_column_2_cpu);
	free(irqs_per_cpu);
L
Len Brown 已提交
1911 1912
}

1913 1914 1915 1916 1917
/*
 * Open a file, and exit on failure
 */
FILE *fopen_or_die(const char *path, const char *mode)
{
1918
	FILE *filep = fopen(path, mode);
1919 1920
	if (!filep)
		err(1, "%s: open failed", path);
1921 1922 1923
	return filep;
}

1924
/*
1925
 * Parse a file containing a single int.
1926
 */
1927
int parse_int_file(const char *fmt, ...)
L
Len Brown 已提交
1928
{
1929 1930
	va_list args;
	char path[PATH_MAX];
1931
	FILE *filep;
1932
	int value;
L
Len Brown 已提交
1933

1934 1935 1936
	va_start(args, fmt);
	vsnprintf(path, sizeof(path), fmt, args);
	va_end(args);
1937
	filep = fopen_or_die(path, "r");
1938 1939
	if (fscanf(filep, "%d", &value) != 1)
		err(1, "%s: failed to parse number from file", path);
1940
	fclose(filep);
1941 1942 1943 1944
	return value;
}

/*
1945 1946 1947
 * get_cpu_position_in_core(cpu)
 * return the position of the CPU among its HT siblings in the core
 * return -1 if the sibling is not in list
1948
 */
1949
int get_cpu_position_in_core(int cpu)
1950
{
1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979
	char path[64];
	FILE *filep;
	int this_cpu;
	char character;
	int i;

	sprintf(path,
		"/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list",
		cpu);
	filep = fopen(path, "r");
	if (filep == NULL) {
		perror(path);
		exit(1);
	}

	for (i = 0; i < topo.num_threads_per_core; i++) {
		fscanf(filep, "%d", &this_cpu);
		if (this_cpu == cpu) {
			fclose(filep);
			return i;
		}

		/* Account for no separator after last thread*/
		if (i != (topo.num_threads_per_core - 1))
			fscanf(filep, "%c", &character);
	}

	fclose(filep);
	return -1;
L
Len Brown 已提交
1980 1981
}

1982 1983 1984 1985 1986
/*
 * cpu_is_first_core_in_package(cpu)
 * return 1 if given CPU is 1st core in package
 */
int cpu_is_first_core_in_package(int cpu)
L
Len Brown 已提交
1987
{
1988
	return cpu == parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_siblings_list", cpu);
L
Len Brown 已提交
1989 1990 1991 1992
}

int get_physical_package_id(int cpu)
{
1993
	return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu);
L
Len Brown 已提交
1994 1995 1996 1997
}

int get_core_id(int cpu)
{
1998
	return parse_int_file("/sys/devices/system/cpu/cpu%d/topology/core_id", cpu);
L
Len Brown 已提交
1999 2000
}

2001 2002 2003 2004
int get_num_ht_siblings(int cpu)
{
	char path[80];
	FILE *filep;
2005 2006
	int sib1;
	int matches = 0;
2007
	char character;
2008 2009
	char str[100];
	char *ch;
2010 2011

	sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list", cpu);
2012
	filep = fopen_or_die(path, "r");
2013

2014 2015
	/*
	 * file format:
2016 2017
	 * A ',' separated or '-' separated set of numbers
	 * (eg 1-2 or 1,3,4,5)
2018
	 */
2019 2020 2021 2022 2023 2024 2025 2026
	fscanf(filep, "%d%c\n", &sib1, &character);
	fseek(filep, 0, SEEK_SET);
	fgets(str, 100, filep);
	ch = strchr(str, character);
	while (ch != NULL) {
		matches++;
		ch = strchr(ch+1, character);
	}
2027 2028

	fclose(filep);
2029
	return matches+1;
2030 2031
}

L
Len Brown 已提交
2032
/*
2033 2034
 * run func(thread, core, package) in topology order
 * skip non-present cpus
L
Len Brown 已提交
2035 2036
 */

2037 2038 2039 2040 2041 2042 2043 2044 2045 2046 2047 2048 2049 2050 2051 2052 2053 2054 2055 2056 2057 2058 2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080
int for_all_cpus_2(int (func)(struct thread_data *, struct core_data *,
	struct pkg_data *, struct thread_data *, struct core_data *,
	struct pkg_data *), struct thread_data *thread_base,
	struct core_data *core_base, struct pkg_data *pkg_base,
	struct thread_data *thread_base2, struct core_data *core_base2,
	struct pkg_data *pkg_base2)
{
	int retval, pkg_no, core_no, thread_no;

	for (pkg_no = 0; pkg_no < topo.num_packages; ++pkg_no) {
		for (core_no = 0; core_no < topo.num_cores_per_pkg; ++core_no) {
			for (thread_no = 0; thread_no <
				topo.num_threads_per_core; ++thread_no) {
				struct thread_data *t, *t2;
				struct core_data *c, *c2;
				struct pkg_data *p, *p2;

				t = GET_THREAD(thread_base, thread_no, core_no, pkg_no);

				if (cpu_is_not_present(t->cpu_id))
					continue;

				t2 = GET_THREAD(thread_base2, thread_no, core_no, pkg_no);

				c = GET_CORE(core_base, core_no, pkg_no);
				c2 = GET_CORE(core_base2, core_no, pkg_no);

				p = GET_PKG(pkg_base, pkg_no);
				p2 = GET_PKG(pkg_base2, pkg_no);

				retval = func(t, c, p, t2, c2, p2);
				if (retval)
					return retval;
			}
		}
	}
	return 0;
}

/*
 * run func(cpu) on every cpu in /proc/stat
 * return max_cpu number
 */
int for_all_proc_cpus(int (func)(int))
L
Len Brown 已提交
2081 2082
{
	FILE *fp;
2083
	int cpu_num;
L
Len Brown 已提交
2084 2085
	int retval;

2086
	fp = fopen_or_die(proc_stat, "r");
L
Len Brown 已提交
2087 2088

	retval = fscanf(fp, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n");
2089 2090
	if (retval != 0)
		err(1, "%s: failed to parse format", proc_stat);
L
Len Brown 已提交
2091

2092 2093
	while (1) {
		retval = fscanf(fp, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu_num);
L
Len Brown 已提交
2094 2095 2096
		if (retval != 1)
			break;

2097 2098 2099 2100 2101
		retval = func(cpu_num);
		if (retval) {
			fclose(fp);
			return(retval);
		}
L
Len Brown 已提交
2102 2103
	}
	fclose(fp);
2104
	return 0;
L
Len Brown 已提交
2105 2106 2107 2108
}

void re_initialize(void)
{
2109 2110 2111
	free_all_buffers();
	setup_all_buffers();
	printf("turbostat: re-initialized with num_cpus %d\n", topo.num_cpus);
L
Len Brown 已提交
2112 2113
}

2114

L
Len Brown 已提交
2115
/*
2116 2117
 * count_cpus()
 * remember the last one seen, it will be the max
L
Len Brown 已提交
2118
 */
2119
int count_cpus(int cpu)
L
Len Brown 已提交
2120
{
2121 2122
	if (topo.max_cpu_num < cpu)
		topo.max_cpu_num = cpu;
L
Len Brown 已提交
2123

2124 2125 2126 2127 2128 2129
	topo.num_cpus += 1;
	return 0;
}
int mark_cpu_present(int cpu)
{
	CPU_SET_S(cpu, cpu_present_setsize, cpu_present_set);
2130
	return 0;
L
Len Brown 已提交
2131 2132
}

2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195
/*
 * snapshot_proc_interrupts()
 *
 * read and record summary of /proc/interrupts
 *
 * return 1 if config change requires a restart, else return 0
 */
int snapshot_proc_interrupts(void)
{
	static FILE *fp;
	int column, retval;

	if (fp == NULL)
		fp = fopen_or_die("/proc/interrupts", "r");
	else
		rewind(fp);

	/* read 1st line of /proc/interrupts to get cpu* name for each column */
	for (column = 0; column < topo.num_cpus; ++column) {
		int cpu_number;

		retval = fscanf(fp, " CPU%d", &cpu_number);
		if (retval != 1)
			break;

		if (cpu_number > topo.max_cpu_num) {
			warn("/proc/interrupts: cpu%d: > %d", cpu_number, topo.max_cpu_num);
			return 1;
		}

		irq_column_2_cpu[column] = cpu_number;
		irqs_per_cpu[cpu_number] = 0;
	}

	/* read /proc/interrupt count lines and sum up irqs per cpu */
	while (1) {
		int column;
		char buf[64];

		retval = fscanf(fp, " %s:", buf);	/* flush irq# "N:" */
		if (retval != 1)
			break;

		/* read the count per cpu */
		for (column = 0; column < topo.num_cpus; ++column) {

			int cpu_number, irq_count;

			retval = fscanf(fp, " %d", &irq_count);
			if (retval != 1)
				break;

			cpu_number = irq_column_2_cpu[column];
			irqs_per_cpu[cpu_number] += irq_count;

		}

		while (getc(fp) != '\n')
			;	/* flush interrupt description */

	}
	return 0;
}
L
Len Brown 已提交
2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218
/*
 * snapshot_gfx_rc6_ms()
 *
 * record snapshot of
 * /sys/class/drm/card0/power/rc6_residency_ms
 *
 * return 1 if config change requires a restart, else return 0
 */
int snapshot_gfx_rc6_ms(void)
{
	FILE *fp;
	int retval;

	fp = fopen_or_die("/sys/class/drm/card0/power/rc6_residency_ms", "r");

	retval = fscanf(fp, "%lld", &gfx_cur_rc6_ms);
	if (retval != 1)
		err(1, "GFX rc6");

	fclose(fp);

	return 0;
}
L
Len Brown 已提交
2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242
/*
 * snapshot_gfx_mhz()
 *
 * record snapshot of
 * /sys/class/graphics/fb0/device/drm/card0/gt_cur_freq_mhz
 *
 * return 1 if config change requires a restart, else return 0
 */
int snapshot_gfx_mhz(void)
{
	static FILE *fp;
	int retval;

	if (fp == NULL)
		fp = fopen_or_die("/sys/class/graphics/fb0/device/drm/card0/gt_cur_freq_mhz", "r");
	else
		rewind(fp);

	retval = fscanf(fp, "%d", &gfx_cur_mhz);
	if (retval != 1)
		err(1, "GFX MHz");

	return 0;
}
2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253

/*
 * snapshot /proc and /sys files
 *
 * return 1 if configuration restart needed, else return 0
 */
int snapshot_proc_sysfs_files(void)
{
	if (snapshot_proc_interrupts())
		return 1;

2254
	if (DO_BIC(BIC_GFX_rc6))
L
Len Brown 已提交
2255 2256
		snapshot_gfx_rc6_ms();

2257
	if (DO_BIC(BIC_GFXMHz))
L
Len Brown 已提交
2258 2259
		snapshot_gfx_mhz();

2260 2261 2262
	return 0;
}

L
Len Brown 已提交
2263 2264
void turbostat_loop()
{
2265
	int retval;
2266
	int restarted = 0;
2267

L
Len Brown 已提交
2268
restart:
2269 2270
	restarted++;

2271
	snapshot_proc_sysfs_files();
2272
	retval = for_all_cpus(get_counters, EVEN_COUNTERS);
2273 2274 2275
	if (retval < -1) {
		exit(retval);
	} else if (retval == -1) {
2276 2277 2278
		if (restarted > 1) {
			exit(retval);
		}
2279 2280 2281
		re_initialize();
		goto restart;
	}
2282
	restarted = 0;
L
Len Brown 已提交
2283 2284 2285
	gettimeofday(&tv_even, (struct timezone *)NULL);

	while (1) {
2286
		if (for_all_proc_cpus(cpu_is_not_present)) {
L
Len Brown 已提交
2287 2288 2289
			re_initialize();
			goto restart;
		}
2290
		nanosleep(&interval_ts, NULL);
2291 2292
		if (snapshot_proc_sysfs_files())
			goto restart;
2293
		retval = for_all_cpus(get_counters, ODD_COUNTERS);
2294 2295 2296
		if (retval < -1) {
			exit(retval);
		} else if (retval == -1) {
2297 2298 2299
			re_initialize();
			goto restart;
		}
L
Len Brown 已提交
2300 2301
		gettimeofday(&tv_odd, (struct timezone *)NULL);
		timersub(&tv_odd, &tv_even, &tv_delta);
2302 2303 2304 2305
		if (for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS)) {
			re_initialize();
			goto restart;
		}
2306 2307
		compute_average(EVEN_COUNTERS);
		format_all_counters(EVEN_COUNTERS);
2308
		flush_output_stdout();
2309
		nanosleep(&interval_ts, NULL);
2310 2311
		if (snapshot_proc_sysfs_files())
			goto restart;
2312
		retval = for_all_cpus(get_counters, EVEN_COUNTERS);
2313 2314 2315
		if (retval < -1) {
			exit(retval);
		} else if (retval == -1) {
L
Len Brown 已提交
2316 2317 2318 2319 2320
			re_initialize();
			goto restart;
		}
		gettimeofday(&tv_even, (struct timezone *)NULL);
		timersub(&tv_even, &tv_odd, &tv_delta);
2321 2322 2323 2324
		if (for_all_cpus_2(delta_cpu, EVEN_COUNTERS, ODD_COUNTERS)) {
			re_initialize();
			goto restart;
		}
2325 2326
		compute_average(ODD_COUNTERS);
		format_all_counters(ODD_COUNTERS);
2327
		flush_output_stdout();
L
Len Brown 已提交
2328 2329 2330 2331 2332 2333
	}
}

void check_dev_msr()
{
	struct stat sb;
2334
	char pathname[32];
L
Len Brown 已提交
2335

2336 2337
	sprintf(pathname, "/dev/cpu/%d/msr", base_cpu);
	if (stat(pathname, &sb))
2338 2339
 		if (system("/sbin/modprobe msr > /dev/null 2>&1"))
			err(-5, "no /dev/cpu/0/msr, Try \"# modprobe msr\" ");
L
Len Brown 已提交
2340 2341
}

2342
void check_permissions()
L
Len Brown 已提交
2343
{
2344 2345 2346 2347 2348 2349
	struct __user_cap_header_struct cap_header_data;
	cap_user_header_t cap_header = &cap_header_data;
	struct __user_cap_data_struct cap_data_data;
	cap_user_data_t cap_data = &cap_data_data;
	extern int capget(cap_user_header_t hdrp, cap_user_data_t datap);
	int do_exit = 0;
2350
	char pathname[32];
2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364

	/* check for CAP_SYS_RAWIO */
	cap_header->pid = getpid();
	cap_header->version = _LINUX_CAPABILITY_VERSION;
	if (capget(cap_header, cap_data) < 0)
		err(-6, "capget(2) failed");

	if ((cap_data->effective & (1 << CAP_SYS_RAWIO)) == 0) {
		do_exit++;
		warnx("capget(CAP_SYS_RAWIO) failed,"
			" try \"# setcap cap_sys_rawio=ep %s\"", progname);
	}

	/* test file permissions */
2365 2366
	sprintf(pathname, "/dev/cpu/%d/msr", base_cpu);
	if (euidaccess(pathname, R_OK)) {
2367 2368 2369 2370 2371 2372 2373
		do_exit++;
		warn("/dev/cpu/0/msr open failed, try chown or chmod +r /dev/cpu/*/msr");
	}

	/* if all else fails, thell them to be root */
	if (do_exit)
		if (getuid() != 0)
2374
			warnx("... or simply run as root");
2375 2376 2377

	if (do_exit)
		exit(-6);
L
Len Brown 已提交
2378 2379
}

2380 2381 2382 2383 2384
/*
 * NHM adds support for additional MSRs:
 *
 * MSR_SMI_COUNT                   0x00000034
 *
2385
 * MSR_PLATFORM_INFO               0x000000ce
2386
 * MSR_PKG_CST_CONFIG_CONTROL     0x000000e2
2387
 *
2388 2389
 * MSR_MISC_PWR_MGMT               0x000001aa
 *
2390 2391 2392 2393 2394
 * MSR_PKG_C3_RESIDENCY            0x000003f8
 * MSR_PKG_C6_RESIDENCY            0x000003f9
 * MSR_CORE_C3_RESIDENCY           0x000003fc
 * MSR_CORE_C6_RESIDENCY           0x000003fd
 *
2395
 * Side effect:
2396
 * sets global pkg_cstate_limit to decode MSR_PKG_CST_CONFIG_CONTROL
2397
 */
2398
int probe_nhm_msrs(unsigned int family, unsigned int model)
L
Len Brown 已提交
2399
{
2400
	unsigned long long msr;
2401
	unsigned int base_ratio;
2402 2403
	int *pkg_cstate_limits;

L
Len Brown 已提交
2404 2405 2406 2407 2408 2409
	if (!genuine_intel)
		return 0;

	if (family != 6)
		return 0;

2410 2411
	bclk = discover_bclk(family, model);

L
Len Brown 已提交
2412
	switch (model) {
2413 2414
	case INTEL_FAM6_NEHALEM_EP:	/* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */
	case INTEL_FAM6_NEHALEM:	/* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */
L
Len Brown 已提交
2415
	case 0x1F:	/* Core i7 and i5 Processor - Nehalem */
2416 2417 2418 2419
	case INTEL_FAM6_WESTMERE:	/* Westmere Client - Clarkdale, Arrandale */
	case INTEL_FAM6_WESTMERE_EP:	/* Westmere EP - Gulftown */
	case INTEL_FAM6_NEHALEM_EX:	/* Nehalem-EX Xeon - Beckton */
	case INTEL_FAM6_WESTMERE_EX:	/* Westmere-EX Xeon - Eagleton */
2420 2421
		pkg_cstate_limits = nhm_pkg_cstate_limits;
		break;
2422 2423 2424 2425
	case INTEL_FAM6_SANDYBRIDGE:	/* SNB */
	case INTEL_FAM6_SANDYBRIDGE_X:	/* SNB Xeon */
	case INTEL_FAM6_IVYBRIDGE:	/* IVB */
	case INTEL_FAM6_IVYBRIDGE_X:	/* IVB Xeon */
2426 2427
		pkg_cstate_limits = snb_pkg_cstate_limits;
		break;
2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439
	case INTEL_FAM6_HASWELL_CORE:	/* HSW */
	case INTEL_FAM6_HASWELL_X:	/* HSX */
	case INTEL_FAM6_HASWELL_ULT:	/* HSW */
	case INTEL_FAM6_HASWELL_GT3E:	/* HSW */
	case INTEL_FAM6_BROADWELL_CORE:	/* BDW */
	case INTEL_FAM6_BROADWELL_GT3E:	/* BDW */
	case INTEL_FAM6_BROADWELL_X:	/* BDX */
	case INTEL_FAM6_BROADWELL_XEON_D:	/* BDX-DE */
	case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
	case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
	case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
	case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
2440 2441
		pkg_cstate_limits = hsw_pkg_cstate_limits;
		break;
2442 2443 2444
	case INTEL_FAM6_SKYLAKE_X:	/* SKX */
		pkg_cstate_limits = skx_pkg_cstate_limits;
		break;
2445
	case INTEL_FAM6_ATOM_SILVERMONT1:	/* BYT */
2446
		no_MSR_MISC_PWR_MGMT = 1;
2447
	case INTEL_FAM6_ATOM_SILVERMONT2:	/* AVN */
2448 2449
		pkg_cstate_limits = slv_pkg_cstate_limits;
		break;
2450
	case INTEL_FAM6_ATOM_AIRMONT:	/* AMT */
2451
		pkg_cstate_limits = amt_pkg_cstate_limits;
2452
		no_MSR_MISC_PWR_MGMT = 1;
2453
		break;
2454
	case INTEL_FAM6_XEON_PHI_KNL:	/* PHI */
2455
	case INTEL_FAM6_XEON_PHI_KNM:
2456 2457
		pkg_cstate_limits = phi_pkg_cstate_limits;
		break;
2458 2459
	case INTEL_FAM6_ATOM_GOLDMONT:	/* BXT */
	case INTEL_FAM6_ATOM_DENVERTON:	/* DNV */
2460 2461
		pkg_cstate_limits = bxt_pkg_cstate_limits;
		break;
L
Len Brown 已提交
2462 2463 2464
	default:
		return 0;
	}
2465
	get_msr(base_cpu, MSR_PKG_CST_CONFIG_CONTROL, &msr);
2466
	pkg_cstate_limit = pkg_cstate_limits[msr & 0xF];
2467

2468
	get_msr(base_cpu, MSR_PLATFORM_INFO, &msr);
2469 2470 2471 2472
	base_ratio = (msr >> 8) & 0xFF;

	base_hz = base_ratio * bclk * 1000000;
	has_base_hz = 1;
2473
	return 1;
L
Len Brown 已提交
2474
}
2475 2476 2477 2478
int has_nhm_turbo_ratio_limit(unsigned int family, unsigned int model)
{
	switch (model) {
	/* Nehalem compatible, but do not include turbo-ratio limit support */
2479 2480 2481
	case INTEL_FAM6_NEHALEM_EX:	/* Nehalem-EX Xeon - Beckton */
	case INTEL_FAM6_WESTMERE_EX:	/* Westmere-EX Xeon - Eagleton */
	case INTEL_FAM6_XEON_PHI_KNL:	/* PHI - Knights Landing (different MSR definition) */
2482
	case INTEL_FAM6_XEON_PHI_KNM:
2483 2484 2485 2486 2487
		return 0;
	default:
		return 1;
	}
}
2488 2489 2490 2491 2492 2493 2494 2495 2496
int has_ivt_turbo_ratio_limit(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;

	if (family != 6)
		return 0;

	switch (model) {
2497 2498
	case INTEL_FAM6_IVYBRIDGE_X:	/* IVB Xeon */
	case INTEL_FAM6_HASWELL_X:	/* HSW Xeon */
2499 2500 2501 2502 2503 2504 2505 2506 2507 2508 2509 2510 2511 2512
		return 1;
	default:
		return 0;
	}
}
int has_hsw_turbo_ratio_limit(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;

	if (family != 6)
		return 0;

	switch (model) {
2513
	case INTEL_FAM6_HASWELL_X:	/* HSW Xeon */
2514 2515 2516 2517 2518 2519
		return 1;
	default:
		return 0;
	}
}

2520 2521 2522 2523 2524 2525 2526 2527 2528
int has_knl_turbo_ratio_limit(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;

	if (family != 6)
		return 0;

	switch (model) {
2529
	case INTEL_FAM6_XEON_PHI_KNL:	/* Knights Landing */
2530
	case INTEL_FAM6_XEON_PHI_KNM:
2531 2532 2533 2534 2535
		return 1;
	default:
		return 0;
	}
}
2536 2537 2538 2539 2540 2541 2542 2543 2544
int has_config_tdp(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;

	if (family != 6)
		return 0;

	switch (model) {
2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560
	case INTEL_FAM6_IVYBRIDGE:	/* IVB */
	case INTEL_FAM6_HASWELL_CORE:	/* HSW */
	case INTEL_FAM6_HASWELL_X:	/* HSX */
	case INTEL_FAM6_HASWELL_ULT:	/* HSW */
	case INTEL_FAM6_HASWELL_GT3E:	/* HSW */
	case INTEL_FAM6_BROADWELL_CORE:	/* BDW */
	case INTEL_FAM6_BROADWELL_GT3E:	/* BDW */
	case INTEL_FAM6_BROADWELL_X:	/* BDX */
	case INTEL_FAM6_BROADWELL_XEON_D:	/* BDX-DE */
	case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
	case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
	case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
	case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
	case INTEL_FAM6_SKYLAKE_X:	/* SKX */

	case INTEL_FAM6_XEON_PHI_KNL:	/* Knights Landing */
2561
	case INTEL_FAM6_XEON_PHI_KNM:
2562 2563 2564 2565 2566 2567
		return 1;
	default:
		return 0;
	}
}

2568
static void
2569
dump_cstate_pstate_config_info(unsigned int family, unsigned int model)
2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584
{
	if (!do_nhm_platform_info)
		return;

	dump_nhm_platform_info();

	if (has_hsw_turbo_ratio_limit(family, model))
		dump_hsw_turbo_ratio_limits();

	if (has_ivt_turbo_ratio_limit(family, model))
		dump_ivt_turbo_ratio_limits();

	if (has_nhm_turbo_ratio_limit(family, model))
		dump_nhm_turbo_ratio_limits();

2585 2586 2587
	if (has_knl_turbo_ratio_limit(family, model))
		dump_knl_turbo_ratio_limits();

2588 2589 2590
	if (has_config_tdp(family, model))
		dump_config_tdp();

2591 2592 2593 2594
	dump_nhm_cst_cfg();
}


2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606 2607 2608 2609 2610 2611 2612 2613 2614
/*
 * print_epb()
 * Decode the ENERGY_PERF_BIAS MSR
 */
int print_epb(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	unsigned long long msr;
	char *epb_string;
	int cpu;

	if (!has_epb)
		return 0;

	cpu = t->cpu_id;

	/* EPB is per-package */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

	if (cpu_migrate(cpu)) {
2615
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
2616 2617 2618 2619 2620 2621
		return -1;
	}

	if (get_msr(cpu, MSR_IA32_ENERGY_PERF_BIAS, &msr))
		return 0;

2622
	switch (msr & 0xF) {
2623 2624 2625 2626 2627 2628 2629 2630 2631 2632 2633 2634 2635
	case ENERGY_PERF_BIAS_PERFORMANCE:
		epb_string = "performance";
		break;
	case ENERGY_PERF_BIAS_NORMAL:
		epb_string = "balanced";
		break;
	case ENERGY_PERF_BIAS_POWERSAVE:
		epb_string = "powersave";
		break;
	default:
		epb_string = "custom";
		break;
	}
2636
	fprintf(outf, "cpu%d: MSR_IA32_ENERGY_PERF_BIAS: 0x%08llx (%s)\n", cpu, msr, epb_string);
2637 2638 2639

	return 0;
}
2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658
/*
 * print_hwp()
 * Decode the MSR_HWP_CAPABILITIES
 */
int print_hwp(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	unsigned long long msr;
	int cpu;

	if (!has_hwp)
		return 0;

	cpu = t->cpu_id;

	/* MSR_HWP_CAPABILITIES is per-package */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

	if (cpu_migrate(cpu)) {
2659
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
2660 2661 2662 2663 2664 2665
		return -1;
	}

	if (get_msr(cpu, MSR_PM_ENABLE, &msr))
		return 0;

2666
	fprintf(outf, "cpu%d: MSR_PM_ENABLE: 0x%08llx (%sHWP)\n",
2667 2668 2669 2670 2671 2672 2673 2674 2675
		cpu, msr, (msr & (1 << 0)) ? "" : "No-");

	/* MSR_PM_ENABLE[1] == 1 if HWP is enabled and MSRs visible */
	if ((msr & (1 << 0)) == 0)
		return 0;

	if (get_msr(cpu, MSR_HWP_CAPABILITIES, &msr))
		return 0;

2676
	fprintf(outf, "cpu%d: MSR_HWP_CAPABILITIES: 0x%08llx "
2677 2678 2679 2680 2681 2682 2683 2684 2685 2686
			"(high 0x%x guar 0x%x eff 0x%x low 0x%x)\n",
			cpu, msr,
			(unsigned int)HWP_HIGHEST_PERF(msr),
			(unsigned int)HWP_GUARANTEED_PERF(msr),
			(unsigned int)HWP_MOSTEFFICIENT_PERF(msr),
			(unsigned int)HWP_LOWEST_PERF(msr));

	if (get_msr(cpu, MSR_HWP_REQUEST, &msr))
		return 0;

2687
	fprintf(outf, "cpu%d: MSR_HWP_REQUEST: 0x%08llx "
2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698 2699 2700
			"(min 0x%x max 0x%x des 0x%x epp 0x%x window 0x%x pkg 0x%x)\n",
			cpu, msr,
			(unsigned int)(((msr) >> 0) & 0xff),
			(unsigned int)(((msr) >> 8) & 0xff),
			(unsigned int)(((msr) >> 16) & 0xff),
			(unsigned int)(((msr) >> 24) & 0xff),
			(unsigned int)(((msr) >> 32) & 0xff3),
			(unsigned int)(((msr) >> 42) & 0x1));

	if (has_hwp_pkg) {
		if (get_msr(cpu, MSR_HWP_REQUEST_PKG, &msr))
			return 0;

2701
		fprintf(outf, "cpu%d: MSR_HWP_REQUEST_PKG: 0x%08llx "
2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713
			"(min 0x%x max 0x%x des 0x%x epp 0x%x window 0x%x)\n",
			cpu, msr,
			(unsigned int)(((msr) >> 0) & 0xff),
			(unsigned int)(((msr) >> 8) & 0xff),
			(unsigned int)(((msr) >> 16) & 0xff),
			(unsigned int)(((msr) >> 24) & 0xff),
			(unsigned int)(((msr) >> 32) & 0xff3));
	}
	if (has_hwp_notify) {
		if (get_msr(cpu, MSR_HWP_INTERRUPT, &msr))
			return 0;

2714
		fprintf(outf, "cpu%d: MSR_HWP_INTERRUPT: 0x%08llx "
2715 2716 2717 2718 2719 2720 2721 2722
			"(%s_Guaranteed_Perf_Change, %s_Excursion_Min)\n",
			cpu, msr,
			((msr) & 0x1) ? "EN" : "Dis",
			((msr) & 0x2) ? "EN" : "Dis");
	}
	if (get_msr(cpu, MSR_HWP_STATUS, &msr))
		return 0;

2723
	fprintf(outf, "cpu%d: MSR_HWP_STATUS: 0x%08llx "
2724 2725 2726 2727
			"(%sGuaranteed_Perf_Change, %sExcursion_Min)\n",
			cpu, msr,
			((msr) & 0x1) ? "" : "No-",
			((msr) & 0x2) ? "" : "No-");
2728 2729 2730 2731

	return 0;
}

2732 2733 2734 2735 2736 2737 2738 2739 2740 2741 2742 2743 2744 2745 2746
/*
 * print_perf_limit()
 */
int print_perf_limit(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	unsigned long long msr;
	int cpu;

	cpu = t->cpu_id;

	/* per-package */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

	if (cpu_migrate(cpu)) {
2747
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
2748 2749 2750 2751 2752
		return -1;
	}

	if (do_core_perf_limit_reasons) {
		get_msr(cpu, MSR_CORE_PERF_LIMIT_REASONS, &msr);
2753 2754
		fprintf(outf, "cpu%d: MSR_CORE_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr);
		fprintf(outf, " (Active: %s%s%s%s%s%s%s%s%s%s%s%s%s%s)",
2755
			(msr & 1 << 15) ? "bit15, " : "",
2756
			(msr & 1 << 14) ? "bit14, " : "",
2757 2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768
			(msr & 1 << 13) ? "Transitions, " : "",
			(msr & 1 << 12) ? "MultiCoreTurbo, " : "",
			(msr & 1 << 11) ? "PkgPwrL2, " : "",
			(msr & 1 << 10) ? "PkgPwrL1, " : "",
			(msr & 1 << 9) ? "CorePwr, " : "",
			(msr & 1 << 8) ? "Amps, " : "",
			(msr & 1 << 6) ? "VR-Therm, " : "",
			(msr & 1 << 5) ? "Auto-HWP, " : "",
			(msr & 1 << 4) ? "Graphics, " : "",
			(msr & 1 << 2) ? "bit2, " : "",
			(msr & 1 << 1) ? "ThermStatus, " : "",
			(msr & 1 << 0) ? "PROCHOT, " : "");
2769
		fprintf(outf, " (Logged: %s%s%s%s%s%s%s%s%s%s%s%s%s%s)\n",
2770
			(msr & 1 << 31) ? "bit31, " : "",
2771
			(msr & 1 << 30) ? "bit30, " : "",
2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783
			(msr & 1 << 29) ? "Transitions, " : "",
			(msr & 1 << 28) ? "MultiCoreTurbo, " : "",
			(msr & 1 << 27) ? "PkgPwrL2, " : "",
			(msr & 1 << 26) ? "PkgPwrL1, " : "",
			(msr & 1 << 25) ? "CorePwr, " : "",
			(msr & 1 << 24) ? "Amps, " : "",
			(msr & 1 << 22) ? "VR-Therm, " : "",
			(msr & 1 << 21) ? "Auto-HWP, " : "",
			(msr & 1 << 20) ? "Graphics, " : "",
			(msr & 1 << 18) ? "bit18, " : "",
			(msr & 1 << 17) ? "ThermStatus, " : "",
			(msr & 1 << 16) ? "PROCHOT, " : "");
2784 2785 2786 2787

	}
	if (do_gfx_perf_limit_reasons) {
		get_msr(cpu, MSR_GFX_PERF_LIMIT_REASONS, &msr);
2788 2789
		fprintf(outf, "cpu%d: MSR_GFX_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr);
		fprintf(outf, " (Active: %s%s%s%s%s%s%s%s)",
2790 2791 2792 2793 2794 2795 2796 2797
			(msr & 1 << 0) ? "PROCHOT, " : "",
			(msr & 1 << 1) ? "ThermStatus, " : "",
			(msr & 1 << 4) ? "Graphics, " : "",
			(msr & 1 << 6) ? "VR-Therm, " : "",
			(msr & 1 << 8) ? "Amps, " : "",
			(msr & 1 << 9) ? "GFXPwr, " : "",
			(msr & 1 << 10) ? "PkgPwrL1, " : "",
			(msr & 1 << 11) ? "PkgPwrL2, " : "");
2798
		fprintf(outf, " (Logged: %s%s%s%s%s%s%s%s)\n",
2799 2800 2801 2802 2803 2804 2805 2806 2807 2808 2809
			(msr & 1 << 16) ? "PROCHOT, " : "",
			(msr & 1 << 17) ? "ThermStatus, " : "",
			(msr & 1 << 20) ? "Graphics, " : "",
			(msr & 1 << 22) ? "VR-Therm, " : "",
			(msr & 1 << 24) ? "Amps, " : "",
			(msr & 1 << 25) ? "GFXPwr, " : "",
			(msr & 1 << 26) ? "PkgPwrL1, " : "",
			(msr & 1 << 27) ? "PkgPwrL2, " : "");
	}
	if (do_ring_perf_limit_reasons) {
		get_msr(cpu, MSR_RING_PERF_LIMIT_REASONS, &msr);
2810 2811
		fprintf(outf, "cpu%d: MSR_RING_PERF_LIMIT_REASONS, 0x%08llx", cpu, msr);
		fprintf(outf, " (Active: %s%s%s%s%s%s)",
2812 2813 2814 2815 2816 2817
			(msr & 1 << 0) ? "PROCHOT, " : "",
			(msr & 1 << 1) ? "ThermStatus, " : "",
			(msr & 1 << 6) ? "VR-Therm, " : "",
			(msr & 1 << 8) ? "Amps, " : "",
			(msr & 1 << 10) ? "PkgPwrL1, " : "",
			(msr & 1 << 11) ? "PkgPwrL2, " : "");
2818
		fprintf(outf, " (Logged: %s%s%s%s%s%s)\n",
2819 2820 2821 2822 2823 2824 2825 2826 2827 2828
			(msr & 1 << 16) ? "PROCHOT, " : "",
			(msr & 1 << 17) ? "ThermStatus, " : "",
			(msr & 1 << 22) ? "VR-Therm, " : "",
			(msr & 1 << 24) ? "Amps, " : "",
			(msr & 1 << 26) ? "PkgPwrL1, " : "",
			(msr & 1 << 27) ? "PkgPwrL2, " : "");
	}
	return 0;
}

2829 2830 2831
#define	RAPL_POWER_GRANULARITY	0x7FFF	/* 15 bit power granularity */
#define	RAPL_TIME_GRANULARITY	0x3F /* 6 bit time granularity */

2832
double get_tdp(unsigned int model)
2833 2834 2835 2836
{
	unsigned long long msr;

	if (do_rapl & RAPL_PKG_POWER_INFO)
2837
		if (!get_msr(base_cpu, MSR_PKG_POWER_INFO, &msr))
2838 2839 2840
			return ((msr >> 0) & RAPL_POWER_GRANULARITY) * rapl_power_units;

	switch (model) {
2841 2842
	case INTEL_FAM6_ATOM_SILVERMONT1:
	case INTEL_FAM6_ATOM_SILVERMONT2:
2843 2844 2845 2846 2847 2848
		return 30.0;
	default:
		return 135.0;
	}
}

2849 2850 2851 2852 2853 2854 2855 2856 2857 2858
/*
 * rapl_dram_energy_units_probe()
 * Energy units are either hard-coded, or come from RAPL Energy Unit MSR.
 */
static double
rapl_dram_energy_units_probe(int  model, double rapl_energy_units)
{
	/* only called for genuine_intel, family 6 */

	switch (model) {
2859 2860 2861 2862
	case INTEL_FAM6_HASWELL_X:	/* HSX */
	case INTEL_FAM6_BROADWELL_X:	/* BDX */
	case INTEL_FAM6_BROADWELL_XEON_D:	/* BDX-DE */
	case INTEL_FAM6_XEON_PHI_KNL:	/* KNL */
2863
	case INTEL_FAM6_XEON_PHI_KNM:
2864 2865 2866 2867 2868 2869
		return (rapl_dram_energy_units = 15.3 / 1000000);
	default:
		return (rapl_energy_units);
	}
}

2870

2871 2872 2873
/*
 * rapl_probe()
 *
2874
 * sets do_rapl, rapl_power_units, rapl_energy_units, rapl_time_units
2875 2876 2877 2878
 */
void rapl_probe(unsigned int family, unsigned int model)
{
	unsigned long long msr;
2879
	unsigned int time_unit;
2880 2881 2882 2883 2884 2885 2886 2887 2888
	double tdp;

	if (!genuine_intel)
		return;

	if (family != 6)
		return;

	switch (model) {
2889 2890 2891 2892 2893 2894 2895
	case INTEL_FAM6_SANDYBRIDGE:
	case INTEL_FAM6_IVYBRIDGE:
	case INTEL_FAM6_HASWELL_CORE:	/* HSW */
	case INTEL_FAM6_HASWELL_ULT:	/* HSW */
	case INTEL_FAM6_HASWELL_GT3E:	/* HSW */
	case INTEL_FAM6_BROADWELL_CORE:	/* BDW */
	case INTEL_FAM6_BROADWELL_GT3E:	/* BDW */
2896
		do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_GFX | RAPL_PKG_POWER_INFO;
2897 2898 2899 2900 2901 2902 2903 2904 2905
		if (rapl_joules) {
			BIC_PRESENT(BIC_Pkg_J);
			BIC_PRESENT(BIC_Cor_J);
			BIC_PRESENT(BIC_GFX_J);
		} else {
			BIC_PRESENT(BIC_PkgWatt);
			BIC_PRESENT(BIC_CorWatt);
			BIC_PRESENT(BIC_GFXWatt);
		}
2906
		break;
2907
	case INTEL_FAM6_ATOM_GOLDMONT:	/* BXT */
2908
		do_rapl = RAPL_PKG | RAPL_PKG_POWER_INFO;
2909 2910 2911 2912
		if (rapl_joules)
			BIC_PRESENT(BIC_Pkg_J);
		else
			BIC_PRESENT(BIC_PkgWatt);
2913
		break;
2914 2915 2916 2917
	case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
	case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
	case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
	case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
2918
		do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO;
2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929
		BIC_PRESENT(BIC_PKG__);
		BIC_PRESENT(BIC_RAM__);
		if (rapl_joules) {
			BIC_PRESENT(BIC_Pkg_J);
			BIC_PRESENT(BIC_Cor_J);
			BIC_PRESENT(BIC_RAM_J);
		} else {
			BIC_PRESENT(BIC_PkgWatt);
			BIC_PRESENT(BIC_CorWatt);
			BIC_PRESENT(BIC_RAMWatt);
		}
2930
		break;
2931 2932 2933 2934 2935
	case INTEL_FAM6_HASWELL_X:	/* HSX */
	case INTEL_FAM6_BROADWELL_X:	/* BDX */
	case INTEL_FAM6_BROADWELL_XEON_D:	/* BDX-DE */
	case INTEL_FAM6_SKYLAKE_X:	/* SKX */
	case INTEL_FAM6_XEON_PHI_KNL:	/* KNL */
2936
	case INTEL_FAM6_XEON_PHI_KNM:
2937
		do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_POWER_INFO | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO;
2938 2939 2940 2941 2942 2943 2944 2945 2946
		BIC_PRESENT(BIC_PKG__);
		BIC_PRESENT(BIC_RAM__);
		if (rapl_joules) {
			BIC_PRESENT(BIC_Pkg_J);
			BIC_PRESENT(BIC_RAM_J);
		} else {
			BIC_PRESENT(BIC_PkgWatt);
			BIC_PRESENT(BIC_RAMWatt);
		}
L
Len Brown 已提交
2947
		break;
2948 2949
	case INTEL_FAM6_SANDYBRIDGE_X:
	case INTEL_FAM6_IVYBRIDGE_X:
2950
		do_rapl = RAPL_PKG | RAPL_CORES | RAPL_CORE_POLICY | RAPL_DRAM | RAPL_DRAM_POWER_INFO | RAPL_PKG_PERF_STATUS | RAPL_DRAM_PERF_STATUS | RAPL_PKG_POWER_INFO;
2951 2952 2953 2954 2955 2956 2957 2958 2959 2960 2961
		BIC_PRESENT(BIC_PKG__);
		BIC_PRESENT(BIC_RAM__);
		if (rapl_joules) {
			BIC_PRESENT(BIC_Pkg_J);
			BIC_PRESENT(BIC_Cor_J);
			BIC_PRESENT(BIC_RAM_J);
		} else {
			BIC_PRESENT(BIC_PkgWatt);
			BIC_PRESENT(BIC_CorWatt);
			BIC_PRESENT(BIC_RAMWatt);
		}
2962
		break;
2963 2964
	case INTEL_FAM6_ATOM_SILVERMONT1:	/* BYT */
	case INTEL_FAM6_ATOM_SILVERMONT2:	/* AVN */
2965
		do_rapl = RAPL_PKG | RAPL_CORES;
2966 2967 2968 2969 2970 2971 2972
		if (rapl_joules) {
			BIC_PRESENT(BIC_Pkg_J);
			BIC_PRESENT(BIC_Cor_J);
		} else {
			BIC_PRESENT(BIC_PkgWatt);
			BIC_PRESENT(BIC_CorWatt);
		}
2973
		break;
2974
	case INTEL_FAM6_ATOM_DENVERTON:	/* DNV */
2975
		do_rapl = RAPL_PKG | RAPL_DRAM | RAPL_DRAM_POWER_INFO | RAPL_DRAM_PERF_STATUS | RAPL_PKG_PERF_STATUS | RAPL_PKG_POWER_INFO | RAPL_CORES_ENERGY_STATUS;
2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986
		BIC_PRESENT(BIC_PKG__);
		BIC_PRESENT(BIC_RAM__);
		if (rapl_joules) {
			BIC_PRESENT(BIC_Pkg_J);
			BIC_PRESENT(BIC_Cor_J);
			BIC_PRESENT(BIC_RAM_J);
		} else {
			BIC_PRESENT(BIC_PkgWatt);
			BIC_PRESENT(BIC_CorWatt);
			BIC_PRESENT(BIC_RAMWatt);
		}
2987
		break;
2988 2989 2990 2991 2992
	default:
		return;
	}

	/* units on package 0, verify later other packages match */
2993
	if (get_msr(base_cpu, MSR_RAPL_POWER_UNIT, &msr))
2994 2995 2996
		return;

	rapl_power_units = 1.0 / (1 << (msr & 0xF));
2997
	if (model == INTEL_FAM6_ATOM_SILVERMONT1)
2998 2999 3000
		rapl_energy_units = 1.0 * (1 << (msr >> 8 & 0x1F)) / 1000000;
	else
		rapl_energy_units = 1.0 / (1 << (msr >> 8 & 0x1F));
3001

3002 3003
	rapl_dram_energy_units = rapl_dram_energy_units_probe(model, rapl_energy_units);

3004 3005 3006
	time_unit = msr >> 16 & 0xF;
	if (time_unit == 0)
		time_unit = 0xA;
3007

3008
	rapl_time_units = 1.0 / (1 << (time_unit));
3009

3010
	tdp = get_tdp(model);
3011

3012
	rapl_joule_counter_range = 0xFFFFFFFF * rapl_energy_units / tdp;
3013
	if (debug)
3014
		fprintf(outf, "RAPL: %.0f sec. Joule Counter Range, at %.0f Watts\n", rapl_joule_counter_range, tdp);
3015 3016 3017 3018

	return;
}

3019
void perf_limit_reasons_probe(unsigned int family, unsigned int model)
3020 3021 3022 3023 3024 3025 3026 3027
{
	if (!genuine_intel)
		return;

	if (family != 6)
		return;

	switch (model) {
3028 3029 3030
	case INTEL_FAM6_HASWELL_CORE:	/* HSW */
	case INTEL_FAM6_HASWELL_ULT:	/* HSW */
	case INTEL_FAM6_HASWELL_GT3E:	/* HSW */
3031
		do_gfx_perf_limit_reasons = 1;
3032
	case INTEL_FAM6_HASWELL_X:	/* HSX */
3033 3034 3035 3036 3037 3038 3039
		do_core_perf_limit_reasons = 1;
		do_ring_perf_limit_reasons = 1;
	default:
		return;
	}
}

3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050 3051
int print_thermal(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	unsigned long long msr;
	unsigned int dts;
	int cpu;

	if (!(do_dts || do_ptm))
		return 0;

	cpu = t->cpu_id;

	/* DTS is per-core, no need to print for each thread */
3052
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE))
3053 3054 3055
		return 0;

	if (cpu_migrate(cpu)) {
3056
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
3057 3058 3059 3060 3061 3062 3063 3064
		return -1;
	}

	if (do_ptm && (t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE)) {
		if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_STATUS, &msr))
			return 0;

		dts = (msr >> 16) & 0x7F;
3065
		fprintf(outf, "cpu%d: MSR_IA32_PACKAGE_THERM_STATUS: 0x%08llx (%d C)\n",
3066 3067 3068 3069 3070 3071 3072 3073
			cpu, msr, tcc_activation_temp - dts);

#ifdef	THERM_DEBUG
		if (get_msr(cpu, MSR_IA32_PACKAGE_THERM_INTERRUPT, &msr))
			return 0;

		dts = (msr >> 16) & 0x7F;
		dts2 = (msr >> 8) & 0x7F;
3074
		fprintf(outf, "cpu%d: MSR_IA32_PACKAGE_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n",
3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087
			cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2);
#endif
	}


	if (do_dts) {
		unsigned int resolution;

		if (get_msr(cpu, MSR_IA32_THERM_STATUS, &msr))
			return 0;

		dts = (msr >> 16) & 0x7F;
		resolution = (msr >> 27) & 0xF;
3088
		fprintf(outf, "cpu%d: MSR_IA32_THERM_STATUS: 0x%08llx (%d C +/- %d)\n",
3089 3090 3091 3092 3093 3094 3095 3096
			cpu, msr, tcc_activation_temp - dts, resolution);

#ifdef THERM_DEBUG
		if (get_msr(cpu, MSR_IA32_THERM_INTERRUPT, &msr))
			return 0;

		dts = (msr >> 16) & 0x7F;
		dts2 = (msr >> 8) & 0x7F;
3097
		fprintf(outf, "cpu%d: MSR_IA32_THERM_INTERRUPT: 0x%08llx (%d C, %d C)\n",
3098 3099 3100 3101 3102 3103
			cpu, msr, tcc_activation_temp - dts, tcc_activation_temp - dts2);
#endif
	}

	return 0;
}
3104

3105 3106
void print_power_limit_msr(int cpu, unsigned long long msr, char *label)
{
3107
	fprintf(outf, "cpu%d: %s: %sabled (%f Watts, %f sec, clamp %sabled)\n",
3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130
		cpu, label,
		((msr >> 15) & 1) ? "EN" : "DIS",
		((msr >> 0) & 0x7FFF) * rapl_power_units,
		(1.0 + (((msr >> 22) & 0x3)/4.0)) * (1 << ((msr >> 17) & 0x1F)) * rapl_time_units,
		(((msr >> 16) & 1) ? "EN" : "DIS"));

	return;
}

int print_rapl(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	unsigned long long msr;
	int cpu;

	if (!do_rapl)
		return 0;

	/* RAPL counters are per package, so print only for 1st thread/package */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

	cpu = t->cpu_id;
	if (cpu_migrate(cpu)) {
3131
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
3132 3133 3134 3135 3136 3137
		return -1;
	}

	if (get_msr(cpu, MSR_RAPL_POWER_UNIT, &msr))
		return -1;

3138
	if (debug) {
3139
		fprintf(outf, "cpu%d: MSR_RAPL_POWER_UNIT: 0x%08llx "
3140
			"(%f Watts, %f Joules, %f sec.)\n", cpu, msr,
3141
			rapl_power_units, rapl_energy_units, rapl_time_units);
3142
	}
3143 3144
	if (do_rapl & RAPL_PKG_POWER_INFO) {

3145 3146 3147 3148
		if (get_msr(cpu, MSR_PKG_POWER_INFO, &msr))
                	return -5;


3149
		fprintf(outf, "cpu%d: MSR_PKG_POWER_INFO: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n",
3150 3151 3152 3153 3154 3155
			cpu, msr,
			((msr >>  0) & RAPL_POWER_GRANULARITY) * rapl_power_units,
			((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units,
			((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units,
			((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units);

3156 3157 3158
	}
	if (do_rapl & RAPL_PKG) {

3159 3160 3161
		if (get_msr(cpu, MSR_PKG_POWER_LIMIT, &msr))
			return -9;

3162
		fprintf(outf, "cpu%d: MSR_PKG_POWER_LIMIT: 0x%08llx (%slocked)\n",
3163 3164 3165
			cpu, msr, (msr >> 63) & 1 ? "": "UN");

		print_power_limit_msr(cpu, msr, "PKG Limit #1");
3166
		fprintf(outf, "cpu%d: PKG Limit #2: %sabled (%f Watts, %f* sec, clamp %sabled)\n",
3167 3168 3169 3170 3171 3172 3173
			cpu,
			((msr >> 47) & 1) ? "EN" : "DIS",
			((msr >> 32) & 0x7FFF) * rapl_power_units,
			(1.0 + (((msr >> 54) & 0x3)/4.0)) * (1 << ((msr >> 49) & 0x1F)) * rapl_time_units,
			((msr >> 48) & 1) ? "EN" : "DIS");
	}

3174
	if (do_rapl & RAPL_DRAM_POWER_INFO) {
3175 3176 3177
		if (get_msr(cpu, MSR_DRAM_POWER_INFO, &msr))
                	return -6;

3178
		fprintf(outf, "cpu%d: MSR_DRAM_POWER_INFO,: 0x%08llx (%.0f W TDP, RAPL %.0f - %.0f W, %f sec.)\n",
3179 3180 3181 3182 3183
			cpu, msr,
			((msr >>  0) & RAPL_POWER_GRANULARITY) * rapl_power_units,
			((msr >> 16) & RAPL_POWER_GRANULARITY) * rapl_power_units,
			((msr >> 32) & RAPL_POWER_GRANULARITY) * rapl_power_units,
			((msr >> 48) & RAPL_TIME_GRANULARITY) * rapl_time_units);
3184 3185
	}
	if (do_rapl & RAPL_DRAM) {
3186 3187
		if (get_msr(cpu, MSR_DRAM_POWER_LIMIT, &msr))
			return -9;
3188
		fprintf(outf, "cpu%d: MSR_DRAM_POWER_LIMIT: 0x%08llx (%slocked)\n",
3189 3190 3191 3192
				cpu, msr, (msr >> 31) & 1 ? "": "UN");

		print_power_limit_msr(cpu, msr, "DRAM Limit");
	}
3193
	if (do_rapl & RAPL_CORE_POLICY) {
3194
		if (debug) {
3195 3196 3197
			if (get_msr(cpu, MSR_PP0_POLICY, &msr))
				return -7;

3198
			fprintf(outf, "cpu%d: MSR_PP0_POLICY: %lld\n", cpu, msr & 0xF);
3199 3200
		}
	}
3201
	if (do_rapl & RAPL_CORES_POWER_LIMIT) {
3202
		if (debug) {
3203 3204
			if (get_msr(cpu, MSR_PP0_POWER_LIMIT, &msr))
				return -9;
3205
			fprintf(outf, "cpu%d: MSR_PP0_POWER_LIMIT: 0x%08llx (%slocked)\n",
3206 3207 3208 3209 3210
					cpu, msr, (msr >> 31) & 1 ? "": "UN");
			print_power_limit_msr(cpu, msr, "Cores Limit");
		}
	}
	if (do_rapl & RAPL_GFX) {
3211
		if (debug) {
3212 3213 3214
			if (get_msr(cpu, MSR_PP1_POLICY, &msr))
				return -8;

3215
			fprintf(outf, "cpu%d: MSR_PP1_POLICY: %lld\n", cpu, msr & 0xF);
3216 3217 3218

			if (get_msr(cpu, MSR_PP1_POWER_LIMIT, &msr))
				return -9;
3219
			fprintf(outf, "cpu%d: MSR_PP1_POWER_LIMIT: 0x%08llx (%slocked)\n",
3220 3221 3222 3223 3224 3225 3226
					cpu, msr, (msr >> 31) & 1 ? "": "UN");
			print_power_limit_msr(cpu, msr, "GFX Limit");
		}
	}
	return 0;
}

3227 3228 3229 3230 3231 3232 3233
/*
 * SNB adds support for additional MSRs:
 *
 * MSR_PKG_C7_RESIDENCY            0x000003fa
 * MSR_CORE_C7_RESIDENCY           0x000003fe
 * MSR_PKG_C2_RESIDENCY            0x0000060d
 */
L
Len Brown 已提交
3234

3235
int has_snb_msrs(unsigned int family, unsigned int model)
L
Len Brown 已提交
3236 3237 3238 3239 3240
{
	if (!genuine_intel)
		return 0;

	switch (model) {
3241 3242 3243 3244 3245 3246 3247 3248 3249 3250 3251 3252 3253 3254 3255 3256 3257 3258
	case INTEL_FAM6_SANDYBRIDGE:
	case INTEL_FAM6_SANDYBRIDGE_X:
	case INTEL_FAM6_IVYBRIDGE:	/* IVB */
	case INTEL_FAM6_IVYBRIDGE_X:	/* IVB Xeon */
	case INTEL_FAM6_HASWELL_CORE:	/* HSW */
	case INTEL_FAM6_HASWELL_X:	/* HSW */
	case INTEL_FAM6_HASWELL_ULT:	/* HSW */
	case INTEL_FAM6_HASWELL_GT3E:	/* HSW */
	case INTEL_FAM6_BROADWELL_CORE:	/* BDW */
	case INTEL_FAM6_BROADWELL_GT3E:	/* BDW */
	case INTEL_FAM6_BROADWELL_X:	/* BDX */
	case INTEL_FAM6_BROADWELL_XEON_D:	/* BDX-DE */
	case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
	case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
	case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
	case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
	case INTEL_FAM6_SKYLAKE_X:	/* SKX */
	case INTEL_FAM6_ATOM_GOLDMONT:	/* BXT */
3259
	case INTEL_FAM6_ATOM_DENVERTON:	/* DNV */
L
Len Brown 已提交
3260 3261 3262 3263 3264
		return 1;
	}
	return 0;
}

3265 3266 3267 3268 3269 3270 3271 3272 3273 3274 3275 3276 3277 3278 3279 3280 3281 3282 3283 3284 3285
/*
 * SLV client has supporet for unique MSRs:
 *
 * MSR_CC6_DEMOTION_POLICY_CONFIG
 * MSR_MC6_DEMOTION_POLICY_CONFIG
 */

int has_slv_msrs(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;

	switch (model) {
	case INTEL_FAM6_ATOM_SILVERMONT1:
	case INTEL_FAM6_ATOM_MERRIFIELD:
	case INTEL_FAM6_ATOM_MOOREFIELD:
		return 1;
	}
	return 0;
}

3286 3287 3288
/*
 * HSW adds support for additional MSRs:
 *
3289 3290 3291 3292 3293 3294 3295 3296
 * MSR_PKG_C8_RESIDENCY		0x00000630
 * MSR_PKG_C9_RESIDENCY		0x00000631
 * MSR_PKG_C10_RESIDENCY	0x00000632
 *
 * MSR_PKGC8_IRTL		0x00000633
 * MSR_PKGC9_IRTL		0x00000634
 * MSR_PKGC10_IRTL		0x00000635
 *
3297 3298
 */
int has_hsw_msrs(unsigned int family, unsigned int model)
3299 3300 3301 3302 3303
{
	if (!genuine_intel)
		return 0;

	switch (model) {
3304 3305 3306 3307 3308 3309 3310
	case INTEL_FAM6_HASWELL_ULT:	/* HSW */
	case INTEL_FAM6_BROADWELL_CORE:	/* BDW */
	case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
	case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
	case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
	case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
	case INTEL_FAM6_ATOM_GOLDMONT:	/* BXT */
3311 3312 3313 3314 3315 3316 3317 3318 3319 3320 3321 3322 3323 3324 3325 3326 3327 3328 3329
		return 1;
	}
	return 0;
}

/*
 * SKL adds support for additional MSRS:
 *
 * MSR_PKG_WEIGHTED_CORE_C0_RES    0x00000658
 * MSR_PKG_ANY_CORE_C0_RES         0x00000659
 * MSR_PKG_ANY_GFXE_C0_RES         0x0000065A
 * MSR_PKG_BOTH_CORE_GFXE_C0_RES   0x0000065B
 */
int has_skl_msrs(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;

	switch (model) {
3330 3331 3332 3333
	case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
	case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
	case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
	case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
3334 3335 3336 3337 3338 3339
		return 1;
	}
	return 0;
}


3340

3341 3342 3343 3344 3345
int is_slm(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;
	switch (model) {
3346 3347
	case INTEL_FAM6_ATOM_SILVERMONT1:	/* BYT */
	case INTEL_FAM6_ATOM_SILVERMONT2:	/* AVN */
3348 3349 3350 3351 3352
		return 1;
	}
	return 0;
}

3353 3354 3355 3356 3357
int is_knl(unsigned int family, unsigned int model)
{
	if (!genuine_intel)
		return 0;
	switch (model) {
3358
	case INTEL_FAM6_XEON_PHI_KNL:	/* KNL */
3359
	case INTEL_FAM6_XEON_PHI_KNM:
3360 3361 3362 3363 3364
		return 1;
	}
	return 0;
}

3365 3366 3367 3368 3369 3370 3371
unsigned int get_aperf_mperf_multiplier(unsigned int family, unsigned int model)
{
	if (is_knl(family, model))
		return 1024;
	return 1;
}

3372 3373 3374 3375 3376 3377 3378 3379 3380
#define SLM_BCLK_FREQS 5
double slm_freq_table[SLM_BCLK_FREQS] = { 83.3, 100.0, 133.3, 116.7, 80.0};

double slm_bclk(void)
{
	unsigned long long msr = 3;
	unsigned int i;
	double freq;

3381
	if (get_msr(base_cpu, MSR_FSB_FREQ, &msr))
3382
		fprintf(outf, "SLM BCLK: unknown\n");
3383 3384 3385

	i = msr & 0xf;
	if (i >= SLM_BCLK_FREQS) {
3386
		fprintf(outf, "SLM BCLK[%d] invalid\n", i);
3387
		i = 3;
3388 3389 3390
	}
	freq = slm_freq_table[i];

3391 3392
	if (debug)
		fprintf(outf, "SLM BCLK: %.1f Mhz\n", freq);
3393 3394 3395 3396

	return freq;
}

L
Len Brown 已提交
3397 3398
double discover_bclk(unsigned int family, unsigned int model)
{
3399
	if (has_snb_msrs(family, model) || is_knl(family, model))
L
Len Brown 已提交
3400
		return 100.00;
3401 3402
	else if (is_slm(family, model))
		return slm_bclk();
L
Len Brown 已提交
3403 3404 3405 3406
	else
		return 133.33;
}

3407 3408 3409 3410 3411 3412 3413 3414 3415 3416 3417 3418 3419 3420 3421 3422 3423 3424 3425 3426 3427 3428 3429 3430 3431 3432 3433 3434
/*
 * MSR_IA32_TEMPERATURE_TARGET indicates the temperature where
 * the Thermal Control Circuit (TCC) activates.
 * This is usually equal to tjMax.
 *
 * Older processors do not have this MSR, so there we guess,
 * but also allow cmdline over-ride with -T.
 *
 * Several MSR temperature values are in units of degrees-C
 * below this value, including the Digital Thermal Sensor (DTS),
 * Package Thermal Management Sensor (PTM), and thermal event thresholds.
 */
int set_temperature_target(struct thread_data *t, struct core_data *c, struct pkg_data *p)
{
	unsigned long long msr;
	unsigned int target_c_local;
	int cpu;

	/* tcc_activation_temp is used only for dts or ptm */
	if (!(do_dts || do_ptm))
		return 0;

	/* this is a per-package concept */
	if (!(t->flags & CPU_IS_FIRST_THREAD_IN_CORE) || !(t->flags & CPU_IS_FIRST_CORE_IN_PACKAGE))
		return 0;

	cpu = t->cpu_id;
	if (cpu_migrate(cpu)) {
3435
		fprintf(outf, "Could not migrate to CPU %d\n", cpu);
3436 3437 3438 3439 3440
		return -1;
	}

	if (tcc_activation_temp_override != 0) {
		tcc_activation_temp = tcc_activation_temp_override;
3441
		fprintf(outf, "cpu%d: Using cmdline TCC Target (%d C)\n",
3442 3443 3444 3445 3446
			cpu, tcc_activation_temp);
		return 0;
	}

	/* Temperature Target MSR is Nehalem and newer only */
3447
	if (!do_nhm_platform_info)
3448 3449
		goto guess;

3450
	if (get_msr(base_cpu, MSR_IA32_TEMPERATURE_TARGET, &msr))
3451 3452
		goto guess;

3453
	target_c_local = (msr >> 16) & 0xFF;
3454

3455
	if (debug)
3456
		fprintf(outf, "cpu%d: MSR_IA32_TEMPERATURE_TARGET: 0x%08llx (%d C)\n",
3457 3458
			cpu, msr, target_c_local);

3459
	if (!target_c_local)
3460 3461 3462 3463 3464 3465 3466 3467
		goto guess;

	tcc_activation_temp = target_c_local;

	return 0;

guess:
	tcc_activation_temp = TJMAX_DEFAULT;
3468
	fprintf(outf, "cpu%d: Guessing tjMax %d C, Please use -T to specify\n",
3469 3470 3471 3472
		cpu, tcc_activation_temp);

	return 0;
}
3473

3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484
void decode_feature_control_msr(void)
{
	unsigned long long msr;

	if (!get_msr(base_cpu, MSR_IA32_FEATURE_CONTROL, &msr))
		fprintf(outf, "cpu%d: MSR_IA32_FEATURE_CONTROL: 0x%08llx (%sLocked %s)\n",
			base_cpu, msr,
			msr & FEATURE_CONTROL_LOCKED ? "" : "UN-",
			msr & (1 << 18) ? "SGX" : "");
}

3485 3486 3487 3488 3489
void decode_misc_enable_msr(void)
{
	unsigned long long msr;

	if (!get_msr(base_cpu, MSR_IA32_MISC_ENABLE, &msr))
3490
		fprintf(outf, "cpu%d: MSR_IA32_MISC_ENABLE: 0x%08llx (%s %s %s)\n",
3491 3492 3493 3494 3495 3496
			base_cpu, msr,
			msr & (1 << 3) ? "TCC" : "",
			msr & (1 << 16) ? "EIST" : "",
			msr & (1 << 18) ? "MONITOR" : "");
}

3497 3498 3499 3500 3501 3502 3503 3504 3505 3506 3507 3508 3509 3510
/*
 * Decode MSR_MISC_PWR_MGMT
 *
 * Decode the bits according to the Nehalem documentation
 * bit[0] seems to continue to have same meaning going forward
 * bit[1] less so...
 */
void decode_misc_pwr_mgmt_msr(void)
{
	unsigned long long msr;

	if (!do_nhm_platform_info)
		return;

3511 3512 3513
	if (no_MSR_MISC_PWR_MGMT)
		return;

3514
	if (!get_msr(base_cpu, MSR_MISC_PWR_MGMT, &msr))
3515
		fprintf(outf, "cpu%d: MSR_MISC_PWR_MGMT: 0x%08llx (%sable-EIST_Coordination %sable-EPB %sable-OOB)\n",
3516 3517
			base_cpu, msr,
			msr & (1 << 0) ? "DIS" : "EN",
3518 3519
			msr & (1 << 1) ? "EN" : "DIS",
			msr & (1 << 8) ? "EN" : "DIS");
3520
}
3521 3522 3523 3524 3525 3526 3527 3528 3529 3530 3531 3532 3533 3534 3535 3536 3537 3538
/*
 * Decode MSR_CC6_DEMOTION_POLICY_CONFIG, MSR_MC6_DEMOTION_POLICY_CONFIG
 *
 * This MSRs are present on Silvermont processors,
 * Intel Atom processor E3000 series (Baytrail), and friends.
 */
void decode_c6_demotion_policy_msr(void)
{
	unsigned long long msr;

	if (!get_msr(base_cpu, MSR_CC6_DEMOTION_POLICY_CONFIG, &msr))
		fprintf(outf, "cpu%d: MSR_CC6_DEMOTION_POLICY_CONFIG: 0x%08llx (%sable-CC6-Demotion)\n",
			base_cpu, msr, msr & (1 << 0) ? "EN" : "DIS");

	if (!get_msr(base_cpu, MSR_MC6_DEMOTION_POLICY_CONFIG, &msr))
		fprintf(outf, "cpu%d: MSR_MC6_DEMOTION_POLICY_CONFIG: 0x%08llx (%sable-MC6-Demotion)\n",
			base_cpu, msr, msr & (1 << 0) ? "EN" : "DIS");
}
3539

3540
void process_cpuid()
L
Len Brown 已提交
3541
{
3542
	unsigned int eax, ebx, ecx, edx, max_level, max_extended_level;
L
Len Brown 已提交
3543 3544 3545 3546
	unsigned int fms, family, model, stepping;

	eax = ebx = ecx = edx = 0;

3547
	__cpuid(0, max_level, ebx, ecx, edx);
L
Len Brown 已提交
3548 3549 3550 3551

	if (ebx == 0x756e6547 && edx == 0x49656e69 && ecx == 0x6c65746e)
		genuine_intel = 1;

3552
	if (debug)
3553
		fprintf(outf, "CPUID(0): %.4s%.4s%.4s ",
L
Len Brown 已提交
3554 3555
			(char *)&ebx, (char *)&edx, (char *)&ecx);

3556
	__cpuid(1, fms, ebx, ecx, edx);
L
Len Brown 已提交
3557 3558 3559 3560 3561 3562
	family = (fms >> 8) & 0xf;
	model = (fms >> 4) & 0xf;
	stepping = fms & 0xf;
	if (family == 6 || family == 0xf)
		model += ((fms >> 16) & 0xf) << 4;

3563
	if (debug) {
3564
		fprintf(outf, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n",
L
Len Brown 已提交
3565
			max_level, family, model, stepping, family, model, stepping);
3566
		fprintf(outf, "CPUID(1): %s %s %s %s %s %s %s %s %s\n",
3567 3568
			ecx & (1 << 0) ? "SSE3" : "-",
			ecx & (1 << 3) ? "MONITOR" : "-",
3569
			ecx & (1 << 6) ? "SMX" : "-",
3570 3571 3572 3573 3574 3575 3576
			ecx & (1 << 7) ? "EIST" : "-",
			ecx & (1 << 8) ? "TM2" : "-",
			edx & (1 << 4) ? "TSC" : "-",
			edx & (1 << 5) ? "MSR" : "-",
			edx & (1 << 22) ? "ACPI-TM" : "-",
			edx & (1 << 29) ? "TM" : "-");
	}
L
Len Brown 已提交
3577

3578 3579
	if (!(edx & (1 << 5)))
		errx(1, "CPUID: no MSR");
L
Len Brown 已提交
3580 3581 3582 3583 3584 3585 3586

	/*
	 * check max extended function levels of CPUID.
	 * This is needed to check for invariant TSC.
	 * This check is valid for both Intel and AMD.
	 */
	ebx = ecx = edx = 0;
3587
	__cpuid(0x80000000, max_extended_level, ebx, ecx, edx);
L
Len Brown 已提交
3588

3589
	if (max_extended_level >= 0x80000007) {
L
Len Brown 已提交
3590

3591 3592 3593 3594
		/*
		 * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8
		 * this check is valid for both Intel and AMD
		 */
3595
		__cpuid(0x80000007, eax, ebx, ecx, edx);
3596 3597
		has_invariant_tsc = edx & (1 << 8);
	}
L
Len Brown 已提交
3598 3599 3600 3601 3602 3603

	/*
	 * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0
	 * this check is valid for both Intel and AMD
	 */

3604
	__cpuid(0x6, eax, ebx, ecx, edx);
3605
	has_aperf = ecx & (1 << 0);
3606 3607 3608 3609 3610
	if (has_aperf) {
		BIC_PRESENT(BIC_Avg_MHz);
		BIC_PRESENT(BIC_Busy);
		BIC_PRESENT(BIC_Bzy_MHz);
	}
3611
	do_dts = eax & (1 << 0);
3612 3613
	if (do_dts)
		BIC_PRESENT(BIC_CoreTmp);
3614
	do_ptm = eax & (1 << 6);
3615 3616
	if (do_ptm)
		BIC_PRESENT(BIC_PkgTmp);
3617 3618 3619 3620 3621
	has_hwp = eax & (1 << 7);
	has_hwp_notify = eax & (1 << 8);
	has_hwp_activity_window = eax & (1 << 9);
	has_hwp_epp = eax & (1 << 10);
	has_hwp_pkg = eax & (1 << 11);
3622 3623
	has_epb = ecx & (1 << 3);

3624
	if (debug)
3625
		fprintf(outf, "CPUID(6): %sAPERF, %sDTS, %sPTM, %sHWP, "
3626 3627 3628 3629 3630 3631 3632 3633 3634 3635
			"%sHWPnotify, %sHWPwindow, %sHWPepp, %sHWPpkg, %sEPB\n",
			has_aperf ? "" : "No-",
			do_dts ? "" : "No-",
			do_ptm ? "" : "No-",
			has_hwp ? "" : "No-",
			has_hwp_notify ? "" : "No-",
			has_hwp_activity_window ? "" : "No-",
			has_hwp_epp ? "" : "No-",
			has_hwp_pkg ? "" : "No-",
			has_epb ? "" : "No-");
L
Len Brown 已提交
3636

3637 3638 3639
	if (debug)
		decode_misc_enable_msr();

3640
	if (max_level >= 0x7 && debug) {
3641
		int has_sgx;
L
Len Brown 已提交
3642

3643 3644 3645 3646 3647 3648 3649 3650 3651 3652 3653
		ecx = 0;

		__cpuid_count(0x7, 0, eax, ebx, ecx, edx);

		has_sgx = ebx & (1 << 2);
		fprintf(outf, "CPUID(7): %sSGX\n", has_sgx ? "" : "No-");

		if (has_sgx)
			decode_feature_control_msr();
	}

3654
	if (max_level >= 0x15) {
3655 3656 3657 3658 3659 3660 3661
		unsigned int eax_crystal;
		unsigned int ebx_tsc;

		/*
		 * CPUID 15H TSC/Crystal ratio, possibly Crystal Hz
		 */
		eax_crystal = ebx_tsc = crystal_hz = edx = 0;
3662
		__cpuid(0x15, eax_crystal, ebx_tsc, crystal_hz, edx);
3663 3664 3665 3666

		if (ebx_tsc != 0) {

			if (debug && (ebx != 0))
3667
				fprintf(outf, "CPUID(0x15): eax_crystal: %d ebx_tsc: %d ecx_crystal_hz: %d\n",
3668 3669 3670 3671
					eax_crystal, ebx_tsc, crystal_hz);

			if (crystal_hz == 0)
				switch(model) {
3672 3673 3674 3675
				case INTEL_FAM6_SKYLAKE_MOBILE:	/* SKL */
				case INTEL_FAM6_SKYLAKE_DESKTOP:	/* SKL */
				case INTEL_FAM6_KABYLAKE_MOBILE:	/* KBL */
				case INTEL_FAM6_KABYLAKE_DESKTOP:	/* KBL */
3676 3677
					crystal_hz = 24000000;	/* 24.0 MHz */
					break;
3678
				case INTEL_FAM6_SKYLAKE_X:	/* SKX */
3679
				case INTEL_FAM6_ATOM_DENVERTON:	/* DNV */
3680 3681
					crystal_hz = 25000000;	/* 25.0 MHz */
					break;
3682
				case INTEL_FAM6_ATOM_GOLDMONT:	/* BXT */
3683
					crystal_hz = 19200000;	/* 19.2 MHz */
3684 3685 3686 3687 3688 3689 3690 3691
					break;
				default:
					crystal_hz = 0;
			}

			if (crystal_hz) {
				tsc_hz =  (unsigned long long) crystal_hz * ebx_tsc / eax_crystal;
				if (debug)
3692
					fprintf(outf, "TSC: %lld MHz (%d Hz * %d / %d / 1000000)\n",
3693 3694 3695 3696
						tsc_hz / 1000000, crystal_hz, ebx_tsc,  eax_crystal);
			}
		}
	}
3697 3698 3699 3700 3701 3702 3703 3704
	if (max_level >= 0x16) {
		unsigned int base_mhz, max_mhz, bus_mhz, edx;

		/*
		 * CPUID 16H Base MHz, Max MHz, Bus MHz
		 */
		base_mhz = max_mhz = bus_mhz = edx = 0;

3705
		__cpuid(0x16, base_mhz, max_mhz, bus_mhz, edx);
3706
		if (debug)
3707
			fprintf(outf, "CPUID(0x16): base_mhz: %d max_mhz: %d bus_mhz: %d\n",
3708 3709
				base_mhz, max_mhz, bus_mhz);
	}
3710

3711 3712 3713
	if (has_aperf)
		aperf_mperf_multiplier = get_aperf_mperf_multiplier(family, model);

3714 3715 3716 3717 3718 3719 3720 3721 3722 3723
	BIC_PRESENT(BIC_IRQ);
	BIC_PRESENT(BIC_TSC_MHz);

	if (probe_nhm_msrs(family, model)) {
		do_nhm_platform_info = 1;
		BIC_PRESENT(BIC_CPU_c1);
		BIC_PRESENT(BIC_CPU_c3);
		BIC_PRESENT(BIC_CPU_c6);
		BIC_PRESENT(BIC_SMI);
	}
3724
	do_snb_cstates = has_snb_msrs(family, model);
3725 3726 3727 3728

	if (do_snb_cstates)
		BIC_PRESENT(BIC_CPU_c7);

3729
	do_irtl_snb = has_snb_msrs(family, model);
3730 3731 3732 3733
	do_pc2 = do_snb_cstates && (pkg_cstate_limit >= PCL__2);
	do_pc3 = (pkg_cstate_limit >= PCL__3);
	do_pc6 = (pkg_cstate_limit >= PCL__6);
	do_pc7 = do_snb_cstates && (pkg_cstate_limit >= PCL__7);
3734
	do_c8_c9_c10 = has_hsw_msrs(family, model);
3735
	do_irtl_hsw = has_hsw_msrs(family, model);
3736
	do_skl_residency = has_skl_msrs(family, model);
3737
	do_slm_cstates = is_slm(family, model);
3738
	do_knl_cstates  = is_knl(family, model);
L
Len Brown 已提交
3739

3740 3741 3742
	if (debug)
		decode_misc_pwr_mgmt_msr();

3743 3744 3745
	if (debug && has_slv_msrs(family, model))
		decode_c6_demotion_policy_msr();

3746
	rapl_probe(family, model);
3747
	perf_limit_reasons_probe(family, model);
3748

3749
	if (debug)
3750
		dump_cstate_pstate_config_info(family, model);
3751

3752 3753 3754
	if (has_skl_msrs(family, model))
		calculate_tsc_tweak();

3755 3756
	if (!access("/sys/class/drm/card0/power/rc6_residency_ms", R_OK))
		BIC_PRESENT(BIC_GFX_rc6);
L
Len Brown 已提交
3757

3758 3759
	if (!access("/sys/class/graphics/fb0/device/drm/card0/gt_cur_freq_mhz", R_OK))
		BIC_PRESENT(BIC_GFXMHz);
L
Len Brown 已提交
3760

3761
	return;
L
Len Brown 已提交
3762 3763
}

3764
void help()
L
Len Brown 已提交
3765
{
3766
	fprintf(outf,
3767 3768 3769 3770 3771 3772
	"Usage: turbostat [OPTIONS][(--interval seconds) | COMMAND ...]\n"
	"\n"
	"Turbostat forks the specified COMMAND and prints statistics\n"
	"when COMMAND completes.\n"
	"If no COMMAND is specified, turbostat wakes every 5-seconds\n"
	"to print statistics, until interrupted.\n"
3773 3774
	"--add		add a counter\n"
	"		eg. --add msr0x10,u64,cpu,delta,MY_TSC\n"
3775 3776 3777
	"--debug	run in \"debug\" mode\n"
	"--interval sec	Override default 5-second measurement interval\n"
	"--help		print this help message\n"
3778
	"--out file	create or truncate \"file\" for all output\n"
3779 3780 3781
	"--version	print version information\n"
	"\n"
	"For more help, run \"man turbostat\"\n");
L
Len Brown 已提交
3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801
}


/*
 * in /dev/cpu/ return success for names that are numbers
 * ie. filter out ".", "..", "microcode".
 */
int dir_filter(const struct dirent *dirp)
{
	if (isdigit(dirp->d_name[0]))
		return 1;
	else
		return 0;
}

int open_dev_cpu_msr(int dummy1)
{
	return 0;
}

3802 3803 3804 3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816 3817
void topology_probe()
{
	int i;
	int max_core_id = 0;
	int max_package_id = 0;
	int max_siblings = 0;
	struct cpu_topology {
		int core_id;
		int physical_package_id;
	} *cpus;

	/* Initialize num_cpus, max_cpu_num */
	topo.num_cpus = 0;
	topo.max_cpu_num = 0;
	for_all_proc_cpus(count_cpus);
	if (!summary_only && topo.num_cpus > 1)
3818
		BIC_PRESENT(BIC_CPU);
3819

3820
	if (debug > 1)
3821
		fprintf(outf, "num_cpus %d max_cpu_num %d\n", topo.num_cpus, topo.max_cpu_num);
3822 3823

	cpus = calloc(1, (topo.max_cpu_num  + 1) * sizeof(struct cpu_topology));
3824 3825
	if (cpus == NULL)
		err(1, "calloc cpus");
3826 3827 3828 3829 3830

	/*
	 * Allocate and initialize cpu_present_set
	 */
	cpu_present_set = CPU_ALLOC((topo.max_cpu_num + 1));
3831 3832
	if (cpu_present_set == NULL)
		err(3, "CPU_ALLOC");
3833 3834 3835 3836 3837 3838 3839 3840
	cpu_present_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1));
	CPU_ZERO_S(cpu_present_setsize, cpu_present_set);
	for_all_proc_cpus(mark_cpu_present);

	/*
	 * Allocate and initialize cpu_affinity_set
	 */
	cpu_affinity_set = CPU_ALLOC((topo.max_cpu_num + 1));
3841 3842
	if (cpu_affinity_set == NULL)
		err(3, "CPU_ALLOC");
3843 3844 3845 3846 3847 3848 3849 3850 3851 3852 3853 3854
	cpu_affinity_setsize = CPU_ALLOC_SIZE((topo.max_cpu_num + 1));
	CPU_ZERO_S(cpu_affinity_setsize, cpu_affinity_set);


	/*
	 * For online cpus
	 * find max_core_id, max_package_id
	 */
	for (i = 0; i <= topo.max_cpu_num; ++i) {
		int siblings;

		if (cpu_is_not_present(i)) {
3855
			if (debug > 1)
3856
				fprintf(outf, "cpu%d NOT PRESENT\n", i);
3857 3858 3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869
			continue;
		}
		cpus[i].core_id = get_core_id(i);
		if (cpus[i].core_id > max_core_id)
			max_core_id = cpus[i].core_id;

		cpus[i].physical_package_id = get_physical_package_id(i);
		if (cpus[i].physical_package_id > max_package_id)
			max_package_id = cpus[i].physical_package_id;

		siblings = get_num_ht_siblings(i);
		if (siblings > max_siblings)
			max_siblings = siblings;
3870
		if (debug > 1)
3871
			fprintf(outf, "cpu %d pkg %d core %d\n",
3872 3873 3874
				i, cpus[i].physical_package_id, cpus[i].core_id);
	}
	topo.num_cores_per_pkg = max_core_id + 1;
3875
	if (debug > 1)
3876
		fprintf(outf, "max_core_id %d, sizing for %d cores per package\n",
3877
			max_core_id, topo.num_cores_per_pkg);
3878
	if (debug && !summary_only && topo.num_cores_per_pkg > 1)
3879
		BIC_PRESENT(BIC_Core);
3880 3881

	topo.num_packages = max_package_id + 1;
3882
	if (debug > 1)
3883
		fprintf(outf, "max_package_id %d, sizing for %d packages\n",
3884
			max_package_id, topo.num_packages);
3885
	if (debug && !summary_only && topo.num_packages > 1)
3886
		BIC_PRESENT(BIC_Package);
3887 3888

	topo.num_threads_per_core = max_siblings;
3889
	if (debug > 1)
3890
		fprintf(outf, "max_siblings %d\n", max_siblings);
3891 3892 3893 3894 3895 3896 3897 3898 3899 3900

	free(cpus);
}

void
allocate_counters(struct thread_data **t, struct core_data **c, struct pkg_data **p)
{
	int i;

	*t = calloc(topo.num_threads_per_core * topo.num_cores_per_pkg *
3901
		topo.num_packages, sizeof(struct thread_data));
3902 3903 3904 3905 3906 3907 3908 3909
	if (*t == NULL)
		goto error;

	for (i = 0; i < topo.num_threads_per_core *
		topo.num_cores_per_pkg * topo.num_packages; i++)
		(*t)[i].cpu_id = -1;

	*c = calloc(topo.num_cores_per_pkg * topo.num_packages,
3910
		sizeof(struct core_data));
3911 3912 3913 3914 3915 3916
	if (*c == NULL)
		goto error;

	for (i = 0; i < topo.num_cores_per_pkg * topo.num_packages; i++)
		(*c)[i].core_id = -1;

3917
	*p = calloc(topo.num_packages, sizeof(struct pkg_data));
3918 3919 3920 3921 3922 3923 3924 3925
	if (*p == NULL)
		goto error;

	for (i = 0; i < topo.num_packages; i++)
		(*p)[i].package_id = i;

	return;
error:
3926
	err(1, "calloc counters");
3927 3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950 3951 3952 3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965
}
/*
 * init_counter()
 *
 * set cpu_id, core_num, pkg_num
 * set FIRST_THREAD_IN_CORE and FIRST_CORE_IN_PACKAGE
 *
 * increment topo.num_cores when 1st core in pkg seen
 */
void init_counter(struct thread_data *thread_base, struct core_data *core_base,
	struct pkg_data *pkg_base, int thread_num, int core_num,
	int pkg_num, int cpu_id)
{
	struct thread_data *t;
	struct core_data *c;
	struct pkg_data *p;

	t = GET_THREAD(thread_base, thread_num, core_num, pkg_num);
	c = GET_CORE(core_base, core_num, pkg_num);
	p = GET_PKG(pkg_base, pkg_num);

	t->cpu_id = cpu_id;
	if (thread_num == 0) {
		t->flags |= CPU_IS_FIRST_THREAD_IN_CORE;
		if (cpu_is_first_core_in_package(cpu_id))
			t->flags |= CPU_IS_FIRST_CORE_IN_PACKAGE;
	}

	c->core_id = core_num;
	p->package_id = pkg_num;
}


int initialize_counters(int cpu_id)
{
	int my_thread_id, my_core_id, my_package_id;

	my_package_id = get_physical_package_id(cpu_id);
	my_core_id = get_core_id(cpu_id);
3966 3967
	my_thread_id = get_cpu_position_in_core(cpu_id);
	if (!my_thread_id)
3968 3969 3970 3971 3972 3973 3974 3975 3976
		topo.num_cores++;

	init_counter(EVEN_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id);
	init_counter(ODD_COUNTERS, my_thread_id, my_core_id, my_package_id, cpu_id);
	return 0;
}

void allocate_output_buffer()
{
3977
	output_buffer = calloc(1, (1 + topo.num_cpus) * 1024);
3978
	outp = output_buffer;
3979 3980
	if (outp == NULL)
		err(-1, "calloc output buffer");
3981
}
3982 3983
void allocate_fd_percpu(void)
{
3984
	fd_percpu = calloc(topo.max_cpu_num + 1, sizeof(int));
3985 3986 3987
	if (fd_percpu == NULL)
		err(-1, "calloc fd_percpu");
}
3988 3989 3990 3991 3992
void allocate_irq_buffers(void)
{
	irq_column_2_cpu = calloc(topo.num_cpus, sizeof(int));
	if (irq_column_2_cpu == NULL)
		err(-1, "calloc %d", topo.num_cpus);
3993

3994
	irqs_per_cpu = calloc(topo.max_cpu_num + 1, sizeof(int));
3995
	if (irqs_per_cpu == NULL)
3996
		err(-1, "calloc %d", topo.max_cpu_num + 1);
3997
}
3998 3999 4000
void setup_all_buffers(void)
{
	topology_probe();
4001
	allocate_irq_buffers();
4002
	allocate_fd_percpu();
4003 4004 4005 4006 4007
	allocate_counters(&thread_even, &core_even, &package_even);
	allocate_counters(&thread_odd, &core_odd, &package_odd);
	allocate_output_buffer();
	for_all_proc_cpus(initialize_counters);
}
4008

4009 4010 4011 4012 4013 4014 4015
void set_base_cpu(void)
{
	base_cpu = sched_getcpu();
	if (base_cpu < 0)
		err(-ENODEV, "No valid cpus found");

	if (debug > 1)
4016
		fprintf(outf, "base_cpu = %d\n", base_cpu);
4017 4018
}

L
Len Brown 已提交
4019 4020
void turbostat_init()
{
4021 4022
	setup_all_buffers();
	set_base_cpu();
L
Len Brown 已提交
4023
	check_dev_msr();
4024
	check_permissions();
4025
	process_cpuid();
L
Len Brown 已提交
4026 4027


4028 4029 4030
	if (debug)
		for_all_cpus(print_hwp, ODD_COUNTERS);

4031
	if (debug)
4032 4033
		for_all_cpus(print_epb, ODD_COUNTERS);

4034
	if (debug)
4035 4036
		for_all_cpus(print_perf_limit, ODD_COUNTERS);

4037
	if (debug)
4038 4039 4040 4041
		for_all_cpus(print_rapl, ODD_COUNTERS);

	for_all_cpus(set_temperature_target, ODD_COUNTERS);

4042
	if (debug)
4043
		for_all_cpus(print_thermal, ODD_COUNTERS);
4044 4045 4046

	if (debug && do_irtl_snb)
		print_irtl();
L
Len Brown 已提交
4047 4048 4049 4050 4051
}

int fork_it(char **argv)
{
	pid_t child_pid;
4052
	int status;
4053

4054 4055 4056
	status = for_all_cpus(get_counters, EVEN_COUNTERS);
	if (status)
		exit(status);
4057 4058
	/* clear affinity side-effect of get_counters() */
	sched_setaffinity(0, cpu_present_setsize, cpu_present_set);
L
Len Brown 已提交
4059 4060 4061 4062 4063 4064 4065 4066 4067
	gettimeofday(&tv_even, (struct timezone *)NULL);

	child_pid = fork();
	if (!child_pid) {
		/* child */
		execvp(argv[0], argv);
	} else {

		/* parent */
4068 4069
		if (child_pid == -1)
			err(1, "fork");
L
Len Brown 已提交
4070 4071 4072

		signal(SIGINT, SIG_IGN);
		signal(SIGQUIT, SIG_IGN);
4073 4074
		if (waitpid(child_pid, &status, 0) == -1)
			err(status, "waitpid");
L
Len Brown 已提交
4075
	}
4076 4077 4078 4079 4080
	/*
	 * n.b. fork_it() does not check for errors from for_all_cpus()
	 * because re-starting is problematic when forking
	 */
	for_all_cpus(get_counters, ODD_COUNTERS);
L
Len Brown 已提交
4081 4082
	gettimeofday(&tv_odd, (struct timezone *)NULL);
	timersub(&tv_odd, &tv_even, &tv_delta);
4083 4084 4085 4086 4087 4088
	if (for_all_cpus_2(delta_cpu, ODD_COUNTERS, EVEN_COUNTERS))
		fprintf(outf, "%s: Counter reset detected\n", progname);
	else {
		compute_average(EVEN_COUNTERS);
		format_all_counters(EVEN_COUNTERS);
	}
L
Len Brown 已提交
4089

4090 4091 4092
	fprintf(outf, "%.6f sec\n", tv_delta.tv_sec + tv_delta.tv_usec/1000000.0);

	flush_output_stderr();
L
Len Brown 已提交
4093

4094
	return status;
L
Len Brown 已提交
4095 4096
}

4097 4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108
int get_and_dump_counters(void)
{
	int status;

	status = for_all_cpus(get_counters, ODD_COUNTERS);
	if (status)
		return status;

	status = for_all_cpus(dump_counters, ODD_COUNTERS);
	if (status)
		return status;

4109
	flush_output_stdout();
4110 4111 4112 4113

	return status;
}

4114
void print_version() {
4115
	fprintf(outf, "turbostat version 4.17 1 Jan 2017"
4116 4117 4118
		" - Len Brown <lenb@kernel.org>\n");
}

4119 4120 4121 4122 4123 4124 4125 4126 4127 4128 4129 4130 4131 4132 4133 4134 4135 4136 4137 4138 4139 4140 4141
int add_counter(unsigned int msr_num, char *name, unsigned int width,
	enum counter_scope scope, enum counter_type type,
	enum counter_format format)
{
	struct msr_counter *msrp;

	msrp = calloc(1, sizeof(struct msr_counter));
	if (msrp == NULL) {
		perror("calloc");
		exit(1);
	}

	msrp->msr_num = msr_num;
	strncpy(msrp->name, name, NAME_BYTES);
	msrp->width = width;
	msrp->type = type;
	msrp->format = format;

	switch (scope) {

	case SCOPE_CPU:
		msrp->next = sys.tp;
		sys.tp = msrp;
4142 4143 4144 4145 4146 4147
		sys.added_thread_counters++;
		if (sys.added_thread_counters > MAX_ADDED_COUNTERS) {
			fprintf(stderr, "exceeded max %d added thread counters\n",
				MAX_ADDED_COUNTERS);
			exit(-1);
		}
4148 4149 4150 4151 4152
		break;

	case SCOPE_CORE:
		msrp->next = sys.cp;
		sys.cp = msrp;
4153 4154 4155 4156 4157 4158
		sys.added_core_counters++;
		if (sys.added_core_counters > MAX_ADDED_COUNTERS) {
			fprintf(stderr, "exceeded max %d added core counters\n",
				MAX_ADDED_COUNTERS);
			exit(-1);
		}
4159 4160 4161 4162 4163
		break;

	case SCOPE_PACKAGE:
		msrp->next = sys.pp;
		sys.pp = msrp;
4164 4165 4166 4167 4168 4169
		sys.added_package_counters++;
		if (sys.added_package_counters > MAX_ADDED_COUNTERS) {
			fprintf(stderr, "exceeded max %d added package counters\n",
				MAX_ADDED_COUNTERS);
			exit(-1);
		}
4170 4171 4172 4173 4174 4175 4176 4177 4178 4179 4180 4181 4182 4183 4184 4185 4186 4187 4188 4189 4190 4191 4192 4193 4194 4195 4196 4197 4198 4199 4200 4201 4202 4203 4204 4205 4206 4207 4208 4209 4210 4211 4212 4213 4214 4215 4216 4217 4218 4219 4220 4221 4222 4223 4224 4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236 4237 4238 4239 4240 4241 4242 4243 4244 4245 4246 4247 4248 4249 4250 4251 4252 4253 4254 4255 4256 4257 4258 4259 4260 4261 4262 4263 4264 4265 4266 4267 4268 4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279
		break;
	}

	return 0;
}

void parse_add_command(char *add_command)
{
	int msr_num = 0;
	char name_buffer[NAME_BYTES];
	int width = 64;
	int fail = 0;
	enum counter_scope scope = SCOPE_CPU;
	enum counter_type type = COUNTER_CYCLES;
	enum counter_format format = FORMAT_DELTA;

	while (add_command) {

		if (sscanf(add_command, "msr0x%x", &msr_num) == 1)
			goto next;

		if (sscanf(add_command, "msr%d", &msr_num) == 1)
			goto next;

		if (sscanf(add_command, "u%d", &width) == 1) {
			if ((width == 32) || (width == 64))
				goto next;
			width = 64;
		}
		if (!strncmp(add_command, "cpu", strlen("cpu"))) {
			scope = SCOPE_CPU;
			goto next;
		}
		if (!strncmp(add_command, "core", strlen("core"))) {
			scope = SCOPE_CORE;
			goto next;
		}
		if (!strncmp(add_command, "package", strlen("package"))) {
			scope = SCOPE_PACKAGE;
			goto next;
		}
		if (!strncmp(add_command, "cycles", strlen("cycles"))) {
			type = COUNTER_CYCLES;
			goto next;
		}
		if (!strncmp(add_command, "seconds", strlen("seconds"))) {
			type = COUNTER_SECONDS;
			goto next;
		}
		if (!strncmp(add_command, "raw", strlen("raw"))) {
			format = FORMAT_RAW;
			goto next;
		}
		if (!strncmp(add_command, "delta", strlen("delta"))) {
			format = FORMAT_DELTA;
			goto next;
		}
		if (!strncmp(add_command, "percent", strlen("percent"))) {
			format = FORMAT_PERCENT;
			goto next;
		}

		if (sscanf(add_command, "%18s,%*s", name_buffer) == 1) {	/* 18 < NAME_BYTES */
			char *eos;

			eos = strchr(name_buffer, ',');
			if (eos)
				*eos = '\0';
			goto next;
		}

next:
		add_command = strchr(add_command, ',');
		if (add_command)
			add_command++;

	}
	if (msr_num == 0) {
		fprintf(stderr, "--add: (msrDDD | msr0xXXX) required\n");
		fail++;
	}

	/* generate default column header */
	if (*name_buffer == '\0') {
		if (format == FORMAT_RAW) {
			if (width == 32)
				sprintf(name_buffer, "msr%d", msr_num);
			else
				sprintf(name_buffer, "MSR%d", msr_num);
		} else if (format == FORMAT_DELTA) {
			if (width == 32)
				sprintf(name_buffer, "cnt%d", msr_num);
			else
				sprintf(name_buffer, "CNT%d", msr_num);
		} else if (format == FORMAT_PERCENT) {
			if (width == 32)
				sprintf(name_buffer, "msr%d%%", msr_num);
			else
				sprintf(name_buffer, "MSR%d%%", msr_num);
		}
	}

	if (add_counter(msr_num, name_buffer, width, scope, type, format))
		fail++;

	if (fail) {
		help();
		exit(1);
	}
}
4280 4281 4282 4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304 4305 4306 4307 4308 4309 4310 4311 4312 4313
/*
 * HIDE_LIST - hide this list of counters, show the rest [default]
 * SHOW_LIST - show this list of counters, hide the rest
 */
enum show_hide_mode { SHOW_LIST, HIDE_LIST } global_show_hide_mode = HIDE_LIST;

int shown;
/*
 * parse_show_hide() - process cmdline to set default counter action
 */
void parse_show_hide(char *optarg, enum show_hide_mode new_mode)
{
	/*
	 * --show: show only those specified
	 *  The 1st invocation will clear and replace the enabled mask
	 *  subsequent invocations can add to it.
	 */
	if (new_mode == SHOW_LIST) {
		if (shown == 0)
			bic_enabled = bic_lookup(optarg);
		else
			bic_enabled |= bic_lookup(optarg);
		shown = 1;

		return;
	}

	/*
	 * --hide: do not show those specified
	 *  multiple invocations simply clear more bits in enabled mask
	 */
	bic_enabled &= ~bic_lookup(optarg);
}

L
Len Brown 已提交
4314 4315 4316
void cmdline(int argc, char **argv)
{
	int opt;
4317 4318
	int option_index = 0;
	static struct option long_options[] = {
4319
		{"add",		required_argument,	0, 'a'},
4320 4321 4322 4323
		{"Dump",	no_argument,		0, 'D'},
		{"debug",	no_argument,		0, 'd'},
		{"interval",	required_argument,	0, 'i'},
		{"help",	no_argument,		0, 'h'},
4324
		{"hide",	required_argument,	0, 'H'},	// meh, -h taken by --help
4325
		{"Joules",	no_argument,		0, 'J'},
4326
		{"out",		required_argument,	0, 'o'},
4327 4328
		{"Package",	no_argument,		0, 'p'},
		{"processor",	no_argument,		0, 'p'},
4329
		{"show",	required_argument,	0, 's'},
4330 4331 4332 4333 4334
		{"Summary",	no_argument,		0, 'S'},
		{"TCC",		required_argument,	0, 'T'},
		{"version",	no_argument,		0, 'v' },
		{0,		0,			0,  0 }
	};
L
Len Brown 已提交
4335 4336 4337

	progname = argv[0];

4338
	while ((opt = getopt_long_only(argc, argv, "+C:c:Ddhi:JM:m:o:PpST:v",
4339
				long_options, &option_index)) != -1) {
L
Len Brown 已提交
4340
		switch (opt) {
4341 4342 4343
		case 'a':
			parse_add_command(optarg);
			break;
4344
		case 'D':
4345 4346
			dump_only++;
			break;
4347 4348
		case 'd':
			debug++;
L
Len Brown 已提交
4349
			break;
4350 4351 4352
		case 'H':
			parse_show_hide(optarg, HIDE_LIST);
			break;
4353 4354 4355 4356
		case 'h':
		default:
			help();
			exit(1);
L
Len Brown 已提交
4357
		case 'i':
4358 4359 4360 4361
			{
				double interval = strtod(optarg, NULL);

				if (interval < 0.001) {
4362
					fprintf(outf, "interval %f seconds is too small\n",
4363 4364 4365 4366 4367 4368 4369
						interval);
					exit(2);
				}

				interval_ts.tv_sec = interval;
				interval_ts.tv_nsec = (interval - interval_ts.tv_sec) * 1000000000;
			}
L
Len Brown 已提交
4370
			break;
4371 4372
		case 'J':
			rapl_joules++;
4373
			break;
4374 4375 4376
		case 'o':
			outf = fopen_or_die(optarg, "w");
			break;
4377 4378 4379 4380 4381
		case 'P':
			show_pkg_only++;
			break;
		case 'p':
			show_core_only++;
L
Len Brown 已提交
4382
			break;
4383 4384 4385
		case 's':
			parse_show_hide(optarg, SHOW_LIST);
			break;
4386 4387
		case 'S':
			summary_only++;
4388 4389 4390 4391
			break;
		case 'T':
			tcc_activation_temp_override = atoi(optarg);
			break;
4392 4393 4394
		case 'v':
			print_version();
			exit(0);
4395
			break;
L
Len Brown 已提交
4396 4397 4398 4399 4400 4401
		}
	}
}

int main(int argc, char **argv)
{
4402 4403
	outf = stderr;

L
Len Brown 已提交
4404 4405
	cmdline(argc, argv);

4406 4407
	if (debug)
		print_version();
L
Len Brown 已提交
4408 4409 4410

	turbostat_init();

4411 4412 4413 4414
	/* dump counters and exit */
	if (dump_only)
		return get_and_dump_counters();

L
Len Brown 已提交
4415 4416 4417 4418 4419 4420 4421 4422 4423 4424
	/*
	 * if any params left, it must be a command to fork
	 */
	if (argc - optind)
		return fork_it(argv + optind);
	else
		turbostat_loop();

	return 0;
}