perf.h 5.1 KB
Newer Older
1 2 3
#ifndef _PERF_PERF_H
#define _PERF_PERF_H

4 5
#include <asm/unistd.h>

V
Vince Weaver 已提交
6 7 8
#if defined(__i386__)
#define rmb()		asm volatile("lock; addl $0,0(%%esp)" ::: "memory")
#define cpu_relax()	asm volatile("rep; nop" ::: "memory");
9
#define CPUINFO_PROC	"model name"
10 11 12
#ifndef __NR_perf_event_open
# define __NR_perf_event_open 336
#endif
V
Vince Weaver 已提交
13 14 15
#endif

#if defined(__x86_64__)
16 17
#define rmb()		asm volatile("lfence" ::: "memory")
#define cpu_relax()	asm volatile("rep; nop" ::: "memory");
18
#define CPUINFO_PROC	"model name"
19 20 21
#ifndef __NR_perf_event_open
# define __NR_perf_event_open 298
#endif
22 23 24
#endif

#ifdef __powerpc__
25
#include "../../arch/powerpc/include/uapi/asm/unistd.h"
26 27
#define rmb()		asm volatile ("sync" ::: "memory")
#define cpu_relax()	asm volatile ("" ::: "memory");
28
#define CPUINFO_PROC	"cpu"
29 30
#endif

31 32 33 34 35
#ifdef __s390__
#define rmb()		asm volatile("bcr 15,0" ::: "memory")
#define cpu_relax()	asm volatile("" ::: "memory");
#endif

36 37 38 39 40 41 42
#ifdef __sh__
#if defined(__SH4A__) || defined(__SH5__)
# define rmb()		asm volatile("synco" ::: "memory")
#else
# define rmb()		asm volatile("" ::: "memory")
#endif
#define cpu_relax()	asm volatile("" ::: "memory")
43
#define CPUINFO_PROC	"cpu type"
44 45
#endif

46 47 48
#ifdef __hppa__
#define rmb()		asm volatile("" ::: "memory")
#define cpu_relax()	asm volatile("" ::: "memory");
49
#define CPUINFO_PROC	"cpu"
50 51
#endif

J
Jens Axboe 已提交
52 53 54
#ifdef __sparc__
#define rmb()		asm volatile("":::"memory")
#define cpu_relax()	asm volatile("":::"memory")
55
#define CPUINFO_PROC	"cpu"
J
Jens Axboe 已提交
56 57
#endif

58 59 60
#ifdef __alpha__
#define rmb()		asm volatile("mb" ::: "memory")
#define cpu_relax()	asm volatile("" ::: "memory")
61
#define CPUINFO_PROC	"cpu model"
62 63
#endif

64 65 66
#ifdef __ia64__
#define rmb()		asm volatile ("mf" ::: "memory")
#define cpu_relax()	asm volatile ("hint @pause" ::: "memory")
67
#define CPUINFO_PROC	"model name"
68 69
#endif

J
Jamie Iles 已提交
70 71 72 73 74
#ifdef __arm__
/*
 * Use the __kuser_memory_barrier helper in the CPU helper page. See
 * arch/arm/kernel/entry-armv.S in the kernel source for details.
 */
75
#define rmb()		((void(*)(void))0xffff0fa0)()
J
Jamie Iles 已提交
76
#define cpu_relax()	asm volatile("":::"memory")
77
#define CPUINFO_PROC	"Processor"
J
Jamie Iles 已提交
78 79
#endif

80 81 82 83 84
#ifdef __aarch64__
#define rmb()		asm volatile("dmb ld" ::: "memory")
#define cpu_relax()	asm volatile("yield" ::: "memory")
#endif

85 86 87 88 89 90 91 92 93
#ifdef __mips__
#define rmb()		asm volatile(					\
				".set	mips2\n\t"			\
				"sync\n\t"				\
				".set	mips0"				\
				: /* no output */			\
				: /* no input */			\
				: "memory")
#define cpu_relax()	asm volatile("" ::: "memory")
94
#define CPUINFO_PROC	"cpu model"
95 96
#endif

97 98 99 100 101 102
#ifdef __arc__
#define rmb()		asm volatile("" ::: "memory")
#define cpu_relax()	rmb()
#define CPUINFO_PROC	"Processor"
#endif

103 104 105 106 107 108
#ifdef __metag__
#define rmb()		asm volatile("" ::: "memory")
#define cpu_relax()	asm volatile("" ::: "memory")
#define CPUINFO_PROC	"CPU"
#endif

109 110 111 112 113
#include <time.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/syscall.h>

114
#include <linux/perf_event.h>
115
#include "util/types.h"
116
#include <stdbool.h>
117

118
/*
119
 * prctl(PR_TASK_PERF_EVENTS_DISABLE) will (cheaply) disable all
120 121
 * counters in the current task.
 */
122 123
#define PR_TASK_PERF_EVENTS_DISABLE   31
#define PR_TASK_PERF_EVENTS_ENABLE    32
124

125 126 127 128 129 130 131 132 133 134 135
#ifndef NSEC_PER_SEC
# define NSEC_PER_SEC			1000000000ULL
#endif

static inline unsigned long long rdclock(void)
{
	struct timespec ts;

	clock_gettime(CLOCK_MONOTONIC, &ts);
	return ts.tv_sec * 1000000000ULL + ts.tv_nsec;
}
136 137 138 139 140 141 142 143 144 145 146 147 148 149

/*
 * Pick up some kernel type conventions:
 */
#define __user
#define asmlinkage

#define unlikely(x)	__builtin_expect(!!(x), 0)
#define min(x, y) ({				\
	typeof(x) _min1 = (x);			\
	typeof(y) _min2 = (y);			\
	(void) (&_min1 == &_min2);		\
	_min1 < _min2 ? _min1 : _min2; })

150 151 152 153 154
extern bool test_attr__enabled;
void test_attr__init(void);
void test_attr__open(struct perf_event_attr *attr, pid_t pid, int cpu,
		     int fd, int group_fd, unsigned long flags);

155
static inline int
156
sys_perf_event_open(struct perf_event_attr *attr,
157 158 159
		      pid_t pid, int cpu, int group_fd,
		      unsigned long flags)
{
160 161 162 163 164 165 166 167 168
	int fd;

	fd = syscall(__NR_perf_event_open, attr, pid, cpu,
		     group_fd, flags);

	if (unlikely(test_attr__enabled))
		test_attr__open(attr, pid, cpu, fd, group_fd, flags);

	return fd;
169 170
}

171 172
#define MAX_COUNTERS			256
#define MAX_NR_CPUS			256
173

174 175 176
struct ip_callchain {
	u64 nr;
	u64 ips[0];
177 178
};

179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195
struct branch_flags {
	u64 mispred:1;
	u64 predicted:1;
	u64 reserved:62;
};

struct branch_entry {
	u64				from;
	u64				to;
	struct branch_flags flags;
};

struct branch_stack {
	u64				nr;
	struct branch_entry	entries[0];
};

196
extern const char *input_name;
197
extern bool perf_host, perf_guest;
198
extern const char perf_version_string[];
199

200 201
void pthread__unblock_sigwinch(void);

202
#include "util/target.h"
203

204 205 206 207 208 209
enum perf_call_graph_mode {
	CALLCHAIN_NONE,
	CALLCHAIN_FP,
	CALLCHAIN_DWARF
};

210 211
struct perf_record_opts {
	struct perf_target target;
212
	int	     call_graph;
213
	bool	     group;
214 215 216 217
	bool	     inherit_stat;
	bool	     no_delay;
	bool	     no_inherit;
	bool	     no_samples;
218
	bool	     pipe_output;
219 220
	bool	     raw_samples;
	bool	     sample_address;
221
	bool	     sample_weight;
222
	bool	     sample_time;
223
	bool	     period;
224
	unsigned int freq;
225
	unsigned int mmap_pages;
226
	unsigned int user_freq;
227
	u64          branch_stack;
228 229
	u64	     default_interval;
	u64	     user_interval;
230
	u16	     stack_dump_size;
231 232
};

233
#endif