• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1  /* SPDX-License-Identifier: GPL-2.0 */
2  #ifndef __PERF_RECORD_H
3  #define __PERF_RECORD_H
4  /*
5   * The linux/stddef.h isn't need here, but is needed for __always_inline used
6   * in files included from uapi/linux/perf_event.h such as
7   * /usr/include/linux/swab.h and /usr/include/linux/byteorder/little_endian.h,
8   * detected in at least musl libc, used in Alpine Linux. -acme
9   */
10  #include <stdio.h>
11  #include <linux/stddef.h>
12  #include <perf/event.h>
13  #include <linux/types.h>
14  
15  #include "perf_regs.h"
16  
17  struct dso;
18  struct machine;
19  struct perf_event_attr;
20  
21  #ifdef __LP64__
22  /*
23   * /usr/include/inttypes.h uses just 'lu' for PRIu64, but we end up defining
24   * __u64 as long long unsigned int, and then -Werror=format= kicks in and
25   * complains of the mismatched types, so use these two special extra PRI
26   * macros to overcome that.
27   */
28  #define PRI_lu64 "l" PRIu64
29  #define PRI_lx64 "l" PRIx64
30  #define PRI_ld64 "l" PRId64
31  #else
32  #define PRI_lu64 PRIu64
33  #define PRI_lx64 PRIx64
34  #define PRI_ld64 PRId64
35  #endif
36  
37  #define PERF_SAMPLE_MASK				\
38  	(PERF_SAMPLE_IP | PERF_SAMPLE_TID |		\
39  	 PERF_SAMPLE_TIME | PERF_SAMPLE_ADDR |		\
40  	PERF_SAMPLE_ID | PERF_SAMPLE_STREAM_ID |	\
41  	 PERF_SAMPLE_CPU | PERF_SAMPLE_PERIOD |		\
42  	 PERF_SAMPLE_IDENTIFIER)
43  
44  /* perf sample has 16 bits size limit */
45  #define PERF_SAMPLE_MAX_SIZE (1 << 16)
46  
47  struct regs_dump {
48  	u64 abi;
49  	u64 mask;
50  	u64 *regs;
51  
52  	/* Cached values/mask filled by first register access. */
53  	u64 cache_regs[PERF_REGS_MAX];
54  	u64 cache_mask;
55  };
56  
57  struct stack_dump {
58  	u16 offset;
59  	u64 size;
60  	char *data;
61  };
62  
63  struct sample_read_value {
64  	u64 value;
65  	u64 id;
66  };
67  
68  struct sample_read {
69  	u64 time_enabled;
70  	u64 time_running;
71  	union {
72  		struct {
73  			u64 nr;
74  			struct sample_read_value *values;
75  		} group;
76  		struct sample_read_value one;
77  	};
78  };
79  
80  struct ip_callchain {
81  	u64 nr;
82  	u64 ips[];
83  };
84  
85  struct branch_stack;
86  
87  enum {
88  	PERF_IP_FLAG_BRANCH		= 1ULL << 0,
89  	PERF_IP_FLAG_CALL		= 1ULL << 1,
90  	PERF_IP_FLAG_RETURN		= 1ULL << 2,
91  	PERF_IP_FLAG_CONDITIONAL	= 1ULL << 3,
92  	PERF_IP_FLAG_SYSCALLRET		= 1ULL << 4,
93  	PERF_IP_FLAG_ASYNC		= 1ULL << 5,
94  	PERF_IP_FLAG_INTERRUPT		= 1ULL << 6,
95  	PERF_IP_FLAG_TX_ABORT		= 1ULL << 7,
96  	PERF_IP_FLAG_TRACE_BEGIN	= 1ULL << 8,
97  	PERF_IP_FLAG_TRACE_END		= 1ULL << 9,
98  	PERF_IP_FLAG_IN_TX		= 1ULL << 10,
99  	PERF_IP_FLAG_VMENTRY		= 1ULL << 11,
100  	PERF_IP_FLAG_VMEXIT		= 1ULL << 12,
101  };
102  
103  #define PERF_IP_FLAG_CHARS "bcrosyiABExgh"
104  
105  #define PERF_BRANCH_MASK		(\
106  	PERF_IP_FLAG_BRANCH		|\
107  	PERF_IP_FLAG_CALL		|\
108  	PERF_IP_FLAG_RETURN		|\
109  	PERF_IP_FLAG_CONDITIONAL	|\
110  	PERF_IP_FLAG_SYSCALLRET		|\
111  	PERF_IP_FLAG_ASYNC		|\
112  	PERF_IP_FLAG_INTERRUPT		|\
113  	PERF_IP_FLAG_TX_ABORT		|\
114  	PERF_IP_FLAG_TRACE_BEGIN	|\
115  	PERF_IP_FLAG_TRACE_END		|\
116  	PERF_IP_FLAG_VMENTRY		|\
117  	PERF_IP_FLAG_VMEXIT)
118  
119  #define MAX_INSN 16
120  
121  struct aux_sample {
122  	u64 size;
123  	void *data;
124  };
125  
126  struct perf_sample {
127  	u64 ip;
128  	u32 pid, tid;
129  	u64 time;
130  	u64 addr;
131  	u64 id;
132  	u64 stream_id;
133  	u64 period;
134  	u64 weight;
135  	u64 transaction;
136  	u64 insn_cnt;
137  	u64 cyc_cnt;
138  	u32 cpu;
139  	u32 raw_size;
140  	u64 data_src;
141  	u64 phys_addr;
142  	u64 data_page_size;
143  	u64 code_page_size;
144  	u64 cgroup;
145  	u32 flags;
146  	u16 insn_len;
147  	u8  cpumode;
148  	u16 misc;
149  	u16 ins_lat;
150  	u16 p_stage_cyc;
151  	bool no_hw_idx;		/* No hw_idx collected in branch_stack */
152  	char insn[MAX_INSN];
153  	void *raw_data;
154  	struct ip_callchain *callchain;
155  	struct branch_stack *branch_stack;
156  	struct regs_dump  user_regs;
157  	struct regs_dump  intr_regs;
158  	struct stack_dump user_stack;
159  	struct sample_read read;
160  	struct aux_sample aux_sample;
161  };
162  
163  #define PERF_MEM_DATA_SRC_NONE \
164  	(PERF_MEM_S(OP, NA) |\
165  	 PERF_MEM_S(LVL, NA) |\
166  	 PERF_MEM_S(SNOOP, NA) |\
167  	 PERF_MEM_S(LOCK, NA) |\
168  	 PERF_MEM_S(TLB, NA))
169  
170  /* Attribute type for custom synthesized events */
171  #define PERF_TYPE_SYNTH		(INT_MAX + 1U)
172  
173  /* Attribute config for custom synthesized events */
174  enum perf_synth_id {
175  	PERF_SYNTH_INTEL_PTWRITE,
176  	PERF_SYNTH_INTEL_MWAIT,
177  	PERF_SYNTH_INTEL_PWRE,
178  	PERF_SYNTH_INTEL_EXSTOP,
179  	PERF_SYNTH_INTEL_PWRX,
180  	PERF_SYNTH_INTEL_CBR,
181  	PERF_SYNTH_INTEL_PSB,
182  };
183  
184  /*
185   * Raw data formats for synthesized events. Note that 4 bytes of padding are
186   * present to match the 'size' member of PERF_SAMPLE_RAW data which is always
187   * 8-byte aligned. That means we must dereference raw_data with an offset of 4.
188   * Refer perf_sample__synth_ptr() and perf_synth__raw_data().  It also means the
189   * structure sizes are 4 bytes bigger than the raw_size, refer
190   * perf_synth__raw_size().
191   */
192  
193  struct perf_synth_intel_ptwrite {
194  	u32 padding;
195  	union {
196  		struct {
197  			u32	ip		:  1,
198  				reserved	: 31;
199  		};
200  		u32	flags;
201  	};
202  	u64	payload;
203  };
204  
205  struct perf_synth_intel_mwait {
206  	u32 padding;
207  	u32 reserved;
208  	union {
209  		struct {
210  			u64	hints		:  8,
211  				reserved1	: 24,
212  				extensions	:  2,
213  				reserved2	: 30;
214  		};
215  		u64	payload;
216  	};
217  };
218  
219  struct perf_synth_intel_pwre {
220  	u32 padding;
221  	u32 reserved;
222  	union {
223  		struct {
224  			u64	reserved1	:  7,
225  				hw		:  1,
226  				subcstate	:  4,
227  				cstate		:  4,
228  				reserved2	: 48;
229  		};
230  		u64	payload;
231  	};
232  };
233  
234  struct perf_synth_intel_exstop {
235  	u32 padding;
236  	union {
237  		struct {
238  			u32	ip		:  1,
239  				reserved	: 31;
240  		};
241  		u32	flags;
242  	};
243  };
244  
245  struct perf_synth_intel_pwrx {
246  	u32 padding;
247  	u32 reserved;
248  	union {
249  		struct {
250  			u64	deepest_cstate	:  4,
251  				last_cstate	:  4,
252  				wake_reason	:  4,
253  				reserved1	: 52;
254  		};
255  		u64	payload;
256  	};
257  };
258  
259  struct perf_synth_intel_cbr {
260  	u32 padding;
261  	union {
262  		struct {
263  			u32	cbr		:  8,
264  				reserved1	:  8,
265  				max_nonturbo	:  8,
266  				reserved2	:  8;
267  		};
268  		u32	flags;
269  	};
270  	u32 freq;
271  	u32 reserved3;
272  };
273  
274  struct perf_synth_intel_psb {
275  	u32 padding;
276  	u32 reserved;
277  	u64 offset;
278  };
279  
280  /*
281   * raw_data is always 4 bytes from an 8-byte boundary, so subtract 4 to get
282   * 8-byte alignment.
283   */
perf_sample__synth_ptr(struct perf_sample * sample)284  static inline void *perf_sample__synth_ptr(struct perf_sample *sample)
285  {
286  	return sample->raw_data - 4;
287  }
288  
perf_synth__raw_data(void * p)289  static inline void *perf_synth__raw_data(void *p)
290  {
291  	return p + 4;
292  }
293  
294  #define perf_synth__raw_size(d) (sizeof(d) - 4)
295  
296  #define perf_sample__bad_synth_size(s, d) ((s)->raw_size < sizeof(d) - 4)
297  
298  enum {
299  	PERF_STAT_ROUND_TYPE__INTERVAL	= 0,
300  	PERF_STAT_ROUND_TYPE__FINAL	= 1,
301  };
302  
303  void perf_event__print_totals(void);
304  
305  struct perf_cpu_map;
306  struct perf_record_stat_config;
307  struct perf_stat_config;
308  struct perf_tool;
309  
310  void perf_event__read_stat_config(struct perf_stat_config *config,
311  				  struct perf_record_stat_config *event);
312  
313  int perf_event__process_comm(struct perf_tool *tool,
314  			     union perf_event *event,
315  			     struct perf_sample *sample,
316  			     struct machine *machine);
317  int perf_event__process_lost(struct perf_tool *tool,
318  			     union perf_event *event,
319  			     struct perf_sample *sample,
320  			     struct machine *machine);
321  int perf_event__process_lost_samples(struct perf_tool *tool,
322  				     union perf_event *event,
323  				     struct perf_sample *sample,
324  				     struct machine *machine);
325  int perf_event__process_aux(struct perf_tool *tool,
326  			    union perf_event *event,
327  			    struct perf_sample *sample,
328  			    struct machine *machine);
329  int perf_event__process_itrace_start(struct perf_tool *tool,
330  				     union perf_event *event,
331  				     struct perf_sample *sample,
332  				     struct machine *machine);
333  int perf_event__process_switch(struct perf_tool *tool,
334  			       union perf_event *event,
335  			       struct perf_sample *sample,
336  			       struct machine *machine);
337  int perf_event__process_namespaces(struct perf_tool *tool,
338  				   union perf_event *event,
339  				   struct perf_sample *sample,
340  				   struct machine *machine);
341  int perf_event__process_cgroup(struct perf_tool *tool,
342  			       union perf_event *event,
343  			       struct perf_sample *sample,
344  			       struct machine *machine);
345  int perf_event__process_mmap(struct perf_tool *tool,
346  			     union perf_event *event,
347  			     struct perf_sample *sample,
348  			     struct machine *machine);
349  int perf_event__process_mmap2(struct perf_tool *tool,
350  			     union perf_event *event,
351  			     struct perf_sample *sample,
352  			     struct machine *machine);
353  int perf_event__process_fork(struct perf_tool *tool,
354  			     union perf_event *event,
355  			     struct perf_sample *sample,
356  			     struct machine *machine);
357  int perf_event__process_exit(struct perf_tool *tool,
358  			     union perf_event *event,
359  			     struct perf_sample *sample,
360  			     struct machine *machine);
361  int perf_event__process_ksymbol(struct perf_tool *tool,
362  				union perf_event *event,
363  				struct perf_sample *sample,
364  				struct machine *machine);
365  int perf_event__process_bpf(struct perf_tool *tool,
366  			    union perf_event *event,
367  			    struct perf_sample *sample,
368  			    struct machine *machine);
369  int perf_event__process_text_poke(struct perf_tool *tool,
370  				  union perf_event *event,
371  				  struct perf_sample *sample,
372  				  struct machine *machine);
373  int perf_event__process(struct perf_tool *tool,
374  			union perf_event *event,
375  			struct perf_sample *sample,
376  			struct machine *machine);
377  
378  struct addr_location;
379  
380  int machine__resolve(struct machine *machine, struct addr_location *al,
381  		     struct perf_sample *sample);
382  
383  void addr_location__put(struct addr_location *al);
384  
385  struct thread;
386  
387  bool is_bts_event(struct perf_event_attr *attr);
388  bool sample_addr_correlates_sym(struct perf_event_attr *attr);
389  void thread__resolve(struct thread *thread, struct addr_location *al,
390  		     struct perf_sample *sample);
391  
392  const char *perf_event__name(unsigned int id);
393  
394  size_t perf_event__fprintf_comm(union perf_event *event, FILE *fp);
395  size_t perf_event__fprintf_mmap(union perf_event *event, FILE *fp);
396  size_t perf_event__fprintf_mmap2(union perf_event *event, FILE *fp);
397  size_t perf_event__fprintf_task(union perf_event *event, FILE *fp);
398  size_t perf_event__fprintf_aux(union perf_event *event, FILE *fp);
399  size_t perf_event__fprintf_itrace_start(union perf_event *event, FILE *fp);
400  size_t perf_event__fprintf_switch(union perf_event *event, FILE *fp);
401  size_t perf_event__fprintf_thread_map(union perf_event *event, FILE *fp);
402  size_t perf_event__fprintf_cpu_map(union perf_event *event, FILE *fp);
403  size_t perf_event__fprintf_namespaces(union perf_event *event, FILE *fp);
404  size_t perf_event__fprintf_cgroup(union perf_event *event, FILE *fp);
405  size_t perf_event__fprintf_ksymbol(union perf_event *event, FILE *fp);
406  size_t perf_event__fprintf_bpf(union perf_event *event, FILE *fp);
407  size_t perf_event__fprintf_text_poke(union perf_event *event, struct machine *machine,FILE *fp);
408  size_t perf_event__fprintf(union perf_event *event, struct machine *machine, FILE *fp);
409  
410  int kallsyms__get_function_start(const char *kallsyms_filename,
411  				 const char *symbol_name, u64 *addr);
412  
413  void *cpu_map_data__alloc(struct perf_cpu_map *map, size_t *size, u16 *type, int *max);
414  void  cpu_map_data__synthesize(struct perf_record_cpu_map_data *data, struct perf_cpu_map *map,
415  			       u16 type, int max);
416  
417  void event_attr_init(struct perf_event_attr *attr);
418  
419  int perf_event_paranoid(void);
420  bool perf_event_paranoid_check(int max_level);
421  
422  extern int sysctl_perf_event_max_stack;
423  extern int sysctl_perf_event_max_contexts_per_stack;
424  extern unsigned int proc_map_timeout;
425  
426  #define PAGE_SIZE_NAME_LEN	32
427  char *get_page_size_name(u64 size, char *str);
428  
429  void arch_perf_parse_sample_weight(struct perf_sample *data, const __u64 *array, u64 type);
430  void arch_perf_synthesize_sample_weight(const struct perf_sample *data, __u64 *array, u64 type);
431  const char *arch_perf_header_entry(const char *se_header);
432  int arch_support_sort_key(const char *sort_key);
433  
434  #endif /* __PERF_RECORD_H */
435