xref: /openbmc/linux/tools/perf/util/stat.h (revision 248ed9e227e6cf59acb1aaf3aa30d530a0232c1a)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef __PERF_STATS_H
3 #define __PERF_STATS_H
4 
5 #include <linux/types.h>
6 #include <stdio.h>
7 #include <sys/types.h>
8 #include <sys/resource.h>
9 #include "cpumap.h"
10 #include "rblist.h"
11 #include "counts.h"
12 
13 struct perf_cpu_map;
14 struct perf_stat_config;
15 struct timespec;
16 
17 struct stats {
18 	double n, mean, M2;
19 	u64 max, min;
20 };
21 
22 enum perf_stat_evsel_id {
23 	PERF_STAT_EVSEL_ID__NONE = 0,
24 	PERF_STAT_EVSEL_ID__CYCLES_IN_TX,
25 	PERF_STAT_EVSEL_ID__TRANSACTION_START,
26 	PERF_STAT_EVSEL_ID__ELISION_START,
27 	PERF_STAT_EVSEL_ID__CYCLES_IN_TX_CP,
28 	PERF_STAT_EVSEL_ID__TOPDOWN_TOTAL_SLOTS,
29 	PERF_STAT_EVSEL_ID__TOPDOWN_SLOTS_ISSUED,
30 	PERF_STAT_EVSEL_ID__TOPDOWN_SLOTS_RETIRED,
31 	PERF_STAT_EVSEL_ID__TOPDOWN_FETCH_BUBBLES,
32 	PERF_STAT_EVSEL_ID__TOPDOWN_RECOVERY_BUBBLES,
33 	PERF_STAT_EVSEL_ID__TOPDOWN_RETIRING,
34 	PERF_STAT_EVSEL_ID__TOPDOWN_BAD_SPEC,
35 	PERF_STAT_EVSEL_ID__TOPDOWN_FE_BOUND,
36 	PERF_STAT_EVSEL_ID__TOPDOWN_BE_BOUND,
37 	PERF_STAT_EVSEL_ID__TOPDOWN_HEAVY_OPS,
38 	PERF_STAT_EVSEL_ID__TOPDOWN_BR_MISPREDICT,
39 	PERF_STAT_EVSEL_ID__TOPDOWN_FETCH_LAT,
40 	PERF_STAT_EVSEL_ID__TOPDOWN_MEM_BOUND,
41 	PERF_STAT_EVSEL_ID__SMI_NUM,
42 	PERF_STAT_EVSEL_ID__APERF,
43 	PERF_STAT_EVSEL_ID__MAX,
44 };
45 
46 /* hold aggregated event info */
47 struct perf_stat_aggr {
48 	/* aggregated values */
49 	struct perf_counts_values	counts;
50 	/* number of entries (CPUs) aggregated */
51 	int				nr;
52 	/* whether any entry has failed to read/process event */
53 	bool				failed;
54 	/* to mark this data is processed already */
55 	bool				used;
56 };
57 
58 /* per-evsel event stats */
59 struct perf_stat_evsel {
60 	/* used for repeated runs */
61 	struct stats		 res_stats;
62 	/* evsel id for quick check */
63 	enum perf_stat_evsel_id	 id;
64 	/* number of allocated 'aggr' */
65 	int			 nr_aggr;
66 	/* aggregated event values */
67 	struct perf_stat_aggr	*aggr;
68 	/* used for group read */
69 	u64			*group_data;
70 };
71 
72 enum aggr_mode {
73 	AGGR_NONE,
74 	AGGR_GLOBAL,
75 	AGGR_SOCKET,
76 	AGGR_DIE,
77 	AGGR_CORE,
78 	AGGR_THREAD,
79 	AGGR_UNSET,
80 	AGGR_NODE,
81 	AGGR_MAX
82 };
83 
84 enum {
85 	CTX_BIT_USER	= 1 << 0,
86 	CTX_BIT_KERNEL	= 1 << 1,
87 	CTX_BIT_HV	= 1 << 2,
88 	CTX_BIT_HOST	= 1 << 3,
89 	CTX_BIT_IDLE	= 1 << 4,
90 	CTX_BIT_MAX	= 1 << 5,
91 };
92 
93 #define NUM_CTX CTX_BIT_MAX
94 
95 enum stat_type {
96 	STAT_NONE = 0,
97 	STAT_NSECS,
98 	STAT_CYCLES,
99 	STAT_STALLED_CYCLES_FRONT,
100 	STAT_STALLED_CYCLES_BACK,
101 	STAT_BRANCHES,
102 	STAT_CACHEREFS,
103 	STAT_L1_DCACHE,
104 	STAT_L1_ICACHE,
105 	STAT_LL_CACHE,
106 	STAT_ITLB_CACHE,
107 	STAT_DTLB_CACHE,
108 	STAT_CYCLES_IN_TX,
109 	STAT_TRANSACTION,
110 	STAT_ELISION,
111 	STAT_TOPDOWN_TOTAL_SLOTS,
112 	STAT_TOPDOWN_SLOTS_ISSUED,
113 	STAT_TOPDOWN_SLOTS_RETIRED,
114 	STAT_TOPDOWN_FETCH_BUBBLES,
115 	STAT_TOPDOWN_RECOVERY_BUBBLES,
116 	STAT_TOPDOWN_RETIRING,
117 	STAT_TOPDOWN_BAD_SPEC,
118 	STAT_TOPDOWN_FE_BOUND,
119 	STAT_TOPDOWN_BE_BOUND,
120 	STAT_TOPDOWN_HEAVY_OPS,
121 	STAT_TOPDOWN_BR_MISPREDICT,
122 	STAT_TOPDOWN_FETCH_LAT,
123 	STAT_TOPDOWN_MEM_BOUND,
124 	STAT_SMI_NUM,
125 	STAT_APERF,
126 	STAT_MAX
127 };
128 
129 struct runtime_stat {
130 	struct rblist value_list;
131 };
132 
133 struct rusage_stats {
134 	struct stats ru_utime_usec_stat;
135 	struct stats ru_stime_usec_stat;
136 };
137 
138 typedef struct aggr_cpu_id (*aggr_get_id_t)(struct perf_stat_config *config, struct perf_cpu cpu);
139 
140 struct perf_stat_config {
141 	enum aggr_mode		 aggr_mode;
142 	bool			 scale;
143 	bool			 no_inherit;
144 	bool			 identifier;
145 	bool			 csv_output;
146 	bool			 json_output;
147 	bool			 interval_clear;
148 	bool			 metric_only;
149 	bool			 null_run;
150 	bool			 ru_display;
151 	bool			 big_num;
152 	bool			 no_merge;
153 	bool			 hybrid_merge;
154 	bool			 walltime_run_table;
155 	bool			 all_kernel;
156 	bool			 all_user;
157 	bool			 percore_show_thread;
158 	bool			 summary;
159 	bool			 no_csv_summary;
160 	bool			 metric_no_group;
161 	bool			 metric_no_merge;
162 	bool			 stop_read_counter;
163 	bool			 iostat_run;
164 	char			 *user_requested_cpu_list;
165 	bool			 system_wide;
166 	FILE			*output;
167 	unsigned int		 interval;
168 	unsigned int		 timeout;
169 	unsigned int		 unit_width;
170 	unsigned int		 metric_only_len;
171 	int			 times;
172 	int			 run_count;
173 	int			 print_free_counters_hint;
174 	int			 print_mixed_hw_group_error;
175 	const char		*csv_sep;
176 	struct stats		*walltime_nsecs_stats;
177 	struct rusage		 ru_data;
178 	struct rusage_stats		 *ru_stats;
179 	struct cpu_aggr_map	*aggr_map;
180 	aggr_get_id_t		 aggr_get_id;
181 	struct cpu_aggr_map	*cpus_aggr_map;
182 	u64			*walltime_run;
183 	struct rblist		 metric_events;
184 	int			 ctl_fd;
185 	int			 ctl_fd_ack;
186 	bool			 ctl_fd_close;
187 	const char		*cgroup_list;
188 	unsigned int		topdown_level;
189 };
190 
191 void perf_stat__set_big_num(int set);
192 void perf_stat__set_no_csv_summary(int set);
193 
194 void update_stats(struct stats *stats, u64 val);
195 double avg_stats(struct stats *stats);
196 double stddev_stats(struct stats *stats);
197 double rel_stddev_stats(double stddev, double avg);
198 
199 static inline void init_stats(struct stats *stats)
200 {
201 	stats->n    = 0.0;
202 	stats->mean = 0.0;
203 	stats->M2   = 0.0;
204 	stats->min  = (u64) -1;
205 	stats->max  = 0;
206 }
207 
208 static inline void init_rusage_stats(struct rusage_stats *ru_stats) {
209 	init_stats(&ru_stats->ru_utime_usec_stat);
210 	init_stats(&ru_stats->ru_stime_usec_stat);
211 }
212 
213 static inline void update_rusage_stats(struct rusage_stats *ru_stats, struct rusage* rusage) {
214 	const u64 us_to_ns = 1000;
215 	const u64 s_to_ns = 1000000000;
216 	update_stats(&ru_stats->ru_utime_usec_stat,
217 	             (rusage->ru_utime.tv_usec * us_to_ns + rusage->ru_utime.tv_sec * s_to_ns));
218 	update_stats(&ru_stats->ru_stime_usec_stat,
219 	             (rusage->ru_stime.tv_usec * us_to_ns + rusage->ru_stime.tv_sec * s_to_ns));
220 }
221 
222 struct evsel;
223 struct evlist;
224 
225 bool __perf_stat_evsel__is(struct evsel *evsel, enum perf_stat_evsel_id id);
226 
227 #define perf_stat_evsel__is(evsel, id) \
228 	__perf_stat_evsel__is(evsel, PERF_STAT_EVSEL_ID__ ## id)
229 
230 extern struct runtime_stat rt_stat;
231 extern struct stats walltime_nsecs_stats;
232 extern struct rusage_stats ru_stats;
233 
234 typedef void (*print_metric_t)(struct perf_stat_config *config,
235 			       void *ctx, const char *color, const char *unit,
236 			       const char *fmt, double val);
237 typedef void (*new_line_t)(struct perf_stat_config *config, void *ctx);
238 
239 void runtime_stat__init(struct runtime_stat *st);
240 void runtime_stat__exit(struct runtime_stat *st);
241 void perf_stat__init_shadow_stats(void);
242 void perf_stat__reset_shadow_stats(void);
243 void perf_stat__reset_shadow_per_stat(struct runtime_stat *st);
244 void perf_stat__update_shadow_stats(struct evsel *counter, u64 count,
245 				    int map_idx, struct runtime_stat *st);
246 struct perf_stat_output_ctx {
247 	void *ctx;
248 	print_metric_t print_metric;
249 	new_line_t new_line;
250 	bool force_header;
251 };
252 
253 void perf_stat__print_shadow_stats(struct perf_stat_config *config,
254 				   struct evsel *evsel,
255 				   double avg, int map_idx,
256 				   struct perf_stat_output_ctx *out,
257 				   struct rblist *metric_events,
258 				   struct runtime_stat *st);
259 
260 int evlist__alloc_stats(struct perf_stat_config *config,
261 			struct evlist *evlist, bool alloc_raw);
262 void evlist__free_stats(struct evlist *evlist);
263 void evlist__reset_stats(struct evlist *evlist);
264 void evlist__reset_prev_raw_counts(struct evlist *evlist);
265 void evlist__copy_prev_raw_counts(struct evlist *evlist);
266 void evlist__save_aggr_prev_raw_counts(struct evlist *evlist);
267 
268 int evlist__alloc_aggr_stats(struct evlist *evlist, int nr_aggr);
269 void evlist__reset_aggr_stats(struct evlist *evlist);
270 
271 int perf_stat_process_counter(struct perf_stat_config *config,
272 			      struct evsel *counter);
273 void perf_stat_merge_counters(struct perf_stat_config *config, struct evlist *evlist);
274 void perf_stat_process_percore(struct perf_stat_config *config, struct evlist *evlist);
275 void perf_stat_process_shadow_stats(struct perf_stat_config *config, struct evlist *evlist);
276 
277 struct perf_tool;
278 union perf_event;
279 struct perf_session;
280 struct target;
281 
282 int perf_event__process_stat_event(struct perf_session *session,
283 				   union perf_event *event);
284 
285 size_t perf_event__fprintf_stat(union perf_event *event, FILE *fp);
286 size_t perf_event__fprintf_stat_round(union perf_event *event, FILE *fp);
287 size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp);
288 
289 int create_perf_stat_counter(struct evsel *evsel,
290 			     struct perf_stat_config *config,
291 			     struct target *target,
292 			     int cpu_map_idx);
293 void evlist__print_counters(struct evlist *evlist, struct perf_stat_config *config,
294 			    struct target *_target, struct timespec *ts, int argc, const char **argv);
295 
296 struct metric_expr;
297 double test_generic_metric(struct metric_expr *mexp, int map_idx, struct runtime_stat *st);
298 #endif
299