xref: /openbmc/linux/tools/perf/util/mem-events.c (revision e3d786a3)
1 // SPDX-License-Identifier: GPL-2.0
2 #include <stddef.h>
3 #include <stdlib.h>
4 #include <string.h>
5 #include <errno.h>
6 #include <sys/types.h>
7 #include <sys/stat.h>
8 #include <unistd.h>
9 #include <api/fs/fs.h>
10 #include <linux/kernel.h>
11 #include "mem-events.h"
12 #include "debug.h"
13 #include "symbol.h"
14 #include "sort.h"
15 
16 unsigned int perf_mem_events__loads_ldlat = 30;
17 
18 #define E(t, n, s) { .tag = t, .name = n, .sysfs_name = s }
19 
20 struct perf_mem_event perf_mem_events[PERF_MEM_EVENTS__MAX] = {
21 	E("ldlat-loads",	"cpu/mem-loads,ldlat=%u/P",	"mem-loads"),
22 	E("ldlat-stores",	"cpu/mem-stores/P",		"mem-stores"),
23 };
24 #undef E
25 
26 #undef E
27 
28 static char mem_loads_name[100];
29 static bool mem_loads_name__init;
30 
31 char *perf_mem_events__name(int i)
32 {
33 	if (i == PERF_MEM_EVENTS__LOAD) {
34 		if (!mem_loads_name__init) {
35 			mem_loads_name__init = true;
36 			scnprintf(mem_loads_name, sizeof(mem_loads_name),
37 				  perf_mem_events[i].name,
38 				  perf_mem_events__loads_ldlat);
39 		}
40 		return mem_loads_name;
41 	}
42 
43 	return (char *)perf_mem_events[i].name;
44 }
45 
46 int perf_mem_events__parse(const char *str)
47 {
48 	char *tok, *saveptr = NULL;
49 	bool found = false;
50 	char *buf;
51 	int j;
52 
53 	/* We need buffer that we know we can write to. */
54 	buf = malloc(strlen(str) + 1);
55 	if (!buf)
56 		return -ENOMEM;
57 
58 	strcpy(buf, str);
59 
60 	tok = strtok_r((char *)buf, ",", &saveptr);
61 
62 	while (tok) {
63 		for (j = 0; j < PERF_MEM_EVENTS__MAX; j++) {
64 			struct perf_mem_event *e = &perf_mem_events[j];
65 
66 			if (strstr(e->tag, tok))
67 				e->record = found = true;
68 		}
69 
70 		tok = strtok_r(NULL, ",", &saveptr);
71 	}
72 
73 	free(buf);
74 
75 	if (found)
76 		return 0;
77 
78 	pr_err("failed: event '%s' not found, use '-e list' to get list of available events\n", str);
79 	return -1;
80 }
81 
82 int perf_mem_events__init(void)
83 {
84 	const char *mnt = sysfs__mount();
85 	bool found = false;
86 	int j;
87 
88 	if (!mnt)
89 		return -ENOENT;
90 
91 	for (j = 0; j < PERF_MEM_EVENTS__MAX; j++) {
92 		char path[PATH_MAX];
93 		struct perf_mem_event *e = &perf_mem_events[j];
94 		struct stat st;
95 
96 		scnprintf(path, PATH_MAX, "%s/devices/cpu/events/%s",
97 			  mnt, e->sysfs_name);
98 
99 		if (!stat(path, &st))
100 			e->supported = found = true;
101 	}
102 
103 	return found ? 0 : -ENOENT;
104 }
105 
106 static const char * const tlb_access[] = {
107 	"N/A",
108 	"HIT",
109 	"MISS",
110 	"L1",
111 	"L2",
112 	"Walker",
113 	"Fault",
114 };
115 
116 int perf_mem__tlb_scnprintf(char *out, size_t sz, struct mem_info *mem_info)
117 {
118 	size_t l = 0, i;
119 	u64 m = PERF_MEM_TLB_NA;
120 	u64 hit, miss;
121 
122 	sz -= 1; /* -1 for null termination */
123 	out[0] = '\0';
124 
125 	if (mem_info)
126 		m = mem_info->data_src.mem_dtlb;
127 
128 	hit = m & PERF_MEM_TLB_HIT;
129 	miss = m & PERF_MEM_TLB_MISS;
130 
131 	/* already taken care of */
132 	m &= ~(PERF_MEM_TLB_HIT|PERF_MEM_TLB_MISS);
133 
134 	for (i = 0; m && i < ARRAY_SIZE(tlb_access); i++, m >>= 1) {
135 		if (!(m & 0x1))
136 			continue;
137 		if (l) {
138 			strcat(out, " or ");
139 			l += 4;
140 		}
141 		l += scnprintf(out + l, sz - l, tlb_access[i]);
142 	}
143 	if (*out == '\0')
144 		l += scnprintf(out, sz - l, "N/A");
145 	if (hit)
146 		l += scnprintf(out + l, sz - l, " hit");
147 	if (miss)
148 		l += scnprintf(out + l, sz - l, " miss");
149 
150 	return l;
151 }
152 
153 static const char * const mem_lvl[] = {
154 	"N/A",
155 	"HIT",
156 	"MISS",
157 	"L1",
158 	"LFB",
159 	"L2",
160 	"L3",
161 	"Local RAM",
162 	"Remote RAM (1 hop)",
163 	"Remote RAM (2 hops)",
164 	"Remote Cache (1 hop)",
165 	"Remote Cache (2 hops)",
166 	"I/O",
167 	"Uncached",
168 };
169 
170 static const char * const mem_lvlnum[] = {
171 	[PERF_MEM_LVLNUM_ANY_CACHE] = "Any cache",
172 	[PERF_MEM_LVLNUM_LFB] = "LFB",
173 	[PERF_MEM_LVLNUM_RAM] = "RAM",
174 	[PERF_MEM_LVLNUM_PMEM] = "PMEM",
175 	[PERF_MEM_LVLNUM_NA] = "N/A",
176 };
177 
178 int perf_mem__lvl_scnprintf(char *out, size_t sz, struct mem_info *mem_info)
179 {
180 	size_t i, l = 0;
181 	u64 m =  PERF_MEM_LVL_NA;
182 	u64 hit, miss;
183 	int printed;
184 
185 	if (mem_info)
186 		m  = mem_info->data_src.mem_lvl;
187 
188 	sz -= 1; /* -1 for null termination */
189 	out[0] = '\0';
190 
191 	hit = m & PERF_MEM_LVL_HIT;
192 	miss = m & PERF_MEM_LVL_MISS;
193 
194 	/* already taken care of */
195 	m &= ~(PERF_MEM_LVL_HIT|PERF_MEM_LVL_MISS);
196 
197 
198 	if (mem_info && mem_info->data_src.mem_remote) {
199 		strcat(out, "Remote ");
200 		l += 7;
201 	}
202 
203 	printed = 0;
204 	for (i = 0; m && i < ARRAY_SIZE(mem_lvl); i++, m >>= 1) {
205 		if (!(m & 0x1))
206 			continue;
207 		if (printed++) {
208 			strcat(out, " or ");
209 			l += 4;
210 		}
211 		l += scnprintf(out + l, sz - l, mem_lvl[i]);
212 	}
213 
214 	if (mem_info && mem_info->data_src.mem_lvl_num) {
215 		int lvl = mem_info->data_src.mem_lvl_num;
216 		if (printed++) {
217 			strcat(out, " or ");
218 			l += 4;
219 		}
220 		if (mem_lvlnum[lvl])
221 			l += scnprintf(out + l, sz - l, mem_lvlnum[lvl]);
222 		else
223 			l += scnprintf(out + l, sz - l, "L%d", lvl);
224 	}
225 
226 	if (l == 0)
227 		l += scnprintf(out + l, sz - l, "N/A");
228 	if (hit)
229 		l += scnprintf(out + l, sz - l, " hit");
230 	if (miss)
231 		l += scnprintf(out + l, sz - l, " miss");
232 
233 	return l;
234 }
235 
236 static const char * const snoop_access[] = {
237 	"N/A",
238 	"None",
239 	"Hit",
240 	"Miss",
241 	"HitM",
242 };
243 
244 int perf_mem__snp_scnprintf(char *out, size_t sz, struct mem_info *mem_info)
245 {
246 	size_t i, l = 0;
247 	u64 m = PERF_MEM_SNOOP_NA;
248 
249 	sz -= 1; /* -1 for null termination */
250 	out[0] = '\0';
251 
252 	if (mem_info)
253 		m = mem_info->data_src.mem_snoop;
254 
255 	for (i = 0; m && i < ARRAY_SIZE(snoop_access); i++, m >>= 1) {
256 		if (!(m & 0x1))
257 			continue;
258 		if (l) {
259 			strcat(out, " or ");
260 			l += 4;
261 		}
262 		l += scnprintf(out + l, sz - l, snoop_access[i]);
263 	}
264 	if (mem_info &&
265 	     (mem_info->data_src.mem_snoopx & PERF_MEM_SNOOPX_FWD)) {
266 		if (l) {
267 			strcat(out, " or ");
268 			l += 4;
269 		}
270 		l += scnprintf(out + l, sz - l, "Fwd");
271 	}
272 
273 	if (*out == '\0')
274 		l += scnprintf(out, sz - l, "N/A");
275 
276 	return l;
277 }
278 
279 int perf_mem__lck_scnprintf(char *out, size_t sz, struct mem_info *mem_info)
280 {
281 	u64 mask = PERF_MEM_LOCK_NA;
282 	int l;
283 
284 	if (mem_info)
285 		mask = mem_info->data_src.mem_lock;
286 
287 	if (mask & PERF_MEM_LOCK_NA)
288 		l = scnprintf(out, sz, "N/A");
289 	else if (mask & PERF_MEM_LOCK_LOCKED)
290 		l = scnprintf(out, sz, "Yes");
291 	else
292 		l = scnprintf(out, sz, "No");
293 
294 	return l;
295 }
296 
297 int perf_script__meminfo_scnprintf(char *out, size_t sz, struct mem_info *mem_info)
298 {
299 	int i = 0;
300 
301 	i += perf_mem__lvl_scnprintf(out, sz, mem_info);
302 	i += scnprintf(out + i, sz - i, "|SNP ");
303 	i += perf_mem__snp_scnprintf(out + i, sz - i, mem_info);
304 	i += scnprintf(out + i, sz - i, "|TLB ");
305 	i += perf_mem__tlb_scnprintf(out + i, sz - i, mem_info);
306 	i += scnprintf(out + i, sz - i, "|LCK ");
307 	i += perf_mem__lck_scnprintf(out + i, sz - i, mem_info);
308 
309 	return i;
310 }
311 
312 int c2c_decode_stats(struct c2c_stats *stats, struct mem_info *mi)
313 {
314 	union perf_mem_data_src *data_src = &mi->data_src;
315 	u64 daddr  = mi->daddr.addr;
316 	u64 op     = data_src->mem_op;
317 	u64 lvl    = data_src->mem_lvl;
318 	u64 snoop  = data_src->mem_snoop;
319 	u64 lock   = data_src->mem_lock;
320 	/*
321 	 * Skylake might report unknown remote level via this
322 	 * bit, consider it when evaluating remote HITMs.
323 	 */
324 	bool mrem  = data_src->mem_remote;
325 	int err = 0;
326 
327 #define HITM_INC(__f)		\
328 do {				\
329 	stats->__f++;		\
330 	stats->tot_hitm++;	\
331 } while (0)
332 
333 #define P(a, b) PERF_MEM_##a##_##b
334 
335 	stats->nr_entries++;
336 
337 	if (lock & P(LOCK, LOCKED)) stats->locks++;
338 
339 	if (op & P(OP, LOAD)) {
340 		/* load */
341 		stats->load++;
342 
343 		if (!daddr) {
344 			stats->ld_noadrs++;
345 			return -1;
346 		}
347 
348 		if (lvl & P(LVL, HIT)) {
349 			if (lvl & P(LVL, UNC)) stats->ld_uncache++;
350 			if (lvl & P(LVL, IO))  stats->ld_io++;
351 			if (lvl & P(LVL, LFB)) stats->ld_fbhit++;
352 			if (lvl & P(LVL, L1 )) stats->ld_l1hit++;
353 			if (lvl & P(LVL, L2 )) stats->ld_l2hit++;
354 			if (lvl & P(LVL, L3 )) {
355 				if (snoop & P(SNOOP, HITM))
356 					HITM_INC(lcl_hitm);
357 				else
358 					stats->ld_llchit++;
359 			}
360 
361 			if (lvl & P(LVL, LOC_RAM)) {
362 				stats->lcl_dram++;
363 				if (snoop & P(SNOOP, HIT))
364 					stats->ld_shared++;
365 				else
366 					stats->ld_excl++;
367 			}
368 
369 			if ((lvl & P(LVL, REM_RAM1)) ||
370 			    (lvl & P(LVL, REM_RAM2)) ||
371 			     mrem) {
372 				stats->rmt_dram++;
373 				if (snoop & P(SNOOP, HIT))
374 					stats->ld_shared++;
375 				else
376 					stats->ld_excl++;
377 			}
378 		}
379 
380 		if ((lvl & P(LVL, REM_CCE1)) ||
381 		    (lvl & P(LVL, REM_CCE2)) ||
382 		     mrem) {
383 			if (snoop & P(SNOOP, HIT))
384 				stats->rmt_hit++;
385 			else if (snoop & P(SNOOP, HITM))
386 				HITM_INC(rmt_hitm);
387 		}
388 
389 		if ((lvl & P(LVL, MISS)))
390 			stats->ld_miss++;
391 
392 	} else if (op & P(OP, STORE)) {
393 		/* store */
394 		stats->store++;
395 
396 		if (!daddr) {
397 			stats->st_noadrs++;
398 			return -1;
399 		}
400 
401 		if (lvl & P(LVL, HIT)) {
402 			if (lvl & P(LVL, UNC)) stats->st_uncache++;
403 			if (lvl & P(LVL, L1 )) stats->st_l1hit++;
404 		}
405 		if (lvl & P(LVL, MISS))
406 			if (lvl & P(LVL, L1)) stats->st_l1miss++;
407 	} else {
408 		/* unparsable data_src? */
409 		stats->noparse++;
410 		return -1;
411 	}
412 
413 	if (!mi->daddr.map || !mi->iaddr.map) {
414 		stats->nomap++;
415 		return -1;
416 	}
417 
418 #undef P
419 #undef HITM_INC
420 	return err;
421 }
422 
423 void c2c_add_stats(struct c2c_stats *stats, struct c2c_stats *add)
424 {
425 	stats->nr_entries	+= add->nr_entries;
426 
427 	stats->locks		+= add->locks;
428 	stats->store		+= add->store;
429 	stats->st_uncache	+= add->st_uncache;
430 	stats->st_noadrs	+= add->st_noadrs;
431 	stats->st_l1hit		+= add->st_l1hit;
432 	stats->st_l1miss	+= add->st_l1miss;
433 	stats->load		+= add->load;
434 	stats->ld_excl		+= add->ld_excl;
435 	stats->ld_shared	+= add->ld_shared;
436 	stats->ld_uncache	+= add->ld_uncache;
437 	stats->ld_io		+= add->ld_io;
438 	stats->ld_miss		+= add->ld_miss;
439 	stats->ld_noadrs	+= add->ld_noadrs;
440 	stats->ld_fbhit		+= add->ld_fbhit;
441 	stats->ld_l1hit		+= add->ld_l1hit;
442 	stats->ld_l2hit		+= add->ld_l2hit;
443 	stats->ld_llchit	+= add->ld_llchit;
444 	stats->lcl_hitm		+= add->lcl_hitm;
445 	stats->rmt_hitm		+= add->rmt_hitm;
446 	stats->tot_hitm		+= add->tot_hitm;
447 	stats->rmt_hit		+= add->rmt_hit;
448 	stats->lcl_dram		+= add->lcl_dram;
449 	stats->rmt_dram		+= add->rmt_dram;
450 	stats->nomap		+= add->nomap;
451 	stats->noparse		+= add->noparse;
452 }
453