xref: /openbmc/linux/tools/perf/util/header.c (revision 9cfc5c90)
1 #include "util.h"
2 #include <sys/types.h>
3 #include <byteswap.h>
4 #include <unistd.h>
5 #include <stdio.h>
6 #include <stdlib.h>
7 #include <linux/list.h>
8 #include <linux/kernel.h>
9 #include <linux/bitops.h>
10 #include <sys/utsname.h>
11 
12 #include "evlist.h"
13 #include "evsel.h"
14 #include "header.h"
15 #include "../perf.h"
16 #include "trace-event.h"
17 #include "session.h"
18 #include "symbol.h"
19 #include "debug.h"
20 #include "cpumap.h"
21 #include "pmu.h"
22 #include "vdso.h"
23 #include "strbuf.h"
24 #include "build-id.h"
25 #include "data.h"
26 
27 /*
28  * magic2 = "PERFILE2"
29  * must be a numerical value to let the endianness
30  * determine the memory layout. That way we are able
31  * to detect endianness when reading the perf.data file
32  * back.
33  *
34  * we check for legacy (PERFFILE) format.
35  */
36 static const char *__perf_magic1 = "PERFFILE";
37 static const u64 __perf_magic2    = 0x32454c4946524550ULL;
38 static const u64 __perf_magic2_sw = 0x50455246494c4532ULL;
39 
40 #define PERF_MAGIC	__perf_magic2
41 
42 struct perf_file_attr {
43 	struct perf_event_attr	attr;
44 	struct perf_file_section	ids;
45 };
46 
47 void perf_header__set_feat(struct perf_header *header, int feat)
48 {
49 	set_bit(feat, header->adds_features);
50 }
51 
52 void perf_header__clear_feat(struct perf_header *header, int feat)
53 {
54 	clear_bit(feat, header->adds_features);
55 }
56 
57 bool perf_header__has_feat(const struct perf_header *header, int feat)
58 {
59 	return test_bit(feat, header->adds_features);
60 }
61 
62 static int do_write(int fd, const void *buf, size_t size)
63 {
64 	while (size) {
65 		int ret = write(fd, buf, size);
66 
67 		if (ret < 0)
68 			return -errno;
69 
70 		size -= ret;
71 		buf += ret;
72 	}
73 
74 	return 0;
75 }
76 
77 int write_padded(int fd, const void *bf, size_t count, size_t count_aligned)
78 {
79 	static const char zero_buf[NAME_ALIGN];
80 	int err = do_write(fd, bf, count);
81 
82 	if (!err)
83 		err = do_write(fd, zero_buf, count_aligned - count);
84 
85 	return err;
86 }
87 
88 #define string_size(str)						\
89 	(PERF_ALIGN((strlen(str) + 1), NAME_ALIGN) + sizeof(u32))
90 
91 static int do_write_string(int fd, const char *str)
92 {
93 	u32 len, olen;
94 	int ret;
95 
96 	olen = strlen(str) + 1;
97 	len = PERF_ALIGN(olen, NAME_ALIGN);
98 
99 	/* write len, incl. \0 */
100 	ret = do_write(fd, &len, sizeof(len));
101 	if (ret < 0)
102 		return ret;
103 
104 	return write_padded(fd, str, olen, len);
105 }
106 
107 static char *do_read_string(int fd, struct perf_header *ph)
108 {
109 	ssize_t sz, ret;
110 	u32 len;
111 	char *buf;
112 
113 	sz = readn(fd, &len, sizeof(len));
114 	if (sz < (ssize_t)sizeof(len))
115 		return NULL;
116 
117 	if (ph->needs_swap)
118 		len = bswap_32(len);
119 
120 	buf = malloc(len);
121 	if (!buf)
122 		return NULL;
123 
124 	ret = readn(fd, buf, len);
125 	if (ret == (ssize_t)len) {
126 		/*
127 		 * strings are padded by zeroes
128 		 * thus the actual strlen of buf
129 		 * may be less than len
130 		 */
131 		return buf;
132 	}
133 
134 	free(buf);
135 	return NULL;
136 }
137 
138 static int write_tracing_data(int fd, struct perf_header *h __maybe_unused,
139 			    struct perf_evlist *evlist)
140 {
141 	return read_tracing_data(fd, &evlist->entries);
142 }
143 
144 
145 static int write_build_id(int fd, struct perf_header *h,
146 			  struct perf_evlist *evlist __maybe_unused)
147 {
148 	struct perf_session *session;
149 	int err;
150 
151 	session = container_of(h, struct perf_session, header);
152 
153 	if (!perf_session__read_build_ids(session, true))
154 		return -1;
155 
156 	err = perf_session__write_buildid_table(session, fd);
157 	if (err < 0) {
158 		pr_debug("failed to write buildid table\n");
159 		return err;
160 	}
161 	perf_session__cache_build_ids(session);
162 
163 	return 0;
164 }
165 
166 static int write_hostname(int fd, struct perf_header *h __maybe_unused,
167 			  struct perf_evlist *evlist __maybe_unused)
168 {
169 	struct utsname uts;
170 	int ret;
171 
172 	ret = uname(&uts);
173 	if (ret < 0)
174 		return -1;
175 
176 	return do_write_string(fd, uts.nodename);
177 }
178 
179 static int write_osrelease(int fd, struct perf_header *h __maybe_unused,
180 			   struct perf_evlist *evlist __maybe_unused)
181 {
182 	struct utsname uts;
183 	int ret;
184 
185 	ret = uname(&uts);
186 	if (ret < 0)
187 		return -1;
188 
189 	return do_write_string(fd, uts.release);
190 }
191 
192 static int write_arch(int fd, struct perf_header *h __maybe_unused,
193 		      struct perf_evlist *evlist __maybe_unused)
194 {
195 	struct utsname uts;
196 	int ret;
197 
198 	ret = uname(&uts);
199 	if (ret < 0)
200 		return -1;
201 
202 	return do_write_string(fd, uts.machine);
203 }
204 
205 static int write_version(int fd, struct perf_header *h __maybe_unused,
206 			 struct perf_evlist *evlist __maybe_unused)
207 {
208 	return do_write_string(fd, perf_version_string);
209 }
210 
211 static int __write_cpudesc(int fd, const char *cpuinfo_proc)
212 {
213 	FILE *file;
214 	char *buf = NULL;
215 	char *s, *p;
216 	const char *search = cpuinfo_proc;
217 	size_t len = 0;
218 	int ret = -1;
219 
220 	if (!search)
221 		return -1;
222 
223 	file = fopen("/proc/cpuinfo", "r");
224 	if (!file)
225 		return -1;
226 
227 	while (getline(&buf, &len, file) > 0) {
228 		ret = strncmp(buf, search, strlen(search));
229 		if (!ret)
230 			break;
231 	}
232 
233 	if (ret) {
234 		ret = -1;
235 		goto done;
236 	}
237 
238 	s = buf;
239 
240 	p = strchr(buf, ':');
241 	if (p && *(p+1) == ' ' && *(p+2))
242 		s = p + 2;
243 	p = strchr(s, '\n');
244 	if (p)
245 		*p = '\0';
246 
247 	/* squash extra space characters (branding string) */
248 	p = s;
249 	while (*p) {
250 		if (isspace(*p)) {
251 			char *r = p + 1;
252 			char *q = r;
253 			*p = ' ';
254 			while (*q && isspace(*q))
255 				q++;
256 			if (q != (p+1))
257 				while ((*r++ = *q++));
258 		}
259 		p++;
260 	}
261 	ret = do_write_string(fd, s);
262 done:
263 	free(buf);
264 	fclose(file);
265 	return ret;
266 }
267 
268 static int write_cpudesc(int fd, struct perf_header *h __maybe_unused,
269 		       struct perf_evlist *evlist __maybe_unused)
270 {
271 #ifndef CPUINFO_PROC
272 #define CPUINFO_PROC {"model name", }
273 #endif
274 	const char *cpuinfo_procs[] = CPUINFO_PROC;
275 	unsigned int i;
276 
277 	for (i = 0; i < ARRAY_SIZE(cpuinfo_procs); i++) {
278 		int ret;
279 		ret = __write_cpudesc(fd, cpuinfo_procs[i]);
280 		if (ret >= 0)
281 			return ret;
282 	}
283 	return -1;
284 }
285 
286 
287 static int write_nrcpus(int fd, struct perf_header *h __maybe_unused,
288 			struct perf_evlist *evlist __maybe_unused)
289 {
290 	long nr;
291 	u32 nrc, nra;
292 	int ret;
293 
294 	nr = sysconf(_SC_NPROCESSORS_CONF);
295 	if (nr < 0)
296 		return -1;
297 
298 	nrc = (u32)(nr & UINT_MAX);
299 
300 	nr = sysconf(_SC_NPROCESSORS_ONLN);
301 	if (nr < 0)
302 		return -1;
303 
304 	nra = (u32)(nr & UINT_MAX);
305 
306 	ret = do_write(fd, &nrc, sizeof(nrc));
307 	if (ret < 0)
308 		return ret;
309 
310 	return do_write(fd, &nra, sizeof(nra));
311 }
312 
313 static int write_event_desc(int fd, struct perf_header *h __maybe_unused,
314 			    struct perf_evlist *evlist)
315 {
316 	struct perf_evsel *evsel;
317 	u32 nre, nri, sz;
318 	int ret;
319 
320 	nre = evlist->nr_entries;
321 
322 	/*
323 	 * write number of events
324 	 */
325 	ret = do_write(fd, &nre, sizeof(nre));
326 	if (ret < 0)
327 		return ret;
328 
329 	/*
330 	 * size of perf_event_attr struct
331 	 */
332 	sz = (u32)sizeof(evsel->attr);
333 	ret = do_write(fd, &sz, sizeof(sz));
334 	if (ret < 0)
335 		return ret;
336 
337 	evlist__for_each(evlist, evsel) {
338 		ret = do_write(fd, &evsel->attr, sz);
339 		if (ret < 0)
340 			return ret;
341 		/*
342 		 * write number of unique id per event
343 		 * there is one id per instance of an event
344 		 *
345 		 * copy into an nri to be independent of the
346 		 * type of ids,
347 		 */
348 		nri = evsel->ids;
349 		ret = do_write(fd, &nri, sizeof(nri));
350 		if (ret < 0)
351 			return ret;
352 
353 		/*
354 		 * write event string as passed on cmdline
355 		 */
356 		ret = do_write_string(fd, perf_evsel__name(evsel));
357 		if (ret < 0)
358 			return ret;
359 		/*
360 		 * write unique ids for this event
361 		 */
362 		ret = do_write(fd, evsel->id, evsel->ids * sizeof(u64));
363 		if (ret < 0)
364 			return ret;
365 	}
366 	return 0;
367 }
368 
369 static int write_cmdline(int fd, struct perf_header *h __maybe_unused,
370 			 struct perf_evlist *evlist __maybe_unused)
371 {
372 	char buf[MAXPATHLEN];
373 	char proc[32];
374 	u32 n;
375 	int i, ret;
376 
377 	/*
378 	 * actual atual path to perf binary
379 	 */
380 	sprintf(proc, "/proc/%d/exe", getpid());
381 	ret = readlink(proc, buf, sizeof(buf));
382 	if (ret <= 0)
383 		return -1;
384 
385 	/* readlink() does not add null termination */
386 	buf[ret] = '\0';
387 
388 	/* account for binary path */
389 	n = perf_env.nr_cmdline + 1;
390 
391 	ret = do_write(fd, &n, sizeof(n));
392 	if (ret < 0)
393 		return ret;
394 
395 	ret = do_write_string(fd, buf);
396 	if (ret < 0)
397 		return ret;
398 
399 	for (i = 0 ; i < perf_env.nr_cmdline; i++) {
400 		ret = do_write_string(fd, perf_env.cmdline_argv[i]);
401 		if (ret < 0)
402 			return ret;
403 	}
404 	return 0;
405 }
406 
407 #define CORE_SIB_FMT \
408 	"/sys/devices/system/cpu/cpu%d/topology/core_siblings_list"
409 #define THRD_SIB_FMT \
410 	"/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list"
411 
412 struct cpu_topo {
413 	u32 cpu_nr;
414 	u32 core_sib;
415 	u32 thread_sib;
416 	char **core_siblings;
417 	char **thread_siblings;
418 };
419 
420 static int build_cpu_topo(struct cpu_topo *tp, int cpu)
421 {
422 	FILE *fp;
423 	char filename[MAXPATHLEN];
424 	char *buf = NULL, *p;
425 	size_t len = 0;
426 	ssize_t sret;
427 	u32 i = 0;
428 	int ret = -1;
429 
430 	sprintf(filename, CORE_SIB_FMT, cpu);
431 	fp = fopen(filename, "r");
432 	if (!fp)
433 		goto try_threads;
434 
435 	sret = getline(&buf, &len, fp);
436 	fclose(fp);
437 	if (sret <= 0)
438 		goto try_threads;
439 
440 	p = strchr(buf, '\n');
441 	if (p)
442 		*p = '\0';
443 
444 	for (i = 0; i < tp->core_sib; i++) {
445 		if (!strcmp(buf, tp->core_siblings[i]))
446 			break;
447 	}
448 	if (i == tp->core_sib) {
449 		tp->core_siblings[i] = buf;
450 		tp->core_sib++;
451 		buf = NULL;
452 		len = 0;
453 	}
454 	ret = 0;
455 
456 try_threads:
457 	sprintf(filename, THRD_SIB_FMT, cpu);
458 	fp = fopen(filename, "r");
459 	if (!fp)
460 		goto done;
461 
462 	if (getline(&buf, &len, fp) <= 0)
463 		goto done;
464 
465 	p = strchr(buf, '\n');
466 	if (p)
467 		*p = '\0';
468 
469 	for (i = 0; i < tp->thread_sib; i++) {
470 		if (!strcmp(buf, tp->thread_siblings[i]))
471 			break;
472 	}
473 	if (i == tp->thread_sib) {
474 		tp->thread_siblings[i] = buf;
475 		tp->thread_sib++;
476 		buf = NULL;
477 	}
478 	ret = 0;
479 done:
480 	if(fp)
481 		fclose(fp);
482 	free(buf);
483 	return ret;
484 }
485 
486 static void free_cpu_topo(struct cpu_topo *tp)
487 {
488 	u32 i;
489 
490 	if (!tp)
491 		return;
492 
493 	for (i = 0 ; i < tp->core_sib; i++)
494 		zfree(&tp->core_siblings[i]);
495 
496 	for (i = 0 ; i < tp->thread_sib; i++)
497 		zfree(&tp->thread_siblings[i]);
498 
499 	free(tp);
500 }
501 
502 static struct cpu_topo *build_cpu_topology(void)
503 {
504 	struct cpu_topo *tp;
505 	void *addr;
506 	u32 nr, i;
507 	size_t sz;
508 	long ncpus;
509 	int ret = -1;
510 
511 	ncpus = sysconf(_SC_NPROCESSORS_CONF);
512 	if (ncpus < 0)
513 		return NULL;
514 
515 	nr = (u32)(ncpus & UINT_MAX);
516 
517 	sz = nr * sizeof(char *);
518 
519 	addr = calloc(1, sizeof(*tp) + 2 * sz);
520 	if (!addr)
521 		return NULL;
522 
523 	tp = addr;
524 	tp->cpu_nr = nr;
525 	addr += sizeof(*tp);
526 	tp->core_siblings = addr;
527 	addr += sz;
528 	tp->thread_siblings = addr;
529 
530 	for (i = 0; i < nr; i++) {
531 		ret = build_cpu_topo(tp, i);
532 		if (ret < 0)
533 			break;
534 	}
535 	if (ret) {
536 		free_cpu_topo(tp);
537 		tp = NULL;
538 	}
539 	return tp;
540 }
541 
542 static int write_cpu_topology(int fd, struct perf_header *h __maybe_unused,
543 			  struct perf_evlist *evlist __maybe_unused)
544 {
545 	struct cpu_topo *tp;
546 	u32 i;
547 	int ret, j;
548 
549 	tp = build_cpu_topology();
550 	if (!tp)
551 		return -1;
552 
553 	ret = do_write(fd, &tp->core_sib, sizeof(tp->core_sib));
554 	if (ret < 0)
555 		goto done;
556 
557 	for (i = 0; i < tp->core_sib; i++) {
558 		ret = do_write_string(fd, tp->core_siblings[i]);
559 		if (ret < 0)
560 			goto done;
561 	}
562 	ret = do_write(fd, &tp->thread_sib, sizeof(tp->thread_sib));
563 	if (ret < 0)
564 		goto done;
565 
566 	for (i = 0; i < tp->thread_sib; i++) {
567 		ret = do_write_string(fd, tp->thread_siblings[i]);
568 		if (ret < 0)
569 			break;
570 	}
571 
572 	ret = perf_env__read_cpu_topology_map(&perf_env);
573 	if (ret < 0)
574 		goto done;
575 
576 	for (j = 0; j < perf_env.nr_cpus_avail; j++) {
577 		ret = do_write(fd, &perf_env.cpu[j].core_id,
578 			       sizeof(perf_env.cpu[j].core_id));
579 		if (ret < 0)
580 			return ret;
581 		ret = do_write(fd, &perf_env.cpu[j].socket_id,
582 			       sizeof(perf_env.cpu[j].socket_id));
583 		if (ret < 0)
584 			return ret;
585 	}
586 done:
587 	free_cpu_topo(tp);
588 	return ret;
589 }
590 
591 
592 
593 static int write_total_mem(int fd, struct perf_header *h __maybe_unused,
594 			  struct perf_evlist *evlist __maybe_unused)
595 {
596 	char *buf = NULL;
597 	FILE *fp;
598 	size_t len = 0;
599 	int ret = -1, n;
600 	uint64_t mem;
601 
602 	fp = fopen("/proc/meminfo", "r");
603 	if (!fp)
604 		return -1;
605 
606 	while (getline(&buf, &len, fp) > 0) {
607 		ret = strncmp(buf, "MemTotal:", 9);
608 		if (!ret)
609 			break;
610 	}
611 	if (!ret) {
612 		n = sscanf(buf, "%*s %"PRIu64, &mem);
613 		if (n == 1)
614 			ret = do_write(fd, &mem, sizeof(mem));
615 	} else
616 		ret = -1;
617 	free(buf);
618 	fclose(fp);
619 	return ret;
620 }
621 
622 static int write_topo_node(int fd, int node)
623 {
624 	char str[MAXPATHLEN];
625 	char field[32];
626 	char *buf = NULL, *p;
627 	size_t len = 0;
628 	FILE *fp;
629 	u64 mem_total, mem_free, mem;
630 	int ret = -1;
631 
632 	sprintf(str, "/sys/devices/system/node/node%d/meminfo", node);
633 	fp = fopen(str, "r");
634 	if (!fp)
635 		return -1;
636 
637 	while (getline(&buf, &len, fp) > 0) {
638 		/* skip over invalid lines */
639 		if (!strchr(buf, ':'))
640 			continue;
641 		if (sscanf(buf, "%*s %*d %31s %"PRIu64, field, &mem) != 2)
642 			goto done;
643 		if (!strcmp(field, "MemTotal:"))
644 			mem_total = mem;
645 		if (!strcmp(field, "MemFree:"))
646 			mem_free = mem;
647 	}
648 
649 	fclose(fp);
650 	fp = NULL;
651 
652 	ret = do_write(fd, &mem_total, sizeof(u64));
653 	if (ret)
654 		goto done;
655 
656 	ret = do_write(fd, &mem_free, sizeof(u64));
657 	if (ret)
658 		goto done;
659 
660 	ret = -1;
661 	sprintf(str, "/sys/devices/system/node/node%d/cpulist", node);
662 
663 	fp = fopen(str, "r");
664 	if (!fp)
665 		goto done;
666 
667 	if (getline(&buf, &len, fp) <= 0)
668 		goto done;
669 
670 	p = strchr(buf, '\n');
671 	if (p)
672 		*p = '\0';
673 
674 	ret = do_write_string(fd, buf);
675 done:
676 	free(buf);
677 	if (fp)
678 		fclose(fp);
679 	return ret;
680 }
681 
682 static int write_numa_topology(int fd, struct perf_header *h __maybe_unused,
683 			  struct perf_evlist *evlist __maybe_unused)
684 {
685 	char *buf = NULL;
686 	size_t len = 0;
687 	FILE *fp;
688 	struct cpu_map *node_map = NULL;
689 	char *c;
690 	u32 nr, i, j;
691 	int ret = -1;
692 
693 	fp = fopen("/sys/devices/system/node/online", "r");
694 	if (!fp)
695 		return -1;
696 
697 	if (getline(&buf, &len, fp) <= 0)
698 		goto done;
699 
700 	c = strchr(buf, '\n');
701 	if (c)
702 		*c = '\0';
703 
704 	node_map = cpu_map__new(buf);
705 	if (!node_map)
706 		goto done;
707 
708 	nr = (u32)node_map->nr;
709 
710 	ret = do_write(fd, &nr, sizeof(nr));
711 	if (ret < 0)
712 		goto done;
713 
714 	for (i = 0; i < nr; i++) {
715 		j = (u32)node_map->map[i];
716 		ret = do_write(fd, &j, sizeof(j));
717 		if (ret < 0)
718 			break;
719 
720 		ret = write_topo_node(fd, i);
721 		if (ret < 0)
722 			break;
723 	}
724 done:
725 	free(buf);
726 	fclose(fp);
727 	free(node_map);
728 	return ret;
729 }
730 
731 /*
732  * File format:
733  *
734  * struct pmu_mappings {
735  *	u32	pmu_num;
736  *	struct pmu_map {
737  *		u32	type;
738  *		char	name[];
739  *	}[pmu_num];
740  * };
741  */
742 
743 static int write_pmu_mappings(int fd, struct perf_header *h __maybe_unused,
744 			      struct perf_evlist *evlist __maybe_unused)
745 {
746 	struct perf_pmu *pmu = NULL;
747 	off_t offset = lseek(fd, 0, SEEK_CUR);
748 	__u32 pmu_num = 0;
749 	int ret;
750 
751 	/* write real pmu_num later */
752 	ret = do_write(fd, &pmu_num, sizeof(pmu_num));
753 	if (ret < 0)
754 		return ret;
755 
756 	while ((pmu = perf_pmu__scan(pmu))) {
757 		if (!pmu->name)
758 			continue;
759 		pmu_num++;
760 
761 		ret = do_write(fd, &pmu->type, sizeof(pmu->type));
762 		if (ret < 0)
763 			return ret;
764 
765 		ret = do_write_string(fd, pmu->name);
766 		if (ret < 0)
767 			return ret;
768 	}
769 
770 	if (pwrite(fd, &pmu_num, sizeof(pmu_num), offset) != sizeof(pmu_num)) {
771 		/* discard all */
772 		lseek(fd, offset, SEEK_SET);
773 		return -1;
774 	}
775 
776 	return 0;
777 }
778 
779 /*
780  * File format:
781  *
782  * struct group_descs {
783  *	u32	nr_groups;
784  *	struct group_desc {
785  *		char	name[];
786  *		u32	leader_idx;
787  *		u32	nr_members;
788  *	}[nr_groups];
789  * };
790  */
791 static int write_group_desc(int fd, struct perf_header *h __maybe_unused,
792 			    struct perf_evlist *evlist)
793 {
794 	u32 nr_groups = evlist->nr_groups;
795 	struct perf_evsel *evsel;
796 	int ret;
797 
798 	ret = do_write(fd, &nr_groups, sizeof(nr_groups));
799 	if (ret < 0)
800 		return ret;
801 
802 	evlist__for_each(evlist, evsel) {
803 		if (perf_evsel__is_group_leader(evsel) &&
804 		    evsel->nr_members > 1) {
805 			const char *name = evsel->group_name ?: "{anon_group}";
806 			u32 leader_idx = evsel->idx;
807 			u32 nr_members = evsel->nr_members;
808 
809 			ret = do_write_string(fd, name);
810 			if (ret < 0)
811 				return ret;
812 
813 			ret = do_write(fd, &leader_idx, sizeof(leader_idx));
814 			if (ret < 0)
815 				return ret;
816 
817 			ret = do_write(fd, &nr_members, sizeof(nr_members));
818 			if (ret < 0)
819 				return ret;
820 		}
821 	}
822 	return 0;
823 }
824 
825 /*
826  * default get_cpuid(): nothing gets recorded
827  * actual implementation must be in arch/$(ARCH)/util/header.c
828  */
829 int __attribute__ ((weak)) get_cpuid(char *buffer __maybe_unused,
830 				     size_t sz __maybe_unused)
831 {
832 	return -1;
833 }
834 
835 static int write_cpuid(int fd, struct perf_header *h __maybe_unused,
836 		       struct perf_evlist *evlist __maybe_unused)
837 {
838 	char buffer[64];
839 	int ret;
840 
841 	ret = get_cpuid(buffer, sizeof(buffer));
842 	if (!ret)
843 		goto write_it;
844 
845 	return -1;
846 write_it:
847 	return do_write_string(fd, buffer);
848 }
849 
850 static int write_branch_stack(int fd __maybe_unused,
851 			      struct perf_header *h __maybe_unused,
852 		       struct perf_evlist *evlist __maybe_unused)
853 {
854 	return 0;
855 }
856 
857 static int write_auxtrace(int fd, struct perf_header *h,
858 			  struct perf_evlist *evlist __maybe_unused)
859 {
860 	struct perf_session *session;
861 	int err;
862 
863 	session = container_of(h, struct perf_session, header);
864 
865 	err = auxtrace_index__write(fd, &session->auxtrace_index);
866 	if (err < 0)
867 		pr_err("Failed to write auxtrace index\n");
868 	return err;
869 }
870 
871 static void print_hostname(struct perf_header *ph, int fd __maybe_unused,
872 			   FILE *fp)
873 {
874 	fprintf(fp, "# hostname : %s\n", ph->env.hostname);
875 }
876 
877 static void print_osrelease(struct perf_header *ph, int fd __maybe_unused,
878 			    FILE *fp)
879 {
880 	fprintf(fp, "# os release : %s\n", ph->env.os_release);
881 }
882 
883 static void print_arch(struct perf_header *ph, int fd __maybe_unused, FILE *fp)
884 {
885 	fprintf(fp, "# arch : %s\n", ph->env.arch);
886 }
887 
888 static void print_cpudesc(struct perf_header *ph, int fd __maybe_unused,
889 			  FILE *fp)
890 {
891 	fprintf(fp, "# cpudesc : %s\n", ph->env.cpu_desc);
892 }
893 
894 static void print_nrcpus(struct perf_header *ph, int fd __maybe_unused,
895 			 FILE *fp)
896 {
897 	fprintf(fp, "# nrcpus online : %u\n", ph->env.nr_cpus_online);
898 	fprintf(fp, "# nrcpus avail : %u\n", ph->env.nr_cpus_avail);
899 }
900 
901 static void print_version(struct perf_header *ph, int fd __maybe_unused,
902 			  FILE *fp)
903 {
904 	fprintf(fp, "# perf version : %s\n", ph->env.version);
905 }
906 
907 static void print_cmdline(struct perf_header *ph, int fd __maybe_unused,
908 			  FILE *fp)
909 {
910 	int nr, i;
911 
912 	nr = ph->env.nr_cmdline;
913 
914 	fprintf(fp, "# cmdline : ");
915 
916 	for (i = 0; i < nr; i++)
917 		fprintf(fp, "%s ", ph->env.cmdline_argv[i]);
918 	fputc('\n', fp);
919 }
920 
921 static void print_cpu_topology(struct perf_header *ph, int fd __maybe_unused,
922 			       FILE *fp)
923 {
924 	int nr, i;
925 	char *str;
926 	int cpu_nr = ph->env.nr_cpus_online;
927 
928 	nr = ph->env.nr_sibling_cores;
929 	str = ph->env.sibling_cores;
930 
931 	for (i = 0; i < nr; i++) {
932 		fprintf(fp, "# sibling cores   : %s\n", str);
933 		str += strlen(str) + 1;
934 	}
935 
936 	nr = ph->env.nr_sibling_threads;
937 	str = ph->env.sibling_threads;
938 
939 	for (i = 0; i < nr; i++) {
940 		fprintf(fp, "# sibling threads : %s\n", str);
941 		str += strlen(str) + 1;
942 	}
943 
944 	if (ph->env.cpu != NULL) {
945 		for (i = 0; i < cpu_nr; i++)
946 			fprintf(fp, "# CPU %d: Core ID %d, Socket ID %d\n", i,
947 				ph->env.cpu[i].core_id, ph->env.cpu[i].socket_id);
948 	} else
949 		fprintf(fp, "# Core ID and Socket ID information is not available\n");
950 }
951 
952 static void free_event_desc(struct perf_evsel *events)
953 {
954 	struct perf_evsel *evsel;
955 
956 	if (!events)
957 		return;
958 
959 	for (evsel = events; evsel->attr.size; evsel++) {
960 		zfree(&evsel->name);
961 		zfree(&evsel->id);
962 	}
963 
964 	free(events);
965 }
966 
967 static struct perf_evsel *
968 read_event_desc(struct perf_header *ph, int fd)
969 {
970 	struct perf_evsel *evsel, *events = NULL;
971 	u64 *id;
972 	void *buf = NULL;
973 	u32 nre, sz, nr, i, j;
974 	ssize_t ret;
975 	size_t msz;
976 
977 	/* number of events */
978 	ret = readn(fd, &nre, sizeof(nre));
979 	if (ret != (ssize_t)sizeof(nre))
980 		goto error;
981 
982 	if (ph->needs_swap)
983 		nre = bswap_32(nre);
984 
985 	ret = readn(fd, &sz, sizeof(sz));
986 	if (ret != (ssize_t)sizeof(sz))
987 		goto error;
988 
989 	if (ph->needs_swap)
990 		sz = bswap_32(sz);
991 
992 	/* buffer to hold on file attr struct */
993 	buf = malloc(sz);
994 	if (!buf)
995 		goto error;
996 
997 	/* the last event terminates with evsel->attr.size == 0: */
998 	events = calloc(nre + 1, sizeof(*events));
999 	if (!events)
1000 		goto error;
1001 
1002 	msz = sizeof(evsel->attr);
1003 	if (sz < msz)
1004 		msz = sz;
1005 
1006 	for (i = 0, evsel = events; i < nre; evsel++, i++) {
1007 		evsel->idx = i;
1008 
1009 		/*
1010 		 * must read entire on-file attr struct to
1011 		 * sync up with layout.
1012 		 */
1013 		ret = readn(fd, buf, sz);
1014 		if (ret != (ssize_t)sz)
1015 			goto error;
1016 
1017 		if (ph->needs_swap)
1018 			perf_event__attr_swap(buf);
1019 
1020 		memcpy(&evsel->attr, buf, msz);
1021 
1022 		ret = readn(fd, &nr, sizeof(nr));
1023 		if (ret != (ssize_t)sizeof(nr))
1024 			goto error;
1025 
1026 		if (ph->needs_swap) {
1027 			nr = bswap_32(nr);
1028 			evsel->needs_swap = true;
1029 		}
1030 
1031 		evsel->name = do_read_string(fd, ph);
1032 
1033 		if (!nr)
1034 			continue;
1035 
1036 		id = calloc(nr, sizeof(*id));
1037 		if (!id)
1038 			goto error;
1039 		evsel->ids = nr;
1040 		evsel->id = id;
1041 
1042 		for (j = 0 ; j < nr; j++) {
1043 			ret = readn(fd, id, sizeof(*id));
1044 			if (ret != (ssize_t)sizeof(*id))
1045 				goto error;
1046 			if (ph->needs_swap)
1047 				*id = bswap_64(*id);
1048 			id++;
1049 		}
1050 	}
1051 out:
1052 	free(buf);
1053 	return events;
1054 error:
1055 	free_event_desc(events);
1056 	events = NULL;
1057 	goto out;
1058 }
1059 
1060 static int __desc_attr__fprintf(FILE *fp, const char *name, const char *val,
1061 				void *priv __attribute__((unused)))
1062 {
1063 	return fprintf(fp, ", %s = %s", name, val);
1064 }
1065 
1066 static void print_event_desc(struct perf_header *ph, int fd, FILE *fp)
1067 {
1068 	struct perf_evsel *evsel, *events = read_event_desc(ph, fd);
1069 	u32 j;
1070 	u64 *id;
1071 
1072 	if (!events) {
1073 		fprintf(fp, "# event desc: not available or unable to read\n");
1074 		return;
1075 	}
1076 
1077 	for (evsel = events; evsel->attr.size; evsel++) {
1078 		fprintf(fp, "# event : name = %s, ", evsel->name);
1079 
1080 		if (evsel->ids) {
1081 			fprintf(fp, ", id = {");
1082 			for (j = 0, id = evsel->id; j < evsel->ids; j++, id++) {
1083 				if (j)
1084 					fputc(',', fp);
1085 				fprintf(fp, " %"PRIu64, *id);
1086 			}
1087 			fprintf(fp, " }");
1088 		}
1089 
1090 		perf_event_attr__fprintf(fp, &evsel->attr, __desc_attr__fprintf, NULL);
1091 
1092 		fputc('\n', fp);
1093 	}
1094 
1095 	free_event_desc(events);
1096 }
1097 
1098 static void print_total_mem(struct perf_header *ph, int fd __maybe_unused,
1099 			    FILE *fp)
1100 {
1101 	fprintf(fp, "# total memory : %Lu kB\n", ph->env.total_mem);
1102 }
1103 
1104 static void print_numa_topology(struct perf_header *ph, int fd __maybe_unused,
1105 				FILE *fp)
1106 {
1107 	u32 nr, c, i;
1108 	char *str, *tmp;
1109 	uint64_t mem_total, mem_free;
1110 
1111 	/* nr nodes */
1112 	nr = ph->env.nr_numa_nodes;
1113 	str = ph->env.numa_nodes;
1114 
1115 	for (i = 0; i < nr; i++) {
1116 		/* node number */
1117 		c = strtoul(str, &tmp, 0);
1118 		if (*tmp != ':')
1119 			goto error;
1120 
1121 		str = tmp + 1;
1122 		mem_total = strtoull(str, &tmp, 0);
1123 		if (*tmp != ':')
1124 			goto error;
1125 
1126 		str = tmp + 1;
1127 		mem_free = strtoull(str, &tmp, 0);
1128 		if (*tmp != ':')
1129 			goto error;
1130 
1131 		fprintf(fp, "# node%u meminfo  : total = %"PRIu64" kB,"
1132 			    " free = %"PRIu64" kB\n",
1133 			c, mem_total, mem_free);
1134 
1135 		str = tmp + 1;
1136 		fprintf(fp, "# node%u cpu list : %s\n", c, str);
1137 
1138 		str += strlen(str) + 1;
1139 	}
1140 	return;
1141 error:
1142 	fprintf(fp, "# numa topology : not available\n");
1143 }
1144 
1145 static void print_cpuid(struct perf_header *ph, int fd __maybe_unused, FILE *fp)
1146 {
1147 	fprintf(fp, "# cpuid : %s\n", ph->env.cpuid);
1148 }
1149 
1150 static void print_branch_stack(struct perf_header *ph __maybe_unused,
1151 			       int fd __maybe_unused, FILE *fp)
1152 {
1153 	fprintf(fp, "# contains samples with branch stack\n");
1154 }
1155 
1156 static void print_auxtrace(struct perf_header *ph __maybe_unused,
1157 			   int fd __maybe_unused, FILE *fp)
1158 {
1159 	fprintf(fp, "# contains AUX area data (e.g. instruction trace)\n");
1160 }
1161 
1162 static void print_pmu_mappings(struct perf_header *ph, int fd __maybe_unused,
1163 			       FILE *fp)
1164 {
1165 	const char *delimiter = "# pmu mappings: ";
1166 	char *str, *tmp;
1167 	u32 pmu_num;
1168 	u32 type;
1169 
1170 	pmu_num = ph->env.nr_pmu_mappings;
1171 	if (!pmu_num) {
1172 		fprintf(fp, "# pmu mappings: not available\n");
1173 		return;
1174 	}
1175 
1176 	str = ph->env.pmu_mappings;
1177 
1178 	while (pmu_num) {
1179 		type = strtoul(str, &tmp, 0);
1180 		if (*tmp != ':')
1181 			goto error;
1182 
1183 		str = tmp + 1;
1184 		fprintf(fp, "%s%s = %" PRIu32, delimiter, str, type);
1185 
1186 		delimiter = ", ";
1187 		str += strlen(str) + 1;
1188 		pmu_num--;
1189 	}
1190 
1191 	fprintf(fp, "\n");
1192 
1193 	if (!pmu_num)
1194 		return;
1195 error:
1196 	fprintf(fp, "# pmu mappings: unable to read\n");
1197 }
1198 
1199 static void print_group_desc(struct perf_header *ph, int fd __maybe_unused,
1200 			     FILE *fp)
1201 {
1202 	struct perf_session *session;
1203 	struct perf_evsel *evsel;
1204 	u32 nr = 0;
1205 
1206 	session = container_of(ph, struct perf_session, header);
1207 
1208 	evlist__for_each(session->evlist, evsel) {
1209 		if (perf_evsel__is_group_leader(evsel) &&
1210 		    evsel->nr_members > 1) {
1211 			fprintf(fp, "# group: %s{%s", evsel->group_name ?: "",
1212 				perf_evsel__name(evsel));
1213 
1214 			nr = evsel->nr_members - 1;
1215 		} else if (nr) {
1216 			fprintf(fp, ",%s", perf_evsel__name(evsel));
1217 
1218 			if (--nr == 0)
1219 				fprintf(fp, "}\n");
1220 		}
1221 	}
1222 }
1223 
1224 static int __event_process_build_id(struct build_id_event *bev,
1225 				    char *filename,
1226 				    struct perf_session *session)
1227 {
1228 	int err = -1;
1229 	struct machine *machine;
1230 	u16 cpumode;
1231 	struct dso *dso;
1232 	enum dso_kernel_type dso_type;
1233 
1234 	machine = perf_session__findnew_machine(session, bev->pid);
1235 	if (!machine)
1236 		goto out;
1237 
1238 	cpumode = bev->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
1239 
1240 	switch (cpumode) {
1241 	case PERF_RECORD_MISC_KERNEL:
1242 		dso_type = DSO_TYPE_KERNEL;
1243 		break;
1244 	case PERF_RECORD_MISC_GUEST_KERNEL:
1245 		dso_type = DSO_TYPE_GUEST_KERNEL;
1246 		break;
1247 	case PERF_RECORD_MISC_USER:
1248 	case PERF_RECORD_MISC_GUEST_USER:
1249 		dso_type = DSO_TYPE_USER;
1250 		break;
1251 	default:
1252 		goto out;
1253 	}
1254 
1255 	dso = machine__findnew_dso(machine, filename);
1256 	if (dso != NULL) {
1257 		char sbuild_id[BUILD_ID_SIZE * 2 + 1];
1258 
1259 		dso__set_build_id(dso, &bev->build_id);
1260 
1261 		if (!is_kernel_module(filename, cpumode))
1262 			dso->kernel = dso_type;
1263 
1264 		build_id__sprintf(dso->build_id, sizeof(dso->build_id),
1265 				  sbuild_id);
1266 		pr_debug("build id event received for %s: %s\n",
1267 			 dso->long_name, sbuild_id);
1268 		dso__put(dso);
1269 	}
1270 
1271 	err = 0;
1272 out:
1273 	return err;
1274 }
1275 
1276 static int perf_header__read_build_ids_abi_quirk(struct perf_header *header,
1277 						 int input, u64 offset, u64 size)
1278 {
1279 	struct perf_session *session = container_of(header, struct perf_session, header);
1280 	struct {
1281 		struct perf_event_header   header;
1282 		u8			   build_id[PERF_ALIGN(BUILD_ID_SIZE, sizeof(u64))];
1283 		char			   filename[0];
1284 	} old_bev;
1285 	struct build_id_event bev;
1286 	char filename[PATH_MAX];
1287 	u64 limit = offset + size;
1288 
1289 	while (offset < limit) {
1290 		ssize_t len;
1291 
1292 		if (readn(input, &old_bev, sizeof(old_bev)) != sizeof(old_bev))
1293 			return -1;
1294 
1295 		if (header->needs_swap)
1296 			perf_event_header__bswap(&old_bev.header);
1297 
1298 		len = old_bev.header.size - sizeof(old_bev);
1299 		if (readn(input, filename, len) != len)
1300 			return -1;
1301 
1302 		bev.header = old_bev.header;
1303 
1304 		/*
1305 		 * As the pid is the missing value, we need to fill
1306 		 * it properly. The header.misc value give us nice hint.
1307 		 */
1308 		bev.pid	= HOST_KERNEL_ID;
1309 		if (bev.header.misc == PERF_RECORD_MISC_GUEST_USER ||
1310 		    bev.header.misc == PERF_RECORD_MISC_GUEST_KERNEL)
1311 			bev.pid	= DEFAULT_GUEST_KERNEL_ID;
1312 
1313 		memcpy(bev.build_id, old_bev.build_id, sizeof(bev.build_id));
1314 		__event_process_build_id(&bev, filename, session);
1315 
1316 		offset += bev.header.size;
1317 	}
1318 
1319 	return 0;
1320 }
1321 
1322 static int perf_header__read_build_ids(struct perf_header *header,
1323 				       int input, u64 offset, u64 size)
1324 {
1325 	struct perf_session *session = container_of(header, struct perf_session, header);
1326 	struct build_id_event bev;
1327 	char filename[PATH_MAX];
1328 	u64 limit = offset + size, orig_offset = offset;
1329 	int err = -1;
1330 
1331 	while (offset < limit) {
1332 		ssize_t len;
1333 
1334 		if (readn(input, &bev, sizeof(bev)) != sizeof(bev))
1335 			goto out;
1336 
1337 		if (header->needs_swap)
1338 			perf_event_header__bswap(&bev.header);
1339 
1340 		len = bev.header.size - sizeof(bev);
1341 		if (readn(input, filename, len) != len)
1342 			goto out;
1343 		/*
1344 		 * The a1645ce1 changeset:
1345 		 *
1346 		 * "perf: 'perf kvm' tool for monitoring guest performance from host"
1347 		 *
1348 		 * Added a field to struct build_id_event that broke the file
1349 		 * format.
1350 		 *
1351 		 * Since the kernel build-id is the first entry, process the
1352 		 * table using the old format if the well known
1353 		 * '[kernel.kallsyms]' string for the kernel build-id has the
1354 		 * first 4 characters chopped off (where the pid_t sits).
1355 		 */
1356 		if (memcmp(filename, "nel.kallsyms]", 13) == 0) {
1357 			if (lseek(input, orig_offset, SEEK_SET) == (off_t)-1)
1358 				return -1;
1359 			return perf_header__read_build_ids_abi_quirk(header, input, offset, size);
1360 		}
1361 
1362 		__event_process_build_id(&bev, filename, session);
1363 
1364 		offset += bev.header.size;
1365 	}
1366 	err = 0;
1367 out:
1368 	return err;
1369 }
1370 
1371 static int process_tracing_data(struct perf_file_section *section __maybe_unused,
1372 				struct perf_header *ph __maybe_unused,
1373 				int fd, void *data)
1374 {
1375 	ssize_t ret = trace_report(fd, data, false);
1376 	return ret < 0 ? -1 : 0;
1377 }
1378 
1379 static int process_build_id(struct perf_file_section *section,
1380 			    struct perf_header *ph, int fd,
1381 			    void *data __maybe_unused)
1382 {
1383 	if (perf_header__read_build_ids(ph, fd, section->offset, section->size))
1384 		pr_debug("Failed to read buildids, continuing...\n");
1385 	return 0;
1386 }
1387 
1388 static int process_hostname(struct perf_file_section *section __maybe_unused,
1389 			    struct perf_header *ph, int fd,
1390 			    void *data __maybe_unused)
1391 {
1392 	ph->env.hostname = do_read_string(fd, ph);
1393 	return ph->env.hostname ? 0 : -ENOMEM;
1394 }
1395 
1396 static int process_osrelease(struct perf_file_section *section __maybe_unused,
1397 			     struct perf_header *ph, int fd,
1398 			     void *data __maybe_unused)
1399 {
1400 	ph->env.os_release = do_read_string(fd, ph);
1401 	return ph->env.os_release ? 0 : -ENOMEM;
1402 }
1403 
1404 static int process_version(struct perf_file_section *section __maybe_unused,
1405 			   struct perf_header *ph, int fd,
1406 			   void *data __maybe_unused)
1407 {
1408 	ph->env.version = do_read_string(fd, ph);
1409 	return ph->env.version ? 0 : -ENOMEM;
1410 }
1411 
1412 static int process_arch(struct perf_file_section *section __maybe_unused,
1413 			struct perf_header *ph,	int fd,
1414 			void *data __maybe_unused)
1415 {
1416 	ph->env.arch = do_read_string(fd, ph);
1417 	return ph->env.arch ? 0 : -ENOMEM;
1418 }
1419 
1420 static int process_nrcpus(struct perf_file_section *section __maybe_unused,
1421 			  struct perf_header *ph, int fd,
1422 			  void *data __maybe_unused)
1423 {
1424 	ssize_t ret;
1425 	u32 nr;
1426 
1427 	ret = readn(fd, &nr, sizeof(nr));
1428 	if (ret != sizeof(nr))
1429 		return -1;
1430 
1431 	if (ph->needs_swap)
1432 		nr = bswap_32(nr);
1433 
1434 	ph->env.nr_cpus_avail = nr;
1435 
1436 	ret = readn(fd, &nr, sizeof(nr));
1437 	if (ret != sizeof(nr))
1438 		return -1;
1439 
1440 	if (ph->needs_swap)
1441 		nr = bswap_32(nr);
1442 
1443 	ph->env.nr_cpus_online = nr;
1444 	return 0;
1445 }
1446 
1447 static int process_cpudesc(struct perf_file_section *section __maybe_unused,
1448 			   struct perf_header *ph, int fd,
1449 			   void *data __maybe_unused)
1450 {
1451 	ph->env.cpu_desc = do_read_string(fd, ph);
1452 	return ph->env.cpu_desc ? 0 : -ENOMEM;
1453 }
1454 
1455 static int process_cpuid(struct perf_file_section *section __maybe_unused,
1456 			 struct perf_header *ph,  int fd,
1457 			 void *data __maybe_unused)
1458 {
1459 	ph->env.cpuid = do_read_string(fd, ph);
1460 	return ph->env.cpuid ? 0 : -ENOMEM;
1461 }
1462 
1463 static int process_total_mem(struct perf_file_section *section __maybe_unused,
1464 			     struct perf_header *ph, int fd,
1465 			     void *data __maybe_unused)
1466 {
1467 	uint64_t mem;
1468 	ssize_t ret;
1469 
1470 	ret = readn(fd, &mem, sizeof(mem));
1471 	if (ret != sizeof(mem))
1472 		return -1;
1473 
1474 	if (ph->needs_swap)
1475 		mem = bswap_64(mem);
1476 
1477 	ph->env.total_mem = mem;
1478 	return 0;
1479 }
1480 
1481 static struct perf_evsel *
1482 perf_evlist__find_by_index(struct perf_evlist *evlist, int idx)
1483 {
1484 	struct perf_evsel *evsel;
1485 
1486 	evlist__for_each(evlist, evsel) {
1487 		if (evsel->idx == idx)
1488 			return evsel;
1489 	}
1490 
1491 	return NULL;
1492 }
1493 
1494 static void
1495 perf_evlist__set_event_name(struct perf_evlist *evlist,
1496 			    struct perf_evsel *event)
1497 {
1498 	struct perf_evsel *evsel;
1499 
1500 	if (!event->name)
1501 		return;
1502 
1503 	evsel = perf_evlist__find_by_index(evlist, event->idx);
1504 	if (!evsel)
1505 		return;
1506 
1507 	if (evsel->name)
1508 		return;
1509 
1510 	evsel->name = strdup(event->name);
1511 }
1512 
1513 static int
1514 process_event_desc(struct perf_file_section *section __maybe_unused,
1515 		   struct perf_header *header, int fd,
1516 		   void *data __maybe_unused)
1517 {
1518 	struct perf_session *session;
1519 	struct perf_evsel *evsel, *events = read_event_desc(header, fd);
1520 
1521 	if (!events)
1522 		return 0;
1523 
1524 	session = container_of(header, struct perf_session, header);
1525 	for (evsel = events; evsel->attr.size; evsel++)
1526 		perf_evlist__set_event_name(session->evlist, evsel);
1527 
1528 	free_event_desc(events);
1529 
1530 	return 0;
1531 }
1532 
1533 static int process_cmdline(struct perf_file_section *section,
1534 			   struct perf_header *ph, int fd,
1535 			   void *data __maybe_unused)
1536 {
1537 	ssize_t ret;
1538 	char *str, *cmdline = NULL, **argv = NULL;
1539 	u32 nr, i, len = 0;
1540 
1541 	ret = readn(fd, &nr, sizeof(nr));
1542 	if (ret != sizeof(nr))
1543 		return -1;
1544 
1545 	if (ph->needs_swap)
1546 		nr = bswap_32(nr);
1547 
1548 	ph->env.nr_cmdline = nr;
1549 
1550 	cmdline = zalloc(section->size + nr + 1);
1551 	if (!cmdline)
1552 		return -1;
1553 
1554 	argv = zalloc(sizeof(char *) * (nr + 1));
1555 	if (!argv)
1556 		goto error;
1557 
1558 	for (i = 0; i < nr; i++) {
1559 		str = do_read_string(fd, ph);
1560 		if (!str)
1561 			goto error;
1562 
1563 		argv[i] = cmdline + len;
1564 		memcpy(argv[i], str, strlen(str) + 1);
1565 		len += strlen(str) + 1;
1566 		free(str);
1567 	}
1568 	ph->env.cmdline = cmdline;
1569 	ph->env.cmdline_argv = (const char **) argv;
1570 	return 0;
1571 
1572 error:
1573 	free(argv);
1574 	free(cmdline);
1575 	return -1;
1576 }
1577 
1578 static int process_cpu_topology(struct perf_file_section *section,
1579 				struct perf_header *ph, int fd,
1580 				void *data __maybe_unused)
1581 {
1582 	ssize_t ret;
1583 	u32 nr, i;
1584 	char *str;
1585 	struct strbuf sb;
1586 	int cpu_nr = ph->env.nr_cpus_online;
1587 	u64 size = 0;
1588 
1589 	ph->env.cpu = calloc(cpu_nr, sizeof(*ph->env.cpu));
1590 	if (!ph->env.cpu)
1591 		return -1;
1592 
1593 	ret = readn(fd, &nr, sizeof(nr));
1594 	if (ret != sizeof(nr))
1595 		goto free_cpu;
1596 
1597 	if (ph->needs_swap)
1598 		nr = bswap_32(nr);
1599 
1600 	ph->env.nr_sibling_cores = nr;
1601 	size += sizeof(u32);
1602 	strbuf_init(&sb, 128);
1603 
1604 	for (i = 0; i < nr; i++) {
1605 		str = do_read_string(fd, ph);
1606 		if (!str)
1607 			goto error;
1608 
1609 		/* include a NULL character at the end */
1610 		strbuf_add(&sb, str, strlen(str) + 1);
1611 		size += string_size(str);
1612 		free(str);
1613 	}
1614 	ph->env.sibling_cores = strbuf_detach(&sb, NULL);
1615 
1616 	ret = readn(fd, &nr, sizeof(nr));
1617 	if (ret != sizeof(nr))
1618 		return -1;
1619 
1620 	if (ph->needs_swap)
1621 		nr = bswap_32(nr);
1622 
1623 	ph->env.nr_sibling_threads = nr;
1624 	size += sizeof(u32);
1625 
1626 	for (i = 0; i < nr; i++) {
1627 		str = do_read_string(fd, ph);
1628 		if (!str)
1629 			goto error;
1630 
1631 		/* include a NULL character at the end */
1632 		strbuf_add(&sb, str, strlen(str) + 1);
1633 		size += string_size(str);
1634 		free(str);
1635 	}
1636 	ph->env.sibling_threads = strbuf_detach(&sb, NULL);
1637 
1638 	/*
1639 	 * The header may be from old perf,
1640 	 * which doesn't include core id and socket id information.
1641 	 */
1642 	if (section->size <= size) {
1643 		zfree(&ph->env.cpu);
1644 		return 0;
1645 	}
1646 
1647 	for (i = 0; i < (u32)cpu_nr; i++) {
1648 		ret = readn(fd, &nr, sizeof(nr));
1649 		if (ret != sizeof(nr))
1650 			goto free_cpu;
1651 
1652 		if (ph->needs_swap)
1653 			nr = bswap_32(nr);
1654 
1655 		if (nr > (u32)cpu_nr) {
1656 			pr_debug("core_id number is too big."
1657 				 "You may need to upgrade the perf tool.\n");
1658 			goto free_cpu;
1659 		}
1660 		ph->env.cpu[i].core_id = nr;
1661 
1662 		ret = readn(fd, &nr, sizeof(nr));
1663 		if (ret != sizeof(nr))
1664 			goto free_cpu;
1665 
1666 		if (ph->needs_swap)
1667 			nr = bswap_32(nr);
1668 
1669 		if (nr > (u32)cpu_nr) {
1670 			pr_debug("socket_id number is too big."
1671 				 "You may need to upgrade the perf tool.\n");
1672 			goto free_cpu;
1673 		}
1674 
1675 		ph->env.cpu[i].socket_id = nr;
1676 	}
1677 
1678 	return 0;
1679 
1680 error:
1681 	strbuf_release(&sb);
1682 free_cpu:
1683 	zfree(&ph->env.cpu);
1684 	return -1;
1685 }
1686 
1687 static int process_numa_topology(struct perf_file_section *section __maybe_unused,
1688 				 struct perf_header *ph, int fd,
1689 				 void *data __maybe_unused)
1690 {
1691 	ssize_t ret;
1692 	u32 nr, node, i;
1693 	char *str;
1694 	uint64_t mem_total, mem_free;
1695 	struct strbuf sb;
1696 
1697 	/* nr nodes */
1698 	ret = readn(fd, &nr, sizeof(nr));
1699 	if (ret != sizeof(nr))
1700 		goto error;
1701 
1702 	if (ph->needs_swap)
1703 		nr = bswap_32(nr);
1704 
1705 	ph->env.nr_numa_nodes = nr;
1706 	strbuf_init(&sb, 256);
1707 
1708 	for (i = 0; i < nr; i++) {
1709 		/* node number */
1710 		ret = readn(fd, &node, sizeof(node));
1711 		if (ret != sizeof(node))
1712 			goto error;
1713 
1714 		ret = readn(fd, &mem_total, sizeof(u64));
1715 		if (ret != sizeof(u64))
1716 			goto error;
1717 
1718 		ret = readn(fd, &mem_free, sizeof(u64));
1719 		if (ret != sizeof(u64))
1720 			goto error;
1721 
1722 		if (ph->needs_swap) {
1723 			node = bswap_32(node);
1724 			mem_total = bswap_64(mem_total);
1725 			mem_free = bswap_64(mem_free);
1726 		}
1727 
1728 		strbuf_addf(&sb, "%u:%"PRIu64":%"PRIu64":",
1729 			    node, mem_total, mem_free);
1730 
1731 		str = do_read_string(fd, ph);
1732 		if (!str)
1733 			goto error;
1734 
1735 		/* include a NULL character at the end */
1736 		strbuf_add(&sb, str, strlen(str) + 1);
1737 		free(str);
1738 	}
1739 	ph->env.numa_nodes = strbuf_detach(&sb, NULL);
1740 	return 0;
1741 
1742 error:
1743 	strbuf_release(&sb);
1744 	return -1;
1745 }
1746 
1747 static int process_pmu_mappings(struct perf_file_section *section __maybe_unused,
1748 				struct perf_header *ph, int fd,
1749 				void *data __maybe_unused)
1750 {
1751 	ssize_t ret;
1752 	char *name;
1753 	u32 pmu_num;
1754 	u32 type;
1755 	struct strbuf sb;
1756 
1757 	ret = readn(fd, &pmu_num, sizeof(pmu_num));
1758 	if (ret != sizeof(pmu_num))
1759 		return -1;
1760 
1761 	if (ph->needs_swap)
1762 		pmu_num = bswap_32(pmu_num);
1763 
1764 	if (!pmu_num) {
1765 		pr_debug("pmu mappings not available\n");
1766 		return 0;
1767 	}
1768 
1769 	ph->env.nr_pmu_mappings = pmu_num;
1770 	strbuf_init(&sb, 128);
1771 
1772 	while (pmu_num) {
1773 		if (readn(fd, &type, sizeof(type)) != sizeof(type))
1774 			goto error;
1775 		if (ph->needs_swap)
1776 			type = bswap_32(type);
1777 
1778 		name = do_read_string(fd, ph);
1779 		if (!name)
1780 			goto error;
1781 
1782 		strbuf_addf(&sb, "%u:%s", type, name);
1783 		/* include a NULL character at the end */
1784 		strbuf_add(&sb, "", 1);
1785 
1786 		if (!strcmp(name, "msr"))
1787 			ph->env.msr_pmu_type = type;
1788 
1789 		free(name);
1790 		pmu_num--;
1791 	}
1792 	ph->env.pmu_mappings = strbuf_detach(&sb, NULL);
1793 	return 0;
1794 
1795 error:
1796 	strbuf_release(&sb);
1797 	return -1;
1798 }
1799 
1800 static int process_group_desc(struct perf_file_section *section __maybe_unused,
1801 			      struct perf_header *ph, int fd,
1802 			      void *data __maybe_unused)
1803 {
1804 	size_t ret = -1;
1805 	u32 i, nr, nr_groups;
1806 	struct perf_session *session;
1807 	struct perf_evsel *evsel, *leader = NULL;
1808 	struct group_desc {
1809 		char *name;
1810 		u32 leader_idx;
1811 		u32 nr_members;
1812 	} *desc;
1813 
1814 	if (readn(fd, &nr_groups, sizeof(nr_groups)) != sizeof(nr_groups))
1815 		return -1;
1816 
1817 	if (ph->needs_swap)
1818 		nr_groups = bswap_32(nr_groups);
1819 
1820 	ph->env.nr_groups = nr_groups;
1821 	if (!nr_groups) {
1822 		pr_debug("group desc not available\n");
1823 		return 0;
1824 	}
1825 
1826 	desc = calloc(nr_groups, sizeof(*desc));
1827 	if (!desc)
1828 		return -1;
1829 
1830 	for (i = 0; i < nr_groups; i++) {
1831 		desc[i].name = do_read_string(fd, ph);
1832 		if (!desc[i].name)
1833 			goto out_free;
1834 
1835 		if (readn(fd, &desc[i].leader_idx, sizeof(u32)) != sizeof(u32))
1836 			goto out_free;
1837 
1838 		if (readn(fd, &desc[i].nr_members, sizeof(u32)) != sizeof(u32))
1839 			goto out_free;
1840 
1841 		if (ph->needs_swap) {
1842 			desc[i].leader_idx = bswap_32(desc[i].leader_idx);
1843 			desc[i].nr_members = bswap_32(desc[i].nr_members);
1844 		}
1845 	}
1846 
1847 	/*
1848 	 * Rebuild group relationship based on the group_desc
1849 	 */
1850 	session = container_of(ph, struct perf_session, header);
1851 	session->evlist->nr_groups = nr_groups;
1852 
1853 	i = nr = 0;
1854 	evlist__for_each(session->evlist, evsel) {
1855 		if (evsel->idx == (int) desc[i].leader_idx) {
1856 			evsel->leader = evsel;
1857 			/* {anon_group} is a dummy name */
1858 			if (strcmp(desc[i].name, "{anon_group}")) {
1859 				evsel->group_name = desc[i].name;
1860 				desc[i].name = NULL;
1861 			}
1862 			evsel->nr_members = desc[i].nr_members;
1863 
1864 			if (i >= nr_groups || nr > 0) {
1865 				pr_debug("invalid group desc\n");
1866 				goto out_free;
1867 			}
1868 
1869 			leader = evsel;
1870 			nr = evsel->nr_members - 1;
1871 			i++;
1872 		} else if (nr) {
1873 			/* This is a group member */
1874 			evsel->leader = leader;
1875 
1876 			nr--;
1877 		}
1878 	}
1879 
1880 	if (i != nr_groups || nr != 0) {
1881 		pr_debug("invalid group desc\n");
1882 		goto out_free;
1883 	}
1884 
1885 	ret = 0;
1886 out_free:
1887 	for (i = 0; i < nr_groups; i++)
1888 		zfree(&desc[i].name);
1889 	free(desc);
1890 
1891 	return ret;
1892 }
1893 
1894 static int process_auxtrace(struct perf_file_section *section,
1895 			    struct perf_header *ph, int fd,
1896 			    void *data __maybe_unused)
1897 {
1898 	struct perf_session *session;
1899 	int err;
1900 
1901 	session = container_of(ph, struct perf_session, header);
1902 
1903 	err = auxtrace_index__process(fd, section->size, session,
1904 				      ph->needs_swap);
1905 	if (err < 0)
1906 		pr_err("Failed to process auxtrace index\n");
1907 	return err;
1908 }
1909 
1910 struct feature_ops {
1911 	int (*write)(int fd, struct perf_header *h, struct perf_evlist *evlist);
1912 	void (*print)(struct perf_header *h, int fd, FILE *fp);
1913 	int (*process)(struct perf_file_section *section,
1914 		       struct perf_header *h, int fd, void *data);
1915 	const char *name;
1916 	bool full_only;
1917 };
1918 
1919 #define FEAT_OPA(n, func) \
1920 	[n] = { .name = #n, .write = write_##func, .print = print_##func }
1921 #define FEAT_OPP(n, func) \
1922 	[n] = { .name = #n, .write = write_##func, .print = print_##func, \
1923 		.process = process_##func }
1924 #define FEAT_OPF(n, func) \
1925 	[n] = { .name = #n, .write = write_##func, .print = print_##func, \
1926 		.process = process_##func, .full_only = true }
1927 
1928 /* feature_ops not implemented: */
1929 #define print_tracing_data	NULL
1930 #define print_build_id		NULL
1931 
1932 static const struct feature_ops feat_ops[HEADER_LAST_FEATURE] = {
1933 	FEAT_OPP(HEADER_TRACING_DATA,	tracing_data),
1934 	FEAT_OPP(HEADER_BUILD_ID,	build_id),
1935 	FEAT_OPP(HEADER_HOSTNAME,	hostname),
1936 	FEAT_OPP(HEADER_OSRELEASE,	osrelease),
1937 	FEAT_OPP(HEADER_VERSION,	version),
1938 	FEAT_OPP(HEADER_ARCH,		arch),
1939 	FEAT_OPP(HEADER_NRCPUS,		nrcpus),
1940 	FEAT_OPP(HEADER_CPUDESC,	cpudesc),
1941 	FEAT_OPP(HEADER_CPUID,		cpuid),
1942 	FEAT_OPP(HEADER_TOTAL_MEM,	total_mem),
1943 	FEAT_OPP(HEADER_EVENT_DESC,	event_desc),
1944 	FEAT_OPP(HEADER_CMDLINE,	cmdline),
1945 	FEAT_OPF(HEADER_CPU_TOPOLOGY,	cpu_topology),
1946 	FEAT_OPF(HEADER_NUMA_TOPOLOGY,	numa_topology),
1947 	FEAT_OPA(HEADER_BRANCH_STACK,	branch_stack),
1948 	FEAT_OPP(HEADER_PMU_MAPPINGS,	pmu_mappings),
1949 	FEAT_OPP(HEADER_GROUP_DESC,	group_desc),
1950 	FEAT_OPP(HEADER_AUXTRACE,	auxtrace),
1951 };
1952 
1953 struct header_print_data {
1954 	FILE *fp;
1955 	bool full; /* extended list of headers */
1956 };
1957 
1958 static int perf_file_section__fprintf_info(struct perf_file_section *section,
1959 					   struct perf_header *ph,
1960 					   int feat, int fd, void *data)
1961 {
1962 	struct header_print_data *hd = data;
1963 
1964 	if (lseek(fd, section->offset, SEEK_SET) == (off_t)-1) {
1965 		pr_debug("Failed to lseek to %" PRIu64 " offset for feature "
1966 				"%d, continuing...\n", section->offset, feat);
1967 		return 0;
1968 	}
1969 	if (feat >= HEADER_LAST_FEATURE) {
1970 		pr_warning("unknown feature %d\n", feat);
1971 		return 0;
1972 	}
1973 	if (!feat_ops[feat].print)
1974 		return 0;
1975 
1976 	if (!feat_ops[feat].full_only || hd->full)
1977 		feat_ops[feat].print(ph, fd, hd->fp);
1978 	else
1979 		fprintf(hd->fp, "# %s info available, use -I to display\n",
1980 			feat_ops[feat].name);
1981 
1982 	return 0;
1983 }
1984 
1985 int perf_header__fprintf_info(struct perf_session *session, FILE *fp, bool full)
1986 {
1987 	struct header_print_data hd;
1988 	struct perf_header *header = &session->header;
1989 	int fd = perf_data_file__fd(session->file);
1990 	hd.fp = fp;
1991 	hd.full = full;
1992 
1993 	perf_header__process_sections(header, fd, &hd,
1994 				      perf_file_section__fprintf_info);
1995 	return 0;
1996 }
1997 
1998 static int do_write_feat(int fd, struct perf_header *h, int type,
1999 			 struct perf_file_section **p,
2000 			 struct perf_evlist *evlist)
2001 {
2002 	int err;
2003 	int ret = 0;
2004 
2005 	if (perf_header__has_feat(h, type)) {
2006 		if (!feat_ops[type].write)
2007 			return -1;
2008 
2009 		(*p)->offset = lseek(fd, 0, SEEK_CUR);
2010 
2011 		err = feat_ops[type].write(fd, h, evlist);
2012 		if (err < 0) {
2013 			pr_debug("failed to write feature %d\n", type);
2014 
2015 			/* undo anything written */
2016 			lseek(fd, (*p)->offset, SEEK_SET);
2017 
2018 			return -1;
2019 		}
2020 		(*p)->size = lseek(fd, 0, SEEK_CUR) - (*p)->offset;
2021 		(*p)++;
2022 	}
2023 	return ret;
2024 }
2025 
2026 static int perf_header__adds_write(struct perf_header *header,
2027 				   struct perf_evlist *evlist, int fd)
2028 {
2029 	int nr_sections;
2030 	struct perf_file_section *feat_sec, *p;
2031 	int sec_size;
2032 	u64 sec_start;
2033 	int feat;
2034 	int err;
2035 
2036 	nr_sections = bitmap_weight(header->adds_features, HEADER_FEAT_BITS);
2037 	if (!nr_sections)
2038 		return 0;
2039 
2040 	feat_sec = p = calloc(nr_sections, sizeof(*feat_sec));
2041 	if (feat_sec == NULL)
2042 		return -ENOMEM;
2043 
2044 	sec_size = sizeof(*feat_sec) * nr_sections;
2045 
2046 	sec_start = header->feat_offset;
2047 	lseek(fd, sec_start + sec_size, SEEK_SET);
2048 
2049 	for_each_set_bit(feat, header->adds_features, HEADER_FEAT_BITS) {
2050 		if (do_write_feat(fd, header, feat, &p, evlist))
2051 			perf_header__clear_feat(header, feat);
2052 	}
2053 
2054 	lseek(fd, sec_start, SEEK_SET);
2055 	/*
2056 	 * may write more than needed due to dropped feature, but
2057 	 * this is okay, reader will skip the mising entries
2058 	 */
2059 	err = do_write(fd, feat_sec, sec_size);
2060 	if (err < 0)
2061 		pr_debug("failed to write feature section\n");
2062 	free(feat_sec);
2063 	return err;
2064 }
2065 
2066 int perf_header__write_pipe(int fd)
2067 {
2068 	struct perf_pipe_file_header f_header;
2069 	int err;
2070 
2071 	f_header = (struct perf_pipe_file_header){
2072 		.magic	   = PERF_MAGIC,
2073 		.size	   = sizeof(f_header),
2074 	};
2075 
2076 	err = do_write(fd, &f_header, sizeof(f_header));
2077 	if (err < 0) {
2078 		pr_debug("failed to write perf pipe header\n");
2079 		return err;
2080 	}
2081 
2082 	return 0;
2083 }
2084 
2085 int perf_session__write_header(struct perf_session *session,
2086 			       struct perf_evlist *evlist,
2087 			       int fd, bool at_exit)
2088 {
2089 	struct perf_file_header f_header;
2090 	struct perf_file_attr   f_attr;
2091 	struct perf_header *header = &session->header;
2092 	struct perf_evsel *evsel;
2093 	u64 attr_offset;
2094 	int err;
2095 
2096 	lseek(fd, sizeof(f_header), SEEK_SET);
2097 
2098 	evlist__for_each(session->evlist, evsel) {
2099 		evsel->id_offset = lseek(fd, 0, SEEK_CUR);
2100 		err = do_write(fd, evsel->id, evsel->ids * sizeof(u64));
2101 		if (err < 0) {
2102 			pr_debug("failed to write perf header\n");
2103 			return err;
2104 		}
2105 	}
2106 
2107 	attr_offset = lseek(fd, 0, SEEK_CUR);
2108 
2109 	evlist__for_each(evlist, evsel) {
2110 		f_attr = (struct perf_file_attr){
2111 			.attr = evsel->attr,
2112 			.ids  = {
2113 				.offset = evsel->id_offset,
2114 				.size   = evsel->ids * sizeof(u64),
2115 			}
2116 		};
2117 		err = do_write(fd, &f_attr, sizeof(f_attr));
2118 		if (err < 0) {
2119 			pr_debug("failed to write perf header attribute\n");
2120 			return err;
2121 		}
2122 	}
2123 
2124 	if (!header->data_offset)
2125 		header->data_offset = lseek(fd, 0, SEEK_CUR);
2126 	header->feat_offset = header->data_offset + header->data_size;
2127 
2128 	if (at_exit) {
2129 		err = perf_header__adds_write(header, evlist, fd);
2130 		if (err < 0)
2131 			return err;
2132 	}
2133 
2134 	f_header = (struct perf_file_header){
2135 		.magic	   = PERF_MAGIC,
2136 		.size	   = sizeof(f_header),
2137 		.attr_size = sizeof(f_attr),
2138 		.attrs = {
2139 			.offset = attr_offset,
2140 			.size   = evlist->nr_entries * sizeof(f_attr),
2141 		},
2142 		.data = {
2143 			.offset = header->data_offset,
2144 			.size	= header->data_size,
2145 		},
2146 		/* event_types is ignored, store zeros */
2147 	};
2148 
2149 	memcpy(&f_header.adds_features, &header->adds_features, sizeof(header->adds_features));
2150 
2151 	lseek(fd, 0, SEEK_SET);
2152 	err = do_write(fd, &f_header, sizeof(f_header));
2153 	if (err < 0) {
2154 		pr_debug("failed to write perf header\n");
2155 		return err;
2156 	}
2157 	lseek(fd, header->data_offset + header->data_size, SEEK_SET);
2158 
2159 	return 0;
2160 }
2161 
2162 static int perf_header__getbuffer64(struct perf_header *header,
2163 				    int fd, void *buf, size_t size)
2164 {
2165 	if (readn(fd, buf, size) <= 0)
2166 		return -1;
2167 
2168 	if (header->needs_swap)
2169 		mem_bswap_64(buf, size);
2170 
2171 	return 0;
2172 }
2173 
2174 int perf_header__process_sections(struct perf_header *header, int fd,
2175 				  void *data,
2176 				  int (*process)(struct perf_file_section *section,
2177 						 struct perf_header *ph,
2178 						 int feat, int fd, void *data))
2179 {
2180 	struct perf_file_section *feat_sec, *sec;
2181 	int nr_sections;
2182 	int sec_size;
2183 	int feat;
2184 	int err;
2185 
2186 	nr_sections = bitmap_weight(header->adds_features, HEADER_FEAT_BITS);
2187 	if (!nr_sections)
2188 		return 0;
2189 
2190 	feat_sec = sec = calloc(nr_sections, sizeof(*feat_sec));
2191 	if (!feat_sec)
2192 		return -1;
2193 
2194 	sec_size = sizeof(*feat_sec) * nr_sections;
2195 
2196 	lseek(fd, header->feat_offset, SEEK_SET);
2197 
2198 	err = perf_header__getbuffer64(header, fd, feat_sec, sec_size);
2199 	if (err < 0)
2200 		goto out_free;
2201 
2202 	for_each_set_bit(feat, header->adds_features, HEADER_LAST_FEATURE) {
2203 		err = process(sec++, header, feat, fd, data);
2204 		if (err < 0)
2205 			goto out_free;
2206 	}
2207 	err = 0;
2208 out_free:
2209 	free(feat_sec);
2210 	return err;
2211 }
2212 
2213 static const int attr_file_abi_sizes[] = {
2214 	[0] = PERF_ATTR_SIZE_VER0,
2215 	[1] = PERF_ATTR_SIZE_VER1,
2216 	[2] = PERF_ATTR_SIZE_VER2,
2217 	[3] = PERF_ATTR_SIZE_VER3,
2218 	[4] = PERF_ATTR_SIZE_VER4,
2219 	0,
2220 };
2221 
2222 /*
2223  * In the legacy file format, the magic number is not used to encode endianness.
2224  * hdr_sz was used to encode endianness. But given that hdr_sz can vary based
2225  * on ABI revisions, we need to try all combinations for all endianness to
2226  * detect the endianness.
2227  */
2228 static int try_all_file_abis(uint64_t hdr_sz, struct perf_header *ph)
2229 {
2230 	uint64_t ref_size, attr_size;
2231 	int i;
2232 
2233 	for (i = 0 ; attr_file_abi_sizes[i]; i++) {
2234 		ref_size = attr_file_abi_sizes[i]
2235 			 + sizeof(struct perf_file_section);
2236 		if (hdr_sz != ref_size) {
2237 			attr_size = bswap_64(hdr_sz);
2238 			if (attr_size != ref_size)
2239 				continue;
2240 
2241 			ph->needs_swap = true;
2242 		}
2243 		pr_debug("ABI%d perf.data file detected, need_swap=%d\n",
2244 			 i,
2245 			 ph->needs_swap);
2246 		return 0;
2247 	}
2248 	/* could not determine endianness */
2249 	return -1;
2250 }
2251 
2252 #define PERF_PIPE_HDR_VER0	16
2253 
2254 static const size_t attr_pipe_abi_sizes[] = {
2255 	[0] = PERF_PIPE_HDR_VER0,
2256 	0,
2257 };
2258 
2259 /*
2260  * In the legacy pipe format, there is an implicit assumption that endiannesss
2261  * between host recording the samples, and host parsing the samples is the
2262  * same. This is not always the case given that the pipe output may always be
2263  * redirected into a file and analyzed on a different machine with possibly a
2264  * different endianness and perf_event ABI revsions in the perf tool itself.
2265  */
2266 static int try_all_pipe_abis(uint64_t hdr_sz, struct perf_header *ph)
2267 {
2268 	u64 attr_size;
2269 	int i;
2270 
2271 	for (i = 0 ; attr_pipe_abi_sizes[i]; i++) {
2272 		if (hdr_sz != attr_pipe_abi_sizes[i]) {
2273 			attr_size = bswap_64(hdr_sz);
2274 			if (attr_size != hdr_sz)
2275 				continue;
2276 
2277 			ph->needs_swap = true;
2278 		}
2279 		pr_debug("Pipe ABI%d perf.data file detected\n", i);
2280 		return 0;
2281 	}
2282 	return -1;
2283 }
2284 
2285 bool is_perf_magic(u64 magic)
2286 {
2287 	if (!memcmp(&magic, __perf_magic1, sizeof(magic))
2288 		|| magic == __perf_magic2
2289 		|| magic == __perf_magic2_sw)
2290 		return true;
2291 
2292 	return false;
2293 }
2294 
2295 static int check_magic_endian(u64 magic, uint64_t hdr_sz,
2296 			      bool is_pipe, struct perf_header *ph)
2297 {
2298 	int ret;
2299 
2300 	/* check for legacy format */
2301 	ret = memcmp(&magic, __perf_magic1, sizeof(magic));
2302 	if (ret == 0) {
2303 		ph->version = PERF_HEADER_VERSION_1;
2304 		pr_debug("legacy perf.data format\n");
2305 		if (is_pipe)
2306 			return try_all_pipe_abis(hdr_sz, ph);
2307 
2308 		return try_all_file_abis(hdr_sz, ph);
2309 	}
2310 	/*
2311 	 * the new magic number serves two purposes:
2312 	 * - unique number to identify actual perf.data files
2313 	 * - encode endianness of file
2314 	 */
2315 	ph->version = PERF_HEADER_VERSION_2;
2316 
2317 	/* check magic number with one endianness */
2318 	if (magic == __perf_magic2)
2319 		return 0;
2320 
2321 	/* check magic number with opposite endianness */
2322 	if (magic != __perf_magic2_sw)
2323 		return -1;
2324 
2325 	ph->needs_swap = true;
2326 
2327 	return 0;
2328 }
2329 
2330 int perf_file_header__read(struct perf_file_header *header,
2331 			   struct perf_header *ph, int fd)
2332 {
2333 	ssize_t ret;
2334 
2335 	lseek(fd, 0, SEEK_SET);
2336 
2337 	ret = readn(fd, header, sizeof(*header));
2338 	if (ret <= 0)
2339 		return -1;
2340 
2341 	if (check_magic_endian(header->magic,
2342 			       header->attr_size, false, ph) < 0) {
2343 		pr_debug("magic/endian check failed\n");
2344 		return -1;
2345 	}
2346 
2347 	if (ph->needs_swap) {
2348 		mem_bswap_64(header, offsetof(struct perf_file_header,
2349 			     adds_features));
2350 	}
2351 
2352 	if (header->size != sizeof(*header)) {
2353 		/* Support the previous format */
2354 		if (header->size == offsetof(typeof(*header), adds_features))
2355 			bitmap_zero(header->adds_features, HEADER_FEAT_BITS);
2356 		else
2357 			return -1;
2358 	} else if (ph->needs_swap) {
2359 		/*
2360 		 * feature bitmap is declared as an array of unsigned longs --
2361 		 * not good since its size can differ between the host that
2362 		 * generated the data file and the host analyzing the file.
2363 		 *
2364 		 * We need to handle endianness, but we don't know the size of
2365 		 * the unsigned long where the file was generated. Take a best
2366 		 * guess at determining it: try 64-bit swap first (ie., file
2367 		 * created on a 64-bit host), and check if the hostname feature
2368 		 * bit is set (this feature bit is forced on as of fbe96f2).
2369 		 * If the bit is not, undo the 64-bit swap and try a 32-bit
2370 		 * swap. If the hostname bit is still not set (e.g., older data
2371 		 * file), punt and fallback to the original behavior --
2372 		 * clearing all feature bits and setting buildid.
2373 		 */
2374 		mem_bswap_64(&header->adds_features,
2375 			    BITS_TO_U64(HEADER_FEAT_BITS));
2376 
2377 		if (!test_bit(HEADER_HOSTNAME, header->adds_features)) {
2378 			/* unswap as u64 */
2379 			mem_bswap_64(&header->adds_features,
2380 				    BITS_TO_U64(HEADER_FEAT_BITS));
2381 
2382 			/* unswap as u32 */
2383 			mem_bswap_32(&header->adds_features,
2384 				    BITS_TO_U32(HEADER_FEAT_BITS));
2385 		}
2386 
2387 		if (!test_bit(HEADER_HOSTNAME, header->adds_features)) {
2388 			bitmap_zero(header->adds_features, HEADER_FEAT_BITS);
2389 			set_bit(HEADER_BUILD_ID, header->adds_features);
2390 		}
2391 	}
2392 
2393 	memcpy(&ph->adds_features, &header->adds_features,
2394 	       sizeof(ph->adds_features));
2395 
2396 	ph->data_offset  = header->data.offset;
2397 	ph->data_size	 = header->data.size;
2398 	ph->feat_offset  = header->data.offset + header->data.size;
2399 	return 0;
2400 }
2401 
2402 static int perf_file_section__process(struct perf_file_section *section,
2403 				      struct perf_header *ph,
2404 				      int feat, int fd, void *data)
2405 {
2406 	if (lseek(fd, section->offset, SEEK_SET) == (off_t)-1) {
2407 		pr_debug("Failed to lseek to %" PRIu64 " offset for feature "
2408 			  "%d, continuing...\n", section->offset, feat);
2409 		return 0;
2410 	}
2411 
2412 	if (feat >= HEADER_LAST_FEATURE) {
2413 		pr_debug("unknown feature %d, continuing...\n", feat);
2414 		return 0;
2415 	}
2416 
2417 	if (!feat_ops[feat].process)
2418 		return 0;
2419 
2420 	return feat_ops[feat].process(section, ph, fd, data);
2421 }
2422 
2423 static int perf_file_header__read_pipe(struct perf_pipe_file_header *header,
2424 				       struct perf_header *ph, int fd,
2425 				       bool repipe)
2426 {
2427 	ssize_t ret;
2428 
2429 	ret = readn(fd, header, sizeof(*header));
2430 	if (ret <= 0)
2431 		return -1;
2432 
2433 	if (check_magic_endian(header->magic, header->size, true, ph) < 0) {
2434 		pr_debug("endian/magic failed\n");
2435 		return -1;
2436 	}
2437 
2438 	if (ph->needs_swap)
2439 		header->size = bswap_64(header->size);
2440 
2441 	if (repipe && do_write(STDOUT_FILENO, header, sizeof(*header)) < 0)
2442 		return -1;
2443 
2444 	return 0;
2445 }
2446 
2447 static int perf_header__read_pipe(struct perf_session *session)
2448 {
2449 	struct perf_header *header = &session->header;
2450 	struct perf_pipe_file_header f_header;
2451 
2452 	if (perf_file_header__read_pipe(&f_header, header,
2453 					perf_data_file__fd(session->file),
2454 					session->repipe) < 0) {
2455 		pr_debug("incompatible file format\n");
2456 		return -EINVAL;
2457 	}
2458 
2459 	return 0;
2460 }
2461 
2462 static int read_attr(int fd, struct perf_header *ph,
2463 		     struct perf_file_attr *f_attr)
2464 {
2465 	struct perf_event_attr *attr = &f_attr->attr;
2466 	size_t sz, left;
2467 	size_t our_sz = sizeof(f_attr->attr);
2468 	ssize_t ret;
2469 
2470 	memset(f_attr, 0, sizeof(*f_attr));
2471 
2472 	/* read minimal guaranteed structure */
2473 	ret = readn(fd, attr, PERF_ATTR_SIZE_VER0);
2474 	if (ret <= 0) {
2475 		pr_debug("cannot read %d bytes of header attr\n",
2476 			 PERF_ATTR_SIZE_VER0);
2477 		return -1;
2478 	}
2479 
2480 	/* on file perf_event_attr size */
2481 	sz = attr->size;
2482 
2483 	if (ph->needs_swap)
2484 		sz = bswap_32(sz);
2485 
2486 	if (sz == 0) {
2487 		/* assume ABI0 */
2488 		sz =  PERF_ATTR_SIZE_VER0;
2489 	} else if (sz > our_sz) {
2490 		pr_debug("file uses a more recent and unsupported ABI"
2491 			 " (%zu bytes extra)\n", sz - our_sz);
2492 		return -1;
2493 	}
2494 	/* what we have not yet read and that we know about */
2495 	left = sz - PERF_ATTR_SIZE_VER0;
2496 	if (left) {
2497 		void *ptr = attr;
2498 		ptr += PERF_ATTR_SIZE_VER0;
2499 
2500 		ret = readn(fd, ptr, left);
2501 	}
2502 	/* read perf_file_section, ids are read in caller */
2503 	ret = readn(fd, &f_attr->ids, sizeof(f_attr->ids));
2504 
2505 	return ret <= 0 ? -1 : 0;
2506 }
2507 
2508 static int perf_evsel__prepare_tracepoint_event(struct perf_evsel *evsel,
2509 						struct pevent *pevent)
2510 {
2511 	struct event_format *event;
2512 	char bf[128];
2513 
2514 	/* already prepared */
2515 	if (evsel->tp_format)
2516 		return 0;
2517 
2518 	if (pevent == NULL) {
2519 		pr_debug("broken or missing trace data\n");
2520 		return -1;
2521 	}
2522 
2523 	event = pevent_find_event(pevent, evsel->attr.config);
2524 	if (event == NULL)
2525 		return -1;
2526 
2527 	if (!evsel->name) {
2528 		snprintf(bf, sizeof(bf), "%s:%s", event->system, event->name);
2529 		evsel->name = strdup(bf);
2530 		if (evsel->name == NULL)
2531 			return -1;
2532 	}
2533 
2534 	evsel->tp_format = event;
2535 	return 0;
2536 }
2537 
2538 static int perf_evlist__prepare_tracepoint_events(struct perf_evlist *evlist,
2539 						  struct pevent *pevent)
2540 {
2541 	struct perf_evsel *pos;
2542 
2543 	evlist__for_each(evlist, pos) {
2544 		if (pos->attr.type == PERF_TYPE_TRACEPOINT &&
2545 		    perf_evsel__prepare_tracepoint_event(pos, pevent))
2546 			return -1;
2547 	}
2548 
2549 	return 0;
2550 }
2551 
2552 int perf_session__read_header(struct perf_session *session)
2553 {
2554 	struct perf_data_file *file = session->file;
2555 	struct perf_header *header = &session->header;
2556 	struct perf_file_header	f_header;
2557 	struct perf_file_attr	f_attr;
2558 	u64			f_id;
2559 	int nr_attrs, nr_ids, i, j;
2560 	int fd = perf_data_file__fd(file);
2561 
2562 	session->evlist = perf_evlist__new();
2563 	if (session->evlist == NULL)
2564 		return -ENOMEM;
2565 
2566 	session->evlist->env = &header->env;
2567 	session->machines.host.env = &header->env;
2568 	if (perf_data_file__is_pipe(file))
2569 		return perf_header__read_pipe(session);
2570 
2571 	if (perf_file_header__read(&f_header, header, fd) < 0)
2572 		return -EINVAL;
2573 
2574 	/*
2575 	 * Sanity check that perf.data was written cleanly; data size is
2576 	 * initialized to 0 and updated only if the on_exit function is run.
2577 	 * If data size is still 0 then the file contains only partial
2578 	 * information.  Just warn user and process it as much as it can.
2579 	 */
2580 	if (f_header.data.size == 0) {
2581 		pr_warning("WARNING: The %s file's data size field is 0 which is unexpected.\n"
2582 			   "Was the 'perf record' command properly terminated?\n",
2583 			   file->path);
2584 	}
2585 
2586 	nr_attrs = f_header.attrs.size / f_header.attr_size;
2587 	lseek(fd, f_header.attrs.offset, SEEK_SET);
2588 
2589 	for (i = 0; i < nr_attrs; i++) {
2590 		struct perf_evsel *evsel;
2591 		off_t tmp;
2592 
2593 		if (read_attr(fd, header, &f_attr) < 0)
2594 			goto out_errno;
2595 
2596 		if (header->needs_swap) {
2597 			f_attr.ids.size   = bswap_64(f_attr.ids.size);
2598 			f_attr.ids.offset = bswap_64(f_attr.ids.offset);
2599 			perf_event__attr_swap(&f_attr.attr);
2600 		}
2601 
2602 		tmp = lseek(fd, 0, SEEK_CUR);
2603 		evsel = perf_evsel__new(&f_attr.attr);
2604 
2605 		if (evsel == NULL)
2606 			goto out_delete_evlist;
2607 
2608 		evsel->needs_swap = header->needs_swap;
2609 		/*
2610 		 * Do it before so that if perf_evsel__alloc_id fails, this
2611 		 * entry gets purged too at perf_evlist__delete().
2612 		 */
2613 		perf_evlist__add(session->evlist, evsel);
2614 
2615 		nr_ids = f_attr.ids.size / sizeof(u64);
2616 		/*
2617 		 * We don't have the cpu and thread maps on the header, so
2618 		 * for allocating the perf_sample_id table we fake 1 cpu and
2619 		 * hattr->ids threads.
2620 		 */
2621 		if (perf_evsel__alloc_id(evsel, 1, nr_ids))
2622 			goto out_delete_evlist;
2623 
2624 		lseek(fd, f_attr.ids.offset, SEEK_SET);
2625 
2626 		for (j = 0; j < nr_ids; j++) {
2627 			if (perf_header__getbuffer64(header, fd, &f_id, sizeof(f_id)))
2628 				goto out_errno;
2629 
2630 			perf_evlist__id_add(session->evlist, evsel, 0, j, f_id);
2631 		}
2632 
2633 		lseek(fd, tmp, SEEK_SET);
2634 	}
2635 
2636 	symbol_conf.nr_events = nr_attrs;
2637 
2638 	perf_header__process_sections(header, fd, &session->tevent,
2639 				      perf_file_section__process);
2640 
2641 	if (perf_evlist__prepare_tracepoint_events(session->evlist,
2642 						   session->tevent.pevent))
2643 		goto out_delete_evlist;
2644 
2645 	return 0;
2646 out_errno:
2647 	return -errno;
2648 
2649 out_delete_evlist:
2650 	perf_evlist__delete(session->evlist);
2651 	session->evlist = NULL;
2652 	return -ENOMEM;
2653 }
2654 
2655 int perf_event__synthesize_attr(struct perf_tool *tool,
2656 				struct perf_event_attr *attr, u32 ids, u64 *id,
2657 				perf_event__handler_t process)
2658 {
2659 	union perf_event *ev;
2660 	size_t size;
2661 	int err;
2662 
2663 	size = sizeof(struct perf_event_attr);
2664 	size = PERF_ALIGN(size, sizeof(u64));
2665 	size += sizeof(struct perf_event_header);
2666 	size += ids * sizeof(u64);
2667 
2668 	ev = malloc(size);
2669 
2670 	if (ev == NULL)
2671 		return -ENOMEM;
2672 
2673 	ev->attr.attr = *attr;
2674 	memcpy(ev->attr.id, id, ids * sizeof(u64));
2675 
2676 	ev->attr.header.type = PERF_RECORD_HEADER_ATTR;
2677 	ev->attr.header.size = (u16)size;
2678 
2679 	if (ev->attr.header.size == size)
2680 		err = process(tool, ev, NULL, NULL);
2681 	else
2682 		err = -E2BIG;
2683 
2684 	free(ev);
2685 
2686 	return err;
2687 }
2688 
2689 int perf_event__synthesize_attrs(struct perf_tool *tool,
2690 				   struct perf_session *session,
2691 				   perf_event__handler_t process)
2692 {
2693 	struct perf_evsel *evsel;
2694 	int err = 0;
2695 
2696 	evlist__for_each(session->evlist, evsel) {
2697 		err = perf_event__synthesize_attr(tool, &evsel->attr, evsel->ids,
2698 						  evsel->id, process);
2699 		if (err) {
2700 			pr_debug("failed to create perf header attribute\n");
2701 			return err;
2702 		}
2703 	}
2704 
2705 	return err;
2706 }
2707 
2708 int perf_event__process_attr(struct perf_tool *tool __maybe_unused,
2709 			     union perf_event *event,
2710 			     struct perf_evlist **pevlist)
2711 {
2712 	u32 i, ids, n_ids;
2713 	struct perf_evsel *evsel;
2714 	struct perf_evlist *evlist = *pevlist;
2715 
2716 	if (evlist == NULL) {
2717 		*pevlist = evlist = perf_evlist__new();
2718 		if (evlist == NULL)
2719 			return -ENOMEM;
2720 	}
2721 
2722 	evsel = perf_evsel__new(&event->attr.attr);
2723 	if (evsel == NULL)
2724 		return -ENOMEM;
2725 
2726 	perf_evlist__add(evlist, evsel);
2727 
2728 	ids = event->header.size;
2729 	ids -= (void *)&event->attr.id - (void *)event;
2730 	n_ids = ids / sizeof(u64);
2731 	/*
2732 	 * We don't have the cpu and thread maps on the header, so
2733 	 * for allocating the perf_sample_id table we fake 1 cpu and
2734 	 * hattr->ids threads.
2735 	 */
2736 	if (perf_evsel__alloc_id(evsel, 1, n_ids))
2737 		return -ENOMEM;
2738 
2739 	for (i = 0; i < n_ids; i++) {
2740 		perf_evlist__id_add(evlist, evsel, 0, i, event->attr.id[i]);
2741 	}
2742 
2743 	symbol_conf.nr_events = evlist->nr_entries;
2744 
2745 	return 0;
2746 }
2747 
2748 int perf_event__synthesize_tracing_data(struct perf_tool *tool, int fd,
2749 					struct perf_evlist *evlist,
2750 					perf_event__handler_t process)
2751 {
2752 	union perf_event ev;
2753 	struct tracing_data *tdata;
2754 	ssize_t size = 0, aligned_size = 0, padding;
2755 	int err __maybe_unused = 0;
2756 
2757 	/*
2758 	 * We are going to store the size of the data followed
2759 	 * by the data contents. Since the fd descriptor is a pipe,
2760 	 * we cannot seek back to store the size of the data once
2761 	 * we know it. Instead we:
2762 	 *
2763 	 * - write the tracing data to the temp file
2764 	 * - get/write the data size to pipe
2765 	 * - write the tracing data from the temp file
2766 	 *   to the pipe
2767 	 */
2768 	tdata = tracing_data_get(&evlist->entries, fd, true);
2769 	if (!tdata)
2770 		return -1;
2771 
2772 	memset(&ev, 0, sizeof(ev));
2773 
2774 	ev.tracing_data.header.type = PERF_RECORD_HEADER_TRACING_DATA;
2775 	size = tdata->size;
2776 	aligned_size = PERF_ALIGN(size, sizeof(u64));
2777 	padding = aligned_size - size;
2778 	ev.tracing_data.header.size = sizeof(ev.tracing_data);
2779 	ev.tracing_data.size = aligned_size;
2780 
2781 	process(tool, &ev, NULL, NULL);
2782 
2783 	/*
2784 	 * The put function will copy all the tracing data
2785 	 * stored in temp file to the pipe.
2786 	 */
2787 	tracing_data_put(tdata);
2788 
2789 	write_padded(fd, NULL, 0, padding);
2790 
2791 	return aligned_size;
2792 }
2793 
2794 int perf_event__process_tracing_data(struct perf_tool *tool __maybe_unused,
2795 				     union perf_event *event,
2796 				     struct perf_session *session)
2797 {
2798 	ssize_t size_read, padding, size = event->tracing_data.size;
2799 	int fd = perf_data_file__fd(session->file);
2800 	off_t offset = lseek(fd, 0, SEEK_CUR);
2801 	char buf[BUFSIZ];
2802 
2803 	/* setup for reading amidst mmap */
2804 	lseek(fd, offset + sizeof(struct tracing_data_event),
2805 	      SEEK_SET);
2806 
2807 	size_read = trace_report(fd, &session->tevent,
2808 				 session->repipe);
2809 	padding = PERF_ALIGN(size_read, sizeof(u64)) - size_read;
2810 
2811 	if (readn(fd, buf, padding) < 0) {
2812 		pr_err("%s: reading input file", __func__);
2813 		return -1;
2814 	}
2815 	if (session->repipe) {
2816 		int retw = write(STDOUT_FILENO, buf, padding);
2817 		if (retw <= 0 || retw != padding) {
2818 			pr_err("%s: repiping tracing data padding", __func__);
2819 			return -1;
2820 		}
2821 	}
2822 
2823 	if (size_read + padding != size) {
2824 		pr_err("%s: tracing data size mismatch", __func__);
2825 		return -1;
2826 	}
2827 
2828 	perf_evlist__prepare_tracepoint_events(session->evlist,
2829 					       session->tevent.pevent);
2830 
2831 	return size_read + padding;
2832 }
2833 
2834 int perf_event__synthesize_build_id(struct perf_tool *tool,
2835 				    struct dso *pos, u16 misc,
2836 				    perf_event__handler_t process,
2837 				    struct machine *machine)
2838 {
2839 	union perf_event ev;
2840 	size_t len;
2841 	int err = 0;
2842 
2843 	if (!pos->hit)
2844 		return err;
2845 
2846 	memset(&ev, 0, sizeof(ev));
2847 
2848 	len = pos->long_name_len + 1;
2849 	len = PERF_ALIGN(len, NAME_ALIGN);
2850 	memcpy(&ev.build_id.build_id, pos->build_id, sizeof(pos->build_id));
2851 	ev.build_id.header.type = PERF_RECORD_HEADER_BUILD_ID;
2852 	ev.build_id.header.misc = misc;
2853 	ev.build_id.pid = machine->pid;
2854 	ev.build_id.header.size = sizeof(ev.build_id) + len;
2855 	memcpy(&ev.build_id.filename, pos->long_name, pos->long_name_len);
2856 
2857 	err = process(tool, &ev, NULL, machine);
2858 
2859 	return err;
2860 }
2861 
2862 int perf_event__process_build_id(struct perf_tool *tool __maybe_unused,
2863 				 union perf_event *event,
2864 				 struct perf_session *session)
2865 {
2866 	__event_process_build_id(&event->build_id,
2867 				 event->build_id.filename,
2868 				 session);
2869 	return 0;
2870 }
2871