xref: /openbmc/linux/tools/perf/util/session.c (revision 52168eea)
1 #define _FILE_OFFSET_BITS 64
2 
3 #include <linux/kernel.h>
4 
5 #include <byteswap.h>
6 #include <unistd.h>
7 #include <sys/types.h>
8 #include <sys/mman.h>
9 
10 #include "evlist.h"
11 #include "evsel.h"
12 #include "session.h"
13 #include "tool.h"
14 #include "sort.h"
15 #include "util.h"
16 #include "cpumap.h"
17 #include "event-parse.h"
18 #include "perf_regs.h"
19 #include "vdso.h"
20 
21 static int perf_session__open(struct perf_session *self, bool force)
22 {
23 	struct stat input_stat;
24 
25 	if (!strcmp(self->filename, "-")) {
26 		self->fd_pipe = true;
27 		self->fd = STDIN_FILENO;
28 
29 		if (perf_session__read_header(self, self->fd) < 0)
30 			pr_err("incompatible file format (rerun with -v to learn more)");
31 
32 		return 0;
33 	}
34 
35 	self->fd = open(self->filename, O_RDONLY);
36 	if (self->fd < 0) {
37 		int err = errno;
38 
39 		pr_err("failed to open %s: %s", self->filename, strerror(err));
40 		if (err == ENOENT && !strcmp(self->filename, "perf.data"))
41 			pr_err("  (try 'perf record' first)");
42 		pr_err("\n");
43 		return -errno;
44 	}
45 
46 	if (fstat(self->fd, &input_stat) < 0)
47 		goto out_close;
48 
49 	if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
50 		pr_err("file %s not owned by current user or root\n",
51 		       self->filename);
52 		goto out_close;
53 	}
54 
55 	if (!input_stat.st_size) {
56 		pr_info("zero-sized file (%s), nothing to do!\n",
57 			self->filename);
58 		goto out_close;
59 	}
60 
61 	if (perf_session__read_header(self, self->fd) < 0) {
62 		pr_err("incompatible file format (rerun with -v to learn more)");
63 		goto out_close;
64 	}
65 
66 	if (!perf_evlist__valid_sample_type(self->evlist)) {
67 		pr_err("non matching sample_type");
68 		goto out_close;
69 	}
70 
71 	if (!perf_evlist__valid_sample_id_all(self->evlist)) {
72 		pr_err("non matching sample_id_all");
73 		goto out_close;
74 	}
75 
76 	self->size = input_stat.st_size;
77 	return 0;
78 
79 out_close:
80 	close(self->fd);
81 	self->fd = -1;
82 	return -1;
83 }
84 
85 void perf_session__set_id_hdr_size(struct perf_session *session)
86 {
87 	u16 id_hdr_size = perf_evlist__id_hdr_size(session->evlist);
88 
89 	session->host_machine.id_hdr_size = id_hdr_size;
90 	machines__set_id_hdr_size(&session->machines, id_hdr_size);
91 }
92 
93 int perf_session__create_kernel_maps(struct perf_session *self)
94 {
95 	int ret = machine__create_kernel_maps(&self->host_machine);
96 
97 	if (ret >= 0)
98 		ret = machines__create_guest_kernel_maps(&self->machines);
99 	return ret;
100 }
101 
102 static void perf_session__destroy_kernel_maps(struct perf_session *self)
103 {
104 	machine__destroy_kernel_maps(&self->host_machine);
105 	machines__destroy_guest_kernel_maps(&self->machines);
106 }
107 
108 struct perf_session *perf_session__new(const char *filename, int mode,
109 				       bool force, bool repipe,
110 				       struct perf_tool *tool)
111 {
112 	struct perf_session *self;
113 	struct stat st;
114 	size_t len;
115 
116 	if (!filename || !strlen(filename)) {
117 		if (!fstat(STDIN_FILENO, &st) && S_ISFIFO(st.st_mode))
118 			filename = "-";
119 		else
120 			filename = "perf.data";
121 	}
122 
123 	len = strlen(filename);
124 	self = zalloc(sizeof(*self) + len);
125 
126 	if (self == NULL)
127 		goto out;
128 
129 	memcpy(self->filename, filename, len);
130 	self->machines = RB_ROOT;
131 	self->repipe = repipe;
132 	INIT_LIST_HEAD(&self->ordered_samples.samples);
133 	INIT_LIST_HEAD(&self->ordered_samples.sample_cache);
134 	INIT_LIST_HEAD(&self->ordered_samples.to_free);
135 	machine__init(&self->host_machine, "", HOST_KERNEL_ID);
136 	hists__init(&self->hists);
137 
138 	if (mode == O_RDONLY) {
139 		if (perf_session__open(self, force) < 0)
140 			goto out_delete;
141 		perf_session__set_id_hdr_size(self);
142 	} else if (mode == O_WRONLY) {
143 		/*
144 		 * In O_RDONLY mode this will be performed when reading the
145 		 * kernel MMAP event, in perf_event__process_mmap().
146 		 */
147 		if (perf_session__create_kernel_maps(self) < 0)
148 			goto out_delete;
149 	}
150 
151 	if (tool && tool->ordering_requires_timestamps &&
152 	    tool->ordered_samples && !perf_evlist__sample_id_all(self->evlist)) {
153 		dump_printf("WARNING: No sample_id_all support, falling back to unordered processing\n");
154 		tool->ordered_samples = false;
155 	}
156 
157 out:
158 	return self;
159 out_delete:
160 	perf_session__delete(self);
161 	return NULL;
162 }
163 
164 static void perf_session__delete_dead_threads(struct perf_session *session)
165 {
166 	machine__delete_dead_threads(&session->host_machine);
167 }
168 
169 static void perf_session__delete_threads(struct perf_session *session)
170 {
171 	machine__delete_threads(&session->host_machine);
172 }
173 
174 static void perf_session_env__delete(struct perf_session_env *env)
175 {
176 	free(env->hostname);
177 	free(env->os_release);
178 	free(env->version);
179 	free(env->arch);
180 	free(env->cpu_desc);
181 	free(env->cpuid);
182 
183 	free(env->cmdline);
184 	free(env->sibling_cores);
185 	free(env->sibling_threads);
186 	free(env->numa_nodes);
187 	free(env->pmu_mappings);
188 }
189 
190 void perf_session__delete(struct perf_session *self)
191 {
192 	perf_session__destroy_kernel_maps(self);
193 	perf_session__delete_dead_threads(self);
194 	perf_session__delete_threads(self);
195 	perf_session_env__delete(&self->header.env);
196 	machine__exit(&self->host_machine);
197 	close(self->fd);
198 	free(self);
199 	vdso__exit();
200 }
201 
202 static int process_event_synth_tracing_data_stub(union perf_event *event
203 						 __maybe_unused,
204 						 struct perf_session *session
205 						__maybe_unused)
206 {
207 	dump_printf(": unhandled!\n");
208 	return 0;
209 }
210 
211 static int process_event_synth_attr_stub(union perf_event *event __maybe_unused,
212 					 struct perf_evlist **pevlist
213 					 __maybe_unused)
214 {
215 	dump_printf(": unhandled!\n");
216 	return 0;
217 }
218 
219 static int process_event_sample_stub(struct perf_tool *tool __maybe_unused,
220 				     union perf_event *event __maybe_unused,
221 				     struct perf_sample *sample __maybe_unused,
222 				     struct perf_evsel *evsel __maybe_unused,
223 				     struct machine *machine __maybe_unused)
224 {
225 	dump_printf(": unhandled!\n");
226 	return 0;
227 }
228 
229 static int process_event_stub(struct perf_tool *tool __maybe_unused,
230 			      union perf_event *event __maybe_unused,
231 			      struct perf_sample *sample __maybe_unused,
232 			      struct machine *machine __maybe_unused)
233 {
234 	dump_printf(": unhandled!\n");
235 	return 0;
236 }
237 
238 static int process_finished_round_stub(struct perf_tool *tool __maybe_unused,
239 				       union perf_event *event __maybe_unused,
240 				       struct perf_session *perf_session
241 				       __maybe_unused)
242 {
243 	dump_printf(": unhandled!\n");
244 	return 0;
245 }
246 
247 static int process_event_type_stub(struct perf_tool *tool __maybe_unused,
248 				   union perf_event *event __maybe_unused)
249 {
250 	dump_printf(": unhandled!\n");
251 	return 0;
252 }
253 
254 static int process_finished_round(struct perf_tool *tool,
255 				  union perf_event *event,
256 				  struct perf_session *session);
257 
258 static void perf_tool__fill_defaults(struct perf_tool *tool)
259 {
260 	if (tool->sample == NULL)
261 		tool->sample = process_event_sample_stub;
262 	if (tool->mmap == NULL)
263 		tool->mmap = process_event_stub;
264 	if (tool->comm == NULL)
265 		tool->comm = process_event_stub;
266 	if (tool->fork == NULL)
267 		tool->fork = process_event_stub;
268 	if (tool->exit == NULL)
269 		tool->exit = process_event_stub;
270 	if (tool->lost == NULL)
271 		tool->lost = perf_event__process_lost;
272 	if (tool->read == NULL)
273 		tool->read = process_event_sample_stub;
274 	if (tool->throttle == NULL)
275 		tool->throttle = process_event_stub;
276 	if (tool->unthrottle == NULL)
277 		tool->unthrottle = process_event_stub;
278 	if (tool->attr == NULL)
279 		tool->attr = process_event_synth_attr_stub;
280 	if (tool->event_type == NULL)
281 		tool->event_type = process_event_type_stub;
282 	if (tool->tracing_data == NULL)
283 		tool->tracing_data = process_event_synth_tracing_data_stub;
284 	if (tool->build_id == NULL)
285 		tool->build_id = process_finished_round_stub;
286 	if (tool->finished_round == NULL) {
287 		if (tool->ordered_samples)
288 			tool->finished_round = process_finished_round;
289 		else
290 			tool->finished_round = process_finished_round_stub;
291 	}
292 }
293 
294 void mem_bswap_32(void *src, int byte_size)
295 {
296 	u32 *m = src;
297 	while (byte_size > 0) {
298 		*m = bswap_32(*m);
299 		byte_size -= sizeof(u32);
300 		++m;
301 	}
302 }
303 
304 void mem_bswap_64(void *src, int byte_size)
305 {
306 	u64 *m = src;
307 
308 	while (byte_size > 0) {
309 		*m = bswap_64(*m);
310 		byte_size -= sizeof(u64);
311 		++m;
312 	}
313 }
314 
315 static void swap_sample_id_all(union perf_event *event, void *data)
316 {
317 	void *end = (void *) event + event->header.size;
318 	int size = end - data;
319 
320 	BUG_ON(size % sizeof(u64));
321 	mem_bswap_64(data, size);
322 }
323 
324 static void perf_event__all64_swap(union perf_event *event,
325 				   bool sample_id_all __maybe_unused)
326 {
327 	struct perf_event_header *hdr = &event->header;
328 	mem_bswap_64(hdr + 1, event->header.size - sizeof(*hdr));
329 }
330 
331 static void perf_event__comm_swap(union perf_event *event, bool sample_id_all)
332 {
333 	event->comm.pid = bswap_32(event->comm.pid);
334 	event->comm.tid = bswap_32(event->comm.tid);
335 
336 	if (sample_id_all) {
337 		void *data = &event->comm.comm;
338 
339 		data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
340 		swap_sample_id_all(event, data);
341 	}
342 }
343 
344 static void perf_event__mmap_swap(union perf_event *event,
345 				  bool sample_id_all)
346 {
347 	event->mmap.pid	  = bswap_32(event->mmap.pid);
348 	event->mmap.tid	  = bswap_32(event->mmap.tid);
349 	event->mmap.start = bswap_64(event->mmap.start);
350 	event->mmap.len	  = bswap_64(event->mmap.len);
351 	event->mmap.pgoff = bswap_64(event->mmap.pgoff);
352 
353 	if (sample_id_all) {
354 		void *data = &event->mmap.filename;
355 
356 		data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
357 		swap_sample_id_all(event, data);
358 	}
359 }
360 
361 static void perf_event__task_swap(union perf_event *event, bool sample_id_all)
362 {
363 	event->fork.pid	 = bswap_32(event->fork.pid);
364 	event->fork.tid	 = bswap_32(event->fork.tid);
365 	event->fork.ppid = bswap_32(event->fork.ppid);
366 	event->fork.ptid = bswap_32(event->fork.ptid);
367 	event->fork.time = bswap_64(event->fork.time);
368 
369 	if (sample_id_all)
370 		swap_sample_id_all(event, &event->fork + 1);
371 }
372 
373 static void perf_event__read_swap(union perf_event *event, bool sample_id_all)
374 {
375 	event->read.pid		 = bswap_32(event->read.pid);
376 	event->read.tid		 = bswap_32(event->read.tid);
377 	event->read.value	 = bswap_64(event->read.value);
378 	event->read.time_enabled = bswap_64(event->read.time_enabled);
379 	event->read.time_running = bswap_64(event->read.time_running);
380 	event->read.id		 = bswap_64(event->read.id);
381 
382 	if (sample_id_all)
383 		swap_sample_id_all(event, &event->read + 1);
384 }
385 
386 static u8 revbyte(u8 b)
387 {
388 	int rev = (b >> 4) | ((b & 0xf) << 4);
389 	rev = ((rev & 0xcc) >> 2) | ((rev & 0x33) << 2);
390 	rev = ((rev & 0xaa) >> 1) | ((rev & 0x55) << 1);
391 	return (u8) rev;
392 }
393 
394 /*
395  * XXX this is hack in attempt to carry flags bitfield
396  * throught endian village. ABI says:
397  *
398  * Bit-fields are allocated from right to left (least to most significant)
399  * on little-endian implementations and from left to right (most to least
400  * significant) on big-endian implementations.
401  *
402  * The above seems to be byte specific, so we need to reverse each
403  * byte of the bitfield. 'Internet' also says this might be implementation
404  * specific and we probably need proper fix and carry perf_event_attr
405  * bitfield flags in separate data file FEAT_ section. Thought this seems
406  * to work for now.
407  */
408 static void swap_bitfield(u8 *p, unsigned len)
409 {
410 	unsigned i;
411 
412 	for (i = 0; i < len; i++) {
413 		*p = revbyte(*p);
414 		p++;
415 	}
416 }
417 
418 /* exported for swapping attributes in file header */
419 void perf_event__attr_swap(struct perf_event_attr *attr)
420 {
421 	attr->type		= bswap_32(attr->type);
422 	attr->size		= bswap_32(attr->size);
423 	attr->config		= bswap_64(attr->config);
424 	attr->sample_period	= bswap_64(attr->sample_period);
425 	attr->sample_type	= bswap_64(attr->sample_type);
426 	attr->read_format	= bswap_64(attr->read_format);
427 	attr->wakeup_events	= bswap_32(attr->wakeup_events);
428 	attr->bp_type		= bswap_32(attr->bp_type);
429 	attr->bp_addr		= bswap_64(attr->bp_addr);
430 	attr->bp_len		= bswap_64(attr->bp_len);
431 
432 	swap_bitfield((u8 *) (&attr->read_format + 1), sizeof(u64));
433 }
434 
435 static void perf_event__hdr_attr_swap(union perf_event *event,
436 				      bool sample_id_all __maybe_unused)
437 {
438 	size_t size;
439 
440 	perf_event__attr_swap(&event->attr.attr);
441 
442 	size = event->header.size;
443 	size -= (void *)&event->attr.id - (void *)event;
444 	mem_bswap_64(event->attr.id, size);
445 }
446 
447 static void perf_event__event_type_swap(union perf_event *event,
448 					bool sample_id_all __maybe_unused)
449 {
450 	event->event_type.event_type.event_id =
451 		bswap_64(event->event_type.event_type.event_id);
452 }
453 
454 static void perf_event__tracing_data_swap(union perf_event *event,
455 					  bool sample_id_all __maybe_unused)
456 {
457 	event->tracing_data.size = bswap_32(event->tracing_data.size);
458 }
459 
460 typedef void (*perf_event__swap_op)(union perf_event *event,
461 				    bool sample_id_all);
462 
463 static perf_event__swap_op perf_event__swap_ops[] = {
464 	[PERF_RECORD_MMAP]		  = perf_event__mmap_swap,
465 	[PERF_RECORD_COMM]		  = perf_event__comm_swap,
466 	[PERF_RECORD_FORK]		  = perf_event__task_swap,
467 	[PERF_RECORD_EXIT]		  = perf_event__task_swap,
468 	[PERF_RECORD_LOST]		  = perf_event__all64_swap,
469 	[PERF_RECORD_READ]		  = perf_event__read_swap,
470 	[PERF_RECORD_SAMPLE]		  = perf_event__all64_swap,
471 	[PERF_RECORD_HEADER_ATTR]	  = perf_event__hdr_attr_swap,
472 	[PERF_RECORD_HEADER_EVENT_TYPE]	  = perf_event__event_type_swap,
473 	[PERF_RECORD_HEADER_TRACING_DATA] = perf_event__tracing_data_swap,
474 	[PERF_RECORD_HEADER_BUILD_ID]	  = NULL,
475 	[PERF_RECORD_HEADER_MAX]	  = NULL,
476 };
477 
478 struct sample_queue {
479 	u64			timestamp;
480 	u64			file_offset;
481 	union perf_event	*event;
482 	struct list_head	list;
483 };
484 
485 static void perf_session_free_sample_buffers(struct perf_session *session)
486 {
487 	struct ordered_samples *os = &session->ordered_samples;
488 
489 	while (!list_empty(&os->to_free)) {
490 		struct sample_queue *sq;
491 
492 		sq = list_entry(os->to_free.next, struct sample_queue, list);
493 		list_del(&sq->list);
494 		free(sq);
495 	}
496 }
497 
498 static int perf_session_deliver_event(struct perf_session *session,
499 				      union perf_event *event,
500 				      struct perf_sample *sample,
501 				      struct perf_tool *tool,
502 				      u64 file_offset);
503 
504 static int flush_sample_queue(struct perf_session *s,
505 			       struct perf_tool *tool)
506 {
507 	struct ordered_samples *os = &s->ordered_samples;
508 	struct list_head *head = &os->samples;
509 	struct sample_queue *tmp, *iter;
510 	struct perf_sample sample;
511 	u64 limit = os->next_flush;
512 	u64 last_ts = os->last_sample ? os->last_sample->timestamp : 0ULL;
513 	unsigned idx = 0, progress_next = os->nr_samples / 16;
514 	int ret;
515 
516 	if (!tool->ordered_samples || !limit)
517 		return 0;
518 
519 	list_for_each_entry_safe(iter, tmp, head, list) {
520 		if (iter->timestamp > limit)
521 			break;
522 
523 		ret = perf_evlist__parse_sample(s->evlist, iter->event, &sample);
524 		if (ret)
525 			pr_err("Can't parse sample, err = %d\n", ret);
526 		else {
527 			ret = perf_session_deliver_event(s, iter->event, &sample, tool,
528 							 iter->file_offset);
529 			if (ret)
530 				return ret;
531 		}
532 
533 		os->last_flush = iter->timestamp;
534 		list_del(&iter->list);
535 		list_add(&iter->list, &os->sample_cache);
536 		if (++idx >= progress_next) {
537 			progress_next += os->nr_samples / 16;
538 			ui_progress__update(idx, os->nr_samples,
539 					    "Processing time ordered events...");
540 		}
541 	}
542 
543 	if (list_empty(head)) {
544 		os->last_sample = NULL;
545 	} else if (last_ts <= limit) {
546 		os->last_sample =
547 			list_entry(head->prev, struct sample_queue, list);
548 	}
549 
550 	os->nr_samples = 0;
551 
552 	return 0;
553 }
554 
555 /*
556  * When perf record finishes a pass on every buffers, it records this pseudo
557  * event.
558  * We record the max timestamp t found in the pass n.
559  * Assuming these timestamps are monotonic across cpus, we know that if
560  * a buffer still has events with timestamps below t, they will be all
561  * available and then read in the pass n + 1.
562  * Hence when we start to read the pass n + 2, we can safely flush every
563  * events with timestamps below t.
564  *
565  *    ============ PASS n =================
566  *       CPU 0         |   CPU 1
567  *                     |
568  *    cnt1 timestamps  |   cnt2 timestamps
569  *          1          |         2
570  *          2          |         3
571  *          -          |         4  <--- max recorded
572  *
573  *    ============ PASS n + 1 ==============
574  *       CPU 0         |   CPU 1
575  *                     |
576  *    cnt1 timestamps  |   cnt2 timestamps
577  *          3          |         5
578  *          4          |         6
579  *          5          |         7 <---- max recorded
580  *
581  *      Flush every events below timestamp 4
582  *
583  *    ============ PASS n + 2 ==============
584  *       CPU 0         |   CPU 1
585  *                     |
586  *    cnt1 timestamps  |   cnt2 timestamps
587  *          6          |         8
588  *          7          |         9
589  *          -          |         10
590  *
591  *      Flush every events below timestamp 7
592  *      etc...
593  */
594 static int process_finished_round(struct perf_tool *tool,
595 				  union perf_event *event __maybe_unused,
596 				  struct perf_session *session)
597 {
598 	int ret = flush_sample_queue(session, tool);
599 	if (!ret)
600 		session->ordered_samples.next_flush = session->ordered_samples.max_timestamp;
601 
602 	return ret;
603 }
604 
605 /* The queue is ordered by time */
606 static void __queue_event(struct sample_queue *new, struct perf_session *s)
607 {
608 	struct ordered_samples *os = &s->ordered_samples;
609 	struct sample_queue *sample = os->last_sample;
610 	u64 timestamp = new->timestamp;
611 	struct list_head *p;
612 
613 	++os->nr_samples;
614 	os->last_sample = new;
615 
616 	if (!sample) {
617 		list_add(&new->list, &os->samples);
618 		os->max_timestamp = timestamp;
619 		return;
620 	}
621 
622 	/*
623 	 * last_sample might point to some random place in the list as it's
624 	 * the last queued event. We expect that the new event is close to
625 	 * this.
626 	 */
627 	if (sample->timestamp <= timestamp) {
628 		while (sample->timestamp <= timestamp) {
629 			p = sample->list.next;
630 			if (p == &os->samples) {
631 				list_add_tail(&new->list, &os->samples);
632 				os->max_timestamp = timestamp;
633 				return;
634 			}
635 			sample = list_entry(p, struct sample_queue, list);
636 		}
637 		list_add_tail(&new->list, &sample->list);
638 	} else {
639 		while (sample->timestamp > timestamp) {
640 			p = sample->list.prev;
641 			if (p == &os->samples) {
642 				list_add(&new->list, &os->samples);
643 				return;
644 			}
645 			sample = list_entry(p, struct sample_queue, list);
646 		}
647 		list_add(&new->list, &sample->list);
648 	}
649 }
650 
651 #define MAX_SAMPLE_BUFFER	(64 * 1024 / sizeof(struct sample_queue))
652 
653 static int perf_session_queue_event(struct perf_session *s, union perf_event *event,
654 				    struct perf_sample *sample, u64 file_offset)
655 {
656 	struct ordered_samples *os = &s->ordered_samples;
657 	struct list_head *sc = &os->sample_cache;
658 	u64 timestamp = sample->time;
659 	struct sample_queue *new;
660 
661 	if (!timestamp || timestamp == ~0ULL)
662 		return -ETIME;
663 
664 	if (timestamp < s->ordered_samples.last_flush) {
665 		printf("Warning: Timestamp below last timeslice flush\n");
666 		return -EINVAL;
667 	}
668 
669 	if (!list_empty(sc)) {
670 		new = list_entry(sc->next, struct sample_queue, list);
671 		list_del(&new->list);
672 	} else if (os->sample_buffer) {
673 		new = os->sample_buffer + os->sample_buffer_idx;
674 		if (++os->sample_buffer_idx == MAX_SAMPLE_BUFFER)
675 			os->sample_buffer = NULL;
676 	} else {
677 		os->sample_buffer = malloc(MAX_SAMPLE_BUFFER * sizeof(*new));
678 		if (!os->sample_buffer)
679 			return -ENOMEM;
680 		list_add(&os->sample_buffer->list, &os->to_free);
681 		os->sample_buffer_idx = 2;
682 		new = os->sample_buffer + 1;
683 	}
684 
685 	new->timestamp = timestamp;
686 	new->file_offset = file_offset;
687 	new->event = event;
688 
689 	__queue_event(new, s);
690 
691 	return 0;
692 }
693 
694 static void callchain__printf(struct perf_sample *sample)
695 {
696 	unsigned int i;
697 
698 	printf("... chain: nr:%" PRIu64 "\n", sample->callchain->nr);
699 
700 	for (i = 0; i < sample->callchain->nr; i++)
701 		printf("..... %2d: %016" PRIx64 "\n",
702 		       i, sample->callchain->ips[i]);
703 }
704 
705 static void branch_stack__printf(struct perf_sample *sample)
706 {
707 	uint64_t i;
708 
709 	printf("... branch stack: nr:%" PRIu64 "\n", sample->branch_stack->nr);
710 
711 	for (i = 0; i < sample->branch_stack->nr; i++)
712 		printf("..... %2"PRIu64": %016" PRIx64 " -> %016" PRIx64 "\n",
713 			i, sample->branch_stack->entries[i].from,
714 			sample->branch_stack->entries[i].to);
715 }
716 
717 static void regs_dump__printf(u64 mask, u64 *regs)
718 {
719 	unsigned rid, i = 0;
720 
721 	for_each_set_bit(rid, (unsigned long *) &mask, sizeof(mask) * 8) {
722 		u64 val = regs[i++];
723 
724 		printf(".... %-5s 0x%" PRIx64 "\n",
725 		       perf_reg_name(rid), val);
726 	}
727 }
728 
729 static void regs_user__printf(struct perf_sample *sample, u64 mask)
730 {
731 	struct regs_dump *user_regs = &sample->user_regs;
732 
733 	if (user_regs->regs) {
734 		printf("... user regs: mask 0x%" PRIx64 "\n", mask);
735 		regs_dump__printf(mask, user_regs->regs);
736 	}
737 }
738 
739 static void stack_user__printf(struct stack_dump *dump)
740 {
741 	printf("... ustack: size %" PRIu64 ", offset 0x%x\n",
742 	       dump->size, dump->offset);
743 }
744 
745 static void perf_session__print_tstamp(struct perf_session *session,
746 				       union perf_event *event,
747 				       struct perf_sample *sample)
748 {
749 	u64 sample_type = perf_evlist__sample_type(session->evlist);
750 
751 	if (event->header.type != PERF_RECORD_SAMPLE &&
752 	    !perf_evlist__sample_id_all(session->evlist)) {
753 		fputs("-1 -1 ", stdout);
754 		return;
755 	}
756 
757 	if ((sample_type & PERF_SAMPLE_CPU))
758 		printf("%u ", sample->cpu);
759 
760 	if (sample_type & PERF_SAMPLE_TIME)
761 		printf("%" PRIu64 " ", sample->time);
762 }
763 
764 static void dump_event(struct perf_session *session, union perf_event *event,
765 		       u64 file_offset, struct perf_sample *sample)
766 {
767 	if (!dump_trace)
768 		return;
769 
770 	printf("\n%#" PRIx64 " [%#x]: event: %d\n",
771 	       file_offset, event->header.size, event->header.type);
772 
773 	trace_event(event);
774 
775 	if (sample)
776 		perf_session__print_tstamp(session, event, sample);
777 
778 	printf("%#" PRIx64 " [%#x]: PERF_RECORD_%s", file_offset,
779 	       event->header.size, perf_event__name(event->header.type));
780 }
781 
782 static void dump_sample(struct perf_evsel *evsel, union perf_event *event,
783 			struct perf_sample *sample)
784 {
785 	u64 sample_type;
786 
787 	if (!dump_trace)
788 		return;
789 
790 	printf("(IP, %d): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n",
791 	       event->header.misc, sample->pid, sample->tid, sample->ip,
792 	       sample->period, sample->addr);
793 
794 	sample_type = evsel->attr.sample_type;
795 
796 	if (sample_type & PERF_SAMPLE_CALLCHAIN)
797 		callchain__printf(sample);
798 
799 	if (sample_type & PERF_SAMPLE_BRANCH_STACK)
800 		branch_stack__printf(sample);
801 
802 	if (sample_type & PERF_SAMPLE_REGS_USER)
803 		regs_user__printf(sample, evsel->attr.sample_regs_user);
804 
805 	if (sample_type & PERF_SAMPLE_STACK_USER)
806 		stack_user__printf(&sample->user_stack);
807 }
808 
809 static struct machine *
810 	perf_session__find_machine_for_cpumode(struct perf_session *session,
811 					       union perf_event *event)
812 {
813 	const u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
814 
815 	if (perf_guest &&
816 	    ((cpumode == PERF_RECORD_MISC_GUEST_KERNEL) ||
817 	     (cpumode == PERF_RECORD_MISC_GUEST_USER))) {
818 		u32 pid;
819 
820 		if (event->header.type == PERF_RECORD_MMAP)
821 			pid = event->mmap.pid;
822 		else
823 			pid = event->ip.pid;
824 
825 		return perf_session__findnew_machine(session, pid);
826 	}
827 
828 	return perf_session__find_host_machine(session);
829 }
830 
831 static int perf_session_deliver_event(struct perf_session *session,
832 				      union perf_event *event,
833 				      struct perf_sample *sample,
834 				      struct perf_tool *tool,
835 				      u64 file_offset)
836 {
837 	struct perf_evsel *evsel;
838 	struct machine *machine;
839 
840 	dump_event(session, event, file_offset, sample);
841 
842 	evsel = perf_evlist__id2evsel(session->evlist, sample->id);
843 	if (evsel != NULL && event->header.type != PERF_RECORD_SAMPLE) {
844 		/*
845 		 * XXX We're leaving PERF_RECORD_SAMPLE unnacounted here
846 		 * because the tools right now may apply filters, discarding
847 		 * some of the samples. For consistency, in the future we
848 		 * should have something like nr_filtered_samples and remove
849 		 * the sample->period from total_sample_period, etc, KISS for
850 		 * now tho.
851 		 *
852 		 * Also testing against NULL allows us to handle files without
853 		 * attr.sample_id_all and/or without PERF_SAMPLE_ID. In the
854 		 * future probably it'll be a good idea to restrict event
855 		 * processing via perf_session to files with both set.
856 		 */
857 		hists__inc_nr_events(&evsel->hists, event->header.type);
858 	}
859 
860 	machine = perf_session__find_machine_for_cpumode(session, event);
861 
862 	switch (event->header.type) {
863 	case PERF_RECORD_SAMPLE:
864 		dump_sample(evsel, event, sample);
865 		if (evsel == NULL) {
866 			++session->hists.stats.nr_unknown_id;
867 			return 0;
868 		}
869 		if (machine == NULL) {
870 			++session->hists.stats.nr_unprocessable_samples;
871 			return 0;
872 		}
873 		return tool->sample(tool, event, sample, evsel, machine);
874 	case PERF_RECORD_MMAP:
875 		return tool->mmap(tool, event, sample, machine);
876 	case PERF_RECORD_COMM:
877 		return tool->comm(tool, event, sample, machine);
878 	case PERF_RECORD_FORK:
879 		return tool->fork(tool, event, sample, machine);
880 	case PERF_RECORD_EXIT:
881 		return tool->exit(tool, event, sample, machine);
882 	case PERF_RECORD_LOST:
883 		if (tool->lost == perf_event__process_lost)
884 			session->hists.stats.total_lost += event->lost.lost;
885 		return tool->lost(tool, event, sample, machine);
886 	case PERF_RECORD_READ:
887 		return tool->read(tool, event, sample, evsel, machine);
888 	case PERF_RECORD_THROTTLE:
889 		return tool->throttle(tool, event, sample, machine);
890 	case PERF_RECORD_UNTHROTTLE:
891 		return tool->unthrottle(tool, event, sample, machine);
892 	default:
893 		++session->hists.stats.nr_unknown_events;
894 		return -1;
895 	}
896 }
897 
898 static int perf_session__preprocess_sample(struct perf_session *session,
899 					   union perf_event *event, struct perf_sample *sample)
900 {
901 	if (event->header.type != PERF_RECORD_SAMPLE ||
902 	    !(perf_evlist__sample_type(session->evlist) & PERF_SAMPLE_CALLCHAIN))
903 		return 0;
904 
905 	if (!ip_callchain__valid(sample->callchain, event)) {
906 		pr_debug("call-chain problem with event, skipping it.\n");
907 		++session->hists.stats.nr_invalid_chains;
908 		session->hists.stats.total_invalid_chains += sample->period;
909 		return -EINVAL;
910 	}
911 	return 0;
912 }
913 
914 static int perf_session__process_user_event(struct perf_session *session, union perf_event *event,
915 					    struct perf_tool *tool, u64 file_offset)
916 {
917 	int err;
918 
919 	dump_event(session, event, file_offset, NULL);
920 
921 	/* These events are processed right away */
922 	switch (event->header.type) {
923 	case PERF_RECORD_HEADER_ATTR:
924 		err = tool->attr(event, &session->evlist);
925 		if (err == 0)
926 			perf_session__set_id_hdr_size(session);
927 		return err;
928 	case PERF_RECORD_HEADER_EVENT_TYPE:
929 		return tool->event_type(tool, event);
930 	case PERF_RECORD_HEADER_TRACING_DATA:
931 		/* setup for reading amidst mmap */
932 		lseek(session->fd, file_offset, SEEK_SET);
933 		return tool->tracing_data(event, session);
934 	case PERF_RECORD_HEADER_BUILD_ID:
935 		return tool->build_id(tool, event, session);
936 	case PERF_RECORD_FINISHED_ROUND:
937 		return tool->finished_round(tool, event, session);
938 	default:
939 		return -EINVAL;
940 	}
941 }
942 
943 static void event_swap(union perf_event *event, bool sample_id_all)
944 {
945 	perf_event__swap_op swap;
946 
947 	swap = perf_event__swap_ops[event->header.type];
948 	if (swap)
949 		swap(event, sample_id_all);
950 }
951 
952 static int perf_session__process_event(struct perf_session *session,
953 				       union perf_event *event,
954 				       struct perf_tool *tool,
955 				       u64 file_offset)
956 {
957 	struct perf_sample sample;
958 	int ret;
959 
960 	if (session->header.needs_swap)
961 		event_swap(event, perf_evlist__sample_id_all(session->evlist));
962 
963 	if (event->header.type >= PERF_RECORD_HEADER_MAX)
964 		return -EINVAL;
965 
966 	hists__inc_nr_events(&session->hists, event->header.type);
967 
968 	if (event->header.type >= PERF_RECORD_USER_TYPE_START)
969 		return perf_session__process_user_event(session, event, tool, file_offset);
970 
971 	/*
972 	 * For all kernel events we get the sample data
973 	 */
974 	ret = perf_evlist__parse_sample(session->evlist, event, &sample);
975 	if (ret)
976 		return ret;
977 
978 	/* Preprocess sample records - precheck callchains */
979 	if (perf_session__preprocess_sample(session, event, &sample))
980 		return 0;
981 
982 	if (tool->ordered_samples) {
983 		ret = perf_session_queue_event(session, event, &sample,
984 					       file_offset);
985 		if (ret != -ETIME)
986 			return ret;
987 	}
988 
989 	return perf_session_deliver_event(session, event, &sample, tool,
990 					  file_offset);
991 }
992 
993 void perf_event_header__bswap(struct perf_event_header *self)
994 {
995 	self->type = bswap_32(self->type);
996 	self->misc = bswap_16(self->misc);
997 	self->size = bswap_16(self->size);
998 }
999 
1000 struct thread *perf_session__findnew(struct perf_session *session, pid_t pid)
1001 {
1002 	return machine__findnew_thread(&session->host_machine, pid);
1003 }
1004 
1005 static struct thread *perf_session__register_idle_thread(struct perf_session *self)
1006 {
1007 	struct thread *thread = perf_session__findnew(self, 0);
1008 
1009 	if (thread == NULL || thread__set_comm(thread, "swapper")) {
1010 		pr_err("problem inserting idle task.\n");
1011 		thread = NULL;
1012 	}
1013 
1014 	return thread;
1015 }
1016 
1017 static void perf_session__warn_about_errors(const struct perf_session *session,
1018 					    const struct perf_tool *tool)
1019 {
1020 	if (tool->lost == perf_event__process_lost &&
1021 	    session->hists.stats.nr_events[PERF_RECORD_LOST] != 0) {
1022 		ui__warning("Processed %d events and lost %d chunks!\n\n"
1023 			    "Check IO/CPU overload!\n\n",
1024 			    session->hists.stats.nr_events[0],
1025 			    session->hists.stats.nr_events[PERF_RECORD_LOST]);
1026 	}
1027 
1028 	if (session->hists.stats.nr_unknown_events != 0) {
1029 		ui__warning("Found %u unknown events!\n\n"
1030 			    "Is this an older tool processing a perf.data "
1031 			    "file generated by a more recent tool?\n\n"
1032 			    "If that is not the case, consider "
1033 			    "reporting to linux-kernel@vger.kernel.org.\n\n",
1034 			    session->hists.stats.nr_unknown_events);
1035 	}
1036 
1037 	if (session->hists.stats.nr_unknown_id != 0) {
1038 		ui__warning("%u samples with id not present in the header\n",
1039 			    session->hists.stats.nr_unknown_id);
1040 	}
1041 
1042  	if (session->hists.stats.nr_invalid_chains != 0) {
1043  		ui__warning("Found invalid callchains!\n\n"
1044  			    "%u out of %u events were discarded for this reason.\n\n"
1045  			    "Consider reporting to linux-kernel@vger.kernel.org.\n\n",
1046  			    session->hists.stats.nr_invalid_chains,
1047  			    session->hists.stats.nr_events[PERF_RECORD_SAMPLE]);
1048  	}
1049 
1050 	if (session->hists.stats.nr_unprocessable_samples != 0) {
1051 		ui__warning("%u unprocessable samples recorded.\n"
1052 			    "Do you have a KVM guest running and not using 'perf kvm'?\n",
1053 			    session->hists.stats.nr_unprocessable_samples);
1054 	}
1055 }
1056 
1057 #define session_done()	(*(volatile int *)(&session_done))
1058 volatile int session_done;
1059 
1060 static int __perf_session__process_pipe_events(struct perf_session *self,
1061 					       struct perf_tool *tool)
1062 {
1063 	union perf_event *event;
1064 	uint32_t size, cur_size = 0;
1065 	void *buf = NULL;
1066 	int skip = 0;
1067 	u64 head;
1068 	int err;
1069 	void *p;
1070 
1071 	perf_tool__fill_defaults(tool);
1072 
1073 	head = 0;
1074 	cur_size = sizeof(union perf_event);
1075 
1076 	buf = malloc(cur_size);
1077 	if (!buf)
1078 		return -errno;
1079 more:
1080 	event = buf;
1081 	err = readn(self->fd, event, sizeof(struct perf_event_header));
1082 	if (err <= 0) {
1083 		if (err == 0)
1084 			goto done;
1085 
1086 		pr_err("failed to read event header\n");
1087 		goto out_err;
1088 	}
1089 
1090 	if (self->header.needs_swap)
1091 		perf_event_header__bswap(&event->header);
1092 
1093 	size = event->header.size;
1094 	if (size == 0)
1095 		size = 8;
1096 
1097 	if (size > cur_size) {
1098 		void *new = realloc(buf, size);
1099 		if (!new) {
1100 			pr_err("failed to allocate memory to read event\n");
1101 			goto out_err;
1102 		}
1103 		buf = new;
1104 		cur_size = size;
1105 		event = buf;
1106 	}
1107 	p = event;
1108 	p += sizeof(struct perf_event_header);
1109 
1110 	if (size - sizeof(struct perf_event_header)) {
1111 		err = readn(self->fd, p, size - sizeof(struct perf_event_header));
1112 		if (err <= 0) {
1113 			if (err == 0) {
1114 				pr_err("unexpected end of event stream\n");
1115 				goto done;
1116 			}
1117 
1118 			pr_err("failed to read event data\n");
1119 			goto out_err;
1120 		}
1121 	}
1122 
1123 	if ((skip = perf_session__process_event(self, event, tool, head)) < 0) {
1124 		pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
1125 		       head, event->header.size, event->header.type);
1126 		err = -EINVAL;
1127 		goto out_err;
1128 	}
1129 
1130 	head += size;
1131 
1132 	if (skip > 0)
1133 		head += skip;
1134 
1135 	if (!session_done())
1136 		goto more;
1137 done:
1138 	err = 0;
1139 out_err:
1140 	free(buf);
1141 	perf_session__warn_about_errors(self, tool);
1142 	perf_session_free_sample_buffers(self);
1143 	return err;
1144 }
1145 
1146 static union perf_event *
1147 fetch_mmaped_event(struct perf_session *session,
1148 		   u64 head, size_t mmap_size, char *buf)
1149 {
1150 	union perf_event *event;
1151 
1152 	/*
1153 	 * Ensure we have enough space remaining to read
1154 	 * the size of the event in the headers.
1155 	 */
1156 	if (head + sizeof(event->header) > mmap_size)
1157 		return NULL;
1158 
1159 	event = (union perf_event *)(buf + head);
1160 
1161 	if (session->header.needs_swap)
1162 		perf_event_header__bswap(&event->header);
1163 
1164 	if (head + event->header.size > mmap_size)
1165 		return NULL;
1166 
1167 	return event;
1168 }
1169 
1170 /*
1171  * On 64bit we can mmap the data file in one go. No need for tiny mmap
1172  * slices. On 32bit we use 32MB.
1173  */
1174 #if BITS_PER_LONG == 64
1175 #define MMAP_SIZE ULLONG_MAX
1176 #define NUM_MMAPS 1
1177 #else
1178 #define MMAP_SIZE (32 * 1024 * 1024ULL)
1179 #define NUM_MMAPS 128
1180 #endif
1181 
1182 int __perf_session__process_events(struct perf_session *session,
1183 				   u64 data_offset, u64 data_size,
1184 				   u64 file_size, struct perf_tool *tool)
1185 {
1186 	u64 head, page_offset, file_offset, file_pos, progress_next;
1187 	int err, mmap_prot, mmap_flags, map_idx = 0;
1188 	size_t	mmap_size;
1189 	char *buf, *mmaps[NUM_MMAPS];
1190 	union perf_event *event;
1191 	uint32_t size;
1192 
1193 	perf_tool__fill_defaults(tool);
1194 
1195 	page_offset = page_size * (data_offset / page_size);
1196 	file_offset = page_offset;
1197 	head = data_offset - page_offset;
1198 
1199 	if (data_offset + data_size < file_size)
1200 		file_size = data_offset + data_size;
1201 
1202 	progress_next = file_size / 16;
1203 
1204 	mmap_size = MMAP_SIZE;
1205 	if (mmap_size > file_size)
1206 		mmap_size = file_size;
1207 
1208 	memset(mmaps, 0, sizeof(mmaps));
1209 
1210 	mmap_prot  = PROT_READ;
1211 	mmap_flags = MAP_SHARED;
1212 
1213 	if (session->header.needs_swap) {
1214 		mmap_prot  |= PROT_WRITE;
1215 		mmap_flags = MAP_PRIVATE;
1216 	}
1217 remap:
1218 	buf = mmap(NULL, mmap_size, mmap_prot, mmap_flags, session->fd,
1219 		   file_offset);
1220 	if (buf == MAP_FAILED) {
1221 		pr_err("failed to mmap file\n");
1222 		err = -errno;
1223 		goto out_err;
1224 	}
1225 	mmaps[map_idx] = buf;
1226 	map_idx = (map_idx + 1) & (ARRAY_SIZE(mmaps) - 1);
1227 	file_pos = file_offset + head;
1228 
1229 more:
1230 	event = fetch_mmaped_event(session, head, mmap_size, buf);
1231 	if (!event) {
1232 		if (mmaps[map_idx]) {
1233 			munmap(mmaps[map_idx], mmap_size);
1234 			mmaps[map_idx] = NULL;
1235 		}
1236 
1237 		page_offset = page_size * (head / page_size);
1238 		file_offset += page_offset;
1239 		head -= page_offset;
1240 		goto remap;
1241 	}
1242 
1243 	size = event->header.size;
1244 
1245 	if (size == 0 ||
1246 	    perf_session__process_event(session, event, tool, file_pos) < 0) {
1247 		pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
1248 		       file_offset + head, event->header.size,
1249 		       event->header.type);
1250 		err = -EINVAL;
1251 		goto out_err;
1252 	}
1253 
1254 	head += size;
1255 	file_pos += size;
1256 
1257 	if (file_pos >= progress_next) {
1258 		progress_next += file_size / 16;
1259 		ui_progress__update(file_pos, file_size,
1260 				    "Processing events...");
1261 	}
1262 
1263 	if (file_pos < file_size)
1264 		goto more;
1265 
1266 	err = 0;
1267 	/* do the final flush for ordered samples */
1268 	session->ordered_samples.next_flush = ULLONG_MAX;
1269 	err = flush_sample_queue(session, tool);
1270 out_err:
1271 	ui_progress__finish();
1272 	perf_session__warn_about_errors(session, tool);
1273 	perf_session_free_sample_buffers(session);
1274 	return err;
1275 }
1276 
1277 int perf_session__process_events(struct perf_session *self,
1278 				 struct perf_tool *tool)
1279 {
1280 	int err;
1281 
1282 	if (perf_session__register_idle_thread(self) == NULL)
1283 		return -ENOMEM;
1284 
1285 	if (!self->fd_pipe)
1286 		err = __perf_session__process_events(self,
1287 						     self->header.data_offset,
1288 						     self->header.data_size,
1289 						     self->size, tool);
1290 	else
1291 		err = __perf_session__process_pipe_events(self, tool);
1292 
1293 	return err;
1294 }
1295 
1296 bool perf_session__has_traces(struct perf_session *session, const char *msg)
1297 {
1298 	if (!(perf_evlist__sample_type(session->evlist) & PERF_SAMPLE_RAW)) {
1299 		pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
1300 		return false;
1301 	}
1302 
1303 	return true;
1304 }
1305 
1306 int maps__set_kallsyms_ref_reloc_sym(struct map **maps,
1307 				     const char *symbol_name, u64 addr)
1308 {
1309 	char *bracket;
1310 	enum map_type i;
1311 	struct ref_reloc_sym *ref;
1312 
1313 	ref = zalloc(sizeof(struct ref_reloc_sym));
1314 	if (ref == NULL)
1315 		return -ENOMEM;
1316 
1317 	ref->name = strdup(symbol_name);
1318 	if (ref->name == NULL) {
1319 		free(ref);
1320 		return -ENOMEM;
1321 	}
1322 
1323 	bracket = strchr(ref->name, ']');
1324 	if (bracket)
1325 		*bracket = '\0';
1326 
1327 	ref->addr = addr;
1328 
1329 	for (i = 0; i < MAP__NR_TYPES; ++i) {
1330 		struct kmap *kmap = map__kmap(maps[i]);
1331 		kmap->ref_reloc_sym = ref;
1332 	}
1333 
1334 	return 0;
1335 }
1336 
1337 size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp)
1338 {
1339 	return __dsos__fprintf(&self->host_machine.kernel_dsos, fp) +
1340 	       __dsos__fprintf(&self->host_machine.user_dsos, fp) +
1341 	       machines__fprintf_dsos(&self->machines, fp);
1342 }
1343 
1344 size_t perf_session__fprintf_dsos_buildid(struct perf_session *self, FILE *fp,
1345 					  bool (skip)(struct dso *dso, int parm), int parm)
1346 {
1347 	size_t ret = machine__fprintf_dsos_buildid(&self->host_machine, fp, skip, parm);
1348 	return ret + machines__fprintf_dsos_buildid(&self->machines, fp, skip, parm);
1349 }
1350 
1351 size_t perf_session__fprintf_nr_events(struct perf_session *session, FILE *fp)
1352 {
1353 	struct perf_evsel *pos;
1354 	size_t ret = fprintf(fp, "Aggregated stats:\n");
1355 
1356 	ret += events_stats__fprintf(&session->hists.stats, fp);
1357 
1358 	list_for_each_entry(pos, &session->evlist->entries, node) {
1359 		ret += fprintf(fp, "%s stats:\n", perf_evsel__name(pos));
1360 		ret += events_stats__fprintf(&pos->hists.stats, fp);
1361 	}
1362 
1363 	return ret;
1364 }
1365 
1366 size_t perf_session__fprintf(struct perf_session *session, FILE *fp)
1367 {
1368 	/*
1369 	 * FIXME: Here we have to actually print all the machines in this
1370 	 * session, not just the host...
1371 	 */
1372 	return machine__fprintf(&session->host_machine, fp);
1373 }
1374 
1375 void perf_session__remove_thread(struct perf_session *session,
1376 				 struct thread *th)
1377 {
1378 	/*
1379 	 * FIXME: This one makes no sense, we need to remove the thread from
1380 	 * the machine it belongs to, perf_session can have many machines, so
1381 	 * doing it always on ->host_machine is wrong.  Fix when auditing all
1382 	 * the 'perf kvm' code.
1383 	 */
1384 	machine__remove_thread(&session->host_machine, th);
1385 }
1386 
1387 struct perf_evsel *perf_session__find_first_evtype(struct perf_session *session,
1388 					      unsigned int type)
1389 {
1390 	struct perf_evsel *pos;
1391 
1392 	list_for_each_entry(pos, &session->evlist->entries, node) {
1393 		if (pos->attr.type == type)
1394 			return pos;
1395 	}
1396 	return NULL;
1397 }
1398 
1399 void perf_evsel__print_ip(struct perf_evsel *evsel, union perf_event *event,
1400 			  struct perf_sample *sample, struct machine *machine,
1401 			  int print_sym, int print_dso, int print_symoffset)
1402 {
1403 	struct addr_location al;
1404 	struct callchain_cursor_node *node;
1405 
1406 	if (perf_event__preprocess_sample(event, machine, &al, sample,
1407 					  NULL) < 0) {
1408 		error("problem processing %d event, skipping it.\n",
1409 			event->header.type);
1410 		return;
1411 	}
1412 
1413 	if (symbol_conf.use_callchain && sample->callchain) {
1414 
1415 
1416 		if (machine__resolve_callchain(machine, evsel, al.thread,
1417 					       sample, NULL) != 0) {
1418 			if (verbose)
1419 				error("Failed to resolve callchain. Skipping\n");
1420 			return;
1421 		}
1422 		callchain_cursor_commit(&callchain_cursor);
1423 
1424 		while (1) {
1425 			node = callchain_cursor_current(&callchain_cursor);
1426 			if (!node)
1427 				break;
1428 
1429 			printf("\t%16" PRIx64, node->ip);
1430 			if (print_sym) {
1431 				printf(" ");
1432 				symbol__fprintf_symname(node->sym, stdout);
1433 			}
1434 			if (print_dso) {
1435 				printf(" (");
1436 				map__fprintf_dsoname(node->map, stdout);
1437 				printf(")");
1438 			}
1439 			printf("\n");
1440 
1441 			callchain_cursor_advance(&callchain_cursor);
1442 		}
1443 
1444 	} else {
1445 		printf("%16" PRIx64, sample->ip);
1446 		if (print_sym) {
1447 			printf(" ");
1448 			if (print_symoffset)
1449 				symbol__fprintf_symname_offs(al.sym, &al,
1450 							     stdout);
1451 			else
1452 				symbol__fprintf_symname(al.sym, stdout);
1453 		}
1454 
1455 		if (print_dso) {
1456 			printf(" (");
1457 			map__fprintf_dsoname(al.map, stdout);
1458 			printf(")");
1459 		}
1460 	}
1461 }
1462 
1463 int perf_session__cpu_bitmap(struct perf_session *session,
1464 			     const char *cpu_list, unsigned long *cpu_bitmap)
1465 {
1466 	int i;
1467 	struct cpu_map *map;
1468 
1469 	for (i = 0; i < PERF_TYPE_MAX; ++i) {
1470 		struct perf_evsel *evsel;
1471 
1472 		evsel = perf_session__find_first_evtype(session, i);
1473 		if (!evsel)
1474 			continue;
1475 
1476 		if (!(evsel->attr.sample_type & PERF_SAMPLE_CPU)) {
1477 			pr_err("File does not contain CPU events. "
1478 			       "Remove -c option to proceed.\n");
1479 			return -1;
1480 		}
1481 	}
1482 
1483 	map = cpu_map__new(cpu_list);
1484 	if (map == NULL) {
1485 		pr_err("Invalid cpu_list\n");
1486 		return -1;
1487 	}
1488 
1489 	for (i = 0; i < map->nr; i++) {
1490 		int cpu = map->map[i];
1491 
1492 		if (cpu >= MAX_NR_CPUS) {
1493 			pr_err("Requested CPU %d too large. "
1494 			       "Consider raising MAX_NR_CPUS\n", cpu);
1495 			return -1;
1496 		}
1497 
1498 		set_bit(cpu, cpu_bitmap);
1499 	}
1500 
1501 	return 0;
1502 }
1503 
1504 void perf_session__fprintf_info(struct perf_session *session, FILE *fp,
1505 				bool full)
1506 {
1507 	struct stat st;
1508 	int ret;
1509 
1510 	if (session == NULL || fp == NULL)
1511 		return;
1512 
1513 	ret = fstat(session->fd, &st);
1514 	if (ret == -1)
1515 		return;
1516 
1517 	fprintf(fp, "# ========\n");
1518 	fprintf(fp, "# captured on: %s", ctime(&st.st_ctime));
1519 	perf_header__fprintf_info(session, fp, full);
1520 	fprintf(fp, "# ========\n#\n");
1521 }
1522 
1523 
1524 int __perf_session__set_tracepoints_handlers(struct perf_session *session,
1525 					     const struct perf_evsel_str_handler *assocs,
1526 					     size_t nr_assocs)
1527 {
1528 	struct perf_evlist *evlist = session->evlist;
1529 	struct event_format *format;
1530 	struct perf_evsel *evsel;
1531 	char *tracepoint, *name;
1532 	size_t i;
1533 	int err;
1534 
1535 	for (i = 0; i < nr_assocs; i++) {
1536 		err = -ENOMEM;
1537 		tracepoint = strdup(assocs[i].name);
1538 		if (tracepoint == NULL)
1539 			goto out;
1540 
1541 		err = -ENOENT;
1542 		name = strchr(tracepoint, ':');
1543 		if (name == NULL)
1544 			goto out_free;
1545 
1546 		*name++ = '\0';
1547 		format = pevent_find_event_by_name(session->pevent,
1548 						   tracepoint, name);
1549 		if (format == NULL) {
1550 			/*
1551 			 * Adding a handler for an event not in the session,
1552 			 * just ignore it.
1553 			 */
1554 			goto next;
1555 		}
1556 
1557 		evsel = perf_evlist__find_tracepoint_by_id(evlist, format->id);
1558 		if (evsel == NULL)
1559 			goto next;
1560 
1561 		err = -EEXIST;
1562 		if (evsel->handler.func != NULL)
1563 			goto out_free;
1564 		evsel->handler.func = assocs[i].handler;
1565 next:
1566 		free(tracepoint);
1567 	}
1568 
1569 	err = 0;
1570 out:
1571 	return err;
1572 
1573 out_free:
1574 	free(tracepoint);
1575 	goto out;
1576 }
1577