xref: /openbmc/linux/tools/perf/util/session.c (revision 089a49b6)
1 #include <linux/kernel.h>
2 #include <traceevent/event-parse.h>
3 
4 #include <byteswap.h>
5 #include <unistd.h>
6 #include <sys/types.h>
7 #include <sys/mman.h>
8 
9 #include "evlist.h"
10 #include "evsel.h"
11 #include "session.h"
12 #include "tool.h"
13 #include "sort.h"
14 #include "util.h"
15 #include "cpumap.h"
16 #include "perf_regs.h"
17 #include "vdso.h"
18 
19 static int perf_session__open(struct perf_session *self, bool force)
20 {
21 	struct stat input_stat;
22 
23 	if (!strcmp(self->filename, "-")) {
24 		self->fd_pipe = true;
25 		self->fd = STDIN_FILENO;
26 
27 		if (perf_session__read_header(self) < 0)
28 			pr_err("incompatible file format (rerun with -v to learn more)");
29 
30 		return 0;
31 	}
32 
33 	self->fd = open(self->filename, O_RDONLY);
34 	if (self->fd < 0) {
35 		int err = errno;
36 
37 		pr_err("failed to open %s: %s", self->filename, strerror(err));
38 		if (err == ENOENT && !strcmp(self->filename, "perf.data"))
39 			pr_err("  (try 'perf record' first)");
40 		pr_err("\n");
41 		return -errno;
42 	}
43 
44 	if (fstat(self->fd, &input_stat) < 0)
45 		goto out_close;
46 
47 	if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
48 		pr_err("file %s not owned by current user or root\n",
49 		       self->filename);
50 		goto out_close;
51 	}
52 
53 	if (!input_stat.st_size) {
54 		pr_info("zero-sized file (%s), nothing to do!\n",
55 			self->filename);
56 		goto out_close;
57 	}
58 
59 	if (perf_session__read_header(self) < 0) {
60 		pr_err("incompatible file format (rerun with -v to learn more)");
61 		goto out_close;
62 	}
63 
64 	if (!perf_evlist__valid_sample_type(self->evlist)) {
65 		pr_err("non matching sample_type");
66 		goto out_close;
67 	}
68 
69 	if (!perf_evlist__valid_sample_id_all(self->evlist)) {
70 		pr_err("non matching sample_id_all");
71 		goto out_close;
72 	}
73 
74 	if (!perf_evlist__valid_read_format(self->evlist)) {
75 		pr_err("non matching read_format");
76 		goto out_close;
77 	}
78 
79 	self->size = input_stat.st_size;
80 	return 0;
81 
82 out_close:
83 	close(self->fd);
84 	self->fd = -1;
85 	return -1;
86 }
87 
88 void perf_session__set_id_hdr_size(struct perf_session *session)
89 {
90 	u16 id_hdr_size = perf_evlist__id_hdr_size(session->evlist);
91 
92 	machines__set_id_hdr_size(&session->machines, id_hdr_size);
93 }
94 
95 int perf_session__create_kernel_maps(struct perf_session *self)
96 {
97 	int ret = machine__create_kernel_maps(&self->machines.host);
98 
99 	if (ret >= 0)
100 		ret = machines__create_guest_kernel_maps(&self->machines);
101 	return ret;
102 }
103 
104 static void perf_session__destroy_kernel_maps(struct perf_session *self)
105 {
106 	machines__destroy_kernel_maps(&self->machines);
107 }
108 
109 struct perf_session *perf_session__new(const char *filename, int mode,
110 				       bool force, bool repipe,
111 				       struct perf_tool *tool)
112 {
113 	struct perf_session *self;
114 	struct stat st;
115 	size_t len;
116 
117 	if (!filename || !strlen(filename)) {
118 		if (!fstat(STDIN_FILENO, &st) && S_ISFIFO(st.st_mode))
119 			filename = "-";
120 		else
121 			filename = "perf.data";
122 	}
123 
124 	len = strlen(filename);
125 	self = zalloc(sizeof(*self) + len);
126 
127 	if (self == NULL)
128 		goto out;
129 
130 	memcpy(self->filename, filename, len);
131 	self->repipe = repipe;
132 	INIT_LIST_HEAD(&self->ordered_samples.samples);
133 	INIT_LIST_HEAD(&self->ordered_samples.sample_cache);
134 	INIT_LIST_HEAD(&self->ordered_samples.to_free);
135 	machines__init(&self->machines);
136 
137 	if (mode == O_RDONLY) {
138 		if (perf_session__open(self, force) < 0)
139 			goto out_delete;
140 		perf_session__set_id_hdr_size(self);
141 	} else if (mode == O_WRONLY) {
142 		/*
143 		 * In O_RDONLY mode this will be performed when reading the
144 		 * kernel MMAP event, in perf_event__process_mmap().
145 		 */
146 		if (perf_session__create_kernel_maps(self) < 0)
147 			goto out_delete;
148 	}
149 
150 	if (tool && tool->ordering_requires_timestamps &&
151 	    tool->ordered_samples && !perf_evlist__sample_id_all(self->evlist)) {
152 		dump_printf("WARNING: No sample_id_all support, falling back to unordered processing\n");
153 		tool->ordered_samples = false;
154 	}
155 
156 out:
157 	return self;
158 out_delete:
159 	perf_session__delete(self);
160 	return NULL;
161 }
162 
163 static void perf_session__delete_dead_threads(struct perf_session *session)
164 {
165 	machine__delete_dead_threads(&session->machines.host);
166 }
167 
168 static void perf_session__delete_threads(struct perf_session *session)
169 {
170 	machine__delete_threads(&session->machines.host);
171 }
172 
173 static void perf_session_env__delete(struct perf_session_env *env)
174 {
175 	free(env->hostname);
176 	free(env->os_release);
177 	free(env->version);
178 	free(env->arch);
179 	free(env->cpu_desc);
180 	free(env->cpuid);
181 
182 	free(env->cmdline);
183 	free(env->sibling_cores);
184 	free(env->sibling_threads);
185 	free(env->numa_nodes);
186 	free(env->pmu_mappings);
187 }
188 
189 void perf_session__delete(struct perf_session *self)
190 {
191 	perf_session__destroy_kernel_maps(self);
192 	perf_session__delete_dead_threads(self);
193 	perf_session__delete_threads(self);
194 	perf_session_env__delete(&self->header.env);
195 	machines__exit(&self->machines);
196 	close(self->fd);
197 	free(self);
198 	vdso__exit();
199 }
200 
201 static int process_event_synth_tracing_data_stub(struct perf_tool *tool
202 						 __maybe_unused,
203 						 union perf_event *event
204 						 __maybe_unused,
205 						 struct perf_session *session
206 						__maybe_unused)
207 {
208 	dump_printf(": unhandled!\n");
209 	return 0;
210 }
211 
212 static int process_event_synth_attr_stub(struct perf_tool *tool __maybe_unused,
213 					 union perf_event *event __maybe_unused,
214 					 struct perf_evlist **pevlist
215 					 __maybe_unused)
216 {
217 	dump_printf(": unhandled!\n");
218 	return 0;
219 }
220 
221 static int process_event_sample_stub(struct perf_tool *tool __maybe_unused,
222 				     union perf_event *event __maybe_unused,
223 				     struct perf_sample *sample __maybe_unused,
224 				     struct perf_evsel *evsel __maybe_unused,
225 				     struct machine *machine __maybe_unused)
226 {
227 	dump_printf(": unhandled!\n");
228 	return 0;
229 }
230 
231 static int process_event_stub(struct perf_tool *tool __maybe_unused,
232 			      union perf_event *event __maybe_unused,
233 			      struct perf_sample *sample __maybe_unused,
234 			      struct machine *machine __maybe_unused)
235 {
236 	dump_printf(": unhandled!\n");
237 	return 0;
238 }
239 
240 static int process_finished_round_stub(struct perf_tool *tool __maybe_unused,
241 				       union perf_event *event __maybe_unused,
242 				       struct perf_session *perf_session
243 				       __maybe_unused)
244 {
245 	dump_printf(": unhandled!\n");
246 	return 0;
247 }
248 
249 static int process_finished_round(struct perf_tool *tool,
250 				  union perf_event *event,
251 				  struct perf_session *session);
252 
253 void perf_tool__fill_defaults(struct perf_tool *tool)
254 {
255 	if (tool->sample == NULL)
256 		tool->sample = process_event_sample_stub;
257 	if (tool->mmap == NULL)
258 		tool->mmap = process_event_stub;
259 	if (tool->comm == NULL)
260 		tool->comm = process_event_stub;
261 	if (tool->fork == NULL)
262 		tool->fork = process_event_stub;
263 	if (tool->exit == NULL)
264 		tool->exit = process_event_stub;
265 	if (tool->lost == NULL)
266 		tool->lost = perf_event__process_lost;
267 	if (tool->read == NULL)
268 		tool->read = process_event_sample_stub;
269 	if (tool->throttle == NULL)
270 		tool->throttle = process_event_stub;
271 	if (tool->unthrottle == NULL)
272 		tool->unthrottle = process_event_stub;
273 	if (tool->attr == NULL)
274 		tool->attr = process_event_synth_attr_stub;
275 	if (tool->tracing_data == NULL)
276 		tool->tracing_data = process_event_synth_tracing_data_stub;
277 	if (tool->build_id == NULL)
278 		tool->build_id = process_finished_round_stub;
279 	if (tool->finished_round == NULL) {
280 		if (tool->ordered_samples)
281 			tool->finished_round = process_finished_round;
282 		else
283 			tool->finished_round = process_finished_round_stub;
284 	}
285 }
286 
287 void mem_bswap_32(void *src, int byte_size)
288 {
289 	u32 *m = src;
290 	while (byte_size > 0) {
291 		*m = bswap_32(*m);
292 		byte_size -= sizeof(u32);
293 		++m;
294 	}
295 }
296 
297 void mem_bswap_64(void *src, int byte_size)
298 {
299 	u64 *m = src;
300 
301 	while (byte_size > 0) {
302 		*m = bswap_64(*m);
303 		byte_size -= sizeof(u64);
304 		++m;
305 	}
306 }
307 
308 static void swap_sample_id_all(union perf_event *event, void *data)
309 {
310 	void *end = (void *) event + event->header.size;
311 	int size = end - data;
312 
313 	BUG_ON(size % sizeof(u64));
314 	mem_bswap_64(data, size);
315 }
316 
317 static void perf_event__all64_swap(union perf_event *event,
318 				   bool sample_id_all __maybe_unused)
319 {
320 	struct perf_event_header *hdr = &event->header;
321 	mem_bswap_64(hdr + 1, event->header.size - sizeof(*hdr));
322 }
323 
324 static void perf_event__comm_swap(union perf_event *event, bool sample_id_all)
325 {
326 	event->comm.pid = bswap_32(event->comm.pid);
327 	event->comm.tid = bswap_32(event->comm.tid);
328 
329 	if (sample_id_all) {
330 		void *data = &event->comm.comm;
331 
332 		data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
333 		swap_sample_id_all(event, data);
334 	}
335 }
336 
337 static void perf_event__mmap_swap(union perf_event *event,
338 				  bool sample_id_all)
339 {
340 	event->mmap.pid	  = bswap_32(event->mmap.pid);
341 	event->mmap.tid	  = bswap_32(event->mmap.tid);
342 	event->mmap.start = bswap_64(event->mmap.start);
343 	event->mmap.len	  = bswap_64(event->mmap.len);
344 	event->mmap.pgoff = bswap_64(event->mmap.pgoff);
345 
346 	if (sample_id_all) {
347 		void *data = &event->mmap.filename;
348 
349 		data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
350 		swap_sample_id_all(event, data);
351 	}
352 }
353 
354 static void perf_event__mmap2_swap(union perf_event *event,
355 				  bool sample_id_all)
356 {
357 	event->mmap2.pid   = bswap_32(event->mmap2.pid);
358 	event->mmap2.tid   = bswap_32(event->mmap2.tid);
359 	event->mmap2.start = bswap_64(event->mmap2.start);
360 	event->mmap2.len   = bswap_64(event->mmap2.len);
361 	event->mmap2.pgoff = bswap_64(event->mmap2.pgoff);
362 	event->mmap2.maj   = bswap_32(event->mmap2.maj);
363 	event->mmap2.min   = bswap_32(event->mmap2.min);
364 	event->mmap2.ino   = bswap_64(event->mmap2.ino);
365 
366 	if (sample_id_all) {
367 		void *data = &event->mmap2.filename;
368 
369 		data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
370 		swap_sample_id_all(event, data);
371 	}
372 }
373 static void perf_event__task_swap(union perf_event *event, bool sample_id_all)
374 {
375 	event->fork.pid	 = bswap_32(event->fork.pid);
376 	event->fork.tid	 = bswap_32(event->fork.tid);
377 	event->fork.ppid = bswap_32(event->fork.ppid);
378 	event->fork.ptid = bswap_32(event->fork.ptid);
379 	event->fork.time = bswap_64(event->fork.time);
380 
381 	if (sample_id_all)
382 		swap_sample_id_all(event, &event->fork + 1);
383 }
384 
385 static void perf_event__read_swap(union perf_event *event, bool sample_id_all)
386 {
387 	event->read.pid		 = bswap_32(event->read.pid);
388 	event->read.tid		 = bswap_32(event->read.tid);
389 	event->read.value	 = bswap_64(event->read.value);
390 	event->read.time_enabled = bswap_64(event->read.time_enabled);
391 	event->read.time_running = bswap_64(event->read.time_running);
392 	event->read.id		 = bswap_64(event->read.id);
393 
394 	if (sample_id_all)
395 		swap_sample_id_all(event, &event->read + 1);
396 }
397 
398 static u8 revbyte(u8 b)
399 {
400 	int rev = (b >> 4) | ((b & 0xf) << 4);
401 	rev = ((rev & 0xcc) >> 2) | ((rev & 0x33) << 2);
402 	rev = ((rev & 0xaa) >> 1) | ((rev & 0x55) << 1);
403 	return (u8) rev;
404 }
405 
406 /*
407  * XXX this is hack in attempt to carry flags bitfield
408  * throught endian village. ABI says:
409  *
410  * Bit-fields are allocated from right to left (least to most significant)
411  * on little-endian implementations and from left to right (most to least
412  * significant) on big-endian implementations.
413  *
414  * The above seems to be byte specific, so we need to reverse each
415  * byte of the bitfield. 'Internet' also says this might be implementation
416  * specific and we probably need proper fix and carry perf_event_attr
417  * bitfield flags in separate data file FEAT_ section. Thought this seems
418  * to work for now.
419  */
420 static void swap_bitfield(u8 *p, unsigned len)
421 {
422 	unsigned i;
423 
424 	for (i = 0; i < len; i++) {
425 		*p = revbyte(*p);
426 		p++;
427 	}
428 }
429 
430 /* exported for swapping attributes in file header */
431 void perf_event__attr_swap(struct perf_event_attr *attr)
432 {
433 	attr->type		= bswap_32(attr->type);
434 	attr->size		= bswap_32(attr->size);
435 	attr->config		= bswap_64(attr->config);
436 	attr->sample_period	= bswap_64(attr->sample_period);
437 	attr->sample_type	= bswap_64(attr->sample_type);
438 	attr->read_format	= bswap_64(attr->read_format);
439 	attr->wakeup_events	= bswap_32(attr->wakeup_events);
440 	attr->bp_type		= bswap_32(attr->bp_type);
441 	attr->bp_addr		= bswap_64(attr->bp_addr);
442 	attr->bp_len		= bswap_64(attr->bp_len);
443 
444 	swap_bitfield((u8 *) (&attr->read_format + 1), sizeof(u64));
445 }
446 
447 static void perf_event__hdr_attr_swap(union perf_event *event,
448 				      bool sample_id_all __maybe_unused)
449 {
450 	size_t size;
451 
452 	perf_event__attr_swap(&event->attr.attr);
453 
454 	size = event->header.size;
455 	size -= (void *)&event->attr.id - (void *)event;
456 	mem_bswap_64(event->attr.id, size);
457 }
458 
459 static void perf_event__event_type_swap(union perf_event *event,
460 					bool sample_id_all __maybe_unused)
461 {
462 	event->event_type.event_type.event_id =
463 		bswap_64(event->event_type.event_type.event_id);
464 }
465 
466 static void perf_event__tracing_data_swap(union perf_event *event,
467 					  bool sample_id_all __maybe_unused)
468 {
469 	event->tracing_data.size = bswap_32(event->tracing_data.size);
470 }
471 
472 typedef void (*perf_event__swap_op)(union perf_event *event,
473 				    bool sample_id_all);
474 
475 static perf_event__swap_op perf_event__swap_ops[] = {
476 	[PERF_RECORD_MMAP]		  = perf_event__mmap_swap,
477 	[PERF_RECORD_MMAP2]		  = perf_event__mmap2_swap,
478 	[PERF_RECORD_COMM]		  = perf_event__comm_swap,
479 	[PERF_RECORD_FORK]		  = perf_event__task_swap,
480 	[PERF_RECORD_EXIT]		  = perf_event__task_swap,
481 	[PERF_RECORD_LOST]		  = perf_event__all64_swap,
482 	[PERF_RECORD_READ]		  = perf_event__read_swap,
483 	[PERF_RECORD_SAMPLE]		  = perf_event__all64_swap,
484 	[PERF_RECORD_HEADER_ATTR]	  = perf_event__hdr_attr_swap,
485 	[PERF_RECORD_HEADER_EVENT_TYPE]	  = perf_event__event_type_swap,
486 	[PERF_RECORD_HEADER_TRACING_DATA] = perf_event__tracing_data_swap,
487 	[PERF_RECORD_HEADER_BUILD_ID]	  = NULL,
488 	[PERF_RECORD_HEADER_MAX]	  = NULL,
489 };
490 
491 struct sample_queue {
492 	u64			timestamp;
493 	u64			file_offset;
494 	union perf_event	*event;
495 	struct list_head	list;
496 };
497 
498 static void perf_session_free_sample_buffers(struct perf_session *session)
499 {
500 	struct ordered_samples *os = &session->ordered_samples;
501 
502 	while (!list_empty(&os->to_free)) {
503 		struct sample_queue *sq;
504 
505 		sq = list_entry(os->to_free.next, struct sample_queue, list);
506 		list_del(&sq->list);
507 		free(sq);
508 	}
509 }
510 
511 static int perf_session_deliver_event(struct perf_session *session,
512 				      union perf_event *event,
513 				      struct perf_sample *sample,
514 				      struct perf_tool *tool,
515 				      u64 file_offset);
516 
517 static int flush_sample_queue(struct perf_session *s,
518 		       struct perf_tool *tool)
519 {
520 	struct ordered_samples *os = &s->ordered_samples;
521 	struct list_head *head = &os->samples;
522 	struct sample_queue *tmp, *iter;
523 	struct perf_sample sample;
524 	u64 limit = os->next_flush;
525 	u64 last_ts = os->last_sample ? os->last_sample->timestamp : 0ULL;
526 	unsigned idx = 0, progress_next = os->nr_samples / 16;
527 	bool show_progress = limit == ULLONG_MAX;
528 	int ret;
529 
530 	if (!tool->ordered_samples || !limit)
531 		return 0;
532 
533 	list_for_each_entry_safe(iter, tmp, head, list) {
534 		if (session_done())
535 			return 0;
536 
537 		if (iter->timestamp > limit)
538 			break;
539 
540 		ret = perf_evlist__parse_sample(s->evlist, iter->event, &sample);
541 		if (ret)
542 			pr_err("Can't parse sample, err = %d\n", ret);
543 		else {
544 			ret = perf_session_deliver_event(s, iter->event, &sample, tool,
545 							 iter->file_offset);
546 			if (ret)
547 				return ret;
548 		}
549 
550 		os->last_flush = iter->timestamp;
551 		list_del(&iter->list);
552 		list_add(&iter->list, &os->sample_cache);
553 		if (show_progress && (++idx >= progress_next)) {
554 			progress_next += os->nr_samples / 16;
555 			ui_progress__update(idx, os->nr_samples,
556 					    "Processing time ordered events...");
557 		}
558 	}
559 
560 	if (list_empty(head)) {
561 		os->last_sample = NULL;
562 	} else if (last_ts <= limit) {
563 		os->last_sample =
564 			list_entry(head->prev, struct sample_queue, list);
565 	}
566 
567 	os->nr_samples = 0;
568 
569 	return 0;
570 }
571 
572 /*
573  * When perf record finishes a pass on every buffers, it records this pseudo
574  * event.
575  * We record the max timestamp t found in the pass n.
576  * Assuming these timestamps are monotonic across cpus, we know that if
577  * a buffer still has events with timestamps below t, they will be all
578  * available and then read in the pass n + 1.
579  * Hence when we start to read the pass n + 2, we can safely flush every
580  * events with timestamps below t.
581  *
582  *    ============ PASS n =================
583  *       CPU 0         |   CPU 1
584  *                     |
585  *    cnt1 timestamps  |   cnt2 timestamps
586  *          1          |         2
587  *          2          |         3
588  *          -          |         4  <--- max recorded
589  *
590  *    ============ PASS n + 1 ==============
591  *       CPU 0         |   CPU 1
592  *                     |
593  *    cnt1 timestamps  |   cnt2 timestamps
594  *          3          |         5
595  *          4          |         6
596  *          5          |         7 <---- max recorded
597  *
598  *      Flush every events below timestamp 4
599  *
600  *    ============ PASS n + 2 ==============
601  *       CPU 0         |   CPU 1
602  *                     |
603  *    cnt1 timestamps  |   cnt2 timestamps
604  *          6          |         8
605  *          7          |         9
606  *          -          |         10
607  *
608  *      Flush every events below timestamp 7
609  *      etc...
610  */
611 static int process_finished_round(struct perf_tool *tool,
612 				  union perf_event *event __maybe_unused,
613 				  struct perf_session *session)
614 {
615 	int ret = flush_sample_queue(session, tool);
616 	if (!ret)
617 		session->ordered_samples.next_flush = session->ordered_samples.max_timestamp;
618 
619 	return ret;
620 }
621 
622 /* The queue is ordered by time */
623 static void __queue_event(struct sample_queue *new, struct perf_session *s)
624 {
625 	struct ordered_samples *os = &s->ordered_samples;
626 	struct sample_queue *sample = os->last_sample;
627 	u64 timestamp = new->timestamp;
628 	struct list_head *p;
629 
630 	++os->nr_samples;
631 	os->last_sample = new;
632 
633 	if (!sample) {
634 		list_add(&new->list, &os->samples);
635 		os->max_timestamp = timestamp;
636 		return;
637 	}
638 
639 	/*
640 	 * last_sample might point to some random place in the list as it's
641 	 * the last queued event. We expect that the new event is close to
642 	 * this.
643 	 */
644 	if (sample->timestamp <= timestamp) {
645 		while (sample->timestamp <= timestamp) {
646 			p = sample->list.next;
647 			if (p == &os->samples) {
648 				list_add_tail(&new->list, &os->samples);
649 				os->max_timestamp = timestamp;
650 				return;
651 			}
652 			sample = list_entry(p, struct sample_queue, list);
653 		}
654 		list_add_tail(&new->list, &sample->list);
655 	} else {
656 		while (sample->timestamp > timestamp) {
657 			p = sample->list.prev;
658 			if (p == &os->samples) {
659 				list_add(&new->list, &os->samples);
660 				return;
661 			}
662 			sample = list_entry(p, struct sample_queue, list);
663 		}
664 		list_add(&new->list, &sample->list);
665 	}
666 }
667 
668 #define MAX_SAMPLE_BUFFER	(64 * 1024 / sizeof(struct sample_queue))
669 
670 int perf_session_queue_event(struct perf_session *s, union perf_event *event,
671 				    struct perf_sample *sample, u64 file_offset)
672 {
673 	struct ordered_samples *os = &s->ordered_samples;
674 	struct list_head *sc = &os->sample_cache;
675 	u64 timestamp = sample->time;
676 	struct sample_queue *new;
677 
678 	if (!timestamp || timestamp == ~0ULL)
679 		return -ETIME;
680 
681 	if (timestamp < s->ordered_samples.last_flush) {
682 		printf("Warning: Timestamp below last timeslice flush\n");
683 		return -EINVAL;
684 	}
685 
686 	if (!list_empty(sc)) {
687 		new = list_entry(sc->next, struct sample_queue, list);
688 		list_del(&new->list);
689 	} else if (os->sample_buffer) {
690 		new = os->sample_buffer + os->sample_buffer_idx;
691 		if (++os->sample_buffer_idx == MAX_SAMPLE_BUFFER)
692 			os->sample_buffer = NULL;
693 	} else {
694 		os->sample_buffer = malloc(MAX_SAMPLE_BUFFER * sizeof(*new));
695 		if (!os->sample_buffer)
696 			return -ENOMEM;
697 		list_add(&os->sample_buffer->list, &os->to_free);
698 		os->sample_buffer_idx = 2;
699 		new = os->sample_buffer + 1;
700 	}
701 
702 	new->timestamp = timestamp;
703 	new->file_offset = file_offset;
704 	new->event = event;
705 
706 	__queue_event(new, s);
707 
708 	return 0;
709 }
710 
711 static void callchain__printf(struct perf_sample *sample)
712 {
713 	unsigned int i;
714 
715 	printf("... chain: nr:%" PRIu64 "\n", sample->callchain->nr);
716 
717 	for (i = 0; i < sample->callchain->nr; i++)
718 		printf("..... %2d: %016" PRIx64 "\n",
719 		       i, sample->callchain->ips[i]);
720 }
721 
722 static void branch_stack__printf(struct perf_sample *sample)
723 {
724 	uint64_t i;
725 
726 	printf("... branch stack: nr:%" PRIu64 "\n", sample->branch_stack->nr);
727 
728 	for (i = 0; i < sample->branch_stack->nr; i++)
729 		printf("..... %2"PRIu64": %016" PRIx64 " -> %016" PRIx64 "\n",
730 			i, sample->branch_stack->entries[i].from,
731 			sample->branch_stack->entries[i].to);
732 }
733 
734 static void regs_dump__printf(u64 mask, u64 *regs)
735 {
736 	unsigned rid, i = 0;
737 
738 	for_each_set_bit(rid, (unsigned long *) &mask, sizeof(mask) * 8) {
739 		u64 val = regs[i++];
740 
741 		printf(".... %-5s 0x%" PRIx64 "\n",
742 		       perf_reg_name(rid), val);
743 	}
744 }
745 
746 static void regs_user__printf(struct perf_sample *sample, u64 mask)
747 {
748 	struct regs_dump *user_regs = &sample->user_regs;
749 
750 	if (user_regs->regs) {
751 		printf("... user regs: mask 0x%" PRIx64 "\n", mask);
752 		regs_dump__printf(mask, user_regs->regs);
753 	}
754 }
755 
756 static void stack_user__printf(struct stack_dump *dump)
757 {
758 	printf("... ustack: size %" PRIu64 ", offset 0x%x\n",
759 	       dump->size, dump->offset);
760 }
761 
762 static void perf_session__print_tstamp(struct perf_session *session,
763 				       union perf_event *event,
764 				       struct perf_sample *sample)
765 {
766 	u64 sample_type = __perf_evlist__combined_sample_type(session->evlist);
767 
768 	if (event->header.type != PERF_RECORD_SAMPLE &&
769 	    !perf_evlist__sample_id_all(session->evlist)) {
770 		fputs("-1 -1 ", stdout);
771 		return;
772 	}
773 
774 	if ((sample_type & PERF_SAMPLE_CPU))
775 		printf("%u ", sample->cpu);
776 
777 	if (sample_type & PERF_SAMPLE_TIME)
778 		printf("%" PRIu64 " ", sample->time);
779 }
780 
781 static void sample_read__printf(struct perf_sample *sample, u64 read_format)
782 {
783 	printf("... sample_read:\n");
784 
785 	if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
786 		printf("...... time enabled %016" PRIx64 "\n",
787 		       sample->read.time_enabled);
788 
789 	if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
790 		printf("...... time running %016" PRIx64 "\n",
791 		       sample->read.time_running);
792 
793 	if (read_format & PERF_FORMAT_GROUP) {
794 		u64 i;
795 
796 		printf(".... group nr %" PRIu64 "\n", sample->read.group.nr);
797 
798 		for (i = 0; i < sample->read.group.nr; i++) {
799 			struct sample_read_value *value;
800 
801 			value = &sample->read.group.values[i];
802 			printf("..... id %016" PRIx64
803 			       ", value %016" PRIx64 "\n",
804 			       value->id, value->value);
805 		}
806 	} else
807 		printf("..... id %016" PRIx64 ", value %016" PRIx64 "\n",
808 			sample->read.one.id, sample->read.one.value);
809 }
810 
811 static void dump_event(struct perf_session *session, union perf_event *event,
812 		       u64 file_offset, struct perf_sample *sample)
813 {
814 	if (!dump_trace)
815 		return;
816 
817 	printf("\n%#" PRIx64 " [%#x]: event: %d\n",
818 	       file_offset, event->header.size, event->header.type);
819 
820 	trace_event(event);
821 
822 	if (sample)
823 		perf_session__print_tstamp(session, event, sample);
824 
825 	printf("%#" PRIx64 " [%#x]: PERF_RECORD_%s", file_offset,
826 	       event->header.size, perf_event__name(event->header.type));
827 }
828 
829 static void dump_sample(struct perf_evsel *evsel, union perf_event *event,
830 			struct perf_sample *sample)
831 {
832 	u64 sample_type;
833 
834 	if (!dump_trace)
835 		return;
836 
837 	printf("(IP, %d): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n",
838 	       event->header.misc, sample->pid, sample->tid, sample->ip,
839 	       sample->period, sample->addr);
840 
841 	sample_type = evsel->attr.sample_type;
842 
843 	if (sample_type & PERF_SAMPLE_CALLCHAIN)
844 		callchain__printf(sample);
845 
846 	if (sample_type & PERF_SAMPLE_BRANCH_STACK)
847 		branch_stack__printf(sample);
848 
849 	if (sample_type & PERF_SAMPLE_REGS_USER)
850 		regs_user__printf(sample, evsel->attr.sample_regs_user);
851 
852 	if (sample_type & PERF_SAMPLE_STACK_USER)
853 		stack_user__printf(&sample->user_stack);
854 
855 	if (sample_type & PERF_SAMPLE_WEIGHT)
856 		printf("... weight: %" PRIu64 "\n", sample->weight);
857 
858 	if (sample_type & PERF_SAMPLE_DATA_SRC)
859 		printf(" . data_src: 0x%"PRIx64"\n", sample->data_src);
860 
861 	if (sample_type & PERF_SAMPLE_READ)
862 		sample_read__printf(sample, evsel->attr.read_format);
863 }
864 
865 static struct machine *
866 	perf_session__find_machine_for_cpumode(struct perf_session *session,
867 					       union perf_event *event,
868 					       struct perf_sample *sample)
869 {
870 	const u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
871 
872 	if (perf_guest &&
873 	    ((cpumode == PERF_RECORD_MISC_GUEST_KERNEL) ||
874 	     (cpumode == PERF_RECORD_MISC_GUEST_USER))) {
875 		u32 pid;
876 
877 		if (event->header.type == PERF_RECORD_MMAP
878 		    || event->header.type == PERF_RECORD_MMAP2)
879 			pid = event->mmap.pid;
880 		else
881 			pid = sample->pid;
882 
883 		return perf_session__findnew_machine(session, pid);
884 	}
885 
886 	return &session->machines.host;
887 }
888 
889 static int deliver_sample_value(struct perf_session *session,
890 				struct perf_tool *tool,
891 				union perf_event *event,
892 				struct perf_sample *sample,
893 				struct sample_read_value *v,
894 				struct machine *machine)
895 {
896 	struct perf_sample_id *sid;
897 
898 	sid = perf_evlist__id2sid(session->evlist, v->id);
899 	if (sid) {
900 		sample->id     = v->id;
901 		sample->period = v->value - sid->period;
902 		sid->period    = v->value;
903 	}
904 
905 	if (!sid || sid->evsel == NULL) {
906 		++session->stats.nr_unknown_id;
907 		return 0;
908 	}
909 
910 	return tool->sample(tool, event, sample, sid->evsel, machine);
911 }
912 
913 static int deliver_sample_group(struct perf_session *session,
914 				struct perf_tool *tool,
915 				union  perf_event *event,
916 				struct perf_sample *sample,
917 				struct machine *machine)
918 {
919 	int ret = -EINVAL;
920 	u64 i;
921 
922 	for (i = 0; i < sample->read.group.nr; i++) {
923 		ret = deliver_sample_value(session, tool, event, sample,
924 					   &sample->read.group.values[i],
925 					   machine);
926 		if (ret)
927 			break;
928 	}
929 
930 	return ret;
931 }
932 
933 static int
934 perf_session__deliver_sample(struct perf_session *session,
935 			     struct perf_tool *tool,
936 			     union  perf_event *event,
937 			     struct perf_sample *sample,
938 			     struct perf_evsel *evsel,
939 			     struct machine *machine)
940 {
941 	/* We know evsel != NULL. */
942 	u64 sample_type = evsel->attr.sample_type;
943 	u64 read_format = evsel->attr.read_format;
944 
945 	/* Standard sample delievery. */
946 	if (!(sample_type & PERF_SAMPLE_READ))
947 		return tool->sample(tool, event, sample, evsel, machine);
948 
949 	/* For PERF_SAMPLE_READ we have either single or group mode. */
950 	if (read_format & PERF_FORMAT_GROUP)
951 		return deliver_sample_group(session, tool, event, sample,
952 					    machine);
953 	else
954 		return deliver_sample_value(session, tool, event, sample,
955 					    &sample->read.one, machine);
956 }
957 
958 static int perf_session_deliver_event(struct perf_session *session,
959 				      union perf_event *event,
960 				      struct perf_sample *sample,
961 				      struct perf_tool *tool,
962 				      u64 file_offset)
963 {
964 	struct perf_evsel *evsel;
965 	struct machine *machine;
966 
967 	dump_event(session, event, file_offset, sample);
968 
969 	evsel = perf_evlist__id2evsel(session->evlist, sample->id);
970 	if (evsel != NULL && event->header.type != PERF_RECORD_SAMPLE) {
971 		/*
972 		 * XXX We're leaving PERF_RECORD_SAMPLE unnacounted here
973 		 * because the tools right now may apply filters, discarding
974 		 * some of the samples. For consistency, in the future we
975 		 * should have something like nr_filtered_samples and remove
976 		 * the sample->period from total_sample_period, etc, KISS for
977 		 * now tho.
978 		 *
979 		 * Also testing against NULL allows us to handle files without
980 		 * attr.sample_id_all and/or without PERF_SAMPLE_ID. In the
981 		 * future probably it'll be a good idea to restrict event
982 		 * processing via perf_session to files with both set.
983 		 */
984 		hists__inc_nr_events(&evsel->hists, event->header.type);
985 	}
986 
987 	machine = perf_session__find_machine_for_cpumode(session, event,
988 							 sample);
989 
990 	switch (event->header.type) {
991 	case PERF_RECORD_SAMPLE:
992 		dump_sample(evsel, event, sample);
993 		if (evsel == NULL) {
994 			++session->stats.nr_unknown_id;
995 			return 0;
996 		}
997 		if (machine == NULL) {
998 			++session->stats.nr_unprocessable_samples;
999 			return 0;
1000 		}
1001 		return perf_session__deliver_sample(session, tool, event,
1002 						    sample, evsel, machine);
1003 	case PERF_RECORD_MMAP:
1004 		return tool->mmap(tool, event, sample, machine);
1005 	case PERF_RECORD_MMAP2:
1006 		return tool->mmap2(tool, event, sample, machine);
1007 	case PERF_RECORD_COMM:
1008 		return tool->comm(tool, event, sample, machine);
1009 	case PERF_RECORD_FORK:
1010 		return tool->fork(tool, event, sample, machine);
1011 	case PERF_RECORD_EXIT:
1012 		return tool->exit(tool, event, sample, machine);
1013 	case PERF_RECORD_LOST:
1014 		if (tool->lost == perf_event__process_lost)
1015 			session->stats.total_lost += event->lost.lost;
1016 		return tool->lost(tool, event, sample, machine);
1017 	case PERF_RECORD_READ:
1018 		return tool->read(tool, event, sample, evsel, machine);
1019 	case PERF_RECORD_THROTTLE:
1020 		return tool->throttle(tool, event, sample, machine);
1021 	case PERF_RECORD_UNTHROTTLE:
1022 		return tool->unthrottle(tool, event, sample, machine);
1023 	default:
1024 		++session->stats.nr_unknown_events;
1025 		return -1;
1026 	}
1027 }
1028 
1029 static int perf_session__process_user_event(struct perf_session *session, union perf_event *event,
1030 					    struct perf_tool *tool, u64 file_offset)
1031 {
1032 	int err;
1033 
1034 	dump_event(session, event, file_offset, NULL);
1035 
1036 	/* These events are processed right away */
1037 	switch (event->header.type) {
1038 	case PERF_RECORD_HEADER_ATTR:
1039 		err = tool->attr(tool, event, &session->evlist);
1040 		if (err == 0)
1041 			perf_session__set_id_hdr_size(session);
1042 		return err;
1043 	case PERF_RECORD_HEADER_TRACING_DATA:
1044 		/* setup for reading amidst mmap */
1045 		lseek(session->fd, file_offset, SEEK_SET);
1046 		return tool->tracing_data(tool, event, session);
1047 	case PERF_RECORD_HEADER_BUILD_ID:
1048 		return tool->build_id(tool, event, session);
1049 	case PERF_RECORD_FINISHED_ROUND:
1050 		return tool->finished_round(tool, event, session);
1051 	default:
1052 		return -EINVAL;
1053 	}
1054 }
1055 
1056 static void event_swap(union perf_event *event, bool sample_id_all)
1057 {
1058 	perf_event__swap_op swap;
1059 
1060 	swap = perf_event__swap_ops[event->header.type];
1061 	if (swap)
1062 		swap(event, sample_id_all);
1063 }
1064 
1065 static int perf_session__process_event(struct perf_session *session,
1066 				       union perf_event *event,
1067 				       struct perf_tool *tool,
1068 				       u64 file_offset)
1069 {
1070 	struct perf_sample sample;
1071 	int ret;
1072 
1073 	if (session->header.needs_swap)
1074 		event_swap(event, perf_evlist__sample_id_all(session->evlist));
1075 
1076 	if (event->header.type >= PERF_RECORD_HEADER_MAX)
1077 		return -EINVAL;
1078 
1079 	events_stats__inc(&session->stats, event->header.type);
1080 
1081 	if (event->header.type >= PERF_RECORD_USER_TYPE_START)
1082 		return perf_session__process_user_event(session, event, tool, file_offset);
1083 
1084 	/*
1085 	 * For all kernel events we get the sample data
1086 	 */
1087 	ret = perf_evlist__parse_sample(session->evlist, event, &sample);
1088 	if (ret)
1089 		return ret;
1090 
1091 	if (tool->ordered_samples) {
1092 		ret = perf_session_queue_event(session, event, &sample,
1093 					       file_offset);
1094 		if (ret != -ETIME)
1095 			return ret;
1096 	}
1097 
1098 	return perf_session_deliver_event(session, event, &sample, tool,
1099 					  file_offset);
1100 }
1101 
1102 void perf_event_header__bswap(struct perf_event_header *self)
1103 {
1104 	self->type = bswap_32(self->type);
1105 	self->misc = bswap_16(self->misc);
1106 	self->size = bswap_16(self->size);
1107 }
1108 
1109 struct thread *perf_session__findnew(struct perf_session *session, pid_t pid)
1110 {
1111 	return machine__findnew_thread(&session->machines.host, 0, pid);
1112 }
1113 
1114 static struct thread *perf_session__register_idle_thread(struct perf_session *self)
1115 {
1116 	struct thread *thread = perf_session__findnew(self, 0);
1117 
1118 	if (thread == NULL || thread__set_comm(thread, "swapper")) {
1119 		pr_err("problem inserting idle task.\n");
1120 		thread = NULL;
1121 	}
1122 
1123 	return thread;
1124 }
1125 
1126 static void perf_session__warn_about_errors(const struct perf_session *session,
1127 					    const struct perf_tool *tool)
1128 {
1129 	if (tool->lost == perf_event__process_lost &&
1130 	    session->stats.nr_events[PERF_RECORD_LOST] != 0) {
1131 		ui__warning("Processed %d events and lost %d chunks!\n\n"
1132 			    "Check IO/CPU overload!\n\n",
1133 			    session->stats.nr_events[0],
1134 			    session->stats.nr_events[PERF_RECORD_LOST]);
1135 	}
1136 
1137 	if (session->stats.nr_unknown_events != 0) {
1138 		ui__warning("Found %u unknown events!\n\n"
1139 			    "Is this an older tool processing a perf.data "
1140 			    "file generated by a more recent tool?\n\n"
1141 			    "If that is not the case, consider "
1142 			    "reporting to linux-kernel@vger.kernel.org.\n\n",
1143 			    session->stats.nr_unknown_events);
1144 	}
1145 
1146 	if (session->stats.nr_unknown_id != 0) {
1147 		ui__warning("%u samples with id not present in the header\n",
1148 			    session->stats.nr_unknown_id);
1149 	}
1150 
1151  	if (session->stats.nr_invalid_chains != 0) {
1152  		ui__warning("Found invalid callchains!\n\n"
1153  			    "%u out of %u events were discarded for this reason.\n\n"
1154  			    "Consider reporting to linux-kernel@vger.kernel.org.\n\n",
1155  			    session->stats.nr_invalid_chains,
1156  			    session->stats.nr_events[PERF_RECORD_SAMPLE]);
1157  	}
1158 
1159 	if (session->stats.nr_unprocessable_samples != 0) {
1160 		ui__warning("%u unprocessable samples recorded.\n"
1161 			    "Do you have a KVM guest running and not using 'perf kvm'?\n",
1162 			    session->stats.nr_unprocessable_samples);
1163 	}
1164 }
1165 
1166 volatile int session_done;
1167 
1168 static int __perf_session__process_pipe_events(struct perf_session *self,
1169 					       struct perf_tool *tool)
1170 {
1171 	union perf_event *event;
1172 	uint32_t size, cur_size = 0;
1173 	void *buf = NULL;
1174 	int skip = 0;
1175 	u64 head;
1176 	int err;
1177 	void *p;
1178 
1179 	perf_tool__fill_defaults(tool);
1180 
1181 	head = 0;
1182 	cur_size = sizeof(union perf_event);
1183 
1184 	buf = malloc(cur_size);
1185 	if (!buf)
1186 		return -errno;
1187 more:
1188 	event = buf;
1189 	err = readn(self->fd, event, sizeof(struct perf_event_header));
1190 	if (err <= 0) {
1191 		if (err == 0)
1192 			goto done;
1193 
1194 		pr_err("failed to read event header\n");
1195 		goto out_err;
1196 	}
1197 
1198 	if (self->header.needs_swap)
1199 		perf_event_header__bswap(&event->header);
1200 
1201 	size = event->header.size;
1202 	if (size < sizeof(struct perf_event_header)) {
1203 		pr_err("bad event header size\n");
1204 		goto out_err;
1205 	}
1206 
1207 	if (size > cur_size) {
1208 		void *new = realloc(buf, size);
1209 		if (!new) {
1210 			pr_err("failed to allocate memory to read event\n");
1211 			goto out_err;
1212 		}
1213 		buf = new;
1214 		cur_size = size;
1215 		event = buf;
1216 	}
1217 	p = event;
1218 	p += sizeof(struct perf_event_header);
1219 
1220 	if (size - sizeof(struct perf_event_header)) {
1221 		err = readn(self->fd, p, size - sizeof(struct perf_event_header));
1222 		if (err <= 0) {
1223 			if (err == 0) {
1224 				pr_err("unexpected end of event stream\n");
1225 				goto done;
1226 			}
1227 
1228 			pr_err("failed to read event data\n");
1229 			goto out_err;
1230 		}
1231 	}
1232 
1233 	if ((skip = perf_session__process_event(self, event, tool, head)) < 0) {
1234 		pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
1235 		       head, event->header.size, event->header.type);
1236 		err = -EINVAL;
1237 		goto out_err;
1238 	}
1239 
1240 	head += size;
1241 
1242 	if (skip > 0)
1243 		head += skip;
1244 
1245 	if (!session_done())
1246 		goto more;
1247 done:
1248 	err = 0;
1249 out_err:
1250 	free(buf);
1251 	perf_session__warn_about_errors(self, tool);
1252 	perf_session_free_sample_buffers(self);
1253 	return err;
1254 }
1255 
1256 static union perf_event *
1257 fetch_mmaped_event(struct perf_session *session,
1258 		   u64 head, size_t mmap_size, char *buf)
1259 {
1260 	union perf_event *event;
1261 
1262 	/*
1263 	 * Ensure we have enough space remaining to read
1264 	 * the size of the event in the headers.
1265 	 */
1266 	if (head + sizeof(event->header) > mmap_size)
1267 		return NULL;
1268 
1269 	event = (union perf_event *)(buf + head);
1270 
1271 	if (session->header.needs_swap)
1272 		perf_event_header__bswap(&event->header);
1273 
1274 	if (head + event->header.size > mmap_size) {
1275 		/* We're not fetching the event so swap back again */
1276 		if (session->header.needs_swap)
1277 			perf_event_header__bswap(&event->header);
1278 		return NULL;
1279 	}
1280 
1281 	return event;
1282 }
1283 
1284 /*
1285  * On 64bit we can mmap the data file in one go. No need for tiny mmap
1286  * slices. On 32bit we use 32MB.
1287  */
1288 #if BITS_PER_LONG == 64
1289 #define MMAP_SIZE ULLONG_MAX
1290 #define NUM_MMAPS 1
1291 #else
1292 #define MMAP_SIZE (32 * 1024 * 1024ULL)
1293 #define NUM_MMAPS 128
1294 #endif
1295 
1296 int __perf_session__process_events(struct perf_session *session,
1297 				   u64 data_offset, u64 data_size,
1298 				   u64 file_size, struct perf_tool *tool)
1299 {
1300 	u64 head, page_offset, file_offset, file_pos, progress_next;
1301 	int err, mmap_prot, mmap_flags, map_idx = 0;
1302 	size_t	mmap_size;
1303 	char *buf, *mmaps[NUM_MMAPS];
1304 	union perf_event *event;
1305 	uint32_t size;
1306 
1307 	perf_tool__fill_defaults(tool);
1308 
1309 	page_offset = page_size * (data_offset / page_size);
1310 	file_offset = page_offset;
1311 	head = data_offset - page_offset;
1312 
1313 	if (data_offset + data_size < file_size)
1314 		file_size = data_offset + data_size;
1315 
1316 	progress_next = file_size / 16;
1317 
1318 	mmap_size = MMAP_SIZE;
1319 	if (mmap_size > file_size)
1320 		mmap_size = file_size;
1321 
1322 	memset(mmaps, 0, sizeof(mmaps));
1323 
1324 	mmap_prot  = PROT_READ;
1325 	mmap_flags = MAP_SHARED;
1326 
1327 	if (session->header.needs_swap) {
1328 		mmap_prot  |= PROT_WRITE;
1329 		mmap_flags = MAP_PRIVATE;
1330 	}
1331 remap:
1332 	buf = mmap(NULL, mmap_size, mmap_prot, mmap_flags, session->fd,
1333 		   file_offset);
1334 	if (buf == MAP_FAILED) {
1335 		pr_err("failed to mmap file\n");
1336 		err = -errno;
1337 		goto out_err;
1338 	}
1339 	mmaps[map_idx] = buf;
1340 	map_idx = (map_idx + 1) & (ARRAY_SIZE(mmaps) - 1);
1341 	file_pos = file_offset + head;
1342 
1343 more:
1344 	event = fetch_mmaped_event(session, head, mmap_size, buf);
1345 	if (!event) {
1346 		if (mmaps[map_idx]) {
1347 			munmap(mmaps[map_idx], mmap_size);
1348 			mmaps[map_idx] = NULL;
1349 		}
1350 
1351 		page_offset = page_size * (head / page_size);
1352 		file_offset += page_offset;
1353 		head -= page_offset;
1354 		goto remap;
1355 	}
1356 
1357 	size = event->header.size;
1358 
1359 	if (size < sizeof(struct perf_event_header) ||
1360 	    perf_session__process_event(session, event, tool, file_pos) < 0) {
1361 		pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
1362 		       file_offset + head, event->header.size,
1363 		       event->header.type);
1364 		err = -EINVAL;
1365 		goto out_err;
1366 	}
1367 
1368 	head += size;
1369 	file_pos += size;
1370 
1371 	if (file_pos >= progress_next) {
1372 		progress_next += file_size / 16;
1373 		ui_progress__update(file_pos, file_size,
1374 				    "Processing events...");
1375 	}
1376 
1377 	err = 0;
1378 	if (session_done())
1379 		goto out_err;
1380 
1381 	if (file_pos < file_size)
1382 		goto more;
1383 
1384 	/* do the final flush for ordered samples */
1385 	session->ordered_samples.next_flush = ULLONG_MAX;
1386 	err = flush_sample_queue(session, tool);
1387 out_err:
1388 	ui_progress__finish();
1389 	perf_session__warn_about_errors(session, tool);
1390 	perf_session_free_sample_buffers(session);
1391 	return err;
1392 }
1393 
1394 int perf_session__process_events(struct perf_session *self,
1395 				 struct perf_tool *tool)
1396 {
1397 	int err;
1398 
1399 	if (perf_session__register_idle_thread(self) == NULL)
1400 		return -ENOMEM;
1401 
1402 	if (!self->fd_pipe)
1403 		err = __perf_session__process_events(self,
1404 						     self->header.data_offset,
1405 						     self->header.data_size,
1406 						     self->size, tool);
1407 	else
1408 		err = __perf_session__process_pipe_events(self, tool);
1409 
1410 	return err;
1411 }
1412 
1413 bool perf_session__has_traces(struct perf_session *session, const char *msg)
1414 {
1415 	struct perf_evsel *evsel;
1416 
1417 	list_for_each_entry(evsel, &session->evlist->entries, node) {
1418 		if (evsel->attr.type == PERF_TYPE_TRACEPOINT)
1419 			return true;
1420 	}
1421 
1422 	pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
1423 	return false;
1424 }
1425 
1426 int maps__set_kallsyms_ref_reloc_sym(struct map **maps,
1427 				     const char *symbol_name, u64 addr)
1428 {
1429 	char *bracket;
1430 	enum map_type i;
1431 	struct ref_reloc_sym *ref;
1432 
1433 	ref = zalloc(sizeof(struct ref_reloc_sym));
1434 	if (ref == NULL)
1435 		return -ENOMEM;
1436 
1437 	ref->name = strdup(symbol_name);
1438 	if (ref->name == NULL) {
1439 		free(ref);
1440 		return -ENOMEM;
1441 	}
1442 
1443 	bracket = strchr(ref->name, ']');
1444 	if (bracket)
1445 		*bracket = '\0';
1446 
1447 	ref->addr = addr;
1448 
1449 	for (i = 0; i < MAP__NR_TYPES; ++i) {
1450 		struct kmap *kmap = map__kmap(maps[i]);
1451 		kmap->ref_reloc_sym = ref;
1452 	}
1453 
1454 	return 0;
1455 }
1456 
1457 size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp)
1458 {
1459 	return machines__fprintf_dsos(&self->machines, fp);
1460 }
1461 
1462 size_t perf_session__fprintf_dsos_buildid(struct perf_session *self, FILE *fp,
1463 					  bool (skip)(struct dso *dso, int parm), int parm)
1464 {
1465 	return machines__fprintf_dsos_buildid(&self->machines, fp, skip, parm);
1466 }
1467 
1468 size_t perf_session__fprintf_nr_events(struct perf_session *session, FILE *fp)
1469 {
1470 	struct perf_evsel *pos;
1471 	size_t ret = fprintf(fp, "Aggregated stats:\n");
1472 
1473 	ret += events_stats__fprintf(&session->stats, fp);
1474 
1475 	list_for_each_entry(pos, &session->evlist->entries, node) {
1476 		ret += fprintf(fp, "%s stats:\n", perf_evsel__name(pos));
1477 		ret += events_stats__fprintf(&pos->hists.stats, fp);
1478 	}
1479 
1480 	return ret;
1481 }
1482 
1483 size_t perf_session__fprintf(struct perf_session *session, FILE *fp)
1484 {
1485 	/*
1486 	 * FIXME: Here we have to actually print all the machines in this
1487 	 * session, not just the host...
1488 	 */
1489 	return machine__fprintf(&session->machines.host, fp);
1490 }
1491 
1492 struct perf_evsel *perf_session__find_first_evtype(struct perf_session *session,
1493 					      unsigned int type)
1494 {
1495 	struct perf_evsel *pos;
1496 
1497 	list_for_each_entry(pos, &session->evlist->entries, node) {
1498 		if (pos->attr.type == type)
1499 			return pos;
1500 	}
1501 	return NULL;
1502 }
1503 
1504 void perf_evsel__print_ip(struct perf_evsel *evsel, union perf_event *event,
1505 			  struct perf_sample *sample, struct machine *machine,
1506 			  unsigned int print_opts, unsigned int stack_depth)
1507 {
1508 	struct addr_location al;
1509 	struct callchain_cursor_node *node;
1510 	int print_ip = print_opts & PRINT_IP_OPT_IP;
1511 	int print_sym = print_opts & PRINT_IP_OPT_SYM;
1512 	int print_dso = print_opts & PRINT_IP_OPT_DSO;
1513 	int print_symoffset = print_opts & PRINT_IP_OPT_SYMOFFSET;
1514 	int print_oneline = print_opts & PRINT_IP_OPT_ONELINE;
1515 	char s = print_oneline ? ' ' : '\t';
1516 
1517 	if (perf_event__preprocess_sample(event, machine, &al, sample) < 0) {
1518 		error("problem processing %d event, skipping it.\n",
1519 			event->header.type);
1520 		return;
1521 	}
1522 
1523 	if (symbol_conf.use_callchain && sample->callchain) {
1524 
1525 		if (machine__resolve_callchain(machine, evsel, al.thread,
1526 					       sample, NULL, NULL) != 0) {
1527 			if (verbose)
1528 				error("Failed to resolve callchain. Skipping\n");
1529 			return;
1530 		}
1531 		callchain_cursor_commit(&callchain_cursor);
1532 
1533 		while (stack_depth) {
1534 			node = callchain_cursor_current(&callchain_cursor);
1535 			if (!node)
1536 				break;
1537 
1538 			if (print_ip)
1539 				printf("%c%16" PRIx64, s, node->ip);
1540 
1541 			if (print_sym) {
1542 				printf(" ");
1543 				if (print_symoffset) {
1544 					al.addr = node->ip;
1545 					al.map  = node->map;
1546 					symbol__fprintf_symname_offs(node->sym, &al, stdout);
1547 				} else
1548 					symbol__fprintf_symname(node->sym, stdout);
1549 			}
1550 
1551 			if (print_dso) {
1552 				printf(" (");
1553 				map__fprintf_dsoname(node->map, stdout);
1554 				printf(")");
1555 			}
1556 
1557 			if (!print_oneline)
1558 				printf("\n");
1559 
1560 			callchain_cursor_advance(&callchain_cursor);
1561 
1562 			stack_depth--;
1563 		}
1564 
1565 	} else {
1566 		if (print_ip)
1567 			printf("%16" PRIx64, sample->ip);
1568 
1569 		if (print_sym) {
1570 			printf(" ");
1571 			if (print_symoffset)
1572 				symbol__fprintf_symname_offs(al.sym, &al,
1573 							     stdout);
1574 			else
1575 				symbol__fprintf_symname(al.sym, stdout);
1576 		}
1577 
1578 		if (print_dso) {
1579 			printf(" (");
1580 			map__fprintf_dsoname(al.map, stdout);
1581 			printf(")");
1582 		}
1583 	}
1584 }
1585 
1586 int perf_session__cpu_bitmap(struct perf_session *session,
1587 			     const char *cpu_list, unsigned long *cpu_bitmap)
1588 {
1589 	int i;
1590 	struct cpu_map *map;
1591 
1592 	for (i = 0; i < PERF_TYPE_MAX; ++i) {
1593 		struct perf_evsel *evsel;
1594 
1595 		evsel = perf_session__find_first_evtype(session, i);
1596 		if (!evsel)
1597 			continue;
1598 
1599 		if (!(evsel->attr.sample_type & PERF_SAMPLE_CPU)) {
1600 			pr_err("File does not contain CPU events. "
1601 			       "Remove -c option to proceed.\n");
1602 			return -1;
1603 		}
1604 	}
1605 
1606 	map = cpu_map__new(cpu_list);
1607 	if (map == NULL) {
1608 		pr_err("Invalid cpu_list\n");
1609 		return -1;
1610 	}
1611 
1612 	for (i = 0; i < map->nr; i++) {
1613 		int cpu = map->map[i];
1614 
1615 		if (cpu >= MAX_NR_CPUS) {
1616 			pr_err("Requested CPU %d too large. "
1617 			       "Consider raising MAX_NR_CPUS\n", cpu);
1618 			return -1;
1619 		}
1620 
1621 		set_bit(cpu, cpu_bitmap);
1622 	}
1623 
1624 	return 0;
1625 }
1626 
1627 void perf_session__fprintf_info(struct perf_session *session, FILE *fp,
1628 				bool full)
1629 {
1630 	struct stat st;
1631 	int ret;
1632 
1633 	if (session == NULL || fp == NULL)
1634 		return;
1635 
1636 	ret = fstat(session->fd, &st);
1637 	if (ret == -1)
1638 		return;
1639 
1640 	fprintf(fp, "# ========\n");
1641 	fprintf(fp, "# captured on: %s", ctime(&st.st_ctime));
1642 	perf_header__fprintf_info(session, fp, full);
1643 	fprintf(fp, "# ========\n#\n");
1644 }
1645 
1646 
1647 int __perf_session__set_tracepoints_handlers(struct perf_session *session,
1648 					     const struct perf_evsel_str_handler *assocs,
1649 					     size_t nr_assocs)
1650 {
1651 	struct perf_evsel *evsel;
1652 	size_t i;
1653 	int err;
1654 
1655 	for (i = 0; i < nr_assocs; i++) {
1656 		/*
1657 		 * Adding a handler for an event not in the session,
1658 		 * just ignore it.
1659 		 */
1660 		evsel = perf_evlist__find_tracepoint_by_name(session->evlist, assocs[i].name);
1661 		if (evsel == NULL)
1662 			continue;
1663 
1664 		err = -EEXIST;
1665 		if (evsel->handler.func != NULL)
1666 			goto out;
1667 		evsel->handler.func = assocs[i].handler;
1668 	}
1669 
1670 	err = 0;
1671 out:
1672 	return err;
1673 }
1674