1 // SPDX-License-Identifier: GPL-2.0 2 #include <errno.h> 3 #include <inttypes.h> 4 #include <linux/kernel.h> 5 #include <linux/zalloc.h> 6 #include <traceevent/event-parse.h> 7 #include <api/fs/fs.h> 8 9 #include <byteswap.h> 10 #include <unistd.h> 11 #include <sys/types.h> 12 #include <sys/mman.h> 13 #include <perf/cpumap.h> 14 15 #include "evlist.h" 16 #include "evsel.h" 17 #include "memswap.h" 18 #include "map.h" 19 #include "symbol.h" 20 #include "session.h" 21 #include "tool.h" 22 #include "sort.h" 23 #include "cpumap.h" 24 #include "perf_regs.h" 25 #include "asm/bug.h" 26 #include "auxtrace.h" 27 #include "thread.h" 28 #include "thread-stack.h" 29 #include "sample-raw.h" 30 #include "stat.h" 31 #include "arch/common.h" 32 33 #ifdef HAVE_ZSTD_SUPPORT 34 static int perf_session__process_compressed_event(struct perf_session *session, 35 union perf_event *event, u64 file_offset) 36 { 37 void *src; 38 size_t decomp_size, src_size; 39 u64 decomp_last_rem = 0; 40 size_t mmap_len, decomp_len = session->header.env.comp_mmap_len; 41 struct decomp *decomp, *decomp_last = session->decomp_last; 42 43 if (decomp_last) { 44 decomp_last_rem = decomp_last->size - decomp_last->head; 45 decomp_len += decomp_last_rem; 46 } 47 48 mmap_len = sizeof(struct decomp) + decomp_len; 49 decomp = mmap(NULL, mmap_len, PROT_READ|PROT_WRITE, 50 MAP_ANONYMOUS|MAP_PRIVATE, -1, 0); 51 if (decomp == MAP_FAILED) { 52 pr_err("Couldn't allocate memory for decompression\n"); 53 return -1; 54 } 55 56 decomp->file_pos = file_offset; 57 decomp->mmap_len = mmap_len; 58 decomp->head = 0; 59 60 if (decomp_last_rem) { 61 memcpy(decomp->data, &(decomp_last->data[decomp_last->head]), decomp_last_rem); 62 decomp->size = decomp_last_rem; 63 } 64 65 src = (void *)event + sizeof(struct compressed_event); 66 src_size = event->pack.header.size - sizeof(struct compressed_event); 67 68 decomp_size = zstd_decompress_stream(&(session->zstd_data), src, src_size, 69 &(decomp->data[decomp_last_rem]), decomp_len - decomp_last_rem); 70 if (!decomp_size) { 71 munmap(decomp, mmap_len); 72 pr_err("Couldn't decompress data\n"); 73 return -1; 74 } 75 76 decomp->size += decomp_size; 77 78 if (session->decomp == NULL) { 79 session->decomp = decomp; 80 session->decomp_last = decomp; 81 } else { 82 session->decomp_last->next = decomp; 83 session->decomp_last = decomp; 84 } 85 86 pr_debug("decomp (B): %ld to %ld\n", src_size, decomp_size); 87 88 return 0; 89 } 90 #else /* !HAVE_ZSTD_SUPPORT */ 91 #define perf_session__process_compressed_event perf_session__process_compressed_event_stub 92 #endif 93 94 static int perf_session__deliver_event(struct perf_session *session, 95 union perf_event *event, 96 struct perf_tool *tool, 97 u64 file_offset); 98 99 static int perf_session__open(struct perf_session *session) 100 { 101 struct perf_data *data = session->data; 102 103 if (perf_session__read_header(session) < 0) { 104 pr_err("incompatible file format (rerun with -v to learn more)\n"); 105 return -1; 106 } 107 108 if (perf_data__is_pipe(data)) 109 return 0; 110 111 if (perf_header__has_feat(&session->header, HEADER_STAT)) 112 return 0; 113 114 if (!perf_evlist__valid_sample_type(session->evlist)) { 115 pr_err("non matching sample_type\n"); 116 return -1; 117 } 118 119 if (!perf_evlist__valid_sample_id_all(session->evlist)) { 120 pr_err("non matching sample_id_all\n"); 121 return -1; 122 } 123 124 if (!perf_evlist__valid_read_format(session->evlist)) { 125 pr_err("non matching read_format\n"); 126 return -1; 127 } 128 129 return 0; 130 } 131 132 void perf_session__set_id_hdr_size(struct perf_session *session) 133 { 134 u16 id_hdr_size = perf_evlist__id_hdr_size(session->evlist); 135 136 machines__set_id_hdr_size(&session->machines, id_hdr_size); 137 } 138 139 int perf_session__create_kernel_maps(struct perf_session *session) 140 { 141 int ret = machine__create_kernel_maps(&session->machines.host); 142 143 if (ret >= 0) 144 ret = machines__create_guest_kernel_maps(&session->machines); 145 return ret; 146 } 147 148 static void perf_session__destroy_kernel_maps(struct perf_session *session) 149 { 150 machines__destroy_kernel_maps(&session->machines); 151 } 152 153 static bool perf_session__has_comm_exec(struct perf_session *session) 154 { 155 struct evsel *evsel; 156 157 evlist__for_each_entry(session->evlist, evsel) { 158 if (evsel->core.attr.comm_exec) 159 return true; 160 } 161 162 return false; 163 } 164 165 static void perf_session__set_comm_exec(struct perf_session *session) 166 { 167 bool comm_exec = perf_session__has_comm_exec(session); 168 169 machines__set_comm_exec(&session->machines, comm_exec); 170 } 171 172 static int ordered_events__deliver_event(struct ordered_events *oe, 173 struct ordered_event *event) 174 { 175 struct perf_session *session = container_of(oe, struct perf_session, 176 ordered_events); 177 178 return perf_session__deliver_event(session, event->event, 179 session->tool, event->file_offset); 180 } 181 182 struct perf_session *perf_session__new(struct perf_data *data, 183 bool repipe, struct perf_tool *tool) 184 { 185 struct perf_session *session = zalloc(sizeof(*session)); 186 187 if (!session) 188 goto out; 189 190 session->repipe = repipe; 191 session->tool = tool; 192 INIT_LIST_HEAD(&session->auxtrace_index); 193 machines__init(&session->machines); 194 ordered_events__init(&session->ordered_events, 195 ordered_events__deliver_event, NULL); 196 197 perf_env__init(&session->header.env); 198 if (data) { 199 if (perf_data__open(data)) 200 goto out_delete; 201 202 session->data = data; 203 204 if (perf_data__is_read(data)) { 205 if (perf_session__open(session) < 0) 206 goto out_delete; 207 208 /* 209 * set session attributes that are present in perf.data 210 * but not in pipe-mode. 211 */ 212 if (!data->is_pipe) { 213 perf_session__set_id_hdr_size(session); 214 perf_session__set_comm_exec(session); 215 } 216 217 perf_evlist__init_trace_event_sample_raw(session->evlist); 218 219 /* Open the directory data. */ 220 if (data->is_dir && perf_data__open_dir(data)) 221 goto out_delete; 222 } 223 } else { 224 session->machines.host.env = &perf_env; 225 } 226 227 session->machines.host.single_address_space = 228 perf_env__single_address_space(session->machines.host.env); 229 230 if (!data || perf_data__is_write(data)) { 231 /* 232 * In O_RDONLY mode this will be performed when reading the 233 * kernel MMAP event, in perf_event__process_mmap(). 234 */ 235 if (perf_session__create_kernel_maps(session) < 0) 236 pr_warning("Cannot read kernel map\n"); 237 } 238 239 /* 240 * In pipe-mode, evlist is empty until PERF_RECORD_HEADER_ATTR is 241 * processed, so perf_evlist__sample_id_all is not meaningful here. 242 */ 243 if ((!data || !data->is_pipe) && tool && tool->ordering_requires_timestamps && 244 tool->ordered_events && !perf_evlist__sample_id_all(session->evlist)) { 245 dump_printf("WARNING: No sample_id_all support, falling back to unordered processing\n"); 246 tool->ordered_events = false; 247 } 248 249 return session; 250 251 out_delete: 252 perf_session__delete(session); 253 out: 254 return NULL; 255 } 256 257 static void perf_session__delete_threads(struct perf_session *session) 258 { 259 machine__delete_threads(&session->machines.host); 260 } 261 262 static void perf_session__release_decomp_events(struct perf_session *session) 263 { 264 struct decomp *next, *decomp; 265 size_t mmap_len; 266 next = session->decomp; 267 do { 268 decomp = next; 269 if (decomp == NULL) 270 break; 271 next = decomp->next; 272 mmap_len = decomp->mmap_len; 273 munmap(decomp, mmap_len); 274 } while (1); 275 } 276 277 void perf_session__delete(struct perf_session *session) 278 { 279 if (session == NULL) 280 return; 281 auxtrace__free(session); 282 auxtrace_index__free(&session->auxtrace_index); 283 perf_session__destroy_kernel_maps(session); 284 perf_session__delete_threads(session); 285 perf_session__release_decomp_events(session); 286 perf_env__exit(&session->header.env); 287 machines__exit(&session->machines); 288 if (session->data) 289 perf_data__close(session->data); 290 free(session); 291 } 292 293 static int process_event_synth_tracing_data_stub(struct perf_session *session 294 __maybe_unused, 295 union perf_event *event 296 __maybe_unused) 297 { 298 dump_printf(": unhandled!\n"); 299 return 0; 300 } 301 302 static int process_event_synth_attr_stub(struct perf_tool *tool __maybe_unused, 303 union perf_event *event __maybe_unused, 304 struct evlist **pevlist 305 __maybe_unused) 306 { 307 dump_printf(": unhandled!\n"); 308 return 0; 309 } 310 311 static int process_event_synth_event_update_stub(struct perf_tool *tool __maybe_unused, 312 union perf_event *event __maybe_unused, 313 struct evlist **pevlist 314 __maybe_unused) 315 { 316 if (dump_trace) 317 perf_event__fprintf_event_update(event, stdout); 318 319 dump_printf(": unhandled!\n"); 320 return 0; 321 } 322 323 static int process_event_sample_stub(struct perf_tool *tool __maybe_unused, 324 union perf_event *event __maybe_unused, 325 struct perf_sample *sample __maybe_unused, 326 struct evsel *evsel __maybe_unused, 327 struct machine *machine __maybe_unused) 328 { 329 dump_printf(": unhandled!\n"); 330 return 0; 331 } 332 333 static int process_event_stub(struct perf_tool *tool __maybe_unused, 334 union perf_event *event __maybe_unused, 335 struct perf_sample *sample __maybe_unused, 336 struct machine *machine __maybe_unused) 337 { 338 dump_printf(": unhandled!\n"); 339 return 0; 340 } 341 342 static int process_finished_round_stub(struct perf_tool *tool __maybe_unused, 343 union perf_event *event __maybe_unused, 344 struct ordered_events *oe __maybe_unused) 345 { 346 dump_printf(": unhandled!\n"); 347 return 0; 348 } 349 350 static int process_finished_round(struct perf_tool *tool, 351 union perf_event *event, 352 struct ordered_events *oe); 353 354 static int skipn(int fd, off_t n) 355 { 356 char buf[4096]; 357 ssize_t ret; 358 359 while (n > 0) { 360 ret = read(fd, buf, min(n, (off_t)sizeof(buf))); 361 if (ret <= 0) 362 return ret; 363 n -= ret; 364 } 365 366 return 0; 367 } 368 369 static s64 process_event_auxtrace_stub(struct perf_session *session __maybe_unused, 370 union perf_event *event) 371 { 372 dump_printf(": unhandled!\n"); 373 if (perf_data__is_pipe(session->data)) 374 skipn(perf_data__fd(session->data), event->auxtrace.size); 375 return event->auxtrace.size; 376 } 377 378 static int process_event_op2_stub(struct perf_session *session __maybe_unused, 379 union perf_event *event __maybe_unused) 380 { 381 dump_printf(": unhandled!\n"); 382 return 0; 383 } 384 385 386 static 387 int process_event_thread_map_stub(struct perf_session *session __maybe_unused, 388 union perf_event *event __maybe_unused) 389 { 390 if (dump_trace) 391 perf_event__fprintf_thread_map(event, stdout); 392 393 dump_printf(": unhandled!\n"); 394 return 0; 395 } 396 397 static 398 int process_event_cpu_map_stub(struct perf_session *session __maybe_unused, 399 union perf_event *event __maybe_unused) 400 { 401 if (dump_trace) 402 perf_event__fprintf_cpu_map(event, stdout); 403 404 dump_printf(": unhandled!\n"); 405 return 0; 406 } 407 408 static 409 int process_event_stat_config_stub(struct perf_session *session __maybe_unused, 410 union perf_event *event __maybe_unused) 411 { 412 if (dump_trace) 413 perf_event__fprintf_stat_config(event, stdout); 414 415 dump_printf(": unhandled!\n"); 416 return 0; 417 } 418 419 static int process_stat_stub(struct perf_session *perf_session __maybe_unused, 420 union perf_event *event) 421 { 422 if (dump_trace) 423 perf_event__fprintf_stat(event, stdout); 424 425 dump_printf(": unhandled!\n"); 426 return 0; 427 } 428 429 static int process_stat_round_stub(struct perf_session *perf_session __maybe_unused, 430 union perf_event *event) 431 { 432 if (dump_trace) 433 perf_event__fprintf_stat_round(event, stdout); 434 435 dump_printf(": unhandled!\n"); 436 return 0; 437 } 438 439 static int perf_session__process_compressed_event_stub(struct perf_session *session __maybe_unused, 440 union perf_event *event __maybe_unused, 441 u64 file_offset __maybe_unused) 442 { 443 dump_printf(": unhandled!\n"); 444 return 0; 445 } 446 447 void perf_tool__fill_defaults(struct perf_tool *tool) 448 { 449 if (tool->sample == NULL) 450 tool->sample = process_event_sample_stub; 451 if (tool->mmap == NULL) 452 tool->mmap = process_event_stub; 453 if (tool->mmap2 == NULL) 454 tool->mmap2 = process_event_stub; 455 if (tool->comm == NULL) 456 tool->comm = process_event_stub; 457 if (tool->namespaces == NULL) 458 tool->namespaces = process_event_stub; 459 if (tool->fork == NULL) 460 tool->fork = process_event_stub; 461 if (tool->exit == NULL) 462 tool->exit = process_event_stub; 463 if (tool->lost == NULL) 464 tool->lost = perf_event__process_lost; 465 if (tool->lost_samples == NULL) 466 tool->lost_samples = perf_event__process_lost_samples; 467 if (tool->aux == NULL) 468 tool->aux = perf_event__process_aux; 469 if (tool->itrace_start == NULL) 470 tool->itrace_start = perf_event__process_itrace_start; 471 if (tool->context_switch == NULL) 472 tool->context_switch = perf_event__process_switch; 473 if (tool->ksymbol == NULL) 474 tool->ksymbol = perf_event__process_ksymbol; 475 if (tool->bpf_event == NULL) 476 tool->bpf_event = perf_event__process_bpf_event; 477 if (tool->read == NULL) 478 tool->read = process_event_sample_stub; 479 if (tool->throttle == NULL) 480 tool->throttle = process_event_stub; 481 if (tool->unthrottle == NULL) 482 tool->unthrottle = process_event_stub; 483 if (tool->attr == NULL) 484 tool->attr = process_event_synth_attr_stub; 485 if (tool->event_update == NULL) 486 tool->event_update = process_event_synth_event_update_stub; 487 if (tool->tracing_data == NULL) 488 tool->tracing_data = process_event_synth_tracing_data_stub; 489 if (tool->build_id == NULL) 490 tool->build_id = process_event_op2_stub; 491 if (tool->finished_round == NULL) { 492 if (tool->ordered_events) 493 tool->finished_round = process_finished_round; 494 else 495 tool->finished_round = process_finished_round_stub; 496 } 497 if (tool->id_index == NULL) 498 tool->id_index = process_event_op2_stub; 499 if (tool->auxtrace_info == NULL) 500 tool->auxtrace_info = process_event_op2_stub; 501 if (tool->auxtrace == NULL) 502 tool->auxtrace = process_event_auxtrace_stub; 503 if (tool->auxtrace_error == NULL) 504 tool->auxtrace_error = process_event_op2_stub; 505 if (tool->thread_map == NULL) 506 tool->thread_map = process_event_thread_map_stub; 507 if (tool->cpu_map == NULL) 508 tool->cpu_map = process_event_cpu_map_stub; 509 if (tool->stat_config == NULL) 510 tool->stat_config = process_event_stat_config_stub; 511 if (tool->stat == NULL) 512 tool->stat = process_stat_stub; 513 if (tool->stat_round == NULL) 514 tool->stat_round = process_stat_round_stub; 515 if (tool->time_conv == NULL) 516 tool->time_conv = process_event_op2_stub; 517 if (tool->feature == NULL) 518 tool->feature = process_event_op2_stub; 519 if (tool->compressed == NULL) 520 tool->compressed = perf_session__process_compressed_event; 521 } 522 523 static void swap_sample_id_all(union perf_event *event, void *data) 524 { 525 void *end = (void *) event + event->header.size; 526 int size = end - data; 527 528 BUG_ON(size % sizeof(u64)); 529 mem_bswap_64(data, size); 530 } 531 532 static void perf_event__all64_swap(union perf_event *event, 533 bool sample_id_all __maybe_unused) 534 { 535 struct perf_event_header *hdr = &event->header; 536 mem_bswap_64(hdr + 1, event->header.size - sizeof(*hdr)); 537 } 538 539 static void perf_event__comm_swap(union perf_event *event, bool sample_id_all) 540 { 541 event->comm.pid = bswap_32(event->comm.pid); 542 event->comm.tid = bswap_32(event->comm.tid); 543 544 if (sample_id_all) { 545 void *data = &event->comm.comm; 546 547 data += PERF_ALIGN(strlen(data) + 1, sizeof(u64)); 548 swap_sample_id_all(event, data); 549 } 550 } 551 552 static void perf_event__mmap_swap(union perf_event *event, 553 bool sample_id_all) 554 { 555 event->mmap.pid = bswap_32(event->mmap.pid); 556 event->mmap.tid = bswap_32(event->mmap.tid); 557 event->mmap.start = bswap_64(event->mmap.start); 558 event->mmap.len = bswap_64(event->mmap.len); 559 event->mmap.pgoff = bswap_64(event->mmap.pgoff); 560 561 if (sample_id_all) { 562 void *data = &event->mmap.filename; 563 564 data += PERF_ALIGN(strlen(data) + 1, sizeof(u64)); 565 swap_sample_id_all(event, data); 566 } 567 } 568 569 static void perf_event__mmap2_swap(union perf_event *event, 570 bool sample_id_all) 571 { 572 event->mmap2.pid = bswap_32(event->mmap2.pid); 573 event->mmap2.tid = bswap_32(event->mmap2.tid); 574 event->mmap2.start = bswap_64(event->mmap2.start); 575 event->mmap2.len = bswap_64(event->mmap2.len); 576 event->mmap2.pgoff = bswap_64(event->mmap2.pgoff); 577 event->mmap2.maj = bswap_32(event->mmap2.maj); 578 event->mmap2.min = bswap_32(event->mmap2.min); 579 event->mmap2.ino = bswap_64(event->mmap2.ino); 580 581 if (sample_id_all) { 582 void *data = &event->mmap2.filename; 583 584 data += PERF_ALIGN(strlen(data) + 1, sizeof(u64)); 585 swap_sample_id_all(event, data); 586 } 587 } 588 static void perf_event__task_swap(union perf_event *event, bool sample_id_all) 589 { 590 event->fork.pid = bswap_32(event->fork.pid); 591 event->fork.tid = bswap_32(event->fork.tid); 592 event->fork.ppid = bswap_32(event->fork.ppid); 593 event->fork.ptid = bswap_32(event->fork.ptid); 594 event->fork.time = bswap_64(event->fork.time); 595 596 if (sample_id_all) 597 swap_sample_id_all(event, &event->fork + 1); 598 } 599 600 static void perf_event__read_swap(union perf_event *event, bool sample_id_all) 601 { 602 event->read.pid = bswap_32(event->read.pid); 603 event->read.tid = bswap_32(event->read.tid); 604 event->read.value = bswap_64(event->read.value); 605 event->read.time_enabled = bswap_64(event->read.time_enabled); 606 event->read.time_running = bswap_64(event->read.time_running); 607 event->read.id = bswap_64(event->read.id); 608 609 if (sample_id_all) 610 swap_sample_id_all(event, &event->read + 1); 611 } 612 613 static void perf_event__aux_swap(union perf_event *event, bool sample_id_all) 614 { 615 event->aux.aux_offset = bswap_64(event->aux.aux_offset); 616 event->aux.aux_size = bswap_64(event->aux.aux_size); 617 event->aux.flags = bswap_64(event->aux.flags); 618 619 if (sample_id_all) 620 swap_sample_id_all(event, &event->aux + 1); 621 } 622 623 static void perf_event__itrace_start_swap(union perf_event *event, 624 bool sample_id_all) 625 { 626 event->itrace_start.pid = bswap_32(event->itrace_start.pid); 627 event->itrace_start.tid = bswap_32(event->itrace_start.tid); 628 629 if (sample_id_all) 630 swap_sample_id_all(event, &event->itrace_start + 1); 631 } 632 633 static void perf_event__switch_swap(union perf_event *event, bool sample_id_all) 634 { 635 if (event->header.type == PERF_RECORD_SWITCH_CPU_WIDE) { 636 event->context_switch.next_prev_pid = 637 bswap_32(event->context_switch.next_prev_pid); 638 event->context_switch.next_prev_tid = 639 bswap_32(event->context_switch.next_prev_tid); 640 } 641 642 if (sample_id_all) 643 swap_sample_id_all(event, &event->context_switch + 1); 644 } 645 646 static void perf_event__throttle_swap(union perf_event *event, 647 bool sample_id_all) 648 { 649 event->throttle.time = bswap_64(event->throttle.time); 650 event->throttle.id = bswap_64(event->throttle.id); 651 event->throttle.stream_id = bswap_64(event->throttle.stream_id); 652 653 if (sample_id_all) 654 swap_sample_id_all(event, &event->throttle + 1); 655 } 656 657 static void perf_event__namespaces_swap(union perf_event *event, 658 bool sample_id_all) 659 { 660 u64 i; 661 662 event->namespaces.pid = bswap_32(event->namespaces.pid); 663 event->namespaces.tid = bswap_32(event->namespaces.tid); 664 event->namespaces.nr_namespaces = bswap_64(event->namespaces.nr_namespaces); 665 666 for (i = 0; i < event->namespaces.nr_namespaces; i++) { 667 struct perf_ns_link_info *ns = &event->namespaces.link_info[i]; 668 669 ns->dev = bswap_64(ns->dev); 670 ns->ino = bswap_64(ns->ino); 671 } 672 673 if (sample_id_all) 674 swap_sample_id_all(event, &event->namespaces.link_info[i]); 675 } 676 677 static u8 revbyte(u8 b) 678 { 679 int rev = (b >> 4) | ((b & 0xf) << 4); 680 rev = ((rev & 0xcc) >> 2) | ((rev & 0x33) << 2); 681 rev = ((rev & 0xaa) >> 1) | ((rev & 0x55) << 1); 682 return (u8) rev; 683 } 684 685 /* 686 * XXX this is hack in attempt to carry flags bitfield 687 * through endian village. ABI says: 688 * 689 * Bit-fields are allocated from right to left (least to most significant) 690 * on little-endian implementations and from left to right (most to least 691 * significant) on big-endian implementations. 692 * 693 * The above seems to be byte specific, so we need to reverse each 694 * byte of the bitfield. 'Internet' also says this might be implementation 695 * specific and we probably need proper fix and carry perf_event_attr 696 * bitfield flags in separate data file FEAT_ section. Thought this seems 697 * to work for now. 698 */ 699 static void swap_bitfield(u8 *p, unsigned len) 700 { 701 unsigned i; 702 703 for (i = 0; i < len; i++) { 704 *p = revbyte(*p); 705 p++; 706 } 707 } 708 709 /* exported for swapping attributes in file header */ 710 void perf_event__attr_swap(struct perf_event_attr *attr) 711 { 712 attr->type = bswap_32(attr->type); 713 attr->size = bswap_32(attr->size); 714 715 #define bswap_safe(f, n) \ 716 (attr->size > (offsetof(struct perf_event_attr, f) + \ 717 sizeof(attr->f) * (n))) 718 #define bswap_field(f, sz) \ 719 do { \ 720 if (bswap_safe(f, 0)) \ 721 attr->f = bswap_##sz(attr->f); \ 722 } while(0) 723 #define bswap_field_16(f) bswap_field(f, 16) 724 #define bswap_field_32(f) bswap_field(f, 32) 725 #define bswap_field_64(f) bswap_field(f, 64) 726 727 bswap_field_64(config); 728 bswap_field_64(sample_period); 729 bswap_field_64(sample_type); 730 bswap_field_64(read_format); 731 bswap_field_32(wakeup_events); 732 bswap_field_32(bp_type); 733 bswap_field_64(bp_addr); 734 bswap_field_64(bp_len); 735 bswap_field_64(branch_sample_type); 736 bswap_field_64(sample_regs_user); 737 bswap_field_32(sample_stack_user); 738 bswap_field_32(aux_watermark); 739 bswap_field_16(sample_max_stack); 740 741 /* 742 * After read_format are bitfields. Check read_format because 743 * we are unable to use offsetof on bitfield. 744 */ 745 if (bswap_safe(read_format, 1)) 746 swap_bitfield((u8 *) (&attr->read_format + 1), 747 sizeof(u64)); 748 #undef bswap_field_64 749 #undef bswap_field_32 750 #undef bswap_field 751 #undef bswap_safe 752 } 753 754 static void perf_event__hdr_attr_swap(union perf_event *event, 755 bool sample_id_all __maybe_unused) 756 { 757 size_t size; 758 759 perf_event__attr_swap(&event->attr.attr); 760 761 size = event->header.size; 762 size -= (void *)&event->attr.id - (void *)event; 763 mem_bswap_64(event->attr.id, size); 764 } 765 766 static void perf_event__event_update_swap(union perf_event *event, 767 bool sample_id_all __maybe_unused) 768 { 769 event->event_update.type = bswap_64(event->event_update.type); 770 event->event_update.id = bswap_64(event->event_update.id); 771 } 772 773 static void perf_event__event_type_swap(union perf_event *event, 774 bool sample_id_all __maybe_unused) 775 { 776 event->event_type.event_type.event_id = 777 bswap_64(event->event_type.event_type.event_id); 778 } 779 780 static void perf_event__tracing_data_swap(union perf_event *event, 781 bool sample_id_all __maybe_unused) 782 { 783 event->tracing_data.size = bswap_32(event->tracing_data.size); 784 } 785 786 static void perf_event__auxtrace_info_swap(union perf_event *event, 787 bool sample_id_all __maybe_unused) 788 { 789 size_t size; 790 791 event->auxtrace_info.type = bswap_32(event->auxtrace_info.type); 792 793 size = event->header.size; 794 size -= (void *)&event->auxtrace_info.priv - (void *)event; 795 mem_bswap_64(event->auxtrace_info.priv, size); 796 } 797 798 static void perf_event__auxtrace_swap(union perf_event *event, 799 bool sample_id_all __maybe_unused) 800 { 801 event->auxtrace.size = bswap_64(event->auxtrace.size); 802 event->auxtrace.offset = bswap_64(event->auxtrace.offset); 803 event->auxtrace.reference = bswap_64(event->auxtrace.reference); 804 event->auxtrace.idx = bswap_32(event->auxtrace.idx); 805 event->auxtrace.tid = bswap_32(event->auxtrace.tid); 806 event->auxtrace.cpu = bswap_32(event->auxtrace.cpu); 807 } 808 809 static void perf_event__auxtrace_error_swap(union perf_event *event, 810 bool sample_id_all __maybe_unused) 811 { 812 event->auxtrace_error.type = bswap_32(event->auxtrace_error.type); 813 event->auxtrace_error.code = bswap_32(event->auxtrace_error.code); 814 event->auxtrace_error.cpu = bswap_32(event->auxtrace_error.cpu); 815 event->auxtrace_error.pid = bswap_32(event->auxtrace_error.pid); 816 event->auxtrace_error.tid = bswap_32(event->auxtrace_error.tid); 817 event->auxtrace_error.fmt = bswap_32(event->auxtrace_error.fmt); 818 event->auxtrace_error.ip = bswap_64(event->auxtrace_error.ip); 819 if (event->auxtrace_error.fmt) 820 event->auxtrace_error.time = bswap_64(event->auxtrace_error.time); 821 } 822 823 static void perf_event__thread_map_swap(union perf_event *event, 824 bool sample_id_all __maybe_unused) 825 { 826 unsigned i; 827 828 event->thread_map.nr = bswap_64(event->thread_map.nr); 829 830 for (i = 0; i < event->thread_map.nr; i++) 831 event->thread_map.entries[i].pid = bswap_64(event->thread_map.entries[i].pid); 832 } 833 834 static void perf_event__cpu_map_swap(union perf_event *event, 835 bool sample_id_all __maybe_unused) 836 { 837 struct cpu_map_data *data = &event->cpu_map.data; 838 struct cpu_map_entries *cpus; 839 struct cpu_map_mask *mask; 840 unsigned i; 841 842 data->type = bswap_64(data->type); 843 844 switch (data->type) { 845 case PERF_CPU_MAP__CPUS: 846 cpus = (struct cpu_map_entries *)data->data; 847 848 cpus->nr = bswap_16(cpus->nr); 849 850 for (i = 0; i < cpus->nr; i++) 851 cpus->cpu[i] = bswap_16(cpus->cpu[i]); 852 break; 853 case PERF_CPU_MAP__MASK: 854 mask = (struct cpu_map_mask *) data->data; 855 856 mask->nr = bswap_16(mask->nr); 857 mask->long_size = bswap_16(mask->long_size); 858 859 switch (mask->long_size) { 860 case 4: mem_bswap_32(&mask->mask, mask->nr); break; 861 case 8: mem_bswap_64(&mask->mask, mask->nr); break; 862 default: 863 pr_err("cpu_map swap: unsupported long size\n"); 864 } 865 default: 866 break; 867 } 868 } 869 870 static void perf_event__stat_config_swap(union perf_event *event, 871 bool sample_id_all __maybe_unused) 872 { 873 u64 size; 874 875 size = event->stat_config.nr * sizeof(event->stat_config.data[0]); 876 size += 1; /* nr item itself */ 877 mem_bswap_64(&event->stat_config.nr, size); 878 } 879 880 static void perf_event__stat_swap(union perf_event *event, 881 bool sample_id_all __maybe_unused) 882 { 883 event->stat.id = bswap_64(event->stat.id); 884 event->stat.thread = bswap_32(event->stat.thread); 885 event->stat.cpu = bswap_32(event->stat.cpu); 886 event->stat.val = bswap_64(event->stat.val); 887 event->stat.ena = bswap_64(event->stat.ena); 888 event->stat.run = bswap_64(event->stat.run); 889 } 890 891 static void perf_event__stat_round_swap(union perf_event *event, 892 bool sample_id_all __maybe_unused) 893 { 894 event->stat_round.type = bswap_64(event->stat_round.type); 895 event->stat_round.time = bswap_64(event->stat_round.time); 896 } 897 898 typedef void (*perf_event__swap_op)(union perf_event *event, 899 bool sample_id_all); 900 901 static perf_event__swap_op perf_event__swap_ops[] = { 902 [PERF_RECORD_MMAP] = perf_event__mmap_swap, 903 [PERF_RECORD_MMAP2] = perf_event__mmap2_swap, 904 [PERF_RECORD_COMM] = perf_event__comm_swap, 905 [PERF_RECORD_FORK] = perf_event__task_swap, 906 [PERF_RECORD_EXIT] = perf_event__task_swap, 907 [PERF_RECORD_LOST] = perf_event__all64_swap, 908 [PERF_RECORD_READ] = perf_event__read_swap, 909 [PERF_RECORD_THROTTLE] = perf_event__throttle_swap, 910 [PERF_RECORD_UNTHROTTLE] = perf_event__throttle_swap, 911 [PERF_RECORD_SAMPLE] = perf_event__all64_swap, 912 [PERF_RECORD_AUX] = perf_event__aux_swap, 913 [PERF_RECORD_ITRACE_START] = perf_event__itrace_start_swap, 914 [PERF_RECORD_LOST_SAMPLES] = perf_event__all64_swap, 915 [PERF_RECORD_SWITCH] = perf_event__switch_swap, 916 [PERF_RECORD_SWITCH_CPU_WIDE] = perf_event__switch_swap, 917 [PERF_RECORD_NAMESPACES] = perf_event__namespaces_swap, 918 [PERF_RECORD_HEADER_ATTR] = perf_event__hdr_attr_swap, 919 [PERF_RECORD_HEADER_EVENT_TYPE] = perf_event__event_type_swap, 920 [PERF_RECORD_HEADER_TRACING_DATA] = perf_event__tracing_data_swap, 921 [PERF_RECORD_HEADER_BUILD_ID] = NULL, 922 [PERF_RECORD_ID_INDEX] = perf_event__all64_swap, 923 [PERF_RECORD_AUXTRACE_INFO] = perf_event__auxtrace_info_swap, 924 [PERF_RECORD_AUXTRACE] = perf_event__auxtrace_swap, 925 [PERF_RECORD_AUXTRACE_ERROR] = perf_event__auxtrace_error_swap, 926 [PERF_RECORD_THREAD_MAP] = perf_event__thread_map_swap, 927 [PERF_RECORD_CPU_MAP] = perf_event__cpu_map_swap, 928 [PERF_RECORD_STAT_CONFIG] = perf_event__stat_config_swap, 929 [PERF_RECORD_STAT] = perf_event__stat_swap, 930 [PERF_RECORD_STAT_ROUND] = perf_event__stat_round_swap, 931 [PERF_RECORD_EVENT_UPDATE] = perf_event__event_update_swap, 932 [PERF_RECORD_TIME_CONV] = perf_event__all64_swap, 933 [PERF_RECORD_HEADER_MAX] = NULL, 934 }; 935 936 /* 937 * When perf record finishes a pass on every buffers, it records this pseudo 938 * event. 939 * We record the max timestamp t found in the pass n. 940 * Assuming these timestamps are monotonic across cpus, we know that if 941 * a buffer still has events with timestamps below t, they will be all 942 * available and then read in the pass n + 1. 943 * Hence when we start to read the pass n + 2, we can safely flush every 944 * events with timestamps below t. 945 * 946 * ============ PASS n ================= 947 * CPU 0 | CPU 1 948 * | 949 * cnt1 timestamps | cnt2 timestamps 950 * 1 | 2 951 * 2 | 3 952 * - | 4 <--- max recorded 953 * 954 * ============ PASS n + 1 ============== 955 * CPU 0 | CPU 1 956 * | 957 * cnt1 timestamps | cnt2 timestamps 958 * 3 | 5 959 * 4 | 6 960 * 5 | 7 <---- max recorded 961 * 962 * Flush every events below timestamp 4 963 * 964 * ============ PASS n + 2 ============== 965 * CPU 0 | CPU 1 966 * | 967 * cnt1 timestamps | cnt2 timestamps 968 * 6 | 8 969 * 7 | 9 970 * - | 10 971 * 972 * Flush every events below timestamp 7 973 * etc... 974 */ 975 static int process_finished_round(struct perf_tool *tool __maybe_unused, 976 union perf_event *event __maybe_unused, 977 struct ordered_events *oe) 978 { 979 if (dump_trace) 980 fprintf(stdout, "\n"); 981 return ordered_events__flush(oe, OE_FLUSH__ROUND); 982 } 983 984 int perf_session__queue_event(struct perf_session *s, union perf_event *event, 985 u64 timestamp, u64 file_offset) 986 { 987 return ordered_events__queue(&s->ordered_events, event, timestamp, file_offset); 988 } 989 990 static void callchain__lbr_callstack_printf(struct perf_sample *sample) 991 { 992 struct ip_callchain *callchain = sample->callchain; 993 struct branch_stack *lbr_stack = sample->branch_stack; 994 u64 kernel_callchain_nr = callchain->nr; 995 unsigned int i; 996 997 for (i = 0; i < kernel_callchain_nr; i++) { 998 if (callchain->ips[i] == PERF_CONTEXT_USER) 999 break; 1000 } 1001 1002 if ((i != kernel_callchain_nr) && lbr_stack->nr) { 1003 u64 total_nr; 1004 /* 1005 * LBR callstack can only get user call chain, 1006 * i is kernel call chain number, 1007 * 1 is PERF_CONTEXT_USER. 1008 * 1009 * The user call chain is stored in LBR registers. 1010 * LBR are pair registers. The caller is stored 1011 * in "from" register, while the callee is stored 1012 * in "to" register. 1013 * For example, there is a call stack 1014 * "A"->"B"->"C"->"D". 1015 * The LBR registers will recorde like 1016 * "C"->"D", "B"->"C", "A"->"B". 1017 * So only the first "to" register and all "from" 1018 * registers are needed to construct the whole stack. 1019 */ 1020 total_nr = i + 1 + lbr_stack->nr + 1; 1021 kernel_callchain_nr = i + 1; 1022 1023 printf("... LBR call chain: nr:%" PRIu64 "\n", total_nr); 1024 1025 for (i = 0; i < kernel_callchain_nr; i++) 1026 printf("..... %2d: %016" PRIx64 "\n", 1027 i, callchain->ips[i]); 1028 1029 printf("..... %2d: %016" PRIx64 "\n", 1030 (int)(kernel_callchain_nr), lbr_stack->entries[0].to); 1031 for (i = 0; i < lbr_stack->nr; i++) 1032 printf("..... %2d: %016" PRIx64 "\n", 1033 (int)(i + kernel_callchain_nr + 1), lbr_stack->entries[i].from); 1034 } 1035 } 1036 1037 static void callchain__printf(struct evsel *evsel, 1038 struct perf_sample *sample) 1039 { 1040 unsigned int i; 1041 struct ip_callchain *callchain = sample->callchain; 1042 1043 if (perf_evsel__has_branch_callstack(evsel)) 1044 callchain__lbr_callstack_printf(sample); 1045 1046 printf("... FP chain: nr:%" PRIu64 "\n", callchain->nr); 1047 1048 for (i = 0; i < callchain->nr; i++) 1049 printf("..... %2d: %016" PRIx64 "\n", 1050 i, callchain->ips[i]); 1051 } 1052 1053 static void branch_stack__printf(struct perf_sample *sample) 1054 { 1055 uint64_t i; 1056 1057 printf("... branch stack: nr:%" PRIu64 "\n", sample->branch_stack->nr); 1058 1059 for (i = 0; i < sample->branch_stack->nr; i++) { 1060 struct branch_entry *e = &sample->branch_stack->entries[i]; 1061 1062 printf("..... %2"PRIu64": %016" PRIx64 " -> %016" PRIx64 " %hu cycles %s%s%s%s %x\n", 1063 i, e->from, e->to, 1064 (unsigned short)e->flags.cycles, 1065 e->flags.mispred ? "M" : " ", 1066 e->flags.predicted ? "P" : " ", 1067 e->flags.abort ? "A" : " ", 1068 e->flags.in_tx ? "T" : " ", 1069 (unsigned)e->flags.reserved); 1070 } 1071 } 1072 1073 static void regs_dump__printf(u64 mask, u64 *regs) 1074 { 1075 unsigned rid, i = 0; 1076 1077 for_each_set_bit(rid, (unsigned long *) &mask, sizeof(mask) * 8) { 1078 u64 val = regs[i++]; 1079 1080 printf(".... %-5s 0x%" PRIx64 "\n", 1081 perf_reg_name(rid), val); 1082 } 1083 } 1084 1085 static const char *regs_abi[] = { 1086 [PERF_SAMPLE_REGS_ABI_NONE] = "none", 1087 [PERF_SAMPLE_REGS_ABI_32] = "32-bit", 1088 [PERF_SAMPLE_REGS_ABI_64] = "64-bit", 1089 }; 1090 1091 static inline const char *regs_dump_abi(struct regs_dump *d) 1092 { 1093 if (d->abi > PERF_SAMPLE_REGS_ABI_64) 1094 return "unknown"; 1095 1096 return regs_abi[d->abi]; 1097 } 1098 1099 static void regs__printf(const char *type, struct regs_dump *regs) 1100 { 1101 u64 mask = regs->mask; 1102 1103 printf("... %s regs: mask 0x%" PRIx64 " ABI %s\n", 1104 type, 1105 mask, 1106 regs_dump_abi(regs)); 1107 1108 regs_dump__printf(mask, regs->regs); 1109 } 1110 1111 static void regs_user__printf(struct perf_sample *sample) 1112 { 1113 struct regs_dump *user_regs = &sample->user_regs; 1114 1115 if (user_regs->regs) 1116 regs__printf("user", user_regs); 1117 } 1118 1119 static void regs_intr__printf(struct perf_sample *sample) 1120 { 1121 struct regs_dump *intr_regs = &sample->intr_regs; 1122 1123 if (intr_regs->regs) 1124 regs__printf("intr", intr_regs); 1125 } 1126 1127 static void stack_user__printf(struct stack_dump *dump) 1128 { 1129 printf("... ustack: size %" PRIu64 ", offset 0x%x\n", 1130 dump->size, dump->offset); 1131 } 1132 1133 static void perf_evlist__print_tstamp(struct evlist *evlist, 1134 union perf_event *event, 1135 struct perf_sample *sample) 1136 { 1137 u64 sample_type = __perf_evlist__combined_sample_type(evlist); 1138 1139 if (event->header.type != PERF_RECORD_SAMPLE && 1140 !perf_evlist__sample_id_all(evlist)) { 1141 fputs("-1 -1 ", stdout); 1142 return; 1143 } 1144 1145 if ((sample_type & PERF_SAMPLE_CPU)) 1146 printf("%u ", sample->cpu); 1147 1148 if (sample_type & PERF_SAMPLE_TIME) 1149 printf("%" PRIu64 " ", sample->time); 1150 } 1151 1152 static void sample_read__printf(struct perf_sample *sample, u64 read_format) 1153 { 1154 printf("... sample_read:\n"); 1155 1156 if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED) 1157 printf("...... time enabled %016" PRIx64 "\n", 1158 sample->read.time_enabled); 1159 1160 if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING) 1161 printf("...... time running %016" PRIx64 "\n", 1162 sample->read.time_running); 1163 1164 if (read_format & PERF_FORMAT_GROUP) { 1165 u64 i; 1166 1167 printf(".... group nr %" PRIu64 "\n", sample->read.group.nr); 1168 1169 for (i = 0; i < sample->read.group.nr; i++) { 1170 struct sample_read_value *value; 1171 1172 value = &sample->read.group.values[i]; 1173 printf("..... id %016" PRIx64 1174 ", value %016" PRIx64 "\n", 1175 value->id, value->value); 1176 } 1177 } else 1178 printf("..... id %016" PRIx64 ", value %016" PRIx64 "\n", 1179 sample->read.one.id, sample->read.one.value); 1180 } 1181 1182 static void dump_event(struct evlist *evlist, union perf_event *event, 1183 u64 file_offset, struct perf_sample *sample) 1184 { 1185 if (!dump_trace) 1186 return; 1187 1188 printf("\n%#" PRIx64 " [%#x]: event: %d\n", 1189 file_offset, event->header.size, event->header.type); 1190 1191 trace_event(event); 1192 if (event->header.type == PERF_RECORD_SAMPLE && evlist->trace_event_sample_raw) 1193 evlist->trace_event_sample_raw(evlist, event, sample); 1194 1195 if (sample) 1196 perf_evlist__print_tstamp(evlist, event, sample); 1197 1198 printf("%#" PRIx64 " [%#x]: PERF_RECORD_%s", file_offset, 1199 event->header.size, perf_event__name(event->header.type)); 1200 } 1201 1202 static void dump_sample(struct evsel *evsel, union perf_event *event, 1203 struct perf_sample *sample) 1204 { 1205 u64 sample_type; 1206 1207 if (!dump_trace) 1208 return; 1209 1210 printf("(IP, 0x%x): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n", 1211 event->header.misc, sample->pid, sample->tid, sample->ip, 1212 sample->period, sample->addr); 1213 1214 sample_type = evsel->core.attr.sample_type; 1215 1216 if (evsel__has_callchain(evsel)) 1217 callchain__printf(evsel, sample); 1218 1219 if ((sample_type & PERF_SAMPLE_BRANCH_STACK) && !perf_evsel__has_branch_callstack(evsel)) 1220 branch_stack__printf(sample); 1221 1222 if (sample_type & PERF_SAMPLE_REGS_USER) 1223 regs_user__printf(sample); 1224 1225 if (sample_type & PERF_SAMPLE_REGS_INTR) 1226 regs_intr__printf(sample); 1227 1228 if (sample_type & PERF_SAMPLE_STACK_USER) 1229 stack_user__printf(&sample->user_stack); 1230 1231 if (sample_type & PERF_SAMPLE_WEIGHT) 1232 printf("... weight: %" PRIu64 "\n", sample->weight); 1233 1234 if (sample_type & PERF_SAMPLE_DATA_SRC) 1235 printf(" . data_src: 0x%"PRIx64"\n", sample->data_src); 1236 1237 if (sample_type & PERF_SAMPLE_PHYS_ADDR) 1238 printf(" .. phys_addr: 0x%"PRIx64"\n", sample->phys_addr); 1239 1240 if (sample_type & PERF_SAMPLE_TRANSACTION) 1241 printf("... transaction: %" PRIx64 "\n", sample->transaction); 1242 1243 if (sample_type & PERF_SAMPLE_READ) 1244 sample_read__printf(sample, evsel->core.attr.read_format); 1245 } 1246 1247 static void dump_read(struct evsel *evsel, union perf_event *event) 1248 { 1249 struct read_event *read_event = &event->read; 1250 u64 read_format; 1251 1252 if (!dump_trace) 1253 return; 1254 1255 printf(": %d %d %s %" PRIu64 "\n", event->read.pid, event->read.tid, 1256 perf_evsel__name(evsel), 1257 event->read.value); 1258 1259 if (!evsel) 1260 return; 1261 1262 read_format = evsel->core.attr.read_format; 1263 1264 if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED) 1265 printf("... time enabled : %" PRIu64 "\n", read_event->time_enabled); 1266 1267 if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING) 1268 printf("... time running : %" PRIu64 "\n", read_event->time_running); 1269 1270 if (read_format & PERF_FORMAT_ID) 1271 printf("... id : %" PRIu64 "\n", read_event->id); 1272 } 1273 1274 static struct machine *machines__find_for_cpumode(struct machines *machines, 1275 union perf_event *event, 1276 struct perf_sample *sample) 1277 { 1278 struct machine *machine; 1279 1280 if (perf_guest && 1281 ((sample->cpumode == PERF_RECORD_MISC_GUEST_KERNEL) || 1282 (sample->cpumode == PERF_RECORD_MISC_GUEST_USER))) { 1283 u32 pid; 1284 1285 if (event->header.type == PERF_RECORD_MMAP 1286 || event->header.type == PERF_RECORD_MMAP2) 1287 pid = event->mmap.pid; 1288 else 1289 pid = sample->pid; 1290 1291 machine = machines__find(machines, pid); 1292 if (!machine) 1293 machine = machines__findnew(machines, DEFAULT_GUEST_KERNEL_ID); 1294 return machine; 1295 } 1296 1297 return &machines->host; 1298 } 1299 1300 static int deliver_sample_value(struct evlist *evlist, 1301 struct perf_tool *tool, 1302 union perf_event *event, 1303 struct perf_sample *sample, 1304 struct sample_read_value *v, 1305 struct machine *machine) 1306 { 1307 struct perf_sample_id *sid = perf_evlist__id2sid(evlist, v->id); 1308 1309 if (sid) { 1310 sample->id = v->id; 1311 sample->period = v->value - sid->period; 1312 sid->period = v->value; 1313 } 1314 1315 if (!sid || sid->evsel == NULL) { 1316 ++evlist->stats.nr_unknown_id; 1317 return 0; 1318 } 1319 1320 /* 1321 * There's no reason to deliver sample 1322 * for zero period, bail out. 1323 */ 1324 if (!sample->period) 1325 return 0; 1326 1327 return tool->sample(tool, event, sample, sid->evsel, machine); 1328 } 1329 1330 static int deliver_sample_group(struct evlist *evlist, 1331 struct perf_tool *tool, 1332 union perf_event *event, 1333 struct perf_sample *sample, 1334 struct machine *machine) 1335 { 1336 int ret = -EINVAL; 1337 u64 i; 1338 1339 for (i = 0; i < sample->read.group.nr; i++) { 1340 ret = deliver_sample_value(evlist, tool, event, sample, 1341 &sample->read.group.values[i], 1342 machine); 1343 if (ret) 1344 break; 1345 } 1346 1347 return ret; 1348 } 1349 1350 static int 1351 perf_evlist__deliver_sample(struct evlist *evlist, 1352 struct perf_tool *tool, 1353 union perf_event *event, 1354 struct perf_sample *sample, 1355 struct evsel *evsel, 1356 struct machine *machine) 1357 { 1358 /* We know evsel != NULL. */ 1359 u64 sample_type = evsel->core.attr.sample_type; 1360 u64 read_format = evsel->core.attr.read_format; 1361 1362 /* Standard sample delivery. */ 1363 if (!(sample_type & PERF_SAMPLE_READ)) 1364 return tool->sample(tool, event, sample, evsel, machine); 1365 1366 /* For PERF_SAMPLE_READ we have either single or group mode. */ 1367 if (read_format & PERF_FORMAT_GROUP) 1368 return deliver_sample_group(evlist, tool, event, sample, 1369 machine); 1370 else 1371 return deliver_sample_value(evlist, tool, event, sample, 1372 &sample->read.one, machine); 1373 } 1374 1375 static int machines__deliver_event(struct machines *machines, 1376 struct evlist *evlist, 1377 union perf_event *event, 1378 struct perf_sample *sample, 1379 struct perf_tool *tool, u64 file_offset) 1380 { 1381 struct evsel *evsel; 1382 struct machine *machine; 1383 1384 dump_event(evlist, event, file_offset, sample); 1385 1386 evsel = perf_evlist__id2evsel(evlist, sample->id); 1387 1388 machine = machines__find_for_cpumode(machines, event, sample); 1389 1390 switch (event->header.type) { 1391 case PERF_RECORD_SAMPLE: 1392 if (evsel == NULL) { 1393 ++evlist->stats.nr_unknown_id; 1394 return 0; 1395 } 1396 dump_sample(evsel, event, sample); 1397 if (machine == NULL) { 1398 ++evlist->stats.nr_unprocessable_samples; 1399 return 0; 1400 } 1401 return perf_evlist__deliver_sample(evlist, tool, event, sample, evsel, machine); 1402 case PERF_RECORD_MMAP: 1403 return tool->mmap(tool, event, sample, machine); 1404 case PERF_RECORD_MMAP2: 1405 if (event->header.misc & PERF_RECORD_MISC_PROC_MAP_PARSE_TIMEOUT) 1406 ++evlist->stats.nr_proc_map_timeout; 1407 return tool->mmap2(tool, event, sample, machine); 1408 case PERF_RECORD_COMM: 1409 return tool->comm(tool, event, sample, machine); 1410 case PERF_RECORD_NAMESPACES: 1411 return tool->namespaces(tool, event, sample, machine); 1412 case PERF_RECORD_FORK: 1413 return tool->fork(tool, event, sample, machine); 1414 case PERF_RECORD_EXIT: 1415 return tool->exit(tool, event, sample, machine); 1416 case PERF_RECORD_LOST: 1417 if (tool->lost == perf_event__process_lost) 1418 evlist->stats.total_lost += event->lost.lost; 1419 return tool->lost(tool, event, sample, machine); 1420 case PERF_RECORD_LOST_SAMPLES: 1421 if (tool->lost_samples == perf_event__process_lost_samples) 1422 evlist->stats.total_lost_samples += event->lost_samples.lost; 1423 return tool->lost_samples(tool, event, sample, machine); 1424 case PERF_RECORD_READ: 1425 dump_read(evsel, event); 1426 return tool->read(tool, event, sample, evsel, machine); 1427 case PERF_RECORD_THROTTLE: 1428 return tool->throttle(tool, event, sample, machine); 1429 case PERF_RECORD_UNTHROTTLE: 1430 return tool->unthrottle(tool, event, sample, machine); 1431 case PERF_RECORD_AUX: 1432 if (tool->aux == perf_event__process_aux) { 1433 if (event->aux.flags & PERF_AUX_FLAG_TRUNCATED) 1434 evlist->stats.total_aux_lost += 1; 1435 if (event->aux.flags & PERF_AUX_FLAG_PARTIAL) 1436 evlist->stats.total_aux_partial += 1; 1437 } 1438 return tool->aux(tool, event, sample, machine); 1439 case PERF_RECORD_ITRACE_START: 1440 return tool->itrace_start(tool, event, sample, machine); 1441 case PERF_RECORD_SWITCH: 1442 case PERF_RECORD_SWITCH_CPU_WIDE: 1443 return tool->context_switch(tool, event, sample, machine); 1444 case PERF_RECORD_KSYMBOL: 1445 return tool->ksymbol(tool, event, sample, machine); 1446 case PERF_RECORD_BPF_EVENT: 1447 return tool->bpf_event(tool, event, sample, machine); 1448 default: 1449 ++evlist->stats.nr_unknown_events; 1450 return -1; 1451 } 1452 } 1453 1454 static int perf_session__deliver_event(struct perf_session *session, 1455 union perf_event *event, 1456 struct perf_tool *tool, 1457 u64 file_offset) 1458 { 1459 struct perf_sample sample; 1460 int ret; 1461 1462 ret = perf_evlist__parse_sample(session->evlist, event, &sample); 1463 if (ret) { 1464 pr_err("Can't parse sample, err = %d\n", ret); 1465 return ret; 1466 } 1467 1468 ret = auxtrace__process_event(session, event, &sample, tool); 1469 if (ret < 0) 1470 return ret; 1471 if (ret > 0) 1472 return 0; 1473 1474 return machines__deliver_event(&session->machines, session->evlist, 1475 event, &sample, tool, file_offset); 1476 } 1477 1478 static s64 perf_session__process_user_event(struct perf_session *session, 1479 union perf_event *event, 1480 u64 file_offset) 1481 { 1482 struct ordered_events *oe = &session->ordered_events; 1483 struct perf_tool *tool = session->tool; 1484 struct perf_sample sample = { .time = 0, }; 1485 int fd = perf_data__fd(session->data); 1486 int err; 1487 1488 if (event->header.type != PERF_RECORD_COMPRESSED || 1489 tool->compressed == perf_session__process_compressed_event_stub) 1490 dump_event(session->evlist, event, file_offset, &sample); 1491 1492 /* These events are processed right away */ 1493 switch (event->header.type) { 1494 case PERF_RECORD_HEADER_ATTR: 1495 err = tool->attr(tool, event, &session->evlist); 1496 if (err == 0) { 1497 perf_session__set_id_hdr_size(session); 1498 perf_session__set_comm_exec(session); 1499 } 1500 return err; 1501 case PERF_RECORD_EVENT_UPDATE: 1502 return tool->event_update(tool, event, &session->evlist); 1503 case PERF_RECORD_HEADER_EVENT_TYPE: 1504 /* 1505 * Depreceated, but we need to handle it for sake 1506 * of old data files create in pipe mode. 1507 */ 1508 return 0; 1509 case PERF_RECORD_HEADER_TRACING_DATA: 1510 /* setup for reading amidst mmap */ 1511 lseek(fd, file_offset, SEEK_SET); 1512 return tool->tracing_data(session, event); 1513 case PERF_RECORD_HEADER_BUILD_ID: 1514 return tool->build_id(session, event); 1515 case PERF_RECORD_FINISHED_ROUND: 1516 return tool->finished_round(tool, event, oe); 1517 case PERF_RECORD_ID_INDEX: 1518 return tool->id_index(session, event); 1519 case PERF_RECORD_AUXTRACE_INFO: 1520 return tool->auxtrace_info(session, event); 1521 case PERF_RECORD_AUXTRACE: 1522 /* setup for reading amidst mmap */ 1523 lseek(fd, file_offset + event->header.size, SEEK_SET); 1524 return tool->auxtrace(session, event); 1525 case PERF_RECORD_AUXTRACE_ERROR: 1526 perf_session__auxtrace_error_inc(session, event); 1527 return tool->auxtrace_error(session, event); 1528 case PERF_RECORD_THREAD_MAP: 1529 return tool->thread_map(session, event); 1530 case PERF_RECORD_CPU_MAP: 1531 return tool->cpu_map(session, event); 1532 case PERF_RECORD_STAT_CONFIG: 1533 return tool->stat_config(session, event); 1534 case PERF_RECORD_STAT: 1535 return tool->stat(session, event); 1536 case PERF_RECORD_STAT_ROUND: 1537 return tool->stat_round(session, event); 1538 case PERF_RECORD_TIME_CONV: 1539 session->time_conv = event->time_conv; 1540 return tool->time_conv(session, event); 1541 case PERF_RECORD_HEADER_FEATURE: 1542 return tool->feature(session, event); 1543 case PERF_RECORD_COMPRESSED: 1544 err = tool->compressed(session, event, file_offset); 1545 if (err) 1546 dump_event(session->evlist, event, file_offset, &sample); 1547 return err; 1548 default: 1549 return -EINVAL; 1550 } 1551 } 1552 1553 int perf_session__deliver_synth_event(struct perf_session *session, 1554 union perf_event *event, 1555 struct perf_sample *sample) 1556 { 1557 struct evlist *evlist = session->evlist; 1558 struct perf_tool *tool = session->tool; 1559 1560 events_stats__inc(&evlist->stats, event->header.type); 1561 1562 if (event->header.type >= PERF_RECORD_USER_TYPE_START) 1563 return perf_session__process_user_event(session, event, 0); 1564 1565 return machines__deliver_event(&session->machines, evlist, event, sample, tool, 0); 1566 } 1567 1568 static void event_swap(union perf_event *event, bool sample_id_all) 1569 { 1570 perf_event__swap_op swap; 1571 1572 swap = perf_event__swap_ops[event->header.type]; 1573 if (swap) 1574 swap(event, sample_id_all); 1575 } 1576 1577 int perf_session__peek_event(struct perf_session *session, off_t file_offset, 1578 void *buf, size_t buf_sz, 1579 union perf_event **event_ptr, 1580 struct perf_sample *sample) 1581 { 1582 union perf_event *event; 1583 size_t hdr_sz, rest; 1584 int fd; 1585 1586 if (session->one_mmap && !session->header.needs_swap) { 1587 event = file_offset - session->one_mmap_offset + 1588 session->one_mmap_addr; 1589 goto out_parse_sample; 1590 } 1591 1592 if (perf_data__is_pipe(session->data)) 1593 return -1; 1594 1595 fd = perf_data__fd(session->data); 1596 hdr_sz = sizeof(struct perf_event_header); 1597 1598 if (buf_sz < hdr_sz) 1599 return -1; 1600 1601 if (lseek(fd, file_offset, SEEK_SET) == (off_t)-1 || 1602 readn(fd, buf, hdr_sz) != (ssize_t)hdr_sz) 1603 return -1; 1604 1605 event = (union perf_event *)buf; 1606 1607 if (session->header.needs_swap) 1608 perf_event_header__bswap(&event->header); 1609 1610 if (event->header.size < hdr_sz || event->header.size > buf_sz) 1611 return -1; 1612 1613 rest = event->header.size - hdr_sz; 1614 1615 if (readn(fd, buf, rest) != (ssize_t)rest) 1616 return -1; 1617 1618 if (session->header.needs_swap) 1619 event_swap(event, perf_evlist__sample_id_all(session->evlist)); 1620 1621 out_parse_sample: 1622 1623 if (sample && event->header.type < PERF_RECORD_USER_TYPE_START && 1624 perf_evlist__parse_sample(session->evlist, event, sample)) 1625 return -1; 1626 1627 *event_ptr = event; 1628 1629 return 0; 1630 } 1631 1632 static s64 perf_session__process_event(struct perf_session *session, 1633 union perf_event *event, u64 file_offset) 1634 { 1635 struct evlist *evlist = session->evlist; 1636 struct perf_tool *tool = session->tool; 1637 int ret; 1638 1639 if (session->header.needs_swap) 1640 event_swap(event, perf_evlist__sample_id_all(evlist)); 1641 1642 if (event->header.type >= PERF_RECORD_HEADER_MAX) 1643 return -EINVAL; 1644 1645 events_stats__inc(&evlist->stats, event->header.type); 1646 1647 if (event->header.type >= PERF_RECORD_USER_TYPE_START) 1648 return perf_session__process_user_event(session, event, file_offset); 1649 1650 if (tool->ordered_events) { 1651 u64 timestamp = -1ULL; 1652 1653 ret = perf_evlist__parse_sample_timestamp(evlist, event, ×tamp); 1654 if (ret && ret != -1) 1655 return ret; 1656 1657 ret = perf_session__queue_event(session, event, timestamp, file_offset); 1658 if (ret != -ETIME) 1659 return ret; 1660 } 1661 1662 return perf_session__deliver_event(session, event, tool, file_offset); 1663 } 1664 1665 void perf_event_header__bswap(struct perf_event_header *hdr) 1666 { 1667 hdr->type = bswap_32(hdr->type); 1668 hdr->misc = bswap_16(hdr->misc); 1669 hdr->size = bswap_16(hdr->size); 1670 } 1671 1672 struct thread *perf_session__findnew(struct perf_session *session, pid_t pid) 1673 { 1674 return machine__findnew_thread(&session->machines.host, -1, pid); 1675 } 1676 1677 /* 1678 * Threads are identified by pid and tid, and the idle task has pid == tid == 0. 1679 * So here a single thread is created for that, but actually there is a separate 1680 * idle task per cpu, so there should be one 'struct thread' per cpu, but there 1681 * is only 1. That causes problems for some tools, requiring workarounds. For 1682 * example get_idle_thread() in builtin-sched.c, or thread_stack__per_cpu(). 1683 */ 1684 int perf_session__register_idle_thread(struct perf_session *session) 1685 { 1686 struct thread *thread; 1687 int err = 0; 1688 1689 thread = machine__findnew_thread(&session->machines.host, 0, 0); 1690 if (thread == NULL || thread__set_comm(thread, "swapper", 0)) { 1691 pr_err("problem inserting idle task.\n"); 1692 err = -1; 1693 } 1694 1695 if (thread == NULL || thread__set_namespaces(thread, 0, NULL)) { 1696 pr_err("problem inserting idle task.\n"); 1697 err = -1; 1698 } 1699 1700 /* machine__findnew_thread() got the thread, so put it */ 1701 thread__put(thread); 1702 return err; 1703 } 1704 1705 static void 1706 perf_session__warn_order(const struct perf_session *session) 1707 { 1708 const struct ordered_events *oe = &session->ordered_events; 1709 struct evsel *evsel; 1710 bool should_warn = true; 1711 1712 evlist__for_each_entry(session->evlist, evsel) { 1713 if (evsel->core.attr.write_backward) 1714 should_warn = false; 1715 } 1716 1717 if (!should_warn) 1718 return; 1719 if (oe->nr_unordered_events != 0) 1720 ui__warning("%u out of order events recorded.\n", oe->nr_unordered_events); 1721 } 1722 1723 static void perf_session__warn_about_errors(const struct perf_session *session) 1724 { 1725 const struct events_stats *stats = &session->evlist->stats; 1726 1727 if (session->tool->lost == perf_event__process_lost && 1728 stats->nr_events[PERF_RECORD_LOST] != 0) { 1729 ui__warning("Processed %d events and lost %d chunks!\n\n" 1730 "Check IO/CPU overload!\n\n", 1731 stats->nr_events[0], 1732 stats->nr_events[PERF_RECORD_LOST]); 1733 } 1734 1735 if (session->tool->lost_samples == perf_event__process_lost_samples) { 1736 double drop_rate; 1737 1738 drop_rate = (double)stats->total_lost_samples / 1739 (double) (stats->nr_events[PERF_RECORD_SAMPLE] + stats->total_lost_samples); 1740 if (drop_rate > 0.05) { 1741 ui__warning("Processed %" PRIu64 " samples and lost %3.2f%%!\n\n", 1742 stats->nr_events[PERF_RECORD_SAMPLE] + stats->total_lost_samples, 1743 drop_rate * 100.0); 1744 } 1745 } 1746 1747 if (session->tool->aux == perf_event__process_aux && 1748 stats->total_aux_lost != 0) { 1749 ui__warning("AUX data lost %" PRIu64 " times out of %u!\n\n", 1750 stats->total_aux_lost, 1751 stats->nr_events[PERF_RECORD_AUX]); 1752 } 1753 1754 if (session->tool->aux == perf_event__process_aux && 1755 stats->total_aux_partial != 0) { 1756 bool vmm_exclusive = false; 1757 1758 (void)sysfs__read_bool("module/kvm_intel/parameters/vmm_exclusive", 1759 &vmm_exclusive); 1760 1761 ui__warning("AUX data had gaps in it %" PRIu64 " times out of %u!\n\n" 1762 "Are you running a KVM guest in the background?%s\n\n", 1763 stats->total_aux_partial, 1764 stats->nr_events[PERF_RECORD_AUX], 1765 vmm_exclusive ? 1766 "\nReloading kvm_intel module with vmm_exclusive=0\n" 1767 "will reduce the gaps to only guest's timeslices." : 1768 ""); 1769 } 1770 1771 if (stats->nr_unknown_events != 0) { 1772 ui__warning("Found %u unknown events!\n\n" 1773 "Is this an older tool processing a perf.data " 1774 "file generated by a more recent tool?\n\n" 1775 "If that is not the case, consider " 1776 "reporting to linux-kernel@vger.kernel.org.\n\n", 1777 stats->nr_unknown_events); 1778 } 1779 1780 if (stats->nr_unknown_id != 0) { 1781 ui__warning("%u samples with id not present in the header\n", 1782 stats->nr_unknown_id); 1783 } 1784 1785 if (stats->nr_invalid_chains != 0) { 1786 ui__warning("Found invalid callchains!\n\n" 1787 "%u out of %u events were discarded for this reason.\n\n" 1788 "Consider reporting to linux-kernel@vger.kernel.org.\n\n", 1789 stats->nr_invalid_chains, 1790 stats->nr_events[PERF_RECORD_SAMPLE]); 1791 } 1792 1793 if (stats->nr_unprocessable_samples != 0) { 1794 ui__warning("%u unprocessable samples recorded.\n" 1795 "Do you have a KVM guest running and not using 'perf kvm'?\n", 1796 stats->nr_unprocessable_samples); 1797 } 1798 1799 perf_session__warn_order(session); 1800 1801 events_stats__auxtrace_error_warn(stats); 1802 1803 if (stats->nr_proc_map_timeout != 0) { 1804 ui__warning("%d map information files for pre-existing threads were\n" 1805 "not processed, if there are samples for addresses they\n" 1806 "will not be resolved, you may find out which are these\n" 1807 "threads by running with -v and redirecting the output\n" 1808 "to a file.\n" 1809 "The time limit to process proc map is too short?\n" 1810 "Increase it by --proc-map-timeout\n", 1811 stats->nr_proc_map_timeout); 1812 } 1813 } 1814 1815 static int perf_session__flush_thread_stack(struct thread *thread, 1816 void *p __maybe_unused) 1817 { 1818 return thread_stack__flush(thread); 1819 } 1820 1821 static int perf_session__flush_thread_stacks(struct perf_session *session) 1822 { 1823 return machines__for_each_thread(&session->machines, 1824 perf_session__flush_thread_stack, 1825 NULL); 1826 } 1827 1828 volatile int session_done; 1829 1830 static int __perf_session__process_decomp_events(struct perf_session *session); 1831 1832 static int __perf_session__process_pipe_events(struct perf_session *session) 1833 { 1834 struct ordered_events *oe = &session->ordered_events; 1835 struct perf_tool *tool = session->tool; 1836 int fd = perf_data__fd(session->data); 1837 union perf_event *event; 1838 uint32_t size, cur_size = 0; 1839 void *buf = NULL; 1840 s64 skip = 0; 1841 u64 head; 1842 ssize_t err; 1843 void *p; 1844 1845 perf_tool__fill_defaults(tool); 1846 1847 head = 0; 1848 cur_size = sizeof(union perf_event); 1849 1850 buf = malloc(cur_size); 1851 if (!buf) 1852 return -errno; 1853 ordered_events__set_copy_on_queue(oe, true); 1854 more: 1855 event = buf; 1856 err = readn(fd, event, sizeof(struct perf_event_header)); 1857 if (err <= 0) { 1858 if (err == 0) 1859 goto done; 1860 1861 pr_err("failed to read event header\n"); 1862 goto out_err; 1863 } 1864 1865 if (session->header.needs_swap) 1866 perf_event_header__bswap(&event->header); 1867 1868 size = event->header.size; 1869 if (size < sizeof(struct perf_event_header)) { 1870 pr_err("bad event header size\n"); 1871 goto out_err; 1872 } 1873 1874 if (size > cur_size) { 1875 void *new = realloc(buf, size); 1876 if (!new) { 1877 pr_err("failed to allocate memory to read event\n"); 1878 goto out_err; 1879 } 1880 buf = new; 1881 cur_size = size; 1882 event = buf; 1883 } 1884 p = event; 1885 p += sizeof(struct perf_event_header); 1886 1887 if (size - sizeof(struct perf_event_header)) { 1888 err = readn(fd, p, size - sizeof(struct perf_event_header)); 1889 if (err <= 0) { 1890 if (err == 0) { 1891 pr_err("unexpected end of event stream\n"); 1892 goto done; 1893 } 1894 1895 pr_err("failed to read event data\n"); 1896 goto out_err; 1897 } 1898 } 1899 1900 if ((skip = perf_session__process_event(session, event, head)) < 0) { 1901 pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n", 1902 head, event->header.size, event->header.type); 1903 err = -EINVAL; 1904 goto out_err; 1905 } 1906 1907 head += size; 1908 1909 if (skip > 0) 1910 head += skip; 1911 1912 err = __perf_session__process_decomp_events(session); 1913 if (err) 1914 goto out_err; 1915 1916 if (!session_done()) 1917 goto more; 1918 done: 1919 /* do the final flush for ordered samples */ 1920 err = ordered_events__flush(oe, OE_FLUSH__FINAL); 1921 if (err) 1922 goto out_err; 1923 err = auxtrace__flush_events(session, tool); 1924 if (err) 1925 goto out_err; 1926 err = perf_session__flush_thread_stacks(session); 1927 out_err: 1928 free(buf); 1929 if (!tool->no_warn) 1930 perf_session__warn_about_errors(session); 1931 ordered_events__free(&session->ordered_events); 1932 auxtrace__free_events(session); 1933 return err; 1934 } 1935 1936 static union perf_event * 1937 fetch_mmaped_event(struct perf_session *session, 1938 u64 head, size_t mmap_size, char *buf) 1939 { 1940 union perf_event *event; 1941 1942 /* 1943 * Ensure we have enough space remaining to read 1944 * the size of the event in the headers. 1945 */ 1946 if (head + sizeof(event->header) > mmap_size) 1947 return NULL; 1948 1949 event = (union perf_event *)(buf + head); 1950 1951 if (session->header.needs_swap) 1952 perf_event_header__bswap(&event->header); 1953 1954 if (head + event->header.size > mmap_size) { 1955 /* We're not fetching the event so swap back again */ 1956 if (session->header.needs_swap) 1957 perf_event_header__bswap(&event->header); 1958 return NULL; 1959 } 1960 1961 return event; 1962 } 1963 1964 static int __perf_session__process_decomp_events(struct perf_session *session) 1965 { 1966 s64 skip; 1967 u64 size, file_pos = 0; 1968 struct decomp *decomp = session->decomp_last; 1969 1970 if (!decomp) 1971 return 0; 1972 1973 while (decomp->head < decomp->size && !session_done()) { 1974 union perf_event *event = fetch_mmaped_event(session, decomp->head, decomp->size, decomp->data); 1975 1976 if (!event) 1977 break; 1978 1979 size = event->header.size; 1980 1981 if (size < sizeof(struct perf_event_header) || 1982 (skip = perf_session__process_event(session, event, file_pos)) < 0) { 1983 pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n", 1984 decomp->file_pos + decomp->head, event->header.size, event->header.type); 1985 return -EINVAL; 1986 } 1987 1988 if (skip) 1989 size += skip; 1990 1991 decomp->head += size; 1992 } 1993 1994 return 0; 1995 } 1996 1997 /* 1998 * On 64bit we can mmap the data file in one go. No need for tiny mmap 1999 * slices. On 32bit we use 32MB. 2000 */ 2001 #if BITS_PER_LONG == 64 2002 #define MMAP_SIZE ULLONG_MAX 2003 #define NUM_MMAPS 1 2004 #else 2005 #define MMAP_SIZE (32 * 1024 * 1024ULL) 2006 #define NUM_MMAPS 128 2007 #endif 2008 2009 struct reader; 2010 2011 typedef s64 (*reader_cb_t)(struct perf_session *session, 2012 union perf_event *event, 2013 u64 file_offset); 2014 2015 struct reader { 2016 int fd; 2017 u64 data_size; 2018 u64 data_offset; 2019 reader_cb_t process; 2020 }; 2021 2022 static int 2023 reader__process_events(struct reader *rd, struct perf_session *session, 2024 struct ui_progress *prog) 2025 { 2026 u64 data_size = rd->data_size; 2027 u64 head, page_offset, file_offset, file_pos, size; 2028 int err = 0, mmap_prot, mmap_flags, map_idx = 0; 2029 size_t mmap_size; 2030 char *buf, *mmaps[NUM_MMAPS]; 2031 union perf_event *event; 2032 s64 skip; 2033 2034 page_offset = page_size * (rd->data_offset / page_size); 2035 file_offset = page_offset; 2036 head = rd->data_offset - page_offset; 2037 2038 ui_progress__init_size(prog, data_size, "Processing events..."); 2039 2040 data_size += rd->data_offset; 2041 2042 mmap_size = MMAP_SIZE; 2043 if (mmap_size > data_size) { 2044 mmap_size = data_size; 2045 session->one_mmap = true; 2046 } 2047 2048 memset(mmaps, 0, sizeof(mmaps)); 2049 2050 mmap_prot = PROT_READ; 2051 mmap_flags = MAP_SHARED; 2052 2053 if (session->header.needs_swap) { 2054 mmap_prot |= PROT_WRITE; 2055 mmap_flags = MAP_PRIVATE; 2056 } 2057 remap: 2058 buf = mmap(NULL, mmap_size, mmap_prot, mmap_flags, rd->fd, 2059 file_offset); 2060 if (buf == MAP_FAILED) { 2061 pr_err("failed to mmap file\n"); 2062 err = -errno; 2063 goto out; 2064 } 2065 mmaps[map_idx] = buf; 2066 map_idx = (map_idx + 1) & (ARRAY_SIZE(mmaps) - 1); 2067 file_pos = file_offset + head; 2068 if (session->one_mmap) { 2069 session->one_mmap_addr = buf; 2070 session->one_mmap_offset = file_offset; 2071 } 2072 2073 more: 2074 event = fetch_mmaped_event(session, head, mmap_size, buf); 2075 if (!event) { 2076 if (mmaps[map_idx]) { 2077 munmap(mmaps[map_idx], mmap_size); 2078 mmaps[map_idx] = NULL; 2079 } 2080 2081 page_offset = page_size * (head / page_size); 2082 file_offset += page_offset; 2083 head -= page_offset; 2084 goto remap; 2085 } 2086 2087 size = event->header.size; 2088 2089 skip = -EINVAL; 2090 2091 if (size < sizeof(struct perf_event_header) || 2092 (skip = rd->process(session, event, file_pos)) < 0) { 2093 pr_err("%#" PRIx64 " [%#x]: failed to process type: %d [%s]\n", 2094 file_offset + head, event->header.size, 2095 event->header.type, strerror(-skip)); 2096 err = skip; 2097 goto out; 2098 } 2099 2100 if (skip) 2101 size += skip; 2102 2103 head += size; 2104 file_pos += size; 2105 2106 err = __perf_session__process_decomp_events(session); 2107 if (err) 2108 goto out; 2109 2110 ui_progress__update(prog, size); 2111 2112 if (session_done()) 2113 goto out; 2114 2115 if (file_pos < data_size) 2116 goto more; 2117 2118 out: 2119 return err; 2120 } 2121 2122 static s64 process_simple(struct perf_session *session, 2123 union perf_event *event, 2124 u64 file_offset) 2125 { 2126 return perf_session__process_event(session, event, file_offset); 2127 } 2128 2129 static int __perf_session__process_events(struct perf_session *session) 2130 { 2131 struct reader rd = { 2132 .fd = perf_data__fd(session->data), 2133 .data_size = session->header.data_size, 2134 .data_offset = session->header.data_offset, 2135 .process = process_simple, 2136 }; 2137 struct ordered_events *oe = &session->ordered_events; 2138 struct perf_tool *tool = session->tool; 2139 struct ui_progress prog; 2140 int err; 2141 2142 perf_tool__fill_defaults(tool); 2143 2144 if (rd.data_size == 0) 2145 return -1; 2146 2147 ui_progress__init_size(&prog, rd.data_size, "Processing events..."); 2148 2149 err = reader__process_events(&rd, session, &prog); 2150 if (err) 2151 goto out_err; 2152 /* do the final flush for ordered samples */ 2153 err = ordered_events__flush(oe, OE_FLUSH__FINAL); 2154 if (err) 2155 goto out_err; 2156 err = auxtrace__flush_events(session, tool); 2157 if (err) 2158 goto out_err; 2159 err = perf_session__flush_thread_stacks(session); 2160 out_err: 2161 ui_progress__finish(); 2162 if (!tool->no_warn) 2163 perf_session__warn_about_errors(session); 2164 /* 2165 * We may switching perf.data output, make ordered_events 2166 * reusable. 2167 */ 2168 ordered_events__reinit(&session->ordered_events); 2169 auxtrace__free_events(session); 2170 session->one_mmap = false; 2171 return err; 2172 } 2173 2174 int perf_session__process_events(struct perf_session *session) 2175 { 2176 if (perf_session__register_idle_thread(session) < 0) 2177 return -ENOMEM; 2178 2179 if (perf_data__is_pipe(session->data)) 2180 return __perf_session__process_pipe_events(session); 2181 2182 return __perf_session__process_events(session); 2183 } 2184 2185 bool perf_session__has_traces(struct perf_session *session, const char *msg) 2186 { 2187 struct evsel *evsel; 2188 2189 evlist__for_each_entry(session->evlist, evsel) { 2190 if (evsel->core.attr.type == PERF_TYPE_TRACEPOINT) 2191 return true; 2192 } 2193 2194 pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg); 2195 return false; 2196 } 2197 2198 int map__set_kallsyms_ref_reloc_sym(struct map *map, const char *symbol_name, u64 addr) 2199 { 2200 char *bracket; 2201 struct ref_reloc_sym *ref; 2202 struct kmap *kmap; 2203 2204 ref = zalloc(sizeof(struct ref_reloc_sym)); 2205 if (ref == NULL) 2206 return -ENOMEM; 2207 2208 ref->name = strdup(symbol_name); 2209 if (ref->name == NULL) { 2210 free(ref); 2211 return -ENOMEM; 2212 } 2213 2214 bracket = strchr(ref->name, ']'); 2215 if (bracket) 2216 *bracket = '\0'; 2217 2218 ref->addr = addr; 2219 2220 kmap = map__kmap(map); 2221 if (kmap) 2222 kmap->ref_reloc_sym = ref; 2223 2224 return 0; 2225 } 2226 2227 size_t perf_session__fprintf_dsos(struct perf_session *session, FILE *fp) 2228 { 2229 return machines__fprintf_dsos(&session->machines, fp); 2230 } 2231 2232 size_t perf_session__fprintf_dsos_buildid(struct perf_session *session, FILE *fp, 2233 bool (skip)(struct dso *dso, int parm), int parm) 2234 { 2235 return machines__fprintf_dsos_buildid(&session->machines, fp, skip, parm); 2236 } 2237 2238 size_t perf_session__fprintf_nr_events(struct perf_session *session, FILE *fp) 2239 { 2240 size_t ret; 2241 const char *msg = ""; 2242 2243 if (perf_header__has_feat(&session->header, HEADER_AUXTRACE)) 2244 msg = " (excludes AUX area (e.g. instruction trace) decoded / synthesized events)"; 2245 2246 ret = fprintf(fp, "\nAggregated stats:%s\n", msg); 2247 2248 ret += events_stats__fprintf(&session->evlist->stats, fp); 2249 return ret; 2250 } 2251 2252 size_t perf_session__fprintf(struct perf_session *session, FILE *fp) 2253 { 2254 /* 2255 * FIXME: Here we have to actually print all the machines in this 2256 * session, not just the host... 2257 */ 2258 return machine__fprintf(&session->machines.host, fp); 2259 } 2260 2261 struct evsel *perf_session__find_first_evtype(struct perf_session *session, 2262 unsigned int type) 2263 { 2264 struct evsel *pos; 2265 2266 evlist__for_each_entry(session->evlist, pos) { 2267 if (pos->core.attr.type == type) 2268 return pos; 2269 } 2270 return NULL; 2271 } 2272 2273 int perf_session__cpu_bitmap(struct perf_session *session, 2274 const char *cpu_list, unsigned long *cpu_bitmap) 2275 { 2276 int i, err = -1; 2277 struct perf_cpu_map *map; 2278 2279 for (i = 0; i < PERF_TYPE_MAX; ++i) { 2280 struct evsel *evsel; 2281 2282 evsel = perf_session__find_first_evtype(session, i); 2283 if (!evsel) 2284 continue; 2285 2286 if (!(evsel->core.attr.sample_type & PERF_SAMPLE_CPU)) { 2287 pr_err("File does not contain CPU events. " 2288 "Remove -C option to proceed.\n"); 2289 return -1; 2290 } 2291 } 2292 2293 map = perf_cpu_map__new(cpu_list); 2294 if (map == NULL) { 2295 pr_err("Invalid cpu_list\n"); 2296 return -1; 2297 } 2298 2299 for (i = 0; i < map->nr; i++) { 2300 int cpu = map->map[i]; 2301 2302 if (cpu >= MAX_NR_CPUS) { 2303 pr_err("Requested CPU %d too large. " 2304 "Consider raising MAX_NR_CPUS\n", cpu); 2305 goto out_delete_map; 2306 } 2307 2308 set_bit(cpu, cpu_bitmap); 2309 } 2310 2311 err = 0; 2312 2313 out_delete_map: 2314 perf_cpu_map__put(map); 2315 return err; 2316 } 2317 2318 void perf_session__fprintf_info(struct perf_session *session, FILE *fp, 2319 bool full) 2320 { 2321 if (session == NULL || fp == NULL) 2322 return; 2323 2324 fprintf(fp, "# ========\n"); 2325 perf_header__fprintf_info(session, fp, full); 2326 fprintf(fp, "# ========\n#\n"); 2327 } 2328 2329 2330 int __perf_session__set_tracepoints_handlers(struct perf_session *session, 2331 const struct evsel_str_handler *assocs, 2332 size_t nr_assocs) 2333 { 2334 struct evsel *evsel; 2335 size_t i; 2336 int err; 2337 2338 for (i = 0; i < nr_assocs; i++) { 2339 /* 2340 * Adding a handler for an event not in the session, 2341 * just ignore it. 2342 */ 2343 evsel = perf_evlist__find_tracepoint_by_name(session->evlist, assocs[i].name); 2344 if (evsel == NULL) 2345 continue; 2346 2347 err = -EEXIST; 2348 if (evsel->handler != NULL) 2349 goto out; 2350 evsel->handler = assocs[i].handler; 2351 } 2352 2353 err = 0; 2354 out: 2355 return err; 2356 } 2357 2358 int perf_event__process_id_index(struct perf_session *session, 2359 union perf_event *event) 2360 { 2361 struct evlist *evlist = session->evlist; 2362 struct id_index_event *ie = &event->id_index; 2363 size_t i, nr, max_nr; 2364 2365 max_nr = (ie->header.size - sizeof(struct id_index_event)) / 2366 sizeof(struct id_index_entry); 2367 nr = ie->nr; 2368 if (nr > max_nr) 2369 return -EINVAL; 2370 2371 if (dump_trace) 2372 fprintf(stdout, " nr: %zu\n", nr); 2373 2374 for (i = 0; i < nr; i++) { 2375 struct id_index_entry *e = &ie->entries[i]; 2376 struct perf_sample_id *sid; 2377 2378 if (dump_trace) { 2379 fprintf(stdout, " ... id: %"PRIu64, e->id); 2380 fprintf(stdout, " idx: %"PRIu64, e->idx); 2381 fprintf(stdout, " cpu: %"PRId64, e->cpu); 2382 fprintf(stdout, " tid: %"PRId64"\n", e->tid); 2383 } 2384 2385 sid = perf_evlist__id2sid(evlist, e->id); 2386 if (!sid) 2387 return -ENOENT; 2388 sid->idx = e->idx; 2389 sid->cpu = e->cpu; 2390 sid->tid = e->tid; 2391 } 2392 return 0; 2393 } 2394 2395 int perf_event__synthesize_id_index(struct perf_tool *tool, 2396 perf_event__handler_t process, 2397 struct evlist *evlist, 2398 struct machine *machine) 2399 { 2400 union perf_event *ev; 2401 struct evsel *evsel; 2402 size_t nr = 0, i = 0, sz, max_nr, n; 2403 int err; 2404 2405 pr_debug2("Synthesizing id index\n"); 2406 2407 max_nr = (UINT16_MAX - sizeof(struct id_index_event)) / 2408 sizeof(struct id_index_entry); 2409 2410 evlist__for_each_entry(evlist, evsel) 2411 nr += evsel->ids; 2412 2413 n = nr > max_nr ? max_nr : nr; 2414 sz = sizeof(struct id_index_event) + n * sizeof(struct id_index_entry); 2415 ev = zalloc(sz); 2416 if (!ev) 2417 return -ENOMEM; 2418 2419 ev->id_index.header.type = PERF_RECORD_ID_INDEX; 2420 ev->id_index.header.size = sz; 2421 ev->id_index.nr = n; 2422 2423 evlist__for_each_entry(evlist, evsel) { 2424 u32 j; 2425 2426 for (j = 0; j < evsel->ids; j++) { 2427 struct id_index_entry *e; 2428 struct perf_sample_id *sid; 2429 2430 if (i >= n) { 2431 err = process(tool, ev, NULL, machine); 2432 if (err) 2433 goto out_err; 2434 nr -= n; 2435 i = 0; 2436 } 2437 2438 e = &ev->id_index.entries[i++]; 2439 2440 e->id = evsel->id[j]; 2441 2442 sid = perf_evlist__id2sid(evlist, e->id); 2443 if (!sid) { 2444 free(ev); 2445 return -ENOENT; 2446 } 2447 2448 e->idx = sid->idx; 2449 e->cpu = sid->cpu; 2450 e->tid = sid->tid; 2451 } 2452 } 2453 2454 sz = sizeof(struct id_index_event) + nr * sizeof(struct id_index_entry); 2455 ev->id_index.header.size = sz; 2456 ev->id_index.nr = nr; 2457 2458 err = process(tool, ev, NULL, machine); 2459 out_err: 2460 free(ev); 2461 2462 return err; 2463 } 2464