1 #include <linux/kernel.h> 2 #include <traceevent/event-parse.h> 3 4 #include <byteswap.h> 5 #include <unistd.h> 6 #include <sys/types.h> 7 #include <sys/mman.h> 8 9 #include "evlist.h" 10 #include "evsel.h" 11 #include "session.h" 12 #include "tool.h" 13 #include "sort.h" 14 #include "util.h" 15 #include "cpumap.h" 16 #include "perf_regs.h" 17 #include "asm/bug.h" 18 #include "auxtrace.h" 19 #include "thread-stack.h" 20 #include "stat.h" 21 22 static int perf_session__deliver_event(struct perf_session *session, 23 union perf_event *event, 24 struct perf_sample *sample, 25 struct perf_tool *tool, 26 u64 file_offset); 27 28 static int perf_session__open(struct perf_session *session) 29 { 30 struct perf_data_file *file = session->file; 31 32 if (perf_session__read_header(session) < 0) { 33 pr_err("incompatible file format (rerun with -v to learn more)\n"); 34 return -1; 35 } 36 37 if (perf_data_file__is_pipe(file)) 38 return 0; 39 40 if (perf_header__has_feat(&session->header, HEADER_STAT)) 41 return 0; 42 43 if (!perf_evlist__valid_sample_type(session->evlist)) { 44 pr_err("non matching sample_type\n"); 45 return -1; 46 } 47 48 if (!perf_evlist__valid_sample_id_all(session->evlist)) { 49 pr_err("non matching sample_id_all\n"); 50 return -1; 51 } 52 53 if (!perf_evlist__valid_read_format(session->evlist)) { 54 pr_err("non matching read_format\n"); 55 return -1; 56 } 57 58 return 0; 59 } 60 61 void perf_session__set_id_hdr_size(struct perf_session *session) 62 { 63 u16 id_hdr_size = perf_evlist__id_hdr_size(session->evlist); 64 65 machines__set_id_hdr_size(&session->machines, id_hdr_size); 66 } 67 68 int perf_session__create_kernel_maps(struct perf_session *session) 69 { 70 int ret = machine__create_kernel_maps(&session->machines.host); 71 72 if (ret >= 0) 73 ret = machines__create_guest_kernel_maps(&session->machines); 74 return ret; 75 } 76 77 static void perf_session__destroy_kernel_maps(struct perf_session *session) 78 { 79 machines__destroy_kernel_maps(&session->machines); 80 } 81 82 static bool perf_session__has_comm_exec(struct perf_session *session) 83 { 84 struct perf_evsel *evsel; 85 86 evlist__for_each(session->evlist, evsel) { 87 if (evsel->attr.comm_exec) 88 return true; 89 } 90 91 return false; 92 } 93 94 static void perf_session__set_comm_exec(struct perf_session *session) 95 { 96 bool comm_exec = perf_session__has_comm_exec(session); 97 98 machines__set_comm_exec(&session->machines, comm_exec); 99 } 100 101 static int ordered_events__deliver_event(struct ordered_events *oe, 102 struct ordered_event *event) 103 { 104 struct perf_sample sample; 105 struct perf_session *session = container_of(oe, struct perf_session, 106 ordered_events); 107 int ret = perf_evlist__parse_sample(session->evlist, event->event, &sample); 108 109 if (ret) { 110 pr_err("Can't parse sample, err = %d\n", ret); 111 return ret; 112 } 113 114 return perf_session__deliver_event(session, event->event, &sample, 115 session->tool, event->file_offset); 116 } 117 118 struct perf_session *perf_session__new(struct perf_data_file *file, 119 bool repipe, struct perf_tool *tool) 120 { 121 struct perf_session *session = zalloc(sizeof(*session)); 122 123 if (!session) 124 goto out; 125 126 session->repipe = repipe; 127 session->tool = tool; 128 INIT_LIST_HEAD(&session->auxtrace_index); 129 machines__init(&session->machines); 130 ordered_events__init(&session->ordered_events, ordered_events__deliver_event); 131 132 if (file) { 133 if (perf_data_file__open(file)) 134 goto out_delete; 135 136 session->file = file; 137 138 if (perf_data_file__is_read(file)) { 139 if (perf_session__open(session) < 0) 140 goto out_close; 141 142 perf_session__set_id_hdr_size(session); 143 perf_session__set_comm_exec(session); 144 } 145 } else { 146 session->machines.host.env = &perf_env; 147 } 148 149 if (!file || perf_data_file__is_write(file)) { 150 /* 151 * In O_RDONLY mode this will be performed when reading the 152 * kernel MMAP event, in perf_event__process_mmap(). 153 */ 154 if (perf_session__create_kernel_maps(session) < 0) 155 pr_warning("Cannot read kernel map\n"); 156 } 157 158 if (tool && tool->ordering_requires_timestamps && 159 tool->ordered_events && !perf_evlist__sample_id_all(session->evlist)) { 160 dump_printf("WARNING: No sample_id_all support, falling back to unordered processing\n"); 161 tool->ordered_events = false; 162 } 163 164 return session; 165 166 out_close: 167 perf_data_file__close(file); 168 out_delete: 169 perf_session__delete(session); 170 out: 171 return NULL; 172 } 173 174 static void perf_session__delete_threads(struct perf_session *session) 175 { 176 machine__delete_threads(&session->machines.host); 177 } 178 179 void perf_session__delete(struct perf_session *session) 180 { 181 auxtrace__free(session); 182 auxtrace_index__free(&session->auxtrace_index); 183 perf_session__destroy_kernel_maps(session); 184 perf_session__delete_threads(session); 185 perf_env__exit(&session->header.env); 186 machines__exit(&session->machines); 187 if (session->file) 188 perf_data_file__close(session->file); 189 free(session); 190 } 191 192 static int process_event_synth_tracing_data_stub(struct perf_tool *tool 193 __maybe_unused, 194 union perf_event *event 195 __maybe_unused, 196 struct perf_session *session 197 __maybe_unused) 198 { 199 dump_printf(": unhandled!\n"); 200 return 0; 201 } 202 203 static int process_event_synth_attr_stub(struct perf_tool *tool __maybe_unused, 204 union perf_event *event __maybe_unused, 205 struct perf_evlist **pevlist 206 __maybe_unused) 207 { 208 dump_printf(": unhandled!\n"); 209 return 0; 210 } 211 212 static int process_event_synth_event_update_stub(struct perf_tool *tool __maybe_unused, 213 union perf_event *event __maybe_unused, 214 struct perf_evlist **pevlist 215 __maybe_unused) 216 { 217 if (dump_trace) 218 perf_event__fprintf_event_update(event, stdout); 219 220 dump_printf(": unhandled!\n"); 221 return 0; 222 } 223 224 static int process_event_sample_stub(struct perf_tool *tool __maybe_unused, 225 union perf_event *event __maybe_unused, 226 struct perf_sample *sample __maybe_unused, 227 struct perf_evsel *evsel __maybe_unused, 228 struct machine *machine __maybe_unused) 229 { 230 dump_printf(": unhandled!\n"); 231 return 0; 232 } 233 234 static int process_event_stub(struct perf_tool *tool __maybe_unused, 235 union perf_event *event __maybe_unused, 236 struct perf_sample *sample __maybe_unused, 237 struct machine *machine __maybe_unused) 238 { 239 dump_printf(": unhandled!\n"); 240 return 0; 241 } 242 243 static int process_finished_round_stub(struct perf_tool *tool __maybe_unused, 244 union perf_event *event __maybe_unused, 245 struct ordered_events *oe __maybe_unused) 246 { 247 dump_printf(": unhandled!\n"); 248 return 0; 249 } 250 251 static int process_finished_round(struct perf_tool *tool, 252 union perf_event *event, 253 struct ordered_events *oe); 254 255 static int skipn(int fd, off_t n) 256 { 257 char buf[4096]; 258 ssize_t ret; 259 260 while (n > 0) { 261 ret = read(fd, buf, min(n, (off_t)sizeof(buf))); 262 if (ret <= 0) 263 return ret; 264 n -= ret; 265 } 266 267 return 0; 268 } 269 270 static s64 process_event_auxtrace_stub(struct perf_tool *tool __maybe_unused, 271 union perf_event *event, 272 struct perf_session *session 273 __maybe_unused) 274 { 275 dump_printf(": unhandled!\n"); 276 if (perf_data_file__is_pipe(session->file)) 277 skipn(perf_data_file__fd(session->file), event->auxtrace.size); 278 return event->auxtrace.size; 279 } 280 281 static int process_event_op2_stub(struct perf_tool *tool __maybe_unused, 282 union perf_event *event __maybe_unused, 283 struct perf_session *session __maybe_unused) 284 { 285 dump_printf(": unhandled!\n"); 286 return 0; 287 } 288 289 290 static 291 int process_event_thread_map_stub(struct perf_tool *tool __maybe_unused, 292 union perf_event *event __maybe_unused, 293 struct perf_session *session __maybe_unused) 294 { 295 if (dump_trace) 296 perf_event__fprintf_thread_map(event, stdout); 297 298 dump_printf(": unhandled!\n"); 299 return 0; 300 } 301 302 static 303 int process_event_cpu_map_stub(struct perf_tool *tool __maybe_unused, 304 union perf_event *event __maybe_unused, 305 struct perf_session *session __maybe_unused) 306 { 307 if (dump_trace) 308 perf_event__fprintf_cpu_map(event, stdout); 309 310 dump_printf(": unhandled!\n"); 311 return 0; 312 } 313 314 static 315 int process_event_stat_config_stub(struct perf_tool *tool __maybe_unused, 316 union perf_event *event __maybe_unused, 317 struct perf_session *session __maybe_unused) 318 { 319 if (dump_trace) 320 perf_event__fprintf_stat_config(event, stdout); 321 322 dump_printf(": unhandled!\n"); 323 return 0; 324 } 325 326 static int process_stat_stub(struct perf_tool *tool __maybe_unused, 327 union perf_event *event __maybe_unused, 328 struct perf_session *perf_session 329 __maybe_unused) 330 { 331 if (dump_trace) 332 perf_event__fprintf_stat(event, stdout); 333 334 dump_printf(": unhandled!\n"); 335 return 0; 336 } 337 338 static int process_stat_round_stub(struct perf_tool *tool __maybe_unused, 339 union perf_event *event __maybe_unused, 340 struct perf_session *perf_session 341 __maybe_unused) 342 { 343 if (dump_trace) 344 perf_event__fprintf_stat_round(event, stdout); 345 346 dump_printf(": unhandled!\n"); 347 return 0; 348 } 349 350 void perf_tool__fill_defaults(struct perf_tool *tool) 351 { 352 if (tool->sample == NULL) 353 tool->sample = process_event_sample_stub; 354 if (tool->mmap == NULL) 355 tool->mmap = process_event_stub; 356 if (tool->mmap2 == NULL) 357 tool->mmap2 = process_event_stub; 358 if (tool->comm == NULL) 359 tool->comm = process_event_stub; 360 if (tool->fork == NULL) 361 tool->fork = process_event_stub; 362 if (tool->exit == NULL) 363 tool->exit = process_event_stub; 364 if (tool->lost == NULL) 365 tool->lost = perf_event__process_lost; 366 if (tool->lost_samples == NULL) 367 tool->lost_samples = perf_event__process_lost_samples; 368 if (tool->aux == NULL) 369 tool->aux = perf_event__process_aux; 370 if (tool->itrace_start == NULL) 371 tool->itrace_start = perf_event__process_itrace_start; 372 if (tool->context_switch == NULL) 373 tool->context_switch = perf_event__process_switch; 374 if (tool->read == NULL) 375 tool->read = process_event_sample_stub; 376 if (tool->throttle == NULL) 377 tool->throttle = process_event_stub; 378 if (tool->unthrottle == NULL) 379 tool->unthrottle = process_event_stub; 380 if (tool->attr == NULL) 381 tool->attr = process_event_synth_attr_stub; 382 if (tool->event_update == NULL) 383 tool->event_update = process_event_synth_event_update_stub; 384 if (tool->tracing_data == NULL) 385 tool->tracing_data = process_event_synth_tracing_data_stub; 386 if (tool->build_id == NULL) 387 tool->build_id = process_event_op2_stub; 388 if (tool->finished_round == NULL) { 389 if (tool->ordered_events) 390 tool->finished_round = process_finished_round; 391 else 392 tool->finished_round = process_finished_round_stub; 393 } 394 if (tool->id_index == NULL) 395 tool->id_index = process_event_op2_stub; 396 if (tool->auxtrace_info == NULL) 397 tool->auxtrace_info = process_event_op2_stub; 398 if (tool->auxtrace == NULL) 399 tool->auxtrace = process_event_auxtrace_stub; 400 if (tool->auxtrace_error == NULL) 401 tool->auxtrace_error = process_event_op2_stub; 402 if (tool->thread_map == NULL) 403 tool->thread_map = process_event_thread_map_stub; 404 if (tool->cpu_map == NULL) 405 tool->cpu_map = process_event_cpu_map_stub; 406 if (tool->stat_config == NULL) 407 tool->stat_config = process_event_stat_config_stub; 408 if (tool->stat == NULL) 409 tool->stat = process_stat_stub; 410 if (tool->stat_round == NULL) 411 tool->stat_round = process_stat_round_stub; 412 if (tool->time_conv == NULL) 413 tool->time_conv = process_event_op2_stub; 414 } 415 416 static void swap_sample_id_all(union perf_event *event, void *data) 417 { 418 void *end = (void *) event + event->header.size; 419 int size = end - data; 420 421 BUG_ON(size % sizeof(u64)); 422 mem_bswap_64(data, size); 423 } 424 425 static void perf_event__all64_swap(union perf_event *event, 426 bool sample_id_all __maybe_unused) 427 { 428 struct perf_event_header *hdr = &event->header; 429 mem_bswap_64(hdr + 1, event->header.size - sizeof(*hdr)); 430 } 431 432 static void perf_event__comm_swap(union perf_event *event, bool sample_id_all) 433 { 434 event->comm.pid = bswap_32(event->comm.pid); 435 event->comm.tid = bswap_32(event->comm.tid); 436 437 if (sample_id_all) { 438 void *data = &event->comm.comm; 439 440 data += PERF_ALIGN(strlen(data) + 1, sizeof(u64)); 441 swap_sample_id_all(event, data); 442 } 443 } 444 445 static void perf_event__mmap_swap(union perf_event *event, 446 bool sample_id_all) 447 { 448 event->mmap.pid = bswap_32(event->mmap.pid); 449 event->mmap.tid = bswap_32(event->mmap.tid); 450 event->mmap.start = bswap_64(event->mmap.start); 451 event->mmap.len = bswap_64(event->mmap.len); 452 event->mmap.pgoff = bswap_64(event->mmap.pgoff); 453 454 if (sample_id_all) { 455 void *data = &event->mmap.filename; 456 457 data += PERF_ALIGN(strlen(data) + 1, sizeof(u64)); 458 swap_sample_id_all(event, data); 459 } 460 } 461 462 static void perf_event__mmap2_swap(union perf_event *event, 463 bool sample_id_all) 464 { 465 event->mmap2.pid = bswap_32(event->mmap2.pid); 466 event->mmap2.tid = bswap_32(event->mmap2.tid); 467 event->mmap2.start = bswap_64(event->mmap2.start); 468 event->mmap2.len = bswap_64(event->mmap2.len); 469 event->mmap2.pgoff = bswap_64(event->mmap2.pgoff); 470 event->mmap2.maj = bswap_32(event->mmap2.maj); 471 event->mmap2.min = bswap_32(event->mmap2.min); 472 event->mmap2.ino = bswap_64(event->mmap2.ino); 473 474 if (sample_id_all) { 475 void *data = &event->mmap2.filename; 476 477 data += PERF_ALIGN(strlen(data) + 1, sizeof(u64)); 478 swap_sample_id_all(event, data); 479 } 480 } 481 static void perf_event__task_swap(union perf_event *event, bool sample_id_all) 482 { 483 event->fork.pid = bswap_32(event->fork.pid); 484 event->fork.tid = bswap_32(event->fork.tid); 485 event->fork.ppid = bswap_32(event->fork.ppid); 486 event->fork.ptid = bswap_32(event->fork.ptid); 487 event->fork.time = bswap_64(event->fork.time); 488 489 if (sample_id_all) 490 swap_sample_id_all(event, &event->fork + 1); 491 } 492 493 static void perf_event__read_swap(union perf_event *event, bool sample_id_all) 494 { 495 event->read.pid = bswap_32(event->read.pid); 496 event->read.tid = bswap_32(event->read.tid); 497 event->read.value = bswap_64(event->read.value); 498 event->read.time_enabled = bswap_64(event->read.time_enabled); 499 event->read.time_running = bswap_64(event->read.time_running); 500 event->read.id = bswap_64(event->read.id); 501 502 if (sample_id_all) 503 swap_sample_id_all(event, &event->read + 1); 504 } 505 506 static void perf_event__aux_swap(union perf_event *event, bool sample_id_all) 507 { 508 event->aux.aux_offset = bswap_64(event->aux.aux_offset); 509 event->aux.aux_size = bswap_64(event->aux.aux_size); 510 event->aux.flags = bswap_64(event->aux.flags); 511 512 if (sample_id_all) 513 swap_sample_id_all(event, &event->aux + 1); 514 } 515 516 static void perf_event__itrace_start_swap(union perf_event *event, 517 bool sample_id_all) 518 { 519 event->itrace_start.pid = bswap_32(event->itrace_start.pid); 520 event->itrace_start.tid = bswap_32(event->itrace_start.tid); 521 522 if (sample_id_all) 523 swap_sample_id_all(event, &event->itrace_start + 1); 524 } 525 526 static void perf_event__switch_swap(union perf_event *event, bool sample_id_all) 527 { 528 if (event->header.type == PERF_RECORD_SWITCH_CPU_WIDE) { 529 event->context_switch.next_prev_pid = 530 bswap_32(event->context_switch.next_prev_pid); 531 event->context_switch.next_prev_tid = 532 bswap_32(event->context_switch.next_prev_tid); 533 } 534 535 if (sample_id_all) 536 swap_sample_id_all(event, &event->context_switch + 1); 537 } 538 539 static void perf_event__throttle_swap(union perf_event *event, 540 bool sample_id_all) 541 { 542 event->throttle.time = bswap_64(event->throttle.time); 543 event->throttle.id = bswap_64(event->throttle.id); 544 event->throttle.stream_id = bswap_64(event->throttle.stream_id); 545 546 if (sample_id_all) 547 swap_sample_id_all(event, &event->throttle + 1); 548 } 549 550 static u8 revbyte(u8 b) 551 { 552 int rev = (b >> 4) | ((b & 0xf) << 4); 553 rev = ((rev & 0xcc) >> 2) | ((rev & 0x33) << 2); 554 rev = ((rev & 0xaa) >> 1) | ((rev & 0x55) << 1); 555 return (u8) rev; 556 } 557 558 /* 559 * XXX this is hack in attempt to carry flags bitfield 560 * throught endian village. ABI says: 561 * 562 * Bit-fields are allocated from right to left (least to most significant) 563 * on little-endian implementations and from left to right (most to least 564 * significant) on big-endian implementations. 565 * 566 * The above seems to be byte specific, so we need to reverse each 567 * byte of the bitfield. 'Internet' also says this might be implementation 568 * specific and we probably need proper fix and carry perf_event_attr 569 * bitfield flags in separate data file FEAT_ section. Thought this seems 570 * to work for now. 571 */ 572 static void swap_bitfield(u8 *p, unsigned len) 573 { 574 unsigned i; 575 576 for (i = 0; i < len; i++) { 577 *p = revbyte(*p); 578 p++; 579 } 580 } 581 582 /* exported for swapping attributes in file header */ 583 void perf_event__attr_swap(struct perf_event_attr *attr) 584 { 585 attr->type = bswap_32(attr->type); 586 attr->size = bswap_32(attr->size); 587 588 #define bswap_safe(f, n) \ 589 (attr->size > (offsetof(struct perf_event_attr, f) + \ 590 sizeof(attr->f) * (n))) 591 #define bswap_field(f, sz) \ 592 do { \ 593 if (bswap_safe(f, 0)) \ 594 attr->f = bswap_##sz(attr->f); \ 595 } while(0) 596 #define bswap_field_16(f) bswap_field(f, 16) 597 #define bswap_field_32(f) bswap_field(f, 32) 598 #define bswap_field_64(f) bswap_field(f, 64) 599 600 bswap_field_64(config); 601 bswap_field_64(sample_period); 602 bswap_field_64(sample_type); 603 bswap_field_64(read_format); 604 bswap_field_32(wakeup_events); 605 bswap_field_32(bp_type); 606 bswap_field_64(bp_addr); 607 bswap_field_64(bp_len); 608 bswap_field_64(branch_sample_type); 609 bswap_field_64(sample_regs_user); 610 bswap_field_32(sample_stack_user); 611 bswap_field_32(aux_watermark); 612 bswap_field_16(sample_max_stack); 613 614 /* 615 * After read_format are bitfields. Check read_format because 616 * we are unable to use offsetof on bitfield. 617 */ 618 if (bswap_safe(read_format, 1)) 619 swap_bitfield((u8 *) (&attr->read_format + 1), 620 sizeof(u64)); 621 #undef bswap_field_64 622 #undef bswap_field_32 623 #undef bswap_field 624 #undef bswap_safe 625 } 626 627 static void perf_event__hdr_attr_swap(union perf_event *event, 628 bool sample_id_all __maybe_unused) 629 { 630 size_t size; 631 632 perf_event__attr_swap(&event->attr.attr); 633 634 size = event->header.size; 635 size -= (void *)&event->attr.id - (void *)event; 636 mem_bswap_64(event->attr.id, size); 637 } 638 639 static void perf_event__event_update_swap(union perf_event *event, 640 bool sample_id_all __maybe_unused) 641 { 642 event->event_update.type = bswap_64(event->event_update.type); 643 event->event_update.id = bswap_64(event->event_update.id); 644 } 645 646 static void perf_event__event_type_swap(union perf_event *event, 647 bool sample_id_all __maybe_unused) 648 { 649 event->event_type.event_type.event_id = 650 bswap_64(event->event_type.event_type.event_id); 651 } 652 653 static void perf_event__tracing_data_swap(union perf_event *event, 654 bool sample_id_all __maybe_unused) 655 { 656 event->tracing_data.size = bswap_32(event->tracing_data.size); 657 } 658 659 static void perf_event__auxtrace_info_swap(union perf_event *event, 660 bool sample_id_all __maybe_unused) 661 { 662 size_t size; 663 664 event->auxtrace_info.type = bswap_32(event->auxtrace_info.type); 665 666 size = event->header.size; 667 size -= (void *)&event->auxtrace_info.priv - (void *)event; 668 mem_bswap_64(event->auxtrace_info.priv, size); 669 } 670 671 static void perf_event__auxtrace_swap(union perf_event *event, 672 bool sample_id_all __maybe_unused) 673 { 674 event->auxtrace.size = bswap_64(event->auxtrace.size); 675 event->auxtrace.offset = bswap_64(event->auxtrace.offset); 676 event->auxtrace.reference = bswap_64(event->auxtrace.reference); 677 event->auxtrace.idx = bswap_32(event->auxtrace.idx); 678 event->auxtrace.tid = bswap_32(event->auxtrace.tid); 679 event->auxtrace.cpu = bswap_32(event->auxtrace.cpu); 680 } 681 682 static void perf_event__auxtrace_error_swap(union perf_event *event, 683 bool sample_id_all __maybe_unused) 684 { 685 event->auxtrace_error.type = bswap_32(event->auxtrace_error.type); 686 event->auxtrace_error.code = bswap_32(event->auxtrace_error.code); 687 event->auxtrace_error.cpu = bswap_32(event->auxtrace_error.cpu); 688 event->auxtrace_error.pid = bswap_32(event->auxtrace_error.pid); 689 event->auxtrace_error.tid = bswap_32(event->auxtrace_error.tid); 690 event->auxtrace_error.ip = bswap_64(event->auxtrace_error.ip); 691 } 692 693 static void perf_event__thread_map_swap(union perf_event *event, 694 bool sample_id_all __maybe_unused) 695 { 696 unsigned i; 697 698 event->thread_map.nr = bswap_64(event->thread_map.nr); 699 700 for (i = 0; i < event->thread_map.nr; i++) 701 event->thread_map.entries[i].pid = bswap_64(event->thread_map.entries[i].pid); 702 } 703 704 static void perf_event__cpu_map_swap(union perf_event *event, 705 bool sample_id_all __maybe_unused) 706 { 707 struct cpu_map_data *data = &event->cpu_map.data; 708 struct cpu_map_entries *cpus; 709 struct cpu_map_mask *mask; 710 unsigned i; 711 712 data->type = bswap_64(data->type); 713 714 switch (data->type) { 715 case PERF_CPU_MAP__CPUS: 716 cpus = (struct cpu_map_entries *)data->data; 717 718 cpus->nr = bswap_16(cpus->nr); 719 720 for (i = 0; i < cpus->nr; i++) 721 cpus->cpu[i] = bswap_16(cpus->cpu[i]); 722 break; 723 case PERF_CPU_MAP__MASK: 724 mask = (struct cpu_map_mask *) data->data; 725 726 mask->nr = bswap_16(mask->nr); 727 mask->long_size = bswap_16(mask->long_size); 728 729 switch (mask->long_size) { 730 case 4: mem_bswap_32(&mask->mask, mask->nr); break; 731 case 8: mem_bswap_64(&mask->mask, mask->nr); break; 732 default: 733 pr_err("cpu_map swap: unsupported long size\n"); 734 } 735 default: 736 break; 737 } 738 } 739 740 static void perf_event__stat_config_swap(union perf_event *event, 741 bool sample_id_all __maybe_unused) 742 { 743 u64 size; 744 745 size = event->stat_config.nr * sizeof(event->stat_config.data[0]); 746 size += 1; /* nr item itself */ 747 mem_bswap_64(&event->stat_config.nr, size); 748 } 749 750 static void perf_event__stat_swap(union perf_event *event, 751 bool sample_id_all __maybe_unused) 752 { 753 event->stat.id = bswap_64(event->stat.id); 754 event->stat.thread = bswap_32(event->stat.thread); 755 event->stat.cpu = bswap_32(event->stat.cpu); 756 event->stat.val = bswap_64(event->stat.val); 757 event->stat.ena = bswap_64(event->stat.ena); 758 event->stat.run = bswap_64(event->stat.run); 759 } 760 761 static void perf_event__stat_round_swap(union perf_event *event, 762 bool sample_id_all __maybe_unused) 763 { 764 event->stat_round.type = bswap_64(event->stat_round.type); 765 event->stat_round.time = bswap_64(event->stat_round.time); 766 } 767 768 typedef void (*perf_event__swap_op)(union perf_event *event, 769 bool sample_id_all); 770 771 static perf_event__swap_op perf_event__swap_ops[] = { 772 [PERF_RECORD_MMAP] = perf_event__mmap_swap, 773 [PERF_RECORD_MMAP2] = perf_event__mmap2_swap, 774 [PERF_RECORD_COMM] = perf_event__comm_swap, 775 [PERF_RECORD_FORK] = perf_event__task_swap, 776 [PERF_RECORD_EXIT] = perf_event__task_swap, 777 [PERF_RECORD_LOST] = perf_event__all64_swap, 778 [PERF_RECORD_READ] = perf_event__read_swap, 779 [PERF_RECORD_THROTTLE] = perf_event__throttle_swap, 780 [PERF_RECORD_UNTHROTTLE] = perf_event__throttle_swap, 781 [PERF_RECORD_SAMPLE] = perf_event__all64_swap, 782 [PERF_RECORD_AUX] = perf_event__aux_swap, 783 [PERF_RECORD_ITRACE_START] = perf_event__itrace_start_swap, 784 [PERF_RECORD_LOST_SAMPLES] = perf_event__all64_swap, 785 [PERF_RECORD_SWITCH] = perf_event__switch_swap, 786 [PERF_RECORD_SWITCH_CPU_WIDE] = perf_event__switch_swap, 787 [PERF_RECORD_HEADER_ATTR] = perf_event__hdr_attr_swap, 788 [PERF_RECORD_HEADER_EVENT_TYPE] = perf_event__event_type_swap, 789 [PERF_RECORD_HEADER_TRACING_DATA] = perf_event__tracing_data_swap, 790 [PERF_RECORD_HEADER_BUILD_ID] = NULL, 791 [PERF_RECORD_ID_INDEX] = perf_event__all64_swap, 792 [PERF_RECORD_AUXTRACE_INFO] = perf_event__auxtrace_info_swap, 793 [PERF_RECORD_AUXTRACE] = perf_event__auxtrace_swap, 794 [PERF_RECORD_AUXTRACE_ERROR] = perf_event__auxtrace_error_swap, 795 [PERF_RECORD_THREAD_MAP] = perf_event__thread_map_swap, 796 [PERF_RECORD_CPU_MAP] = perf_event__cpu_map_swap, 797 [PERF_RECORD_STAT_CONFIG] = perf_event__stat_config_swap, 798 [PERF_RECORD_STAT] = perf_event__stat_swap, 799 [PERF_RECORD_STAT_ROUND] = perf_event__stat_round_swap, 800 [PERF_RECORD_EVENT_UPDATE] = perf_event__event_update_swap, 801 [PERF_RECORD_TIME_CONV] = perf_event__all64_swap, 802 [PERF_RECORD_HEADER_MAX] = NULL, 803 }; 804 805 /* 806 * When perf record finishes a pass on every buffers, it records this pseudo 807 * event. 808 * We record the max timestamp t found in the pass n. 809 * Assuming these timestamps are monotonic across cpus, we know that if 810 * a buffer still has events with timestamps below t, they will be all 811 * available and then read in the pass n + 1. 812 * Hence when we start to read the pass n + 2, we can safely flush every 813 * events with timestamps below t. 814 * 815 * ============ PASS n ================= 816 * CPU 0 | CPU 1 817 * | 818 * cnt1 timestamps | cnt2 timestamps 819 * 1 | 2 820 * 2 | 3 821 * - | 4 <--- max recorded 822 * 823 * ============ PASS n + 1 ============== 824 * CPU 0 | CPU 1 825 * | 826 * cnt1 timestamps | cnt2 timestamps 827 * 3 | 5 828 * 4 | 6 829 * 5 | 7 <---- max recorded 830 * 831 * Flush every events below timestamp 4 832 * 833 * ============ PASS n + 2 ============== 834 * CPU 0 | CPU 1 835 * | 836 * cnt1 timestamps | cnt2 timestamps 837 * 6 | 8 838 * 7 | 9 839 * - | 10 840 * 841 * Flush every events below timestamp 7 842 * etc... 843 */ 844 static int process_finished_round(struct perf_tool *tool __maybe_unused, 845 union perf_event *event __maybe_unused, 846 struct ordered_events *oe) 847 { 848 if (dump_trace) 849 fprintf(stdout, "\n"); 850 return ordered_events__flush(oe, OE_FLUSH__ROUND); 851 } 852 853 int perf_session__queue_event(struct perf_session *s, union perf_event *event, 854 struct perf_sample *sample, u64 file_offset) 855 { 856 return ordered_events__queue(&s->ordered_events, event, sample, file_offset); 857 } 858 859 static void callchain__lbr_callstack_printf(struct perf_sample *sample) 860 { 861 struct ip_callchain *callchain = sample->callchain; 862 struct branch_stack *lbr_stack = sample->branch_stack; 863 u64 kernel_callchain_nr = callchain->nr; 864 unsigned int i; 865 866 for (i = 0; i < kernel_callchain_nr; i++) { 867 if (callchain->ips[i] == PERF_CONTEXT_USER) 868 break; 869 } 870 871 if ((i != kernel_callchain_nr) && lbr_stack->nr) { 872 u64 total_nr; 873 /* 874 * LBR callstack can only get user call chain, 875 * i is kernel call chain number, 876 * 1 is PERF_CONTEXT_USER. 877 * 878 * The user call chain is stored in LBR registers. 879 * LBR are pair registers. The caller is stored 880 * in "from" register, while the callee is stored 881 * in "to" register. 882 * For example, there is a call stack 883 * "A"->"B"->"C"->"D". 884 * The LBR registers will recorde like 885 * "C"->"D", "B"->"C", "A"->"B". 886 * So only the first "to" register and all "from" 887 * registers are needed to construct the whole stack. 888 */ 889 total_nr = i + 1 + lbr_stack->nr + 1; 890 kernel_callchain_nr = i + 1; 891 892 printf("... LBR call chain: nr:%" PRIu64 "\n", total_nr); 893 894 for (i = 0; i < kernel_callchain_nr; i++) 895 printf("..... %2d: %016" PRIx64 "\n", 896 i, callchain->ips[i]); 897 898 printf("..... %2d: %016" PRIx64 "\n", 899 (int)(kernel_callchain_nr), lbr_stack->entries[0].to); 900 for (i = 0; i < lbr_stack->nr; i++) 901 printf("..... %2d: %016" PRIx64 "\n", 902 (int)(i + kernel_callchain_nr + 1), lbr_stack->entries[i].from); 903 } 904 } 905 906 static void callchain__printf(struct perf_evsel *evsel, 907 struct perf_sample *sample) 908 { 909 unsigned int i; 910 struct ip_callchain *callchain = sample->callchain; 911 912 if (perf_evsel__has_branch_callstack(evsel)) 913 callchain__lbr_callstack_printf(sample); 914 915 printf("... FP chain: nr:%" PRIu64 "\n", callchain->nr); 916 917 for (i = 0; i < callchain->nr; i++) 918 printf("..... %2d: %016" PRIx64 "\n", 919 i, callchain->ips[i]); 920 } 921 922 static void branch_stack__printf(struct perf_sample *sample) 923 { 924 uint64_t i; 925 926 printf("... branch stack: nr:%" PRIu64 "\n", sample->branch_stack->nr); 927 928 for (i = 0; i < sample->branch_stack->nr; i++) { 929 struct branch_entry *e = &sample->branch_stack->entries[i]; 930 931 printf("..... %2"PRIu64": %016" PRIx64 " -> %016" PRIx64 " %hu cycles %s%s%s%s %x\n", 932 i, e->from, e->to, 933 e->flags.cycles, 934 e->flags.mispred ? "M" : " ", 935 e->flags.predicted ? "P" : " ", 936 e->flags.abort ? "A" : " ", 937 e->flags.in_tx ? "T" : " ", 938 (unsigned)e->flags.reserved); 939 } 940 } 941 942 static void regs_dump__printf(u64 mask, u64 *regs) 943 { 944 unsigned rid, i = 0; 945 946 for_each_set_bit(rid, (unsigned long *) &mask, sizeof(mask) * 8) { 947 u64 val = regs[i++]; 948 949 printf(".... %-5s 0x%" PRIx64 "\n", 950 perf_reg_name(rid), val); 951 } 952 } 953 954 static const char *regs_abi[] = { 955 [PERF_SAMPLE_REGS_ABI_NONE] = "none", 956 [PERF_SAMPLE_REGS_ABI_32] = "32-bit", 957 [PERF_SAMPLE_REGS_ABI_64] = "64-bit", 958 }; 959 960 static inline const char *regs_dump_abi(struct regs_dump *d) 961 { 962 if (d->abi > PERF_SAMPLE_REGS_ABI_64) 963 return "unknown"; 964 965 return regs_abi[d->abi]; 966 } 967 968 static void regs__printf(const char *type, struct regs_dump *regs) 969 { 970 u64 mask = regs->mask; 971 972 printf("... %s regs: mask 0x%" PRIx64 " ABI %s\n", 973 type, 974 mask, 975 regs_dump_abi(regs)); 976 977 regs_dump__printf(mask, regs->regs); 978 } 979 980 static void regs_user__printf(struct perf_sample *sample) 981 { 982 struct regs_dump *user_regs = &sample->user_regs; 983 984 if (user_regs->regs) 985 regs__printf("user", user_regs); 986 } 987 988 static void regs_intr__printf(struct perf_sample *sample) 989 { 990 struct regs_dump *intr_regs = &sample->intr_regs; 991 992 if (intr_regs->regs) 993 regs__printf("intr", intr_regs); 994 } 995 996 static void stack_user__printf(struct stack_dump *dump) 997 { 998 printf("... ustack: size %" PRIu64 ", offset 0x%x\n", 999 dump->size, dump->offset); 1000 } 1001 1002 static void perf_evlist__print_tstamp(struct perf_evlist *evlist, 1003 union perf_event *event, 1004 struct perf_sample *sample) 1005 { 1006 u64 sample_type = __perf_evlist__combined_sample_type(evlist); 1007 1008 if (event->header.type != PERF_RECORD_SAMPLE && 1009 !perf_evlist__sample_id_all(evlist)) { 1010 fputs("-1 -1 ", stdout); 1011 return; 1012 } 1013 1014 if ((sample_type & PERF_SAMPLE_CPU)) 1015 printf("%u ", sample->cpu); 1016 1017 if (sample_type & PERF_SAMPLE_TIME) 1018 printf("%" PRIu64 " ", sample->time); 1019 } 1020 1021 static void sample_read__printf(struct perf_sample *sample, u64 read_format) 1022 { 1023 printf("... sample_read:\n"); 1024 1025 if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED) 1026 printf("...... time enabled %016" PRIx64 "\n", 1027 sample->read.time_enabled); 1028 1029 if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING) 1030 printf("...... time running %016" PRIx64 "\n", 1031 sample->read.time_running); 1032 1033 if (read_format & PERF_FORMAT_GROUP) { 1034 u64 i; 1035 1036 printf(".... group nr %" PRIu64 "\n", sample->read.group.nr); 1037 1038 for (i = 0; i < sample->read.group.nr; i++) { 1039 struct sample_read_value *value; 1040 1041 value = &sample->read.group.values[i]; 1042 printf("..... id %016" PRIx64 1043 ", value %016" PRIx64 "\n", 1044 value->id, value->value); 1045 } 1046 } else 1047 printf("..... id %016" PRIx64 ", value %016" PRIx64 "\n", 1048 sample->read.one.id, sample->read.one.value); 1049 } 1050 1051 static void dump_event(struct perf_evlist *evlist, union perf_event *event, 1052 u64 file_offset, struct perf_sample *sample) 1053 { 1054 if (!dump_trace) 1055 return; 1056 1057 printf("\n%#" PRIx64 " [%#x]: event: %d\n", 1058 file_offset, event->header.size, event->header.type); 1059 1060 trace_event(event); 1061 1062 if (sample) 1063 perf_evlist__print_tstamp(evlist, event, sample); 1064 1065 printf("%#" PRIx64 " [%#x]: PERF_RECORD_%s", file_offset, 1066 event->header.size, perf_event__name(event->header.type)); 1067 } 1068 1069 static void dump_sample(struct perf_evsel *evsel, union perf_event *event, 1070 struct perf_sample *sample) 1071 { 1072 u64 sample_type; 1073 1074 if (!dump_trace) 1075 return; 1076 1077 printf("(IP, 0x%x): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n", 1078 event->header.misc, sample->pid, sample->tid, sample->ip, 1079 sample->period, sample->addr); 1080 1081 sample_type = evsel->attr.sample_type; 1082 1083 if (sample_type & PERF_SAMPLE_CALLCHAIN) 1084 callchain__printf(evsel, sample); 1085 1086 if ((sample_type & PERF_SAMPLE_BRANCH_STACK) && !perf_evsel__has_branch_callstack(evsel)) 1087 branch_stack__printf(sample); 1088 1089 if (sample_type & PERF_SAMPLE_REGS_USER) 1090 regs_user__printf(sample); 1091 1092 if (sample_type & PERF_SAMPLE_REGS_INTR) 1093 regs_intr__printf(sample); 1094 1095 if (sample_type & PERF_SAMPLE_STACK_USER) 1096 stack_user__printf(&sample->user_stack); 1097 1098 if (sample_type & PERF_SAMPLE_WEIGHT) 1099 printf("... weight: %" PRIu64 "\n", sample->weight); 1100 1101 if (sample_type & PERF_SAMPLE_DATA_SRC) 1102 printf(" . data_src: 0x%"PRIx64"\n", sample->data_src); 1103 1104 if (sample_type & PERF_SAMPLE_TRANSACTION) 1105 printf("... transaction: %" PRIx64 "\n", sample->transaction); 1106 1107 if (sample_type & PERF_SAMPLE_READ) 1108 sample_read__printf(sample, evsel->attr.read_format); 1109 } 1110 1111 static struct machine *machines__find_for_cpumode(struct machines *machines, 1112 union perf_event *event, 1113 struct perf_sample *sample) 1114 { 1115 struct machine *machine; 1116 1117 if (perf_guest && 1118 ((sample->cpumode == PERF_RECORD_MISC_GUEST_KERNEL) || 1119 (sample->cpumode == PERF_RECORD_MISC_GUEST_USER))) { 1120 u32 pid; 1121 1122 if (event->header.type == PERF_RECORD_MMAP 1123 || event->header.type == PERF_RECORD_MMAP2) 1124 pid = event->mmap.pid; 1125 else 1126 pid = sample->pid; 1127 1128 machine = machines__find(machines, pid); 1129 if (!machine) 1130 machine = machines__findnew(machines, DEFAULT_GUEST_KERNEL_ID); 1131 return machine; 1132 } 1133 1134 return &machines->host; 1135 } 1136 1137 static int deliver_sample_value(struct perf_evlist *evlist, 1138 struct perf_tool *tool, 1139 union perf_event *event, 1140 struct perf_sample *sample, 1141 struct sample_read_value *v, 1142 struct machine *machine) 1143 { 1144 struct perf_sample_id *sid = perf_evlist__id2sid(evlist, v->id); 1145 1146 if (sid) { 1147 sample->id = v->id; 1148 sample->period = v->value - sid->period; 1149 sid->period = v->value; 1150 } 1151 1152 if (!sid || sid->evsel == NULL) { 1153 ++evlist->stats.nr_unknown_id; 1154 return 0; 1155 } 1156 1157 return tool->sample(tool, event, sample, sid->evsel, machine); 1158 } 1159 1160 static int deliver_sample_group(struct perf_evlist *evlist, 1161 struct perf_tool *tool, 1162 union perf_event *event, 1163 struct perf_sample *sample, 1164 struct machine *machine) 1165 { 1166 int ret = -EINVAL; 1167 u64 i; 1168 1169 for (i = 0; i < sample->read.group.nr; i++) { 1170 ret = deliver_sample_value(evlist, tool, event, sample, 1171 &sample->read.group.values[i], 1172 machine); 1173 if (ret) 1174 break; 1175 } 1176 1177 return ret; 1178 } 1179 1180 static int 1181 perf_evlist__deliver_sample(struct perf_evlist *evlist, 1182 struct perf_tool *tool, 1183 union perf_event *event, 1184 struct perf_sample *sample, 1185 struct perf_evsel *evsel, 1186 struct machine *machine) 1187 { 1188 /* We know evsel != NULL. */ 1189 u64 sample_type = evsel->attr.sample_type; 1190 u64 read_format = evsel->attr.read_format; 1191 1192 /* Standard sample delievery. */ 1193 if (!(sample_type & PERF_SAMPLE_READ)) 1194 return tool->sample(tool, event, sample, evsel, machine); 1195 1196 /* For PERF_SAMPLE_READ we have either single or group mode. */ 1197 if (read_format & PERF_FORMAT_GROUP) 1198 return deliver_sample_group(evlist, tool, event, sample, 1199 machine); 1200 else 1201 return deliver_sample_value(evlist, tool, event, sample, 1202 &sample->read.one, machine); 1203 } 1204 1205 static int machines__deliver_event(struct machines *machines, 1206 struct perf_evlist *evlist, 1207 union perf_event *event, 1208 struct perf_sample *sample, 1209 struct perf_tool *tool, u64 file_offset) 1210 { 1211 struct perf_evsel *evsel; 1212 struct machine *machine; 1213 1214 dump_event(evlist, event, file_offset, sample); 1215 1216 evsel = perf_evlist__id2evsel(evlist, sample->id); 1217 1218 machine = machines__find_for_cpumode(machines, event, sample); 1219 1220 switch (event->header.type) { 1221 case PERF_RECORD_SAMPLE: 1222 if (evsel == NULL) { 1223 ++evlist->stats.nr_unknown_id; 1224 return 0; 1225 } 1226 dump_sample(evsel, event, sample); 1227 if (machine == NULL) { 1228 ++evlist->stats.nr_unprocessable_samples; 1229 return 0; 1230 } 1231 return perf_evlist__deliver_sample(evlist, tool, event, sample, evsel, machine); 1232 case PERF_RECORD_MMAP: 1233 return tool->mmap(tool, event, sample, machine); 1234 case PERF_RECORD_MMAP2: 1235 if (event->header.misc & PERF_RECORD_MISC_PROC_MAP_PARSE_TIMEOUT) 1236 ++evlist->stats.nr_proc_map_timeout; 1237 return tool->mmap2(tool, event, sample, machine); 1238 case PERF_RECORD_COMM: 1239 return tool->comm(tool, event, sample, machine); 1240 case PERF_RECORD_FORK: 1241 return tool->fork(tool, event, sample, machine); 1242 case PERF_RECORD_EXIT: 1243 return tool->exit(tool, event, sample, machine); 1244 case PERF_RECORD_LOST: 1245 if (tool->lost == perf_event__process_lost) 1246 evlist->stats.total_lost += event->lost.lost; 1247 return tool->lost(tool, event, sample, machine); 1248 case PERF_RECORD_LOST_SAMPLES: 1249 if (tool->lost_samples == perf_event__process_lost_samples) 1250 evlist->stats.total_lost_samples += event->lost_samples.lost; 1251 return tool->lost_samples(tool, event, sample, machine); 1252 case PERF_RECORD_READ: 1253 return tool->read(tool, event, sample, evsel, machine); 1254 case PERF_RECORD_THROTTLE: 1255 return tool->throttle(tool, event, sample, machine); 1256 case PERF_RECORD_UNTHROTTLE: 1257 return tool->unthrottle(tool, event, sample, machine); 1258 case PERF_RECORD_AUX: 1259 if (tool->aux == perf_event__process_aux && 1260 (event->aux.flags & PERF_AUX_FLAG_TRUNCATED)) 1261 evlist->stats.total_aux_lost += 1; 1262 return tool->aux(tool, event, sample, machine); 1263 case PERF_RECORD_ITRACE_START: 1264 return tool->itrace_start(tool, event, sample, machine); 1265 case PERF_RECORD_SWITCH: 1266 case PERF_RECORD_SWITCH_CPU_WIDE: 1267 return tool->context_switch(tool, event, sample, machine); 1268 default: 1269 ++evlist->stats.nr_unknown_events; 1270 return -1; 1271 } 1272 } 1273 1274 static int perf_session__deliver_event(struct perf_session *session, 1275 union perf_event *event, 1276 struct perf_sample *sample, 1277 struct perf_tool *tool, 1278 u64 file_offset) 1279 { 1280 int ret; 1281 1282 ret = auxtrace__process_event(session, event, sample, tool); 1283 if (ret < 0) 1284 return ret; 1285 if (ret > 0) 1286 return 0; 1287 1288 return machines__deliver_event(&session->machines, session->evlist, 1289 event, sample, tool, file_offset); 1290 } 1291 1292 static s64 perf_session__process_user_event(struct perf_session *session, 1293 union perf_event *event, 1294 u64 file_offset) 1295 { 1296 struct ordered_events *oe = &session->ordered_events; 1297 struct perf_tool *tool = session->tool; 1298 int fd = perf_data_file__fd(session->file); 1299 int err; 1300 1301 dump_event(session->evlist, event, file_offset, NULL); 1302 1303 /* These events are processed right away */ 1304 switch (event->header.type) { 1305 case PERF_RECORD_HEADER_ATTR: 1306 err = tool->attr(tool, event, &session->evlist); 1307 if (err == 0) { 1308 perf_session__set_id_hdr_size(session); 1309 perf_session__set_comm_exec(session); 1310 } 1311 return err; 1312 case PERF_RECORD_EVENT_UPDATE: 1313 return tool->event_update(tool, event, &session->evlist); 1314 case PERF_RECORD_HEADER_EVENT_TYPE: 1315 /* 1316 * Depreceated, but we need to handle it for sake 1317 * of old data files create in pipe mode. 1318 */ 1319 return 0; 1320 case PERF_RECORD_HEADER_TRACING_DATA: 1321 /* setup for reading amidst mmap */ 1322 lseek(fd, file_offset, SEEK_SET); 1323 return tool->tracing_data(tool, event, session); 1324 case PERF_RECORD_HEADER_BUILD_ID: 1325 return tool->build_id(tool, event, session); 1326 case PERF_RECORD_FINISHED_ROUND: 1327 return tool->finished_round(tool, event, oe); 1328 case PERF_RECORD_ID_INDEX: 1329 return tool->id_index(tool, event, session); 1330 case PERF_RECORD_AUXTRACE_INFO: 1331 return tool->auxtrace_info(tool, event, session); 1332 case PERF_RECORD_AUXTRACE: 1333 /* setup for reading amidst mmap */ 1334 lseek(fd, file_offset + event->header.size, SEEK_SET); 1335 return tool->auxtrace(tool, event, session); 1336 case PERF_RECORD_AUXTRACE_ERROR: 1337 perf_session__auxtrace_error_inc(session, event); 1338 return tool->auxtrace_error(tool, event, session); 1339 case PERF_RECORD_THREAD_MAP: 1340 return tool->thread_map(tool, event, session); 1341 case PERF_RECORD_CPU_MAP: 1342 return tool->cpu_map(tool, event, session); 1343 case PERF_RECORD_STAT_CONFIG: 1344 return tool->stat_config(tool, event, session); 1345 case PERF_RECORD_STAT: 1346 return tool->stat(tool, event, session); 1347 case PERF_RECORD_STAT_ROUND: 1348 return tool->stat_round(tool, event, session); 1349 case PERF_RECORD_TIME_CONV: 1350 session->time_conv = event->time_conv; 1351 return tool->time_conv(tool, event, session); 1352 default: 1353 return -EINVAL; 1354 } 1355 } 1356 1357 int perf_session__deliver_synth_event(struct perf_session *session, 1358 union perf_event *event, 1359 struct perf_sample *sample) 1360 { 1361 struct perf_evlist *evlist = session->evlist; 1362 struct perf_tool *tool = session->tool; 1363 1364 events_stats__inc(&evlist->stats, event->header.type); 1365 1366 if (event->header.type >= PERF_RECORD_USER_TYPE_START) 1367 return perf_session__process_user_event(session, event, 0); 1368 1369 return machines__deliver_event(&session->machines, evlist, event, sample, tool, 0); 1370 } 1371 1372 static void event_swap(union perf_event *event, bool sample_id_all) 1373 { 1374 perf_event__swap_op swap; 1375 1376 swap = perf_event__swap_ops[event->header.type]; 1377 if (swap) 1378 swap(event, sample_id_all); 1379 } 1380 1381 int perf_session__peek_event(struct perf_session *session, off_t file_offset, 1382 void *buf, size_t buf_sz, 1383 union perf_event **event_ptr, 1384 struct perf_sample *sample) 1385 { 1386 union perf_event *event; 1387 size_t hdr_sz, rest; 1388 int fd; 1389 1390 if (session->one_mmap && !session->header.needs_swap) { 1391 event = file_offset - session->one_mmap_offset + 1392 session->one_mmap_addr; 1393 goto out_parse_sample; 1394 } 1395 1396 if (perf_data_file__is_pipe(session->file)) 1397 return -1; 1398 1399 fd = perf_data_file__fd(session->file); 1400 hdr_sz = sizeof(struct perf_event_header); 1401 1402 if (buf_sz < hdr_sz) 1403 return -1; 1404 1405 if (lseek(fd, file_offset, SEEK_SET) == (off_t)-1 || 1406 readn(fd, buf, hdr_sz) != (ssize_t)hdr_sz) 1407 return -1; 1408 1409 event = (union perf_event *)buf; 1410 1411 if (session->header.needs_swap) 1412 perf_event_header__bswap(&event->header); 1413 1414 if (event->header.size < hdr_sz || event->header.size > buf_sz) 1415 return -1; 1416 1417 rest = event->header.size - hdr_sz; 1418 1419 if (readn(fd, buf, rest) != (ssize_t)rest) 1420 return -1; 1421 1422 if (session->header.needs_swap) 1423 event_swap(event, perf_evlist__sample_id_all(session->evlist)); 1424 1425 out_parse_sample: 1426 1427 if (sample && event->header.type < PERF_RECORD_USER_TYPE_START && 1428 perf_evlist__parse_sample(session->evlist, event, sample)) 1429 return -1; 1430 1431 *event_ptr = event; 1432 1433 return 0; 1434 } 1435 1436 static s64 perf_session__process_event(struct perf_session *session, 1437 union perf_event *event, u64 file_offset) 1438 { 1439 struct perf_evlist *evlist = session->evlist; 1440 struct perf_tool *tool = session->tool; 1441 struct perf_sample sample; 1442 int ret; 1443 1444 if (session->header.needs_swap) 1445 event_swap(event, perf_evlist__sample_id_all(evlist)); 1446 1447 if (event->header.type >= PERF_RECORD_HEADER_MAX) 1448 return -EINVAL; 1449 1450 events_stats__inc(&evlist->stats, event->header.type); 1451 1452 if (event->header.type >= PERF_RECORD_USER_TYPE_START) 1453 return perf_session__process_user_event(session, event, file_offset); 1454 1455 /* 1456 * For all kernel events we get the sample data 1457 */ 1458 ret = perf_evlist__parse_sample(evlist, event, &sample); 1459 if (ret) 1460 return ret; 1461 1462 if (tool->ordered_events) { 1463 ret = perf_session__queue_event(session, event, &sample, file_offset); 1464 if (ret != -ETIME) 1465 return ret; 1466 } 1467 1468 return perf_session__deliver_event(session, event, &sample, tool, 1469 file_offset); 1470 } 1471 1472 void perf_event_header__bswap(struct perf_event_header *hdr) 1473 { 1474 hdr->type = bswap_32(hdr->type); 1475 hdr->misc = bswap_16(hdr->misc); 1476 hdr->size = bswap_16(hdr->size); 1477 } 1478 1479 struct thread *perf_session__findnew(struct perf_session *session, pid_t pid) 1480 { 1481 return machine__findnew_thread(&session->machines.host, -1, pid); 1482 } 1483 1484 int perf_session__register_idle_thread(struct perf_session *session) 1485 { 1486 struct thread *thread; 1487 int err = 0; 1488 1489 thread = machine__findnew_thread(&session->machines.host, 0, 0); 1490 if (thread == NULL || thread__set_comm(thread, "swapper", 0)) { 1491 pr_err("problem inserting idle task.\n"); 1492 err = -1; 1493 } 1494 1495 /* machine__findnew_thread() got the thread, so put it */ 1496 thread__put(thread); 1497 return err; 1498 } 1499 1500 static void perf_session__warn_about_errors(const struct perf_session *session) 1501 { 1502 const struct events_stats *stats = &session->evlist->stats; 1503 const struct ordered_events *oe = &session->ordered_events; 1504 1505 if (session->tool->lost == perf_event__process_lost && 1506 stats->nr_events[PERF_RECORD_LOST] != 0) { 1507 ui__warning("Processed %d events and lost %d chunks!\n\n" 1508 "Check IO/CPU overload!\n\n", 1509 stats->nr_events[0], 1510 stats->nr_events[PERF_RECORD_LOST]); 1511 } 1512 1513 if (session->tool->lost_samples == perf_event__process_lost_samples) { 1514 double drop_rate; 1515 1516 drop_rate = (double)stats->total_lost_samples / 1517 (double) (stats->nr_events[PERF_RECORD_SAMPLE] + stats->total_lost_samples); 1518 if (drop_rate > 0.05) { 1519 ui__warning("Processed %" PRIu64 " samples and lost %3.2f%% samples!\n\n", 1520 stats->nr_events[PERF_RECORD_SAMPLE] + stats->total_lost_samples, 1521 drop_rate * 100.0); 1522 } 1523 } 1524 1525 if (session->tool->aux == perf_event__process_aux && 1526 stats->total_aux_lost != 0) { 1527 ui__warning("AUX data lost %" PRIu64 " times out of %u!\n\n", 1528 stats->total_aux_lost, 1529 stats->nr_events[PERF_RECORD_AUX]); 1530 } 1531 1532 if (stats->nr_unknown_events != 0) { 1533 ui__warning("Found %u unknown events!\n\n" 1534 "Is this an older tool processing a perf.data " 1535 "file generated by a more recent tool?\n\n" 1536 "If that is not the case, consider " 1537 "reporting to linux-kernel@vger.kernel.org.\n\n", 1538 stats->nr_unknown_events); 1539 } 1540 1541 if (stats->nr_unknown_id != 0) { 1542 ui__warning("%u samples with id not present in the header\n", 1543 stats->nr_unknown_id); 1544 } 1545 1546 if (stats->nr_invalid_chains != 0) { 1547 ui__warning("Found invalid callchains!\n\n" 1548 "%u out of %u events were discarded for this reason.\n\n" 1549 "Consider reporting to linux-kernel@vger.kernel.org.\n\n", 1550 stats->nr_invalid_chains, 1551 stats->nr_events[PERF_RECORD_SAMPLE]); 1552 } 1553 1554 if (stats->nr_unprocessable_samples != 0) { 1555 ui__warning("%u unprocessable samples recorded.\n" 1556 "Do you have a KVM guest running and not using 'perf kvm'?\n", 1557 stats->nr_unprocessable_samples); 1558 } 1559 1560 if (oe->nr_unordered_events != 0) 1561 ui__warning("%u out of order events recorded.\n", oe->nr_unordered_events); 1562 1563 events_stats__auxtrace_error_warn(stats); 1564 1565 if (stats->nr_proc_map_timeout != 0) { 1566 ui__warning("%d map information files for pre-existing threads were\n" 1567 "not processed, if there are samples for addresses they\n" 1568 "will not be resolved, you may find out which are these\n" 1569 "threads by running with -v and redirecting the output\n" 1570 "to a file.\n" 1571 "The time limit to process proc map is too short?\n" 1572 "Increase it by --proc-map-timeout\n", 1573 stats->nr_proc_map_timeout); 1574 } 1575 } 1576 1577 static int perf_session__flush_thread_stack(struct thread *thread, 1578 void *p __maybe_unused) 1579 { 1580 return thread_stack__flush(thread); 1581 } 1582 1583 static int perf_session__flush_thread_stacks(struct perf_session *session) 1584 { 1585 return machines__for_each_thread(&session->machines, 1586 perf_session__flush_thread_stack, 1587 NULL); 1588 } 1589 1590 volatile int session_done; 1591 1592 static int __perf_session__process_pipe_events(struct perf_session *session) 1593 { 1594 struct ordered_events *oe = &session->ordered_events; 1595 struct perf_tool *tool = session->tool; 1596 int fd = perf_data_file__fd(session->file); 1597 union perf_event *event; 1598 uint32_t size, cur_size = 0; 1599 void *buf = NULL; 1600 s64 skip = 0; 1601 u64 head; 1602 ssize_t err; 1603 void *p; 1604 1605 perf_tool__fill_defaults(tool); 1606 1607 head = 0; 1608 cur_size = sizeof(union perf_event); 1609 1610 buf = malloc(cur_size); 1611 if (!buf) 1612 return -errno; 1613 more: 1614 event = buf; 1615 err = readn(fd, event, sizeof(struct perf_event_header)); 1616 if (err <= 0) { 1617 if (err == 0) 1618 goto done; 1619 1620 pr_err("failed to read event header\n"); 1621 goto out_err; 1622 } 1623 1624 if (session->header.needs_swap) 1625 perf_event_header__bswap(&event->header); 1626 1627 size = event->header.size; 1628 if (size < sizeof(struct perf_event_header)) { 1629 pr_err("bad event header size\n"); 1630 goto out_err; 1631 } 1632 1633 if (size > cur_size) { 1634 void *new = realloc(buf, size); 1635 if (!new) { 1636 pr_err("failed to allocate memory to read event\n"); 1637 goto out_err; 1638 } 1639 buf = new; 1640 cur_size = size; 1641 event = buf; 1642 } 1643 p = event; 1644 p += sizeof(struct perf_event_header); 1645 1646 if (size - sizeof(struct perf_event_header)) { 1647 err = readn(fd, p, size - sizeof(struct perf_event_header)); 1648 if (err <= 0) { 1649 if (err == 0) { 1650 pr_err("unexpected end of event stream\n"); 1651 goto done; 1652 } 1653 1654 pr_err("failed to read event data\n"); 1655 goto out_err; 1656 } 1657 } 1658 1659 if ((skip = perf_session__process_event(session, event, head)) < 0) { 1660 pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n", 1661 head, event->header.size, event->header.type); 1662 err = -EINVAL; 1663 goto out_err; 1664 } 1665 1666 head += size; 1667 1668 if (skip > 0) 1669 head += skip; 1670 1671 if (!session_done()) 1672 goto more; 1673 done: 1674 /* do the final flush for ordered samples */ 1675 err = ordered_events__flush(oe, OE_FLUSH__FINAL); 1676 if (err) 1677 goto out_err; 1678 err = auxtrace__flush_events(session, tool); 1679 if (err) 1680 goto out_err; 1681 err = perf_session__flush_thread_stacks(session); 1682 out_err: 1683 free(buf); 1684 perf_session__warn_about_errors(session); 1685 ordered_events__free(&session->ordered_events); 1686 auxtrace__free_events(session); 1687 return err; 1688 } 1689 1690 static union perf_event * 1691 fetch_mmaped_event(struct perf_session *session, 1692 u64 head, size_t mmap_size, char *buf) 1693 { 1694 union perf_event *event; 1695 1696 /* 1697 * Ensure we have enough space remaining to read 1698 * the size of the event in the headers. 1699 */ 1700 if (head + sizeof(event->header) > mmap_size) 1701 return NULL; 1702 1703 event = (union perf_event *)(buf + head); 1704 1705 if (session->header.needs_swap) 1706 perf_event_header__bswap(&event->header); 1707 1708 if (head + event->header.size > mmap_size) { 1709 /* We're not fetching the event so swap back again */ 1710 if (session->header.needs_swap) 1711 perf_event_header__bswap(&event->header); 1712 return NULL; 1713 } 1714 1715 return event; 1716 } 1717 1718 /* 1719 * On 64bit we can mmap the data file in one go. No need for tiny mmap 1720 * slices. On 32bit we use 32MB. 1721 */ 1722 #if BITS_PER_LONG == 64 1723 #define MMAP_SIZE ULLONG_MAX 1724 #define NUM_MMAPS 1 1725 #else 1726 #define MMAP_SIZE (32 * 1024 * 1024ULL) 1727 #define NUM_MMAPS 128 1728 #endif 1729 1730 static int __perf_session__process_events(struct perf_session *session, 1731 u64 data_offset, u64 data_size, 1732 u64 file_size) 1733 { 1734 struct ordered_events *oe = &session->ordered_events; 1735 struct perf_tool *tool = session->tool; 1736 int fd = perf_data_file__fd(session->file); 1737 u64 head, page_offset, file_offset, file_pos, size; 1738 int err, mmap_prot, mmap_flags, map_idx = 0; 1739 size_t mmap_size; 1740 char *buf, *mmaps[NUM_MMAPS]; 1741 union perf_event *event; 1742 struct ui_progress prog; 1743 s64 skip; 1744 1745 perf_tool__fill_defaults(tool); 1746 1747 page_offset = page_size * (data_offset / page_size); 1748 file_offset = page_offset; 1749 head = data_offset - page_offset; 1750 1751 if (data_size == 0) 1752 goto out; 1753 1754 if (data_offset + data_size < file_size) 1755 file_size = data_offset + data_size; 1756 1757 ui_progress__init(&prog, file_size, "Processing events..."); 1758 1759 mmap_size = MMAP_SIZE; 1760 if (mmap_size > file_size) { 1761 mmap_size = file_size; 1762 session->one_mmap = true; 1763 } 1764 1765 memset(mmaps, 0, sizeof(mmaps)); 1766 1767 mmap_prot = PROT_READ; 1768 mmap_flags = MAP_SHARED; 1769 1770 if (session->header.needs_swap) { 1771 mmap_prot |= PROT_WRITE; 1772 mmap_flags = MAP_PRIVATE; 1773 } 1774 remap: 1775 buf = mmap(NULL, mmap_size, mmap_prot, mmap_flags, fd, 1776 file_offset); 1777 if (buf == MAP_FAILED) { 1778 pr_err("failed to mmap file\n"); 1779 err = -errno; 1780 goto out_err; 1781 } 1782 mmaps[map_idx] = buf; 1783 map_idx = (map_idx + 1) & (ARRAY_SIZE(mmaps) - 1); 1784 file_pos = file_offset + head; 1785 if (session->one_mmap) { 1786 session->one_mmap_addr = buf; 1787 session->one_mmap_offset = file_offset; 1788 } 1789 1790 more: 1791 event = fetch_mmaped_event(session, head, mmap_size, buf); 1792 if (!event) { 1793 if (mmaps[map_idx]) { 1794 munmap(mmaps[map_idx], mmap_size); 1795 mmaps[map_idx] = NULL; 1796 } 1797 1798 page_offset = page_size * (head / page_size); 1799 file_offset += page_offset; 1800 head -= page_offset; 1801 goto remap; 1802 } 1803 1804 size = event->header.size; 1805 1806 if (size < sizeof(struct perf_event_header) || 1807 (skip = perf_session__process_event(session, event, file_pos)) < 0) { 1808 pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n", 1809 file_offset + head, event->header.size, 1810 event->header.type); 1811 err = -EINVAL; 1812 goto out_err; 1813 } 1814 1815 if (skip) 1816 size += skip; 1817 1818 head += size; 1819 file_pos += size; 1820 1821 ui_progress__update(&prog, size); 1822 1823 if (session_done()) 1824 goto out; 1825 1826 if (file_pos < file_size) 1827 goto more; 1828 1829 out: 1830 /* do the final flush for ordered samples */ 1831 err = ordered_events__flush(oe, OE_FLUSH__FINAL); 1832 if (err) 1833 goto out_err; 1834 err = auxtrace__flush_events(session, tool); 1835 if (err) 1836 goto out_err; 1837 err = perf_session__flush_thread_stacks(session); 1838 out_err: 1839 ui_progress__finish(); 1840 perf_session__warn_about_errors(session); 1841 /* 1842 * We may switching perf.data output, make ordered_events 1843 * reusable. 1844 */ 1845 ordered_events__reinit(&session->ordered_events); 1846 auxtrace__free_events(session); 1847 session->one_mmap = false; 1848 return err; 1849 } 1850 1851 int perf_session__process_events(struct perf_session *session) 1852 { 1853 u64 size = perf_data_file__size(session->file); 1854 int err; 1855 1856 if (perf_session__register_idle_thread(session) < 0) 1857 return -ENOMEM; 1858 1859 if (!perf_data_file__is_pipe(session->file)) 1860 err = __perf_session__process_events(session, 1861 session->header.data_offset, 1862 session->header.data_size, size); 1863 else 1864 err = __perf_session__process_pipe_events(session); 1865 1866 return err; 1867 } 1868 1869 bool perf_session__has_traces(struct perf_session *session, const char *msg) 1870 { 1871 struct perf_evsel *evsel; 1872 1873 evlist__for_each(session->evlist, evsel) { 1874 if (evsel->attr.type == PERF_TYPE_TRACEPOINT) 1875 return true; 1876 } 1877 1878 pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg); 1879 return false; 1880 } 1881 1882 int maps__set_kallsyms_ref_reloc_sym(struct map **maps, 1883 const char *symbol_name, u64 addr) 1884 { 1885 char *bracket; 1886 enum map_type i; 1887 struct ref_reloc_sym *ref; 1888 1889 ref = zalloc(sizeof(struct ref_reloc_sym)); 1890 if (ref == NULL) 1891 return -ENOMEM; 1892 1893 ref->name = strdup(symbol_name); 1894 if (ref->name == NULL) { 1895 free(ref); 1896 return -ENOMEM; 1897 } 1898 1899 bracket = strchr(ref->name, ']'); 1900 if (bracket) 1901 *bracket = '\0'; 1902 1903 ref->addr = addr; 1904 1905 for (i = 0; i < MAP__NR_TYPES; ++i) { 1906 struct kmap *kmap = map__kmap(maps[i]); 1907 1908 if (!kmap) 1909 continue; 1910 kmap->ref_reloc_sym = ref; 1911 } 1912 1913 return 0; 1914 } 1915 1916 size_t perf_session__fprintf_dsos(struct perf_session *session, FILE *fp) 1917 { 1918 return machines__fprintf_dsos(&session->machines, fp); 1919 } 1920 1921 size_t perf_session__fprintf_dsos_buildid(struct perf_session *session, FILE *fp, 1922 bool (skip)(struct dso *dso, int parm), int parm) 1923 { 1924 return machines__fprintf_dsos_buildid(&session->machines, fp, skip, parm); 1925 } 1926 1927 size_t perf_session__fprintf_nr_events(struct perf_session *session, FILE *fp) 1928 { 1929 size_t ret; 1930 const char *msg = ""; 1931 1932 if (perf_header__has_feat(&session->header, HEADER_AUXTRACE)) 1933 msg = " (excludes AUX area (e.g. instruction trace) decoded / synthesized events)"; 1934 1935 ret = fprintf(fp, "\nAggregated stats:%s\n", msg); 1936 1937 ret += events_stats__fprintf(&session->evlist->stats, fp); 1938 return ret; 1939 } 1940 1941 size_t perf_session__fprintf(struct perf_session *session, FILE *fp) 1942 { 1943 /* 1944 * FIXME: Here we have to actually print all the machines in this 1945 * session, not just the host... 1946 */ 1947 return machine__fprintf(&session->machines.host, fp); 1948 } 1949 1950 struct perf_evsel *perf_session__find_first_evtype(struct perf_session *session, 1951 unsigned int type) 1952 { 1953 struct perf_evsel *pos; 1954 1955 evlist__for_each(session->evlist, pos) { 1956 if (pos->attr.type == type) 1957 return pos; 1958 } 1959 return NULL; 1960 } 1961 1962 int perf_session__cpu_bitmap(struct perf_session *session, 1963 const char *cpu_list, unsigned long *cpu_bitmap) 1964 { 1965 int i, err = -1; 1966 struct cpu_map *map; 1967 1968 for (i = 0; i < PERF_TYPE_MAX; ++i) { 1969 struct perf_evsel *evsel; 1970 1971 evsel = perf_session__find_first_evtype(session, i); 1972 if (!evsel) 1973 continue; 1974 1975 if (!(evsel->attr.sample_type & PERF_SAMPLE_CPU)) { 1976 pr_err("File does not contain CPU events. " 1977 "Remove -c option to proceed.\n"); 1978 return -1; 1979 } 1980 } 1981 1982 map = cpu_map__new(cpu_list); 1983 if (map == NULL) { 1984 pr_err("Invalid cpu_list\n"); 1985 return -1; 1986 } 1987 1988 for (i = 0; i < map->nr; i++) { 1989 int cpu = map->map[i]; 1990 1991 if (cpu >= MAX_NR_CPUS) { 1992 pr_err("Requested CPU %d too large. " 1993 "Consider raising MAX_NR_CPUS\n", cpu); 1994 goto out_delete_map; 1995 } 1996 1997 set_bit(cpu, cpu_bitmap); 1998 } 1999 2000 err = 0; 2001 2002 out_delete_map: 2003 cpu_map__put(map); 2004 return err; 2005 } 2006 2007 void perf_session__fprintf_info(struct perf_session *session, FILE *fp, 2008 bool full) 2009 { 2010 struct stat st; 2011 int fd, ret; 2012 2013 if (session == NULL || fp == NULL) 2014 return; 2015 2016 fd = perf_data_file__fd(session->file); 2017 2018 ret = fstat(fd, &st); 2019 if (ret == -1) 2020 return; 2021 2022 fprintf(fp, "# ========\n"); 2023 fprintf(fp, "# captured on: %s", ctime(&st.st_ctime)); 2024 perf_header__fprintf_info(session, fp, full); 2025 fprintf(fp, "# ========\n#\n"); 2026 } 2027 2028 2029 int __perf_session__set_tracepoints_handlers(struct perf_session *session, 2030 const struct perf_evsel_str_handler *assocs, 2031 size_t nr_assocs) 2032 { 2033 struct perf_evsel *evsel; 2034 size_t i; 2035 int err; 2036 2037 for (i = 0; i < nr_assocs; i++) { 2038 /* 2039 * Adding a handler for an event not in the session, 2040 * just ignore it. 2041 */ 2042 evsel = perf_evlist__find_tracepoint_by_name(session->evlist, assocs[i].name); 2043 if (evsel == NULL) 2044 continue; 2045 2046 err = -EEXIST; 2047 if (evsel->handler != NULL) 2048 goto out; 2049 evsel->handler = assocs[i].handler; 2050 } 2051 2052 err = 0; 2053 out: 2054 return err; 2055 } 2056 2057 int perf_event__process_id_index(struct perf_tool *tool __maybe_unused, 2058 union perf_event *event, 2059 struct perf_session *session) 2060 { 2061 struct perf_evlist *evlist = session->evlist; 2062 struct id_index_event *ie = &event->id_index; 2063 size_t i, nr, max_nr; 2064 2065 max_nr = (ie->header.size - sizeof(struct id_index_event)) / 2066 sizeof(struct id_index_entry); 2067 nr = ie->nr; 2068 if (nr > max_nr) 2069 return -EINVAL; 2070 2071 if (dump_trace) 2072 fprintf(stdout, " nr: %zu\n", nr); 2073 2074 for (i = 0; i < nr; i++) { 2075 struct id_index_entry *e = &ie->entries[i]; 2076 struct perf_sample_id *sid; 2077 2078 if (dump_trace) { 2079 fprintf(stdout, " ... id: %"PRIu64, e->id); 2080 fprintf(stdout, " idx: %"PRIu64, e->idx); 2081 fprintf(stdout, " cpu: %"PRId64, e->cpu); 2082 fprintf(stdout, " tid: %"PRId64"\n", e->tid); 2083 } 2084 2085 sid = perf_evlist__id2sid(evlist, e->id); 2086 if (!sid) 2087 return -ENOENT; 2088 sid->idx = e->idx; 2089 sid->cpu = e->cpu; 2090 sid->tid = e->tid; 2091 } 2092 return 0; 2093 } 2094 2095 int perf_event__synthesize_id_index(struct perf_tool *tool, 2096 perf_event__handler_t process, 2097 struct perf_evlist *evlist, 2098 struct machine *machine) 2099 { 2100 union perf_event *ev; 2101 struct perf_evsel *evsel; 2102 size_t nr = 0, i = 0, sz, max_nr, n; 2103 int err; 2104 2105 pr_debug2("Synthesizing id index\n"); 2106 2107 max_nr = (UINT16_MAX - sizeof(struct id_index_event)) / 2108 sizeof(struct id_index_entry); 2109 2110 evlist__for_each(evlist, evsel) 2111 nr += evsel->ids; 2112 2113 n = nr > max_nr ? max_nr : nr; 2114 sz = sizeof(struct id_index_event) + n * sizeof(struct id_index_entry); 2115 ev = zalloc(sz); 2116 if (!ev) 2117 return -ENOMEM; 2118 2119 ev->id_index.header.type = PERF_RECORD_ID_INDEX; 2120 ev->id_index.header.size = sz; 2121 ev->id_index.nr = n; 2122 2123 evlist__for_each(evlist, evsel) { 2124 u32 j; 2125 2126 for (j = 0; j < evsel->ids; j++) { 2127 struct id_index_entry *e; 2128 struct perf_sample_id *sid; 2129 2130 if (i >= n) { 2131 err = process(tool, ev, NULL, machine); 2132 if (err) 2133 goto out_err; 2134 nr -= n; 2135 i = 0; 2136 } 2137 2138 e = &ev->id_index.entries[i++]; 2139 2140 e->id = evsel->id[j]; 2141 2142 sid = perf_evlist__id2sid(evlist, e->id); 2143 if (!sid) { 2144 free(ev); 2145 return -ENOENT; 2146 } 2147 2148 e->idx = sid->idx; 2149 e->cpu = sid->cpu; 2150 e->tid = sid->tid; 2151 } 2152 } 2153 2154 sz = sizeof(struct id_index_event) + nr * sizeof(struct id_index_entry); 2155 ev->id_index.header.size = sz; 2156 ev->id_index.nr = nr; 2157 2158 err = process(tool, ev, NULL, machine); 2159 out_err: 2160 free(ev); 2161 2162 return err; 2163 } 2164