1 /*
2  * intel_pt_decoder.c: Intel Processor Trace support
3  * Copyright (c) 2013-2014, Intel Corporation.
4  *
5  * This program is free software; you can redistribute it and/or modify it
6  * under the terms and conditions of the GNU General Public License,
7  * version 2, as published by the Free Software Foundation.
8  *
9  * This program is distributed in the hope it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
12  * more details.
13  *
14  */
15 
16 #ifndef _GNU_SOURCE
17 #define _GNU_SOURCE
18 #endif
19 #include <stdlib.h>
20 #include <stdbool.h>
21 #include <string.h>
22 #include <errno.h>
23 #include <stdint.h>
24 #include <inttypes.h>
25 
26 #include "../cache.h"
27 #include "../util.h"
28 
29 #include "intel-pt-insn-decoder.h"
30 #include "intel-pt-pkt-decoder.h"
31 #include "intel-pt-decoder.h"
32 #include "intel-pt-log.h"
33 
34 #define INTEL_PT_BLK_SIZE 1024
35 
36 #define BIT63 (((uint64_t)1 << 63))
37 
38 #define INTEL_PT_RETURN 1
39 
40 /* Maximum number of loops with no packets consumed i.e. stuck in a loop */
41 #define INTEL_PT_MAX_LOOPS 10000
42 
43 struct intel_pt_blk {
44 	struct intel_pt_blk *prev;
45 	uint64_t ip[INTEL_PT_BLK_SIZE];
46 };
47 
48 struct intel_pt_stack {
49 	struct intel_pt_blk *blk;
50 	struct intel_pt_blk *spare;
51 	int pos;
52 };
53 
54 enum intel_pt_pkt_state {
55 	INTEL_PT_STATE_NO_PSB,
56 	INTEL_PT_STATE_NO_IP,
57 	INTEL_PT_STATE_ERR_RESYNC,
58 	INTEL_PT_STATE_IN_SYNC,
59 	INTEL_PT_STATE_TNT,
60 	INTEL_PT_STATE_TIP,
61 	INTEL_PT_STATE_TIP_PGD,
62 	INTEL_PT_STATE_FUP,
63 	INTEL_PT_STATE_FUP_NO_TIP,
64 };
65 
66 #ifdef INTEL_PT_STRICT
67 #define INTEL_PT_STATE_ERR1	INTEL_PT_STATE_NO_PSB
68 #define INTEL_PT_STATE_ERR2	INTEL_PT_STATE_NO_PSB
69 #define INTEL_PT_STATE_ERR3	INTEL_PT_STATE_NO_PSB
70 #define INTEL_PT_STATE_ERR4	INTEL_PT_STATE_NO_PSB
71 #else
72 #define INTEL_PT_STATE_ERR1	(decoder->pkt_state)
73 #define INTEL_PT_STATE_ERR2	INTEL_PT_STATE_NO_IP
74 #define INTEL_PT_STATE_ERR3	INTEL_PT_STATE_ERR_RESYNC
75 #define INTEL_PT_STATE_ERR4	INTEL_PT_STATE_IN_SYNC
76 #endif
77 
78 struct intel_pt_decoder {
79 	int (*get_trace)(struct intel_pt_buffer *buffer, void *data);
80 	int (*walk_insn)(struct intel_pt_insn *intel_pt_insn,
81 			 uint64_t *insn_cnt_ptr, uint64_t *ip, uint64_t to_ip,
82 			 uint64_t max_insn_cnt, void *data);
83 	bool (*pgd_ip)(uint64_t ip, void *data);
84 	void *data;
85 	struct intel_pt_state state;
86 	const unsigned char *buf;
87 	size_t len;
88 	bool return_compression;
89 	bool mtc_insn;
90 	bool pge;
91 	bool have_tma;
92 	bool have_cyc;
93 	bool fixup_last_mtc;
94 	uint64_t pos;
95 	uint64_t last_ip;
96 	uint64_t ip;
97 	uint64_t cr3;
98 	uint64_t timestamp;
99 	uint64_t tsc_timestamp;
100 	uint64_t ref_timestamp;
101 	uint64_t ret_addr;
102 	uint64_t ctc_timestamp;
103 	uint64_t ctc_delta;
104 	uint64_t cycle_cnt;
105 	uint64_t cyc_ref_timestamp;
106 	uint32_t last_mtc;
107 	uint32_t tsc_ctc_ratio_n;
108 	uint32_t tsc_ctc_ratio_d;
109 	uint32_t tsc_ctc_mult;
110 	uint32_t tsc_slip;
111 	uint32_t ctc_rem_mask;
112 	int mtc_shift;
113 	struct intel_pt_stack stack;
114 	enum intel_pt_pkt_state pkt_state;
115 	struct intel_pt_pkt packet;
116 	struct intel_pt_pkt tnt;
117 	int pkt_step;
118 	int pkt_len;
119 	int last_packet_type;
120 	unsigned int cbr;
121 	unsigned int max_non_turbo_ratio;
122 	double max_non_turbo_ratio_fp;
123 	double cbr_cyc_to_tsc;
124 	double calc_cyc_to_tsc;
125 	bool have_calc_cyc_to_tsc;
126 	int exec_mode;
127 	unsigned int insn_bytes;
128 	uint64_t period;
129 	enum intel_pt_period_type period_type;
130 	uint64_t tot_insn_cnt;
131 	uint64_t period_insn_cnt;
132 	uint64_t period_mask;
133 	uint64_t period_ticks;
134 	uint64_t last_masked_timestamp;
135 	bool continuous_period;
136 	bool overflow;
137 	bool set_fup_tx_flags;
138 	unsigned int fup_tx_flags;
139 	unsigned int tx_flags;
140 	uint64_t timestamp_insn_cnt;
141 	uint64_t stuck_ip;
142 	int no_progress;
143 	int stuck_ip_prd;
144 	int stuck_ip_cnt;
145 	const unsigned char *next_buf;
146 	size_t next_len;
147 	unsigned char temp_buf[INTEL_PT_PKT_MAX_SZ];
148 };
149 
150 static uint64_t intel_pt_lower_power_of_2(uint64_t x)
151 {
152 	int i;
153 
154 	for (i = 0; x != 1; i++)
155 		x >>= 1;
156 
157 	return x << i;
158 }
159 
160 static void intel_pt_setup_period(struct intel_pt_decoder *decoder)
161 {
162 	if (decoder->period_type == INTEL_PT_PERIOD_TICKS) {
163 		uint64_t period;
164 
165 		period = intel_pt_lower_power_of_2(decoder->period);
166 		decoder->period_mask  = ~(period - 1);
167 		decoder->period_ticks = period;
168 	}
169 }
170 
171 static uint64_t multdiv(uint64_t t, uint32_t n, uint32_t d)
172 {
173 	if (!d)
174 		return 0;
175 	return (t / d) * n + ((t % d) * n) / d;
176 }
177 
178 struct intel_pt_decoder *intel_pt_decoder_new(struct intel_pt_params *params)
179 {
180 	struct intel_pt_decoder *decoder;
181 
182 	if (!params->get_trace || !params->walk_insn)
183 		return NULL;
184 
185 	decoder = zalloc(sizeof(struct intel_pt_decoder));
186 	if (!decoder)
187 		return NULL;
188 
189 	decoder->get_trace          = params->get_trace;
190 	decoder->walk_insn          = params->walk_insn;
191 	decoder->pgd_ip             = params->pgd_ip;
192 	decoder->data               = params->data;
193 	decoder->return_compression = params->return_compression;
194 
195 	decoder->period             = params->period;
196 	decoder->period_type        = params->period_type;
197 
198 	decoder->max_non_turbo_ratio    = params->max_non_turbo_ratio;
199 	decoder->max_non_turbo_ratio_fp = params->max_non_turbo_ratio;
200 
201 	intel_pt_setup_period(decoder);
202 
203 	decoder->mtc_shift = params->mtc_period;
204 	decoder->ctc_rem_mask = (1 << decoder->mtc_shift) - 1;
205 
206 	decoder->tsc_ctc_ratio_n = params->tsc_ctc_ratio_n;
207 	decoder->tsc_ctc_ratio_d = params->tsc_ctc_ratio_d;
208 
209 	if (!decoder->tsc_ctc_ratio_n)
210 		decoder->tsc_ctc_ratio_d = 0;
211 
212 	if (decoder->tsc_ctc_ratio_d) {
213 		if (!(decoder->tsc_ctc_ratio_n % decoder->tsc_ctc_ratio_d))
214 			decoder->tsc_ctc_mult = decoder->tsc_ctc_ratio_n /
215 						decoder->tsc_ctc_ratio_d;
216 
217 		/*
218 		 * Allow for timestamps appearing to backwards because a TSC
219 		 * packet has slipped past a MTC packet, so allow 2 MTC ticks
220 		 * or ...
221 		 */
222 		decoder->tsc_slip = multdiv(2 << decoder->mtc_shift,
223 					decoder->tsc_ctc_ratio_n,
224 					decoder->tsc_ctc_ratio_d);
225 	}
226 	/* ... or 0x100 paranoia */
227 	if (decoder->tsc_slip < 0x100)
228 		decoder->tsc_slip = 0x100;
229 
230 	intel_pt_log("timestamp: mtc_shift %u\n", decoder->mtc_shift);
231 	intel_pt_log("timestamp: tsc_ctc_ratio_n %u\n", decoder->tsc_ctc_ratio_n);
232 	intel_pt_log("timestamp: tsc_ctc_ratio_d %u\n", decoder->tsc_ctc_ratio_d);
233 	intel_pt_log("timestamp: tsc_ctc_mult %u\n", decoder->tsc_ctc_mult);
234 	intel_pt_log("timestamp: tsc_slip %#x\n", decoder->tsc_slip);
235 
236 	return decoder;
237 }
238 
239 static void intel_pt_pop_blk(struct intel_pt_stack *stack)
240 {
241 	struct intel_pt_blk *blk = stack->blk;
242 
243 	stack->blk = blk->prev;
244 	if (!stack->spare)
245 		stack->spare = blk;
246 	else
247 		free(blk);
248 }
249 
250 static uint64_t intel_pt_pop(struct intel_pt_stack *stack)
251 {
252 	if (!stack->pos) {
253 		if (!stack->blk)
254 			return 0;
255 		intel_pt_pop_blk(stack);
256 		if (!stack->blk)
257 			return 0;
258 		stack->pos = INTEL_PT_BLK_SIZE;
259 	}
260 	return stack->blk->ip[--stack->pos];
261 }
262 
263 static int intel_pt_alloc_blk(struct intel_pt_stack *stack)
264 {
265 	struct intel_pt_blk *blk;
266 
267 	if (stack->spare) {
268 		blk = stack->spare;
269 		stack->spare = NULL;
270 	} else {
271 		blk = malloc(sizeof(struct intel_pt_blk));
272 		if (!blk)
273 			return -ENOMEM;
274 	}
275 
276 	blk->prev = stack->blk;
277 	stack->blk = blk;
278 	stack->pos = 0;
279 	return 0;
280 }
281 
282 static int intel_pt_push(struct intel_pt_stack *stack, uint64_t ip)
283 {
284 	int err;
285 
286 	if (!stack->blk || stack->pos == INTEL_PT_BLK_SIZE) {
287 		err = intel_pt_alloc_blk(stack);
288 		if (err)
289 			return err;
290 	}
291 
292 	stack->blk->ip[stack->pos++] = ip;
293 	return 0;
294 }
295 
296 static void intel_pt_clear_stack(struct intel_pt_stack *stack)
297 {
298 	while (stack->blk)
299 		intel_pt_pop_blk(stack);
300 	stack->pos = 0;
301 }
302 
303 static void intel_pt_free_stack(struct intel_pt_stack *stack)
304 {
305 	intel_pt_clear_stack(stack);
306 	zfree(&stack->blk);
307 	zfree(&stack->spare);
308 }
309 
310 void intel_pt_decoder_free(struct intel_pt_decoder *decoder)
311 {
312 	intel_pt_free_stack(&decoder->stack);
313 	free(decoder);
314 }
315 
316 static int intel_pt_ext_err(int code)
317 {
318 	switch (code) {
319 	case -ENOMEM:
320 		return INTEL_PT_ERR_NOMEM;
321 	case -ENOSYS:
322 		return INTEL_PT_ERR_INTERN;
323 	case -EBADMSG:
324 		return INTEL_PT_ERR_BADPKT;
325 	case -ENODATA:
326 		return INTEL_PT_ERR_NODATA;
327 	case -EILSEQ:
328 		return INTEL_PT_ERR_NOINSN;
329 	case -ENOENT:
330 		return INTEL_PT_ERR_MISMAT;
331 	case -EOVERFLOW:
332 		return INTEL_PT_ERR_OVR;
333 	case -ENOSPC:
334 		return INTEL_PT_ERR_LOST;
335 	case -ELOOP:
336 		return INTEL_PT_ERR_NELOOP;
337 	default:
338 		return INTEL_PT_ERR_UNK;
339 	}
340 }
341 
342 static const char *intel_pt_err_msgs[] = {
343 	[INTEL_PT_ERR_NOMEM]  = "Memory allocation failed",
344 	[INTEL_PT_ERR_INTERN] = "Internal error",
345 	[INTEL_PT_ERR_BADPKT] = "Bad packet",
346 	[INTEL_PT_ERR_NODATA] = "No more data",
347 	[INTEL_PT_ERR_NOINSN] = "Failed to get instruction",
348 	[INTEL_PT_ERR_MISMAT] = "Trace doesn't match instruction",
349 	[INTEL_PT_ERR_OVR]    = "Overflow packet",
350 	[INTEL_PT_ERR_LOST]   = "Lost trace data",
351 	[INTEL_PT_ERR_UNK]    = "Unknown error!",
352 	[INTEL_PT_ERR_NELOOP] = "Never-ending loop",
353 };
354 
355 int intel_pt__strerror(int code, char *buf, size_t buflen)
356 {
357 	if (code < 1 || code >= INTEL_PT_ERR_MAX)
358 		code = INTEL_PT_ERR_UNK;
359 	strlcpy(buf, intel_pt_err_msgs[code], buflen);
360 	return 0;
361 }
362 
363 static uint64_t intel_pt_calc_ip(const struct intel_pt_pkt *packet,
364 				 uint64_t last_ip)
365 {
366 	uint64_t ip;
367 
368 	switch (packet->count) {
369 	case 1:
370 		ip = (last_ip & (uint64_t)0xffffffffffff0000ULL) |
371 		     packet->payload;
372 		break;
373 	case 2:
374 		ip = (last_ip & (uint64_t)0xffffffff00000000ULL) |
375 		     packet->payload;
376 		break;
377 	case 3:
378 		ip = packet->payload;
379 		/* Sign-extend 6-byte ip */
380 		if (ip & (uint64_t)0x800000000000ULL)
381 			ip |= (uint64_t)0xffff000000000000ULL;
382 		break;
383 	case 4:
384 		ip = (last_ip & (uint64_t)0xffff000000000000ULL) |
385 		     packet->payload;
386 		break;
387 	case 6:
388 		ip = packet->payload;
389 		break;
390 	default:
391 		return 0;
392 	}
393 
394 	return ip;
395 }
396 
397 static inline void intel_pt_set_last_ip(struct intel_pt_decoder *decoder)
398 {
399 	decoder->last_ip = intel_pt_calc_ip(&decoder->packet, decoder->last_ip);
400 }
401 
402 static inline void intel_pt_set_ip(struct intel_pt_decoder *decoder)
403 {
404 	intel_pt_set_last_ip(decoder);
405 	decoder->ip = decoder->last_ip;
406 }
407 
408 static void intel_pt_decoder_log_packet(struct intel_pt_decoder *decoder)
409 {
410 	intel_pt_log_packet(&decoder->packet, decoder->pkt_len, decoder->pos,
411 			    decoder->buf);
412 }
413 
414 static int intel_pt_bug(struct intel_pt_decoder *decoder)
415 {
416 	intel_pt_log("ERROR: Internal error\n");
417 	decoder->pkt_state = INTEL_PT_STATE_NO_PSB;
418 	return -ENOSYS;
419 }
420 
421 static inline void intel_pt_clear_tx_flags(struct intel_pt_decoder *decoder)
422 {
423 	decoder->tx_flags = 0;
424 }
425 
426 static inline void intel_pt_update_in_tx(struct intel_pt_decoder *decoder)
427 {
428 	decoder->tx_flags = decoder->packet.payload & INTEL_PT_IN_TX;
429 }
430 
431 static int intel_pt_bad_packet(struct intel_pt_decoder *decoder)
432 {
433 	intel_pt_clear_tx_flags(decoder);
434 	decoder->have_tma = false;
435 	decoder->pkt_len = 1;
436 	decoder->pkt_step = 1;
437 	intel_pt_decoder_log_packet(decoder);
438 	if (decoder->pkt_state != INTEL_PT_STATE_NO_PSB) {
439 		intel_pt_log("ERROR: Bad packet\n");
440 		decoder->pkt_state = INTEL_PT_STATE_ERR1;
441 	}
442 	return -EBADMSG;
443 }
444 
445 static int intel_pt_get_data(struct intel_pt_decoder *decoder)
446 {
447 	struct intel_pt_buffer buffer = { .buf = 0, };
448 	int ret;
449 
450 	decoder->pkt_step = 0;
451 
452 	intel_pt_log("Getting more data\n");
453 	ret = decoder->get_trace(&buffer, decoder->data);
454 	if (ret)
455 		return ret;
456 	decoder->buf = buffer.buf;
457 	decoder->len = buffer.len;
458 	if (!decoder->len) {
459 		intel_pt_log("No more data\n");
460 		return -ENODATA;
461 	}
462 	if (!buffer.consecutive) {
463 		decoder->ip = 0;
464 		decoder->pkt_state = INTEL_PT_STATE_NO_PSB;
465 		decoder->ref_timestamp = buffer.ref_timestamp;
466 		decoder->timestamp = 0;
467 		decoder->have_tma = false;
468 		decoder->state.trace_nr = buffer.trace_nr;
469 		intel_pt_log("Reference timestamp 0x%" PRIx64 "\n",
470 			     decoder->ref_timestamp);
471 		return -ENOLINK;
472 	}
473 
474 	return 0;
475 }
476 
477 static int intel_pt_get_next_data(struct intel_pt_decoder *decoder)
478 {
479 	if (!decoder->next_buf)
480 		return intel_pt_get_data(decoder);
481 
482 	decoder->buf = decoder->next_buf;
483 	decoder->len = decoder->next_len;
484 	decoder->next_buf = 0;
485 	decoder->next_len = 0;
486 	return 0;
487 }
488 
489 static int intel_pt_get_split_packet(struct intel_pt_decoder *decoder)
490 {
491 	unsigned char *buf = decoder->temp_buf;
492 	size_t old_len, len, n;
493 	int ret;
494 
495 	old_len = decoder->len;
496 	len = decoder->len;
497 	memcpy(buf, decoder->buf, len);
498 
499 	ret = intel_pt_get_data(decoder);
500 	if (ret) {
501 		decoder->pos += old_len;
502 		return ret < 0 ? ret : -EINVAL;
503 	}
504 
505 	n = INTEL_PT_PKT_MAX_SZ - len;
506 	if (n > decoder->len)
507 		n = decoder->len;
508 	memcpy(buf + len, decoder->buf, n);
509 	len += n;
510 
511 	ret = intel_pt_get_packet(buf, len, &decoder->packet);
512 	if (ret < (int)old_len) {
513 		decoder->next_buf = decoder->buf;
514 		decoder->next_len = decoder->len;
515 		decoder->buf = buf;
516 		decoder->len = old_len;
517 		return intel_pt_bad_packet(decoder);
518 	}
519 
520 	decoder->next_buf = decoder->buf + (ret - old_len);
521 	decoder->next_len = decoder->len - (ret - old_len);
522 
523 	decoder->buf = buf;
524 	decoder->len = ret;
525 
526 	return ret;
527 }
528 
529 struct intel_pt_pkt_info {
530 	struct intel_pt_decoder	  *decoder;
531 	struct intel_pt_pkt       packet;
532 	uint64_t                  pos;
533 	int                       pkt_len;
534 	int                       last_packet_type;
535 	void                      *data;
536 };
537 
538 typedef int (*intel_pt_pkt_cb_t)(struct intel_pt_pkt_info *pkt_info);
539 
540 /* Lookahead packets in current buffer */
541 static int intel_pt_pkt_lookahead(struct intel_pt_decoder *decoder,
542 				  intel_pt_pkt_cb_t cb, void *data)
543 {
544 	struct intel_pt_pkt_info pkt_info;
545 	const unsigned char *buf = decoder->buf;
546 	size_t len = decoder->len;
547 	int ret;
548 
549 	pkt_info.decoder          = decoder;
550 	pkt_info.pos              = decoder->pos;
551 	pkt_info.pkt_len          = decoder->pkt_step;
552 	pkt_info.last_packet_type = decoder->last_packet_type;
553 	pkt_info.data             = data;
554 
555 	while (1) {
556 		do {
557 			pkt_info.pos += pkt_info.pkt_len;
558 			buf          += pkt_info.pkt_len;
559 			len          -= pkt_info.pkt_len;
560 
561 			if (!len)
562 				return INTEL_PT_NEED_MORE_BYTES;
563 
564 			ret = intel_pt_get_packet(buf, len, &pkt_info.packet);
565 			if (!ret)
566 				return INTEL_PT_NEED_MORE_BYTES;
567 			if (ret < 0)
568 				return ret;
569 
570 			pkt_info.pkt_len = ret;
571 		} while (pkt_info.packet.type == INTEL_PT_PAD);
572 
573 		ret = cb(&pkt_info);
574 		if (ret)
575 			return 0;
576 
577 		pkt_info.last_packet_type = pkt_info.packet.type;
578 	}
579 }
580 
581 struct intel_pt_calc_cyc_to_tsc_info {
582 	uint64_t        cycle_cnt;
583 	unsigned int    cbr;
584 	uint32_t        last_mtc;
585 	uint64_t        ctc_timestamp;
586 	uint64_t        ctc_delta;
587 	uint64_t        tsc_timestamp;
588 	uint64_t        timestamp;
589 	bool            have_tma;
590 	bool            fixup_last_mtc;
591 	bool            from_mtc;
592 	double          cbr_cyc_to_tsc;
593 };
594 
595 /*
596  * MTC provides a 8-bit slice of CTC but the TMA packet only provides the lower
597  * 16 bits of CTC. If mtc_shift > 8 then some of the MTC bits are not in the CTC
598  * provided by the TMA packet. Fix-up the last_mtc calculated from the TMA
599  * packet by copying the missing bits from the current MTC assuming the least
600  * difference between the two, and that the current MTC comes after last_mtc.
601  */
602 static void intel_pt_fixup_last_mtc(uint32_t mtc, int mtc_shift,
603 				    uint32_t *last_mtc)
604 {
605 	uint32_t first_missing_bit = 1U << (16 - mtc_shift);
606 	uint32_t mask = ~(first_missing_bit - 1);
607 
608 	*last_mtc |= mtc & mask;
609 	if (*last_mtc >= mtc) {
610 		*last_mtc -= first_missing_bit;
611 		*last_mtc &= 0xff;
612 	}
613 }
614 
615 static int intel_pt_calc_cyc_cb(struct intel_pt_pkt_info *pkt_info)
616 {
617 	struct intel_pt_decoder *decoder = pkt_info->decoder;
618 	struct intel_pt_calc_cyc_to_tsc_info *data = pkt_info->data;
619 	uint64_t timestamp;
620 	double cyc_to_tsc;
621 	unsigned int cbr;
622 	uint32_t mtc, mtc_delta, ctc, fc, ctc_rem;
623 
624 	switch (pkt_info->packet.type) {
625 	case INTEL_PT_TNT:
626 	case INTEL_PT_TIP_PGE:
627 	case INTEL_PT_TIP:
628 	case INTEL_PT_FUP:
629 	case INTEL_PT_PSB:
630 	case INTEL_PT_PIP:
631 	case INTEL_PT_MODE_EXEC:
632 	case INTEL_PT_MODE_TSX:
633 	case INTEL_PT_PSBEND:
634 	case INTEL_PT_PAD:
635 	case INTEL_PT_VMCS:
636 	case INTEL_PT_MNT:
637 		return 0;
638 
639 	case INTEL_PT_MTC:
640 		if (!data->have_tma)
641 			return 0;
642 
643 		mtc = pkt_info->packet.payload;
644 		if (decoder->mtc_shift > 8 && data->fixup_last_mtc) {
645 			data->fixup_last_mtc = false;
646 			intel_pt_fixup_last_mtc(mtc, decoder->mtc_shift,
647 						&data->last_mtc);
648 		}
649 		if (mtc > data->last_mtc)
650 			mtc_delta = mtc - data->last_mtc;
651 		else
652 			mtc_delta = mtc + 256 - data->last_mtc;
653 		data->ctc_delta += mtc_delta << decoder->mtc_shift;
654 		data->last_mtc = mtc;
655 
656 		if (decoder->tsc_ctc_mult) {
657 			timestamp = data->ctc_timestamp +
658 				data->ctc_delta * decoder->tsc_ctc_mult;
659 		} else {
660 			timestamp = data->ctc_timestamp +
661 				multdiv(data->ctc_delta,
662 					decoder->tsc_ctc_ratio_n,
663 					decoder->tsc_ctc_ratio_d);
664 		}
665 
666 		if (timestamp < data->timestamp)
667 			return 1;
668 
669 		if (pkt_info->last_packet_type != INTEL_PT_CYC) {
670 			data->timestamp = timestamp;
671 			return 0;
672 		}
673 
674 		break;
675 
676 	case INTEL_PT_TSC:
677 		timestamp = pkt_info->packet.payload |
678 			    (data->timestamp & (0xffULL << 56));
679 		if (data->from_mtc && timestamp < data->timestamp &&
680 		    data->timestamp - timestamp < decoder->tsc_slip)
681 			return 1;
682 		if (timestamp < data->timestamp)
683 			timestamp += (1ULL << 56);
684 		if (pkt_info->last_packet_type != INTEL_PT_CYC) {
685 			if (data->from_mtc)
686 				return 1;
687 			data->tsc_timestamp = timestamp;
688 			data->timestamp = timestamp;
689 			return 0;
690 		}
691 		break;
692 
693 	case INTEL_PT_TMA:
694 		if (data->from_mtc)
695 			return 1;
696 
697 		if (!decoder->tsc_ctc_ratio_d)
698 			return 0;
699 
700 		ctc = pkt_info->packet.payload;
701 		fc = pkt_info->packet.count;
702 		ctc_rem = ctc & decoder->ctc_rem_mask;
703 
704 		data->last_mtc = (ctc >> decoder->mtc_shift) & 0xff;
705 
706 		data->ctc_timestamp = data->tsc_timestamp - fc;
707 		if (decoder->tsc_ctc_mult) {
708 			data->ctc_timestamp -= ctc_rem * decoder->tsc_ctc_mult;
709 		} else {
710 			data->ctc_timestamp -=
711 				multdiv(ctc_rem, decoder->tsc_ctc_ratio_n,
712 					decoder->tsc_ctc_ratio_d);
713 		}
714 
715 		data->ctc_delta = 0;
716 		data->have_tma = true;
717 		data->fixup_last_mtc = true;
718 
719 		return 0;
720 
721 	case INTEL_PT_CYC:
722 		data->cycle_cnt += pkt_info->packet.payload;
723 		return 0;
724 
725 	case INTEL_PT_CBR:
726 		cbr = pkt_info->packet.payload;
727 		if (data->cbr && data->cbr != cbr)
728 			return 1;
729 		data->cbr = cbr;
730 		data->cbr_cyc_to_tsc = decoder->max_non_turbo_ratio_fp / cbr;
731 		return 0;
732 
733 	case INTEL_PT_TIP_PGD:
734 	case INTEL_PT_TRACESTOP:
735 	case INTEL_PT_OVF:
736 	case INTEL_PT_BAD: /* Does not happen */
737 	default:
738 		return 1;
739 	}
740 
741 	if (!data->cbr && decoder->cbr) {
742 		data->cbr = decoder->cbr;
743 		data->cbr_cyc_to_tsc = decoder->cbr_cyc_to_tsc;
744 	}
745 
746 	if (!data->cycle_cnt)
747 		return 1;
748 
749 	cyc_to_tsc = (double)(timestamp - decoder->timestamp) / data->cycle_cnt;
750 
751 	if (data->cbr && cyc_to_tsc > data->cbr_cyc_to_tsc &&
752 	    cyc_to_tsc / data->cbr_cyc_to_tsc > 1.25) {
753 		intel_pt_log("Timestamp: calculated %g TSC ticks per cycle too big (c.f. CBR-based value %g), pos " x64_fmt "\n",
754 			     cyc_to_tsc, data->cbr_cyc_to_tsc, pkt_info->pos);
755 		return 1;
756 	}
757 
758 	decoder->calc_cyc_to_tsc = cyc_to_tsc;
759 	decoder->have_calc_cyc_to_tsc = true;
760 
761 	if (data->cbr) {
762 		intel_pt_log("Timestamp: calculated %g TSC ticks per cycle c.f. CBR-based value %g, pos " x64_fmt "\n",
763 			     cyc_to_tsc, data->cbr_cyc_to_tsc, pkt_info->pos);
764 	} else {
765 		intel_pt_log("Timestamp: calculated %g TSC ticks per cycle c.f. unknown CBR-based value, pos " x64_fmt "\n",
766 			     cyc_to_tsc, pkt_info->pos);
767 	}
768 
769 	return 1;
770 }
771 
772 static void intel_pt_calc_cyc_to_tsc(struct intel_pt_decoder *decoder,
773 				     bool from_mtc)
774 {
775 	struct intel_pt_calc_cyc_to_tsc_info data = {
776 		.cycle_cnt      = 0,
777 		.cbr            = 0,
778 		.last_mtc       = decoder->last_mtc,
779 		.ctc_timestamp  = decoder->ctc_timestamp,
780 		.ctc_delta      = decoder->ctc_delta,
781 		.tsc_timestamp  = decoder->tsc_timestamp,
782 		.timestamp      = decoder->timestamp,
783 		.have_tma       = decoder->have_tma,
784 		.fixup_last_mtc = decoder->fixup_last_mtc,
785 		.from_mtc       = from_mtc,
786 		.cbr_cyc_to_tsc = 0,
787 	};
788 
789 	intel_pt_pkt_lookahead(decoder, intel_pt_calc_cyc_cb, &data);
790 }
791 
792 static int intel_pt_get_next_packet(struct intel_pt_decoder *decoder)
793 {
794 	int ret;
795 
796 	decoder->last_packet_type = decoder->packet.type;
797 
798 	do {
799 		decoder->pos += decoder->pkt_step;
800 		decoder->buf += decoder->pkt_step;
801 		decoder->len -= decoder->pkt_step;
802 
803 		if (!decoder->len) {
804 			ret = intel_pt_get_next_data(decoder);
805 			if (ret)
806 				return ret;
807 		}
808 
809 		ret = intel_pt_get_packet(decoder->buf, decoder->len,
810 					  &decoder->packet);
811 		if (ret == INTEL_PT_NEED_MORE_BYTES &&
812 		    decoder->len < INTEL_PT_PKT_MAX_SZ && !decoder->next_buf) {
813 			ret = intel_pt_get_split_packet(decoder);
814 			if (ret < 0)
815 				return ret;
816 		}
817 		if (ret <= 0)
818 			return intel_pt_bad_packet(decoder);
819 
820 		decoder->pkt_len = ret;
821 		decoder->pkt_step = ret;
822 		intel_pt_decoder_log_packet(decoder);
823 	} while (decoder->packet.type == INTEL_PT_PAD);
824 
825 	return 0;
826 }
827 
828 static uint64_t intel_pt_next_period(struct intel_pt_decoder *decoder)
829 {
830 	uint64_t timestamp, masked_timestamp;
831 
832 	timestamp = decoder->timestamp + decoder->timestamp_insn_cnt;
833 	masked_timestamp = timestamp & decoder->period_mask;
834 	if (decoder->continuous_period) {
835 		if (masked_timestamp != decoder->last_masked_timestamp)
836 			return 1;
837 	} else {
838 		timestamp += 1;
839 		masked_timestamp = timestamp & decoder->period_mask;
840 		if (masked_timestamp != decoder->last_masked_timestamp) {
841 			decoder->last_masked_timestamp = masked_timestamp;
842 			decoder->continuous_period = true;
843 		}
844 	}
845 	return decoder->period_ticks - (timestamp - masked_timestamp);
846 }
847 
848 static uint64_t intel_pt_next_sample(struct intel_pt_decoder *decoder)
849 {
850 	switch (decoder->period_type) {
851 	case INTEL_PT_PERIOD_INSTRUCTIONS:
852 		return decoder->period - decoder->period_insn_cnt;
853 	case INTEL_PT_PERIOD_TICKS:
854 		return intel_pt_next_period(decoder);
855 	case INTEL_PT_PERIOD_NONE:
856 	case INTEL_PT_PERIOD_MTC:
857 	default:
858 		return 0;
859 	}
860 }
861 
862 static void intel_pt_sample_insn(struct intel_pt_decoder *decoder)
863 {
864 	uint64_t timestamp, masked_timestamp;
865 
866 	switch (decoder->period_type) {
867 	case INTEL_PT_PERIOD_INSTRUCTIONS:
868 		decoder->period_insn_cnt = 0;
869 		break;
870 	case INTEL_PT_PERIOD_TICKS:
871 		timestamp = decoder->timestamp + decoder->timestamp_insn_cnt;
872 		masked_timestamp = timestamp & decoder->period_mask;
873 		decoder->last_masked_timestamp = masked_timestamp;
874 		break;
875 	case INTEL_PT_PERIOD_NONE:
876 	case INTEL_PT_PERIOD_MTC:
877 	default:
878 		break;
879 	}
880 
881 	decoder->state.type |= INTEL_PT_INSTRUCTION;
882 }
883 
884 static int intel_pt_walk_insn(struct intel_pt_decoder *decoder,
885 			      struct intel_pt_insn *intel_pt_insn, uint64_t ip)
886 {
887 	uint64_t max_insn_cnt, insn_cnt = 0;
888 	int err;
889 
890 	if (!decoder->mtc_insn)
891 		decoder->mtc_insn = true;
892 
893 	max_insn_cnt = intel_pt_next_sample(decoder);
894 
895 	err = decoder->walk_insn(intel_pt_insn, &insn_cnt, &decoder->ip, ip,
896 				 max_insn_cnt, decoder->data);
897 
898 	decoder->tot_insn_cnt += insn_cnt;
899 	decoder->timestamp_insn_cnt += insn_cnt;
900 	decoder->period_insn_cnt += insn_cnt;
901 
902 	if (err) {
903 		decoder->no_progress = 0;
904 		decoder->pkt_state = INTEL_PT_STATE_ERR2;
905 		intel_pt_log_at("ERROR: Failed to get instruction",
906 				decoder->ip);
907 		if (err == -ENOENT)
908 			return -ENOLINK;
909 		return -EILSEQ;
910 	}
911 
912 	if (ip && decoder->ip == ip) {
913 		err = -EAGAIN;
914 		goto out;
915 	}
916 
917 	if (max_insn_cnt && insn_cnt >= max_insn_cnt)
918 		intel_pt_sample_insn(decoder);
919 
920 	if (intel_pt_insn->branch == INTEL_PT_BR_NO_BRANCH) {
921 		decoder->state.type = INTEL_PT_INSTRUCTION;
922 		decoder->state.from_ip = decoder->ip;
923 		decoder->state.to_ip = 0;
924 		decoder->ip += intel_pt_insn->length;
925 		err = INTEL_PT_RETURN;
926 		goto out;
927 	}
928 
929 	if (intel_pt_insn->op == INTEL_PT_OP_CALL) {
930 		/* Zero-length calls are excluded */
931 		if (intel_pt_insn->branch != INTEL_PT_BR_UNCONDITIONAL ||
932 		    intel_pt_insn->rel) {
933 			err = intel_pt_push(&decoder->stack, decoder->ip +
934 					    intel_pt_insn->length);
935 			if (err)
936 				goto out;
937 		}
938 	} else if (intel_pt_insn->op == INTEL_PT_OP_RET) {
939 		decoder->ret_addr = intel_pt_pop(&decoder->stack);
940 	}
941 
942 	if (intel_pt_insn->branch == INTEL_PT_BR_UNCONDITIONAL) {
943 		int cnt = decoder->no_progress++;
944 
945 		decoder->state.from_ip = decoder->ip;
946 		decoder->ip += intel_pt_insn->length +
947 				intel_pt_insn->rel;
948 		decoder->state.to_ip = decoder->ip;
949 		err = INTEL_PT_RETURN;
950 
951 		/*
952 		 * Check for being stuck in a loop.  This can happen if a
953 		 * decoder error results in the decoder erroneously setting the
954 		 * ip to an address that is itself in an infinite loop that
955 		 * consumes no packets.  When that happens, there must be an
956 		 * unconditional branch.
957 		 */
958 		if (cnt) {
959 			if (cnt == 1) {
960 				decoder->stuck_ip = decoder->state.to_ip;
961 				decoder->stuck_ip_prd = 1;
962 				decoder->stuck_ip_cnt = 1;
963 			} else if (cnt > INTEL_PT_MAX_LOOPS ||
964 				   decoder->state.to_ip == decoder->stuck_ip) {
965 				intel_pt_log_at("ERROR: Never-ending loop",
966 						decoder->state.to_ip);
967 				decoder->pkt_state = INTEL_PT_STATE_ERR_RESYNC;
968 				err = -ELOOP;
969 				goto out;
970 			} else if (!--decoder->stuck_ip_cnt) {
971 				decoder->stuck_ip_prd += 1;
972 				decoder->stuck_ip_cnt = decoder->stuck_ip_prd;
973 				decoder->stuck_ip = decoder->state.to_ip;
974 			}
975 		}
976 		goto out_no_progress;
977 	}
978 out:
979 	decoder->no_progress = 0;
980 out_no_progress:
981 	decoder->state.insn_op = intel_pt_insn->op;
982 	decoder->state.insn_len = intel_pt_insn->length;
983 	memcpy(decoder->state.insn, intel_pt_insn->buf,
984 	       INTEL_PT_INSN_BUF_SZ);
985 
986 	if (decoder->tx_flags & INTEL_PT_IN_TX)
987 		decoder->state.flags |= INTEL_PT_IN_TX;
988 
989 	return err;
990 }
991 
992 static int intel_pt_walk_fup(struct intel_pt_decoder *decoder)
993 {
994 	struct intel_pt_insn intel_pt_insn;
995 	uint64_t ip;
996 	int err;
997 
998 	ip = decoder->last_ip;
999 
1000 	while (1) {
1001 		err = intel_pt_walk_insn(decoder, &intel_pt_insn, ip);
1002 		if (err == INTEL_PT_RETURN)
1003 			return 0;
1004 		if (err == -EAGAIN) {
1005 			if (decoder->set_fup_tx_flags) {
1006 				decoder->set_fup_tx_flags = false;
1007 				decoder->tx_flags = decoder->fup_tx_flags;
1008 				decoder->state.type = INTEL_PT_TRANSACTION;
1009 				decoder->state.from_ip = decoder->ip;
1010 				decoder->state.to_ip = 0;
1011 				decoder->state.flags = decoder->fup_tx_flags;
1012 				return 0;
1013 			}
1014 			return err;
1015 		}
1016 		decoder->set_fup_tx_flags = false;
1017 		if (err)
1018 			return err;
1019 
1020 		if (intel_pt_insn.branch == INTEL_PT_BR_INDIRECT) {
1021 			intel_pt_log_at("ERROR: Unexpected indirect branch",
1022 					decoder->ip);
1023 			decoder->pkt_state = INTEL_PT_STATE_ERR_RESYNC;
1024 			return -ENOENT;
1025 		}
1026 
1027 		if (intel_pt_insn.branch == INTEL_PT_BR_CONDITIONAL) {
1028 			intel_pt_log_at("ERROR: Unexpected conditional branch",
1029 					decoder->ip);
1030 			decoder->pkt_state = INTEL_PT_STATE_ERR_RESYNC;
1031 			return -ENOENT;
1032 		}
1033 
1034 		intel_pt_bug(decoder);
1035 	}
1036 }
1037 
1038 static int intel_pt_walk_tip(struct intel_pt_decoder *decoder)
1039 {
1040 	struct intel_pt_insn intel_pt_insn;
1041 	int err;
1042 
1043 	err = intel_pt_walk_insn(decoder, &intel_pt_insn, 0);
1044 	if (err == INTEL_PT_RETURN &&
1045 	    decoder->pgd_ip &&
1046 	    decoder->pkt_state == INTEL_PT_STATE_TIP_PGD &&
1047 	    (decoder->state.type & INTEL_PT_BRANCH) &&
1048 	    decoder->pgd_ip(decoder->state.to_ip, decoder->data)) {
1049 		/* Unconditional branch leaving filter region */
1050 		decoder->no_progress = 0;
1051 		decoder->pge = false;
1052 		decoder->continuous_period = false;
1053 		decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1054 		decoder->state.to_ip = 0;
1055 		return 0;
1056 	}
1057 	if (err == INTEL_PT_RETURN)
1058 		return 0;
1059 	if (err)
1060 		return err;
1061 
1062 	if (intel_pt_insn.branch == INTEL_PT_BR_INDIRECT) {
1063 		if (decoder->pkt_state == INTEL_PT_STATE_TIP_PGD) {
1064 			decoder->pge = false;
1065 			decoder->continuous_period = false;
1066 			decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1067 			decoder->state.from_ip = decoder->ip;
1068 			decoder->state.to_ip = 0;
1069 			if (decoder->packet.count != 0)
1070 				decoder->ip = decoder->last_ip;
1071 		} else {
1072 			decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1073 			decoder->state.from_ip = decoder->ip;
1074 			if (decoder->packet.count == 0) {
1075 				decoder->state.to_ip = 0;
1076 			} else {
1077 				decoder->state.to_ip = decoder->last_ip;
1078 				decoder->ip = decoder->last_ip;
1079 			}
1080 		}
1081 		return 0;
1082 	}
1083 
1084 	if (intel_pt_insn.branch == INTEL_PT_BR_CONDITIONAL) {
1085 		uint64_t to_ip = decoder->ip + intel_pt_insn.length +
1086 				 intel_pt_insn.rel;
1087 
1088 		if (decoder->pgd_ip &&
1089 		    decoder->pkt_state == INTEL_PT_STATE_TIP_PGD &&
1090 		    decoder->pgd_ip(to_ip, decoder->data)) {
1091 			/* Conditional branch leaving filter region */
1092 			decoder->pge = false;
1093 			decoder->continuous_period = false;
1094 			decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1095 			decoder->ip = to_ip;
1096 			decoder->state.from_ip = decoder->ip;
1097 			decoder->state.to_ip = 0;
1098 			return 0;
1099 		}
1100 		intel_pt_log_at("ERROR: Conditional branch when expecting indirect branch",
1101 				decoder->ip);
1102 		decoder->pkt_state = INTEL_PT_STATE_ERR_RESYNC;
1103 		return -ENOENT;
1104 	}
1105 
1106 	return intel_pt_bug(decoder);
1107 }
1108 
1109 static int intel_pt_walk_tnt(struct intel_pt_decoder *decoder)
1110 {
1111 	struct intel_pt_insn intel_pt_insn;
1112 	int err;
1113 
1114 	while (1) {
1115 		err = intel_pt_walk_insn(decoder, &intel_pt_insn, 0);
1116 		if (err == INTEL_PT_RETURN)
1117 			return 0;
1118 		if (err)
1119 			return err;
1120 
1121 		if (intel_pt_insn.op == INTEL_PT_OP_RET) {
1122 			if (!decoder->return_compression) {
1123 				intel_pt_log_at("ERROR: RET when expecting conditional branch",
1124 						decoder->ip);
1125 				decoder->pkt_state = INTEL_PT_STATE_ERR3;
1126 				return -ENOENT;
1127 			}
1128 			if (!decoder->ret_addr) {
1129 				intel_pt_log_at("ERROR: Bad RET compression (stack empty)",
1130 						decoder->ip);
1131 				decoder->pkt_state = INTEL_PT_STATE_ERR3;
1132 				return -ENOENT;
1133 			}
1134 			if (!(decoder->tnt.payload & BIT63)) {
1135 				intel_pt_log_at("ERROR: Bad RET compression (TNT=N)",
1136 						decoder->ip);
1137 				decoder->pkt_state = INTEL_PT_STATE_ERR3;
1138 				return -ENOENT;
1139 			}
1140 			decoder->tnt.count -= 1;
1141 			if (!decoder->tnt.count)
1142 				decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1143 			decoder->tnt.payload <<= 1;
1144 			decoder->state.from_ip = decoder->ip;
1145 			decoder->ip = decoder->ret_addr;
1146 			decoder->state.to_ip = decoder->ip;
1147 			return 0;
1148 		}
1149 
1150 		if (intel_pt_insn.branch == INTEL_PT_BR_INDIRECT) {
1151 			/* Handle deferred TIPs */
1152 			err = intel_pt_get_next_packet(decoder);
1153 			if (err)
1154 				return err;
1155 			if (decoder->packet.type != INTEL_PT_TIP ||
1156 			    decoder->packet.count == 0) {
1157 				intel_pt_log_at("ERROR: Missing deferred TIP for indirect branch",
1158 						decoder->ip);
1159 				decoder->pkt_state = INTEL_PT_STATE_ERR3;
1160 				decoder->pkt_step = 0;
1161 				return -ENOENT;
1162 			}
1163 			intel_pt_set_last_ip(decoder);
1164 			decoder->state.from_ip = decoder->ip;
1165 			decoder->state.to_ip = decoder->last_ip;
1166 			decoder->ip = decoder->last_ip;
1167 			return 0;
1168 		}
1169 
1170 		if (intel_pt_insn.branch == INTEL_PT_BR_CONDITIONAL) {
1171 			decoder->tnt.count -= 1;
1172 			if (!decoder->tnt.count)
1173 				decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1174 			if (decoder->tnt.payload & BIT63) {
1175 				decoder->tnt.payload <<= 1;
1176 				decoder->state.from_ip = decoder->ip;
1177 				decoder->ip += intel_pt_insn.length +
1178 					       intel_pt_insn.rel;
1179 				decoder->state.to_ip = decoder->ip;
1180 				return 0;
1181 			}
1182 			/* Instruction sample for a non-taken branch */
1183 			if (decoder->state.type & INTEL_PT_INSTRUCTION) {
1184 				decoder->tnt.payload <<= 1;
1185 				decoder->state.type = INTEL_PT_INSTRUCTION;
1186 				decoder->state.from_ip = decoder->ip;
1187 				decoder->state.to_ip = 0;
1188 				decoder->ip += intel_pt_insn.length;
1189 				return 0;
1190 			}
1191 			decoder->ip += intel_pt_insn.length;
1192 			if (!decoder->tnt.count)
1193 				return -EAGAIN;
1194 			decoder->tnt.payload <<= 1;
1195 			continue;
1196 		}
1197 
1198 		return intel_pt_bug(decoder);
1199 	}
1200 }
1201 
1202 static int intel_pt_mode_tsx(struct intel_pt_decoder *decoder, bool *no_tip)
1203 {
1204 	unsigned int fup_tx_flags;
1205 	int err;
1206 
1207 	fup_tx_flags = decoder->packet.payload &
1208 		       (INTEL_PT_IN_TX | INTEL_PT_ABORT_TX);
1209 	err = intel_pt_get_next_packet(decoder);
1210 	if (err)
1211 		return err;
1212 	if (decoder->packet.type == INTEL_PT_FUP) {
1213 		decoder->fup_tx_flags = fup_tx_flags;
1214 		decoder->set_fup_tx_flags = true;
1215 		if (!(decoder->fup_tx_flags & INTEL_PT_ABORT_TX))
1216 			*no_tip = true;
1217 	} else {
1218 		intel_pt_log_at("ERROR: Missing FUP after MODE.TSX",
1219 				decoder->pos);
1220 		intel_pt_update_in_tx(decoder);
1221 	}
1222 	return 0;
1223 }
1224 
1225 static void intel_pt_calc_tsc_timestamp(struct intel_pt_decoder *decoder)
1226 {
1227 	uint64_t timestamp;
1228 
1229 	decoder->have_tma = false;
1230 
1231 	if (decoder->ref_timestamp) {
1232 		timestamp = decoder->packet.payload |
1233 			    (decoder->ref_timestamp & (0xffULL << 56));
1234 		if (timestamp < decoder->ref_timestamp) {
1235 			if (decoder->ref_timestamp - timestamp > (1ULL << 55))
1236 				timestamp += (1ULL << 56);
1237 		} else {
1238 			if (timestamp - decoder->ref_timestamp > (1ULL << 55))
1239 				timestamp -= (1ULL << 56);
1240 		}
1241 		decoder->tsc_timestamp = timestamp;
1242 		decoder->timestamp = timestamp;
1243 		decoder->ref_timestamp = 0;
1244 		decoder->timestamp_insn_cnt = 0;
1245 	} else if (decoder->timestamp) {
1246 		timestamp = decoder->packet.payload |
1247 			    (decoder->timestamp & (0xffULL << 56));
1248 		decoder->tsc_timestamp = timestamp;
1249 		if (timestamp < decoder->timestamp &&
1250 		    decoder->timestamp - timestamp < decoder->tsc_slip) {
1251 			intel_pt_log_to("Suppressing backwards timestamp",
1252 					timestamp);
1253 			timestamp = decoder->timestamp;
1254 		}
1255 		if (timestamp < decoder->timestamp) {
1256 			intel_pt_log_to("Wraparound timestamp", timestamp);
1257 			timestamp += (1ULL << 56);
1258 			decoder->tsc_timestamp = timestamp;
1259 		}
1260 		decoder->timestamp = timestamp;
1261 		decoder->timestamp_insn_cnt = 0;
1262 	}
1263 
1264 	if (decoder->last_packet_type == INTEL_PT_CYC) {
1265 		decoder->cyc_ref_timestamp = decoder->timestamp;
1266 		decoder->cycle_cnt = 0;
1267 		decoder->have_calc_cyc_to_tsc = false;
1268 		intel_pt_calc_cyc_to_tsc(decoder, false);
1269 	}
1270 
1271 	intel_pt_log_to("Setting timestamp", decoder->timestamp);
1272 }
1273 
1274 static int intel_pt_overflow(struct intel_pt_decoder *decoder)
1275 {
1276 	intel_pt_log("ERROR: Buffer overflow\n");
1277 	intel_pt_clear_tx_flags(decoder);
1278 	decoder->have_tma = false;
1279 	decoder->cbr = 0;
1280 	decoder->pkt_state = INTEL_PT_STATE_ERR_RESYNC;
1281 	decoder->overflow = true;
1282 	return -EOVERFLOW;
1283 }
1284 
1285 static void intel_pt_calc_tma(struct intel_pt_decoder *decoder)
1286 {
1287 	uint32_t ctc = decoder->packet.payload;
1288 	uint32_t fc = decoder->packet.count;
1289 	uint32_t ctc_rem = ctc & decoder->ctc_rem_mask;
1290 
1291 	if (!decoder->tsc_ctc_ratio_d)
1292 		return;
1293 
1294 	decoder->last_mtc = (ctc >> decoder->mtc_shift) & 0xff;
1295 	decoder->ctc_timestamp = decoder->tsc_timestamp - fc;
1296 	if (decoder->tsc_ctc_mult) {
1297 		decoder->ctc_timestamp -= ctc_rem * decoder->tsc_ctc_mult;
1298 	} else {
1299 		decoder->ctc_timestamp -= multdiv(ctc_rem,
1300 						  decoder->tsc_ctc_ratio_n,
1301 						  decoder->tsc_ctc_ratio_d);
1302 	}
1303 	decoder->ctc_delta = 0;
1304 	decoder->have_tma = true;
1305 	decoder->fixup_last_mtc = true;
1306 	intel_pt_log("CTC timestamp " x64_fmt " last MTC %#x  CTC rem %#x\n",
1307 		     decoder->ctc_timestamp, decoder->last_mtc, ctc_rem);
1308 }
1309 
1310 static void intel_pt_calc_mtc_timestamp(struct intel_pt_decoder *decoder)
1311 {
1312 	uint64_t timestamp;
1313 	uint32_t mtc, mtc_delta;
1314 
1315 	if (!decoder->have_tma)
1316 		return;
1317 
1318 	mtc = decoder->packet.payload;
1319 
1320 	if (decoder->mtc_shift > 8 && decoder->fixup_last_mtc) {
1321 		decoder->fixup_last_mtc = false;
1322 		intel_pt_fixup_last_mtc(mtc, decoder->mtc_shift,
1323 					&decoder->last_mtc);
1324 	}
1325 
1326 	if (mtc > decoder->last_mtc)
1327 		mtc_delta = mtc - decoder->last_mtc;
1328 	else
1329 		mtc_delta = mtc + 256 - decoder->last_mtc;
1330 
1331 	decoder->ctc_delta += mtc_delta << decoder->mtc_shift;
1332 
1333 	if (decoder->tsc_ctc_mult) {
1334 		timestamp = decoder->ctc_timestamp +
1335 			    decoder->ctc_delta * decoder->tsc_ctc_mult;
1336 	} else {
1337 		timestamp = decoder->ctc_timestamp +
1338 			    multdiv(decoder->ctc_delta,
1339 				    decoder->tsc_ctc_ratio_n,
1340 				    decoder->tsc_ctc_ratio_d);
1341 	}
1342 
1343 	if (timestamp < decoder->timestamp)
1344 		intel_pt_log("Suppressing MTC timestamp " x64_fmt " less than current timestamp " x64_fmt "\n",
1345 			     timestamp, decoder->timestamp);
1346 	else
1347 		decoder->timestamp = timestamp;
1348 
1349 	decoder->timestamp_insn_cnt = 0;
1350 	decoder->last_mtc = mtc;
1351 
1352 	if (decoder->last_packet_type == INTEL_PT_CYC) {
1353 		decoder->cyc_ref_timestamp = decoder->timestamp;
1354 		decoder->cycle_cnt = 0;
1355 		decoder->have_calc_cyc_to_tsc = false;
1356 		intel_pt_calc_cyc_to_tsc(decoder, true);
1357 	}
1358 }
1359 
1360 static void intel_pt_calc_cbr(struct intel_pt_decoder *decoder)
1361 {
1362 	unsigned int cbr = decoder->packet.payload;
1363 
1364 	if (decoder->cbr == cbr)
1365 		return;
1366 
1367 	decoder->cbr = cbr;
1368 	decoder->cbr_cyc_to_tsc = decoder->max_non_turbo_ratio_fp / cbr;
1369 }
1370 
1371 static void intel_pt_calc_cyc_timestamp(struct intel_pt_decoder *decoder)
1372 {
1373 	uint64_t timestamp = decoder->cyc_ref_timestamp;
1374 
1375 	decoder->have_cyc = true;
1376 
1377 	decoder->cycle_cnt += decoder->packet.payload;
1378 
1379 	if (!decoder->cyc_ref_timestamp)
1380 		return;
1381 
1382 	if (decoder->have_calc_cyc_to_tsc)
1383 		timestamp += decoder->cycle_cnt * decoder->calc_cyc_to_tsc;
1384 	else if (decoder->cbr)
1385 		timestamp += decoder->cycle_cnt * decoder->cbr_cyc_to_tsc;
1386 	else
1387 		return;
1388 
1389 	if (timestamp < decoder->timestamp)
1390 		intel_pt_log("Suppressing CYC timestamp " x64_fmt " less than current timestamp " x64_fmt "\n",
1391 			     timestamp, decoder->timestamp);
1392 	else
1393 		decoder->timestamp = timestamp;
1394 
1395 	decoder->timestamp_insn_cnt = 0;
1396 }
1397 
1398 /* Walk PSB+ packets when already in sync. */
1399 static int intel_pt_walk_psbend(struct intel_pt_decoder *decoder)
1400 {
1401 	int err;
1402 
1403 	while (1) {
1404 		err = intel_pt_get_next_packet(decoder);
1405 		if (err)
1406 			return err;
1407 
1408 		switch (decoder->packet.type) {
1409 		case INTEL_PT_PSBEND:
1410 			return 0;
1411 
1412 		case INTEL_PT_TIP_PGD:
1413 		case INTEL_PT_TIP_PGE:
1414 		case INTEL_PT_TIP:
1415 		case INTEL_PT_TNT:
1416 		case INTEL_PT_TRACESTOP:
1417 		case INTEL_PT_BAD:
1418 		case INTEL_PT_PSB:
1419 			decoder->have_tma = false;
1420 			intel_pt_log("ERROR: Unexpected packet\n");
1421 			return -EAGAIN;
1422 
1423 		case INTEL_PT_OVF:
1424 			return intel_pt_overflow(decoder);
1425 
1426 		case INTEL_PT_TSC:
1427 			intel_pt_calc_tsc_timestamp(decoder);
1428 			break;
1429 
1430 		case INTEL_PT_TMA:
1431 			intel_pt_calc_tma(decoder);
1432 			break;
1433 
1434 		case INTEL_PT_CBR:
1435 			intel_pt_calc_cbr(decoder);
1436 			break;
1437 
1438 		case INTEL_PT_MODE_EXEC:
1439 			decoder->exec_mode = decoder->packet.payload;
1440 			break;
1441 
1442 		case INTEL_PT_PIP:
1443 			decoder->cr3 = decoder->packet.payload & (BIT63 - 1);
1444 			break;
1445 
1446 		case INTEL_PT_FUP:
1447 			decoder->pge = true;
1448 			intel_pt_set_last_ip(decoder);
1449 			break;
1450 
1451 		case INTEL_PT_MODE_TSX:
1452 			intel_pt_update_in_tx(decoder);
1453 			break;
1454 
1455 		case INTEL_PT_MTC:
1456 			intel_pt_calc_mtc_timestamp(decoder);
1457 			if (decoder->period_type == INTEL_PT_PERIOD_MTC)
1458 				decoder->state.type |= INTEL_PT_INSTRUCTION;
1459 			break;
1460 
1461 		case INTEL_PT_CYC:
1462 		case INTEL_PT_VMCS:
1463 		case INTEL_PT_MNT:
1464 		case INTEL_PT_PAD:
1465 		default:
1466 			break;
1467 		}
1468 	}
1469 }
1470 
1471 static int intel_pt_walk_fup_tip(struct intel_pt_decoder *decoder)
1472 {
1473 	int err;
1474 
1475 	if (decoder->tx_flags & INTEL_PT_ABORT_TX) {
1476 		decoder->tx_flags = 0;
1477 		decoder->state.flags &= ~INTEL_PT_IN_TX;
1478 		decoder->state.flags |= INTEL_PT_ABORT_TX;
1479 	} else {
1480 		decoder->state.flags |= INTEL_PT_ASYNC;
1481 	}
1482 
1483 	while (1) {
1484 		err = intel_pt_get_next_packet(decoder);
1485 		if (err)
1486 			return err;
1487 
1488 		switch (decoder->packet.type) {
1489 		case INTEL_PT_TNT:
1490 		case INTEL_PT_FUP:
1491 		case INTEL_PT_TRACESTOP:
1492 		case INTEL_PT_PSB:
1493 		case INTEL_PT_TSC:
1494 		case INTEL_PT_TMA:
1495 		case INTEL_PT_CBR:
1496 		case INTEL_PT_MODE_TSX:
1497 		case INTEL_PT_BAD:
1498 		case INTEL_PT_PSBEND:
1499 			intel_pt_log("ERROR: Missing TIP after FUP\n");
1500 			decoder->pkt_state = INTEL_PT_STATE_ERR3;
1501 			return -ENOENT;
1502 
1503 		case INTEL_PT_OVF:
1504 			return intel_pt_overflow(decoder);
1505 
1506 		case INTEL_PT_TIP_PGD:
1507 			decoder->state.from_ip = decoder->ip;
1508 			decoder->state.to_ip = 0;
1509 			if (decoder->packet.count != 0) {
1510 				intel_pt_set_ip(decoder);
1511 				intel_pt_log("Omitting PGD ip " x64_fmt "\n",
1512 					     decoder->ip);
1513 			}
1514 			decoder->pge = false;
1515 			decoder->continuous_period = false;
1516 			return 0;
1517 
1518 		case INTEL_PT_TIP_PGE:
1519 			decoder->pge = true;
1520 			intel_pt_log("Omitting PGE ip " x64_fmt "\n",
1521 				     decoder->ip);
1522 			decoder->state.from_ip = 0;
1523 			if (decoder->packet.count == 0) {
1524 				decoder->state.to_ip = 0;
1525 			} else {
1526 				intel_pt_set_ip(decoder);
1527 				decoder->state.to_ip = decoder->ip;
1528 			}
1529 			return 0;
1530 
1531 		case INTEL_PT_TIP:
1532 			decoder->state.from_ip = decoder->ip;
1533 			if (decoder->packet.count == 0) {
1534 				decoder->state.to_ip = 0;
1535 			} else {
1536 				intel_pt_set_ip(decoder);
1537 				decoder->state.to_ip = decoder->ip;
1538 			}
1539 			return 0;
1540 
1541 		case INTEL_PT_PIP:
1542 			decoder->cr3 = decoder->packet.payload & (BIT63 - 1);
1543 			break;
1544 
1545 		case INTEL_PT_MTC:
1546 			intel_pt_calc_mtc_timestamp(decoder);
1547 			if (decoder->period_type == INTEL_PT_PERIOD_MTC)
1548 				decoder->state.type |= INTEL_PT_INSTRUCTION;
1549 			break;
1550 
1551 		case INTEL_PT_CYC:
1552 			intel_pt_calc_cyc_timestamp(decoder);
1553 			break;
1554 
1555 		case INTEL_PT_MODE_EXEC:
1556 			decoder->exec_mode = decoder->packet.payload;
1557 			break;
1558 
1559 		case INTEL_PT_VMCS:
1560 		case INTEL_PT_MNT:
1561 		case INTEL_PT_PAD:
1562 			break;
1563 
1564 		default:
1565 			return intel_pt_bug(decoder);
1566 		}
1567 	}
1568 }
1569 
1570 static int intel_pt_walk_trace(struct intel_pt_decoder *decoder)
1571 {
1572 	bool no_tip = false;
1573 	int err;
1574 
1575 	while (1) {
1576 		err = intel_pt_get_next_packet(decoder);
1577 		if (err)
1578 			return err;
1579 next:
1580 		switch (decoder->packet.type) {
1581 		case INTEL_PT_TNT:
1582 			if (!decoder->packet.count)
1583 				break;
1584 			decoder->tnt = decoder->packet;
1585 			decoder->pkt_state = INTEL_PT_STATE_TNT;
1586 			err = intel_pt_walk_tnt(decoder);
1587 			if (err == -EAGAIN)
1588 				break;
1589 			return err;
1590 
1591 		case INTEL_PT_TIP_PGD:
1592 			if (decoder->packet.count != 0)
1593 				intel_pt_set_last_ip(decoder);
1594 			decoder->pkt_state = INTEL_PT_STATE_TIP_PGD;
1595 			return intel_pt_walk_tip(decoder);
1596 
1597 		case INTEL_PT_TIP_PGE: {
1598 			decoder->pge = true;
1599 			if (decoder->packet.count == 0) {
1600 				intel_pt_log_at("Skipping zero TIP.PGE",
1601 						decoder->pos);
1602 				break;
1603 			}
1604 			intel_pt_set_ip(decoder);
1605 			decoder->state.from_ip = 0;
1606 			decoder->state.to_ip = decoder->ip;
1607 			return 0;
1608 		}
1609 
1610 		case INTEL_PT_OVF:
1611 			return intel_pt_overflow(decoder);
1612 
1613 		case INTEL_PT_TIP:
1614 			if (decoder->packet.count != 0)
1615 				intel_pt_set_last_ip(decoder);
1616 			decoder->pkt_state = INTEL_PT_STATE_TIP;
1617 			return intel_pt_walk_tip(decoder);
1618 
1619 		case INTEL_PT_FUP:
1620 			if (decoder->packet.count == 0) {
1621 				intel_pt_log_at("Skipping zero FUP",
1622 						decoder->pos);
1623 				no_tip = false;
1624 				break;
1625 			}
1626 			intel_pt_set_last_ip(decoder);
1627 			err = intel_pt_walk_fup(decoder);
1628 			if (err != -EAGAIN) {
1629 				if (err)
1630 					return err;
1631 				if (no_tip)
1632 					decoder->pkt_state =
1633 						INTEL_PT_STATE_FUP_NO_TIP;
1634 				else
1635 					decoder->pkt_state = INTEL_PT_STATE_FUP;
1636 				return 0;
1637 			}
1638 			if (no_tip) {
1639 				no_tip = false;
1640 				break;
1641 			}
1642 			return intel_pt_walk_fup_tip(decoder);
1643 
1644 		case INTEL_PT_TRACESTOP:
1645 			decoder->pge = false;
1646 			decoder->continuous_period = false;
1647 			intel_pt_clear_tx_flags(decoder);
1648 			decoder->have_tma = false;
1649 			break;
1650 
1651 		case INTEL_PT_PSB:
1652 			intel_pt_clear_stack(&decoder->stack);
1653 			err = intel_pt_walk_psbend(decoder);
1654 			if (err == -EAGAIN)
1655 				goto next;
1656 			if (err)
1657 				return err;
1658 			break;
1659 
1660 		case INTEL_PT_PIP:
1661 			decoder->cr3 = decoder->packet.payload & (BIT63 - 1);
1662 			break;
1663 
1664 		case INTEL_PT_MTC:
1665 			intel_pt_calc_mtc_timestamp(decoder);
1666 			if (decoder->period_type != INTEL_PT_PERIOD_MTC)
1667 				break;
1668 			/*
1669 			 * Ensure that there has been an instruction since the
1670 			 * last MTC.
1671 			 */
1672 			if (!decoder->mtc_insn)
1673 				break;
1674 			decoder->mtc_insn = false;
1675 			/* Ensure that there is a timestamp */
1676 			if (!decoder->timestamp)
1677 				break;
1678 			decoder->state.type = INTEL_PT_INSTRUCTION;
1679 			decoder->state.from_ip = decoder->ip;
1680 			decoder->state.to_ip = 0;
1681 			decoder->mtc_insn = false;
1682 			return 0;
1683 
1684 		case INTEL_PT_TSC:
1685 			intel_pt_calc_tsc_timestamp(decoder);
1686 			break;
1687 
1688 		case INTEL_PT_TMA:
1689 			intel_pt_calc_tma(decoder);
1690 			break;
1691 
1692 		case INTEL_PT_CYC:
1693 			intel_pt_calc_cyc_timestamp(decoder);
1694 			break;
1695 
1696 		case INTEL_PT_CBR:
1697 			intel_pt_calc_cbr(decoder);
1698 			break;
1699 
1700 		case INTEL_PT_MODE_EXEC:
1701 			decoder->exec_mode = decoder->packet.payload;
1702 			break;
1703 
1704 		case INTEL_PT_MODE_TSX:
1705 			/* MODE_TSX need not be followed by FUP */
1706 			if (!decoder->pge) {
1707 				intel_pt_update_in_tx(decoder);
1708 				break;
1709 			}
1710 			err = intel_pt_mode_tsx(decoder, &no_tip);
1711 			if (err)
1712 				return err;
1713 			goto next;
1714 
1715 		case INTEL_PT_BAD: /* Does not happen */
1716 			return intel_pt_bug(decoder);
1717 
1718 		case INTEL_PT_PSBEND:
1719 		case INTEL_PT_VMCS:
1720 		case INTEL_PT_MNT:
1721 		case INTEL_PT_PAD:
1722 			break;
1723 
1724 		default:
1725 			return intel_pt_bug(decoder);
1726 		}
1727 	}
1728 }
1729 
1730 static inline bool intel_pt_have_ip(struct intel_pt_decoder *decoder)
1731 {
1732 	return decoder->last_ip || decoder->packet.count == 0 ||
1733 	       decoder->packet.count == 3 || decoder->packet.count == 6;
1734 }
1735 
1736 /* Walk PSB+ packets to get in sync. */
1737 static int intel_pt_walk_psb(struct intel_pt_decoder *decoder)
1738 {
1739 	int err;
1740 
1741 	while (1) {
1742 		err = intel_pt_get_next_packet(decoder);
1743 		if (err)
1744 			return err;
1745 
1746 		switch (decoder->packet.type) {
1747 		case INTEL_PT_TIP_PGD:
1748 			decoder->continuous_period = false;
1749 		case INTEL_PT_TIP_PGE:
1750 		case INTEL_PT_TIP:
1751 			intel_pt_log("ERROR: Unexpected packet\n");
1752 			return -ENOENT;
1753 
1754 		case INTEL_PT_FUP:
1755 			decoder->pge = true;
1756 			if (intel_pt_have_ip(decoder)) {
1757 				uint64_t current_ip = decoder->ip;
1758 
1759 				intel_pt_set_ip(decoder);
1760 				if (current_ip)
1761 					intel_pt_log_to("Setting IP",
1762 							decoder->ip);
1763 			}
1764 			break;
1765 
1766 		case INTEL_PT_MTC:
1767 			intel_pt_calc_mtc_timestamp(decoder);
1768 			break;
1769 
1770 		case INTEL_PT_TSC:
1771 			intel_pt_calc_tsc_timestamp(decoder);
1772 			break;
1773 
1774 		case INTEL_PT_TMA:
1775 			intel_pt_calc_tma(decoder);
1776 			break;
1777 
1778 		case INTEL_PT_CYC:
1779 			intel_pt_calc_cyc_timestamp(decoder);
1780 			break;
1781 
1782 		case INTEL_PT_CBR:
1783 			intel_pt_calc_cbr(decoder);
1784 			break;
1785 
1786 		case INTEL_PT_PIP:
1787 			decoder->cr3 = decoder->packet.payload & (BIT63 - 1);
1788 			break;
1789 
1790 		case INTEL_PT_MODE_EXEC:
1791 			decoder->exec_mode = decoder->packet.payload;
1792 			break;
1793 
1794 		case INTEL_PT_MODE_TSX:
1795 			intel_pt_update_in_tx(decoder);
1796 			break;
1797 
1798 		case INTEL_PT_TRACESTOP:
1799 			decoder->pge = false;
1800 			decoder->continuous_period = false;
1801 			intel_pt_clear_tx_flags(decoder);
1802 		case INTEL_PT_TNT:
1803 			decoder->have_tma = false;
1804 			intel_pt_log("ERROR: Unexpected packet\n");
1805 			if (decoder->ip)
1806 				decoder->pkt_state = INTEL_PT_STATE_ERR4;
1807 			else
1808 				decoder->pkt_state = INTEL_PT_STATE_ERR3;
1809 			return -ENOENT;
1810 
1811 		case INTEL_PT_BAD: /* Does not happen */
1812 			return intel_pt_bug(decoder);
1813 
1814 		case INTEL_PT_OVF:
1815 			return intel_pt_overflow(decoder);
1816 
1817 		case INTEL_PT_PSBEND:
1818 			return 0;
1819 
1820 		case INTEL_PT_PSB:
1821 		case INTEL_PT_VMCS:
1822 		case INTEL_PT_MNT:
1823 		case INTEL_PT_PAD:
1824 		default:
1825 			break;
1826 		}
1827 	}
1828 }
1829 
1830 static int intel_pt_walk_to_ip(struct intel_pt_decoder *decoder)
1831 {
1832 	int err;
1833 
1834 	while (1) {
1835 		err = intel_pt_get_next_packet(decoder);
1836 		if (err)
1837 			return err;
1838 
1839 		switch (decoder->packet.type) {
1840 		case INTEL_PT_TIP_PGD:
1841 			decoder->continuous_period = false;
1842 		case INTEL_PT_TIP_PGE:
1843 		case INTEL_PT_TIP:
1844 			decoder->pge = decoder->packet.type != INTEL_PT_TIP_PGD;
1845 			if (intel_pt_have_ip(decoder))
1846 				intel_pt_set_ip(decoder);
1847 			if (decoder->ip)
1848 				return 0;
1849 			break;
1850 
1851 		case INTEL_PT_FUP:
1852 			if (decoder->overflow) {
1853 				if (intel_pt_have_ip(decoder))
1854 					intel_pt_set_ip(decoder);
1855 				if (decoder->ip)
1856 					return 0;
1857 			}
1858 			if (decoder->packet.count)
1859 				intel_pt_set_last_ip(decoder);
1860 			break;
1861 
1862 		case INTEL_PT_MTC:
1863 			intel_pt_calc_mtc_timestamp(decoder);
1864 			break;
1865 
1866 		case INTEL_PT_TSC:
1867 			intel_pt_calc_tsc_timestamp(decoder);
1868 			break;
1869 
1870 		case INTEL_PT_TMA:
1871 			intel_pt_calc_tma(decoder);
1872 			break;
1873 
1874 		case INTEL_PT_CYC:
1875 			intel_pt_calc_cyc_timestamp(decoder);
1876 			break;
1877 
1878 		case INTEL_PT_CBR:
1879 			intel_pt_calc_cbr(decoder);
1880 			break;
1881 
1882 		case INTEL_PT_PIP:
1883 			decoder->cr3 = decoder->packet.payload & (BIT63 - 1);
1884 			break;
1885 
1886 		case INTEL_PT_MODE_EXEC:
1887 			decoder->exec_mode = decoder->packet.payload;
1888 			break;
1889 
1890 		case INTEL_PT_MODE_TSX:
1891 			intel_pt_update_in_tx(decoder);
1892 			break;
1893 
1894 		case INTEL_PT_OVF:
1895 			return intel_pt_overflow(decoder);
1896 
1897 		case INTEL_PT_BAD: /* Does not happen */
1898 			return intel_pt_bug(decoder);
1899 
1900 		case INTEL_PT_TRACESTOP:
1901 			decoder->pge = false;
1902 			decoder->continuous_period = false;
1903 			intel_pt_clear_tx_flags(decoder);
1904 			decoder->have_tma = false;
1905 			break;
1906 
1907 		case INTEL_PT_PSB:
1908 			err = intel_pt_walk_psb(decoder);
1909 			if (err)
1910 				return err;
1911 			if (decoder->ip) {
1912 				/* Do not have a sample */
1913 				decoder->state.type = 0;
1914 				return 0;
1915 			}
1916 			break;
1917 
1918 		case INTEL_PT_TNT:
1919 		case INTEL_PT_PSBEND:
1920 		case INTEL_PT_VMCS:
1921 		case INTEL_PT_MNT:
1922 		case INTEL_PT_PAD:
1923 		default:
1924 			break;
1925 		}
1926 	}
1927 }
1928 
1929 static int intel_pt_sync_ip(struct intel_pt_decoder *decoder)
1930 {
1931 	int err;
1932 
1933 	intel_pt_log("Scanning for full IP\n");
1934 	err = intel_pt_walk_to_ip(decoder);
1935 	if (err)
1936 		return err;
1937 
1938 	decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
1939 	decoder->overflow = false;
1940 
1941 	decoder->state.from_ip = 0;
1942 	decoder->state.to_ip = decoder->ip;
1943 	intel_pt_log_to("Setting IP", decoder->ip);
1944 
1945 	return 0;
1946 }
1947 
1948 static int intel_pt_part_psb(struct intel_pt_decoder *decoder)
1949 {
1950 	const unsigned char *end = decoder->buf + decoder->len;
1951 	size_t i;
1952 
1953 	for (i = INTEL_PT_PSB_LEN - 1; i; i--) {
1954 		if (i > decoder->len)
1955 			continue;
1956 		if (!memcmp(end - i, INTEL_PT_PSB_STR, i))
1957 			return i;
1958 	}
1959 	return 0;
1960 }
1961 
1962 static int intel_pt_rest_psb(struct intel_pt_decoder *decoder, int part_psb)
1963 {
1964 	size_t rest_psb = INTEL_PT_PSB_LEN - part_psb;
1965 	const char *psb = INTEL_PT_PSB_STR;
1966 
1967 	if (rest_psb > decoder->len ||
1968 	    memcmp(decoder->buf, psb + part_psb, rest_psb))
1969 		return 0;
1970 
1971 	return rest_psb;
1972 }
1973 
1974 static int intel_pt_get_split_psb(struct intel_pt_decoder *decoder,
1975 				  int part_psb)
1976 {
1977 	int rest_psb, ret;
1978 
1979 	decoder->pos += decoder->len;
1980 	decoder->len = 0;
1981 
1982 	ret = intel_pt_get_next_data(decoder);
1983 	if (ret)
1984 		return ret;
1985 
1986 	rest_psb = intel_pt_rest_psb(decoder, part_psb);
1987 	if (!rest_psb)
1988 		return 0;
1989 
1990 	decoder->pos -= part_psb;
1991 	decoder->next_buf = decoder->buf + rest_psb;
1992 	decoder->next_len = decoder->len - rest_psb;
1993 	memcpy(decoder->temp_buf, INTEL_PT_PSB_STR, INTEL_PT_PSB_LEN);
1994 	decoder->buf = decoder->temp_buf;
1995 	decoder->len = INTEL_PT_PSB_LEN;
1996 
1997 	return 0;
1998 }
1999 
2000 static int intel_pt_scan_for_psb(struct intel_pt_decoder *decoder)
2001 {
2002 	unsigned char *next;
2003 	int ret;
2004 
2005 	intel_pt_log("Scanning for PSB\n");
2006 	while (1) {
2007 		if (!decoder->len) {
2008 			ret = intel_pt_get_next_data(decoder);
2009 			if (ret)
2010 				return ret;
2011 		}
2012 
2013 		next = memmem(decoder->buf, decoder->len, INTEL_PT_PSB_STR,
2014 			      INTEL_PT_PSB_LEN);
2015 		if (!next) {
2016 			int part_psb;
2017 
2018 			part_psb = intel_pt_part_psb(decoder);
2019 			if (part_psb) {
2020 				ret = intel_pt_get_split_psb(decoder, part_psb);
2021 				if (ret)
2022 					return ret;
2023 			} else {
2024 				decoder->pos += decoder->len;
2025 				decoder->len = 0;
2026 			}
2027 			continue;
2028 		}
2029 
2030 		decoder->pkt_step = next - decoder->buf;
2031 		return intel_pt_get_next_packet(decoder);
2032 	}
2033 }
2034 
2035 static int intel_pt_sync(struct intel_pt_decoder *decoder)
2036 {
2037 	int err;
2038 
2039 	decoder->pge = false;
2040 	decoder->continuous_period = false;
2041 	decoder->last_ip = 0;
2042 	decoder->ip = 0;
2043 	intel_pt_clear_stack(&decoder->stack);
2044 
2045 	err = intel_pt_scan_for_psb(decoder);
2046 	if (err)
2047 		return err;
2048 
2049 	decoder->pkt_state = INTEL_PT_STATE_NO_IP;
2050 
2051 	err = intel_pt_walk_psb(decoder);
2052 	if (err)
2053 		return err;
2054 
2055 	if (decoder->ip) {
2056 		decoder->state.type = 0; /* Do not have a sample */
2057 		decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
2058 	} else {
2059 		return intel_pt_sync_ip(decoder);
2060 	}
2061 
2062 	return 0;
2063 }
2064 
2065 static uint64_t intel_pt_est_timestamp(struct intel_pt_decoder *decoder)
2066 {
2067 	uint64_t est = decoder->timestamp_insn_cnt << 1;
2068 
2069 	if (!decoder->cbr || !decoder->max_non_turbo_ratio)
2070 		goto out;
2071 
2072 	est *= decoder->max_non_turbo_ratio;
2073 	est /= decoder->cbr;
2074 out:
2075 	return decoder->timestamp + est;
2076 }
2077 
2078 const struct intel_pt_state *intel_pt_decode(struct intel_pt_decoder *decoder)
2079 {
2080 	int err;
2081 
2082 	do {
2083 		decoder->state.type = INTEL_PT_BRANCH;
2084 		decoder->state.flags = 0;
2085 
2086 		switch (decoder->pkt_state) {
2087 		case INTEL_PT_STATE_NO_PSB:
2088 			err = intel_pt_sync(decoder);
2089 			break;
2090 		case INTEL_PT_STATE_NO_IP:
2091 			decoder->last_ip = 0;
2092 			/* Fall through */
2093 		case INTEL_PT_STATE_ERR_RESYNC:
2094 			err = intel_pt_sync_ip(decoder);
2095 			break;
2096 		case INTEL_PT_STATE_IN_SYNC:
2097 			err = intel_pt_walk_trace(decoder);
2098 			break;
2099 		case INTEL_PT_STATE_TNT:
2100 			err = intel_pt_walk_tnt(decoder);
2101 			if (err == -EAGAIN)
2102 				err = intel_pt_walk_trace(decoder);
2103 			break;
2104 		case INTEL_PT_STATE_TIP:
2105 		case INTEL_PT_STATE_TIP_PGD:
2106 			err = intel_pt_walk_tip(decoder);
2107 			break;
2108 		case INTEL_PT_STATE_FUP:
2109 			decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
2110 			err = intel_pt_walk_fup(decoder);
2111 			if (err == -EAGAIN)
2112 				err = intel_pt_walk_fup_tip(decoder);
2113 			else if (!err)
2114 				decoder->pkt_state = INTEL_PT_STATE_FUP;
2115 			break;
2116 		case INTEL_PT_STATE_FUP_NO_TIP:
2117 			decoder->pkt_state = INTEL_PT_STATE_IN_SYNC;
2118 			err = intel_pt_walk_fup(decoder);
2119 			if (err == -EAGAIN)
2120 				err = intel_pt_walk_trace(decoder);
2121 			break;
2122 		default:
2123 			err = intel_pt_bug(decoder);
2124 			break;
2125 		}
2126 	} while (err == -ENOLINK);
2127 
2128 	decoder->state.err = err ? intel_pt_ext_err(err) : 0;
2129 	decoder->state.timestamp = decoder->timestamp;
2130 	decoder->state.est_timestamp = intel_pt_est_timestamp(decoder);
2131 	decoder->state.cr3 = decoder->cr3;
2132 	decoder->state.tot_insn_cnt = decoder->tot_insn_cnt;
2133 
2134 	if (err)
2135 		decoder->state.from_ip = decoder->ip;
2136 
2137 	return &decoder->state;
2138 }
2139 
2140 static bool intel_pt_at_psb(unsigned char *buf, size_t len)
2141 {
2142 	if (len < INTEL_PT_PSB_LEN)
2143 		return false;
2144 	return memmem(buf, INTEL_PT_PSB_LEN, INTEL_PT_PSB_STR,
2145 		      INTEL_PT_PSB_LEN);
2146 }
2147 
2148 /**
2149  * intel_pt_next_psb - move buffer pointer to the start of the next PSB packet.
2150  * @buf: pointer to buffer pointer
2151  * @len: size of buffer
2152  *
2153  * Updates the buffer pointer to point to the start of the next PSB packet if
2154  * there is one, otherwise the buffer pointer is unchanged.  If @buf is updated,
2155  * @len is adjusted accordingly.
2156  *
2157  * Return: %true if a PSB packet is found, %false otherwise.
2158  */
2159 static bool intel_pt_next_psb(unsigned char **buf, size_t *len)
2160 {
2161 	unsigned char *next;
2162 
2163 	next = memmem(*buf, *len, INTEL_PT_PSB_STR, INTEL_PT_PSB_LEN);
2164 	if (next) {
2165 		*len -= next - *buf;
2166 		*buf = next;
2167 		return true;
2168 	}
2169 	return false;
2170 }
2171 
2172 /**
2173  * intel_pt_step_psb - move buffer pointer to the start of the following PSB
2174  *                     packet.
2175  * @buf: pointer to buffer pointer
2176  * @len: size of buffer
2177  *
2178  * Updates the buffer pointer to point to the start of the following PSB packet
2179  * (skipping the PSB at @buf itself) if there is one, otherwise the buffer
2180  * pointer is unchanged.  If @buf is updated, @len is adjusted accordingly.
2181  *
2182  * Return: %true if a PSB packet is found, %false otherwise.
2183  */
2184 static bool intel_pt_step_psb(unsigned char **buf, size_t *len)
2185 {
2186 	unsigned char *next;
2187 
2188 	if (!*len)
2189 		return false;
2190 
2191 	next = memmem(*buf + 1, *len - 1, INTEL_PT_PSB_STR, INTEL_PT_PSB_LEN);
2192 	if (next) {
2193 		*len -= next - *buf;
2194 		*buf = next;
2195 		return true;
2196 	}
2197 	return false;
2198 }
2199 
2200 /**
2201  * intel_pt_last_psb - find the last PSB packet in a buffer.
2202  * @buf: buffer
2203  * @len: size of buffer
2204  *
2205  * This function finds the last PSB in a buffer.
2206  *
2207  * Return: A pointer to the last PSB in @buf if found, %NULL otherwise.
2208  */
2209 static unsigned char *intel_pt_last_psb(unsigned char *buf, size_t len)
2210 {
2211 	const char *n = INTEL_PT_PSB_STR;
2212 	unsigned char *p;
2213 	size_t k;
2214 
2215 	if (len < INTEL_PT_PSB_LEN)
2216 		return NULL;
2217 
2218 	k = len - INTEL_PT_PSB_LEN + 1;
2219 	while (1) {
2220 		p = memrchr(buf, n[0], k);
2221 		if (!p)
2222 			return NULL;
2223 		if (!memcmp(p + 1, n + 1, INTEL_PT_PSB_LEN - 1))
2224 			return p;
2225 		k = p - buf;
2226 		if (!k)
2227 			return NULL;
2228 	}
2229 }
2230 
2231 /**
2232  * intel_pt_next_tsc - find and return next TSC.
2233  * @buf: buffer
2234  * @len: size of buffer
2235  * @tsc: TSC value returned
2236  *
2237  * Find a TSC packet in @buf and return the TSC value.  This function assumes
2238  * that @buf starts at a PSB and that PSB+ will contain TSC and so stops if a
2239  * PSBEND packet is found.
2240  *
2241  * Return: %true if TSC is found, false otherwise.
2242  */
2243 static bool intel_pt_next_tsc(unsigned char *buf, size_t len, uint64_t *tsc)
2244 {
2245 	struct intel_pt_pkt packet;
2246 	int ret;
2247 
2248 	while (len) {
2249 		ret = intel_pt_get_packet(buf, len, &packet);
2250 		if (ret <= 0)
2251 			return false;
2252 		if (packet.type == INTEL_PT_TSC) {
2253 			*tsc = packet.payload;
2254 			return true;
2255 		}
2256 		if (packet.type == INTEL_PT_PSBEND)
2257 			return false;
2258 		buf += ret;
2259 		len -= ret;
2260 	}
2261 	return false;
2262 }
2263 
2264 /**
2265  * intel_pt_tsc_cmp - compare 7-byte TSCs.
2266  * @tsc1: first TSC to compare
2267  * @tsc2: second TSC to compare
2268  *
2269  * This function compares 7-byte TSC values allowing for the possibility that
2270  * TSC wrapped around.  Generally it is not possible to know if TSC has wrapped
2271  * around so for that purpose this function assumes the absolute difference is
2272  * less than half the maximum difference.
2273  *
2274  * Return: %-1 if @tsc1 is before @tsc2, %0 if @tsc1 == @tsc2, %1 if @tsc1 is
2275  * after @tsc2.
2276  */
2277 static int intel_pt_tsc_cmp(uint64_t tsc1, uint64_t tsc2)
2278 {
2279 	const uint64_t halfway = (1ULL << 55);
2280 
2281 	if (tsc1 == tsc2)
2282 		return 0;
2283 
2284 	if (tsc1 < tsc2) {
2285 		if (tsc2 - tsc1 < halfway)
2286 			return -1;
2287 		else
2288 			return 1;
2289 	} else {
2290 		if (tsc1 - tsc2 < halfway)
2291 			return 1;
2292 		else
2293 			return -1;
2294 	}
2295 }
2296 
2297 /**
2298  * intel_pt_find_overlap_tsc - determine start of non-overlapped trace data
2299  *                             using TSC.
2300  * @buf_a: first buffer
2301  * @len_a: size of first buffer
2302  * @buf_b: second buffer
2303  * @len_b: size of second buffer
2304  *
2305  * If the trace contains TSC we can look at the last TSC of @buf_a and the
2306  * first TSC of @buf_b in order to determine if the buffers overlap, and then
2307  * walk forward in @buf_b until a later TSC is found.  A precondition is that
2308  * @buf_a and @buf_b are positioned at a PSB.
2309  *
2310  * Return: A pointer into @buf_b from where non-overlapped data starts, or
2311  * @buf_b + @len_b if there is no non-overlapped data.
2312  */
2313 static unsigned char *intel_pt_find_overlap_tsc(unsigned char *buf_a,
2314 						size_t len_a,
2315 						unsigned char *buf_b,
2316 						size_t len_b)
2317 {
2318 	uint64_t tsc_a, tsc_b;
2319 	unsigned char *p;
2320 	size_t len;
2321 
2322 	p = intel_pt_last_psb(buf_a, len_a);
2323 	if (!p)
2324 		return buf_b; /* No PSB in buf_a => no overlap */
2325 
2326 	len = len_a - (p - buf_a);
2327 	if (!intel_pt_next_tsc(p, len, &tsc_a)) {
2328 		/* The last PSB+ in buf_a is incomplete, so go back one more */
2329 		len_a -= len;
2330 		p = intel_pt_last_psb(buf_a, len_a);
2331 		if (!p)
2332 			return buf_b; /* No full PSB+ => assume no overlap */
2333 		len = len_a - (p - buf_a);
2334 		if (!intel_pt_next_tsc(p, len, &tsc_a))
2335 			return buf_b; /* No TSC in buf_a => assume no overlap */
2336 	}
2337 
2338 	while (1) {
2339 		/* Ignore PSB+ with no TSC */
2340 		if (intel_pt_next_tsc(buf_b, len_b, &tsc_b) &&
2341 		    intel_pt_tsc_cmp(tsc_a, tsc_b) < 0)
2342 			return buf_b; /* tsc_a < tsc_b => no overlap */
2343 
2344 		if (!intel_pt_step_psb(&buf_b, &len_b))
2345 			return buf_b + len_b; /* No PSB in buf_b => no data */
2346 	}
2347 }
2348 
2349 /**
2350  * intel_pt_find_overlap - determine start of non-overlapped trace data.
2351  * @buf_a: first buffer
2352  * @len_a: size of first buffer
2353  * @buf_b: second buffer
2354  * @len_b: size of second buffer
2355  * @have_tsc: can use TSC packets to detect overlap
2356  *
2357  * When trace samples or snapshots are recorded there is the possibility that
2358  * the data overlaps.  Note that, for the purposes of decoding, data is only
2359  * useful if it begins with a PSB packet.
2360  *
2361  * Return: A pointer into @buf_b from where non-overlapped data starts, or
2362  * @buf_b + @len_b if there is no non-overlapped data.
2363  */
2364 unsigned char *intel_pt_find_overlap(unsigned char *buf_a, size_t len_a,
2365 				     unsigned char *buf_b, size_t len_b,
2366 				     bool have_tsc)
2367 {
2368 	unsigned char *found;
2369 
2370 	/* Buffer 'b' must start at PSB so throw away everything before that */
2371 	if (!intel_pt_next_psb(&buf_b, &len_b))
2372 		return buf_b + len_b; /* No PSB */
2373 
2374 	if (!intel_pt_next_psb(&buf_a, &len_a))
2375 		return buf_b; /* No overlap */
2376 
2377 	if (have_tsc) {
2378 		found = intel_pt_find_overlap_tsc(buf_a, len_a, buf_b, len_b);
2379 		if (found)
2380 			return found;
2381 	}
2382 
2383 	/*
2384 	 * Buffer 'b' cannot end within buffer 'a' so, for comparison purposes,
2385 	 * we can ignore the first part of buffer 'a'.
2386 	 */
2387 	while (len_b < len_a) {
2388 		if (!intel_pt_step_psb(&buf_a, &len_a))
2389 			return buf_b; /* No overlap */
2390 	}
2391 
2392 	/* Now len_b >= len_a */
2393 	if (len_b > len_a) {
2394 		/* The leftover buffer 'b' must start at a PSB */
2395 		while (!intel_pt_at_psb(buf_b + len_a, len_b - len_a)) {
2396 			if (!intel_pt_step_psb(&buf_a, &len_a))
2397 				return buf_b; /* No overlap */
2398 		}
2399 	}
2400 
2401 	while (1) {
2402 		/* Potential overlap so check the bytes */
2403 		found = memmem(buf_a, len_a, buf_b, len_a);
2404 		if (found)
2405 			return buf_b + len_a;
2406 
2407 		/* Try again at next PSB in buffer 'a' */
2408 		if (!intel_pt_step_psb(&buf_a, &len_a))
2409 			return buf_b; /* No overlap */
2410 
2411 		/* The leftover buffer 'b' must start at a PSB */
2412 		while (!intel_pt_at_psb(buf_b + len_a, len_b - len_a)) {
2413 			if (!intel_pt_step_psb(&buf_a, &len_a))
2414 				return buf_b; /* No overlap */
2415 		}
2416 	}
2417 }
2418