1a54ca194STan Xiaojun // SPDX-License-Identifier: GPL-2.0
2a54ca194STan Xiaojun /*
3a54ca194STan Xiaojun * arm_spe_decoder.c: ARM SPE support
4a54ca194STan Xiaojun */
5a54ca194STan Xiaojun
6a54ca194STan Xiaojun #ifndef _GNU_SOURCE
7a54ca194STan Xiaojun #define _GNU_SOURCE
8a54ca194STan Xiaojun #endif
9a54ca194STan Xiaojun #include <errno.h>
10a54ca194STan Xiaojun #include <inttypes.h>
11a54ca194STan Xiaojun #include <stdbool.h>
12a54ca194STan Xiaojun #include <string.h>
13a54ca194STan Xiaojun #include <stdint.h>
14a54ca194STan Xiaojun #include <stdlib.h>
15c185f1cdSLeo Yan #include <linux/bitops.h>
16a54ca194STan Xiaojun #include <linux/compiler.h>
17a54ca194STan Xiaojun #include <linux/zalloc.h>
18a54ca194STan Xiaojun
19a54ca194STan Xiaojun #include "../auxtrace.h"
20a54ca194STan Xiaojun #include "../debug.h"
21a54ca194STan Xiaojun #include "../util.h"
22a54ca194STan Xiaojun
23a54ca194STan Xiaojun #include "arm-spe-decoder.h"
24a54ca194STan Xiaojun
arm_spe_calc_ip(int index,u64 payload)25a54ca194STan Xiaojun static u64 arm_spe_calc_ip(int index, u64 payload)
26a54ca194STan Xiaojun {
275513ddafSLeo Yan u64 ns, el, val;
28a54ca194STan Xiaojun
29a54ca194STan Xiaojun /* Instruction virtual address or Branch target address */
30a54ca194STan Xiaojun if (index == SPE_ADDR_PKT_HDR_INDEX_INS ||
31a54ca194STan Xiaojun index == SPE_ADDR_PKT_HDR_INDEX_BRANCH) {
3209935ca7SLeo Yan ns = SPE_ADDR_PKT_GET_NS(payload);
3309935ca7SLeo Yan el = SPE_ADDR_PKT_GET_EL(payload);
3409935ca7SLeo Yan
3509935ca7SLeo Yan /* Clean highest byte */
3609935ca7SLeo Yan payload = SPE_ADDR_PKT_ADDR_GET_BYTES_0_6(payload);
37a54ca194STan Xiaojun
38a54ca194STan Xiaojun /* Fill highest byte for EL1 or EL2 (VHE) mode */
39a54ca194STan Xiaojun if (ns && (el == SPE_ADDR_PKT_EL1 || el == SPE_ADDR_PKT_EL2))
4009935ca7SLeo Yan payload |= 0xffULL << SPE_ADDR_PKT_ADDR_BYTE7_SHIFT;
41a54ca194STan Xiaojun
42a54ca194STan Xiaojun /* Data access virtual address */
43a54ca194STan Xiaojun } else if (index == SPE_ADDR_PKT_HDR_INDEX_DATA_VIRT) {
44a54ca194STan Xiaojun
4509935ca7SLeo Yan /* Clean tags */
4609935ca7SLeo Yan payload = SPE_ADDR_PKT_ADDR_GET_BYTES_0_6(payload);
4709935ca7SLeo Yan
485513ddafSLeo Yan /*
495513ddafSLeo Yan * Armv8 ARM (ARM DDI 0487F.c), chapter "D10.2.1 Address packet"
505513ddafSLeo Yan * defines the data virtual address payload format, the top byte
515513ddafSLeo Yan * (bits [63:56]) is assigned as top-byte tag; so we only can
525513ddafSLeo Yan * retrieve address value from bits [55:0].
535513ddafSLeo Yan *
545513ddafSLeo Yan * According to Documentation/arch/arm64/memory.rst, if detects the
555513ddafSLeo Yan * specific pattern in bits [55:52] of payload which falls in
565513ddafSLeo Yan * the kernel space, should fixup the top byte and this allows
575513ddafSLeo Yan * perf tool to parse DSO symbol for data address correctly.
585513ddafSLeo Yan *
595513ddafSLeo Yan * For this reason, if detects the bits [55:52] is 0xf, will
605513ddafSLeo Yan * fill 0xff into the top byte.
615513ddafSLeo Yan */
625513ddafSLeo Yan val = SPE_ADDR_PKT_ADDR_GET_BYTE_6(payload);
635513ddafSLeo Yan if ((val & 0xf0ULL) == 0xf0ULL)
6409935ca7SLeo Yan payload |= 0xffULL << SPE_ADDR_PKT_ADDR_BYTE7_SHIFT;
65a54ca194STan Xiaojun
66a54ca194STan Xiaojun /* Data access physical address */
67a54ca194STan Xiaojun } else if (index == SPE_ADDR_PKT_HDR_INDEX_DATA_PHYS) {
6809935ca7SLeo Yan /* Clean highest byte */
6909935ca7SLeo Yan payload = SPE_ADDR_PKT_ADDR_GET_BYTES_0_6(payload);
70a54ca194STan Xiaojun } else {
7128899594SRob Herring static u32 seen_idx = 0;
7228899594SRob Herring if (!(seen_idx & BIT(index))) {
7328899594SRob Herring seen_idx |= BIT(index);
7428899594SRob Herring pr_warning("ignoring unsupported address packet index: 0x%x\n", index);
7528899594SRob Herring }
76a54ca194STan Xiaojun }
77a54ca194STan Xiaojun
78a54ca194STan Xiaojun return payload;
79a54ca194STan Xiaojun }
80a54ca194STan Xiaojun
arm_spe_decoder_new(struct arm_spe_params * params)81a54ca194STan Xiaojun struct arm_spe_decoder *arm_spe_decoder_new(struct arm_spe_params *params)
82a54ca194STan Xiaojun {
83a54ca194STan Xiaojun struct arm_spe_decoder *decoder;
84a54ca194STan Xiaojun
85a54ca194STan Xiaojun if (!params->get_trace)
86a54ca194STan Xiaojun return NULL;
87a54ca194STan Xiaojun
88a54ca194STan Xiaojun decoder = zalloc(sizeof(struct arm_spe_decoder));
89a54ca194STan Xiaojun if (!decoder)
90a54ca194STan Xiaojun return NULL;
91a54ca194STan Xiaojun
92a54ca194STan Xiaojun decoder->get_trace = params->get_trace;
93a54ca194STan Xiaojun decoder->data = params->data;
94a54ca194STan Xiaojun
95a54ca194STan Xiaojun return decoder;
96a54ca194STan Xiaojun }
97a54ca194STan Xiaojun
arm_spe_decoder_free(struct arm_spe_decoder * decoder)98a54ca194STan Xiaojun void arm_spe_decoder_free(struct arm_spe_decoder *decoder)
99a54ca194STan Xiaojun {
100a54ca194STan Xiaojun free(decoder);
101a54ca194STan Xiaojun }
102a54ca194STan Xiaojun
arm_spe_get_data(struct arm_spe_decoder * decoder)103a54ca194STan Xiaojun static int arm_spe_get_data(struct arm_spe_decoder *decoder)
104a54ca194STan Xiaojun {
105a54ca194STan Xiaojun struct arm_spe_buffer buffer = { .buf = 0, };
106a54ca194STan Xiaojun int ret;
107a54ca194STan Xiaojun
108a54ca194STan Xiaojun pr_debug("Getting more data\n");
109a54ca194STan Xiaojun ret = decoder->get_trace(&buffer, decoder->data);
110a54ca194STan Xiaojun if (ret < 0)
111a54ca194STan Xiaojun return ret;
112a54ca194STan Xiaojun
113a54ca194STan Xiaojun decoder->buf = buffer.buf;
114a54ca194STan Xiaojun decoder->len = buffer.len;
115a54ca194STan Xiaojun
116a54ca194STan Xiaojun if (!decoder->len)
117a54ca194STan Xiaojun pr_debug("No more data\n");
118a54ca194STan Xiaojun
119a54ca194STan Xiaojun return decoder->len;
120a54ca194STan Xiaojun }
121a54ca194STan Xiaojun
arm_spe_get_next_packet(struct arm_spe_decoder * decoder)122a54ca194STan Xiaojun static int arm_spe_get_next_packet(struct arm_spe_decoder *decoder)
123a54ca194STan Xiaojun {
124a54ca194STan Xiaojun int ret;
125a54ca194STan Xiaojun
126a54ca194STan Xiaojun do {
127a54ca194STan Xiaojun if (!decoder->len) {
128a54ca194STan Xiaojun ret = arm_spe_get_data(decoder);
129a54ca194STan Xiaojun
130a54ca194STan Xiaojun /* Failed to read out trace data */
131a54ca194STan Xiaojun if (ret <= 0)
132a54ca194STan Xiaojun return ret;
133a54ca194STan Xiaojun }
134a54ca194STan Xiaojun
135a54ca194STan Xiaojun ret = arm_spe_get_packet(decoder->buf, decoder->len,
136a54ca194STan Xiaojun &decoder->packet);
137a54ca194STan Xiaojun if (ret <= 0) {
138a54ca194STan Xiaojun /* Move forward for 1 byte */
139a54ca194STan Xiaojun decoder->buf += 1;
140a54ca194STan Xiaojun decoder->len -= 1;
141a54ca194STan Xiaojun return -EBADMSG;
142a54ca194STan Xiaojun }
143a54ca194STan Xiaojun
144a54ca194STan Xiaojun decoder->buf += ret;
145a54ca194STan Xiaojun decoder->len -= ret;
146a54ca194STan Xiaojun } while (decoder->packet.type == ARM_SPE_PAD);
147a54ca194STan Xiaojun
148a54ca194STan Xiaojun return 1;
149a54ca194STan Xiaojun }
150a54ca194STan Xiaojun
arm_spe_read_record(struct arm_spe_decoder * decoder)151a54ca194STan Xiaojun static int arm_spe_read_record(struct arm_spe_decoder *decoder)
152a54ca194STan Xiaojun {
153a54ca194STan Xiaojun int err;
154a54ca194STan Xiaojun int idx;
155a54ca194STan Xiaojun u64 payload, ip;
156a54ca194STan Xiaojun
157a54ca194STan Xiaojun memset(&decoder->record, 0x0, sizeof(decoder->record));
158169de64fSGerman Gomez decoder->record.context_id = (u64)-1;
159a54ca194STan Xiaojun
160a54ca194STan Xiaojun while (1) {
161a54ca194STan Xiaojun err = arm_spe_get_next_packet(decoder);
162a54ca194STan Xiaojun if (err <= 0)
163a54ca194STan Xiaojun return err;
164a54ca194STan Xiaojun
165a54ca194STan Xiaojun idx = decoder->packet.index;
166a54ca194STan Xiaojun payload = decoder->packet.payload;
167a54ca194STan Xiaojun
168a54ca194STan Xiaojun switch (decoder->packet.type) {
169a54ca194STan Xiaojun case ARM_SPE_TIMESTAMP:
170a54ca194STan Xiaojun decoder->record.timestamp = payload;
171a54ca194STan Xiaojun return 1;
172a54ca194STan Xiaojun case ARM_SPE_END:
173a54ca194STan Xiaojun return 1;
174a54ca194STan Xiaojun case ARM_SPE_ADDRESS:
175a54ca194STan Xiaojun ip = arm_spe_calc_ip(idx, payload);
176a54ca194STan Xiaojun if (idx == SPE_ADDR_PKT_HDR_INDEX_INS)
177a54ca194STan Xiaojun decoder->record.from_ip = ip;
178a54ca194STan Xiaojun else if (idx == SPE_ADDR_PKT_HDR_INDEX_BRANCH)
179a54ca194STan Xiaojun decoder->record.to_ip = ip;
180265cfb95SLeo Yan else if (idx == SPE_ADDR_PKT_HDR_INDEX_DATA_VIRT)
181265cfb95SLeo Yan decoder->record.virt_addr = ip;
182265cfb95SLeo Yan else if (idx == SPE_ADDR_PKT_HDR_INDEX_DATA_PHYS)
183265cfb95SLeo Yan decoder->record.phys_addr = ip;
184a54ca194STan Xiaojun break;
185a54ca194STan Xiaojun case ARM_SPE_COUNTER:
186b0fde9c6SNamhyung Kim if (idx == SPE_CNT_PKT_HDR_INDEX_TOTAL_LAT)
187b0fde9c6SNamhyung Kim decoder->record.latency = payload;
188a54ca194STan Xiaojun break;
189a54ca194STan Xiaojun case ARM_SPE_CONTEXT:
190169de64fSGerman Gomez decoder->record.context_id = payload;
191a54ca194STan Xiaojun break;
192a54ca194STan Xiaojun case ARM_SPE_OP_TYPE:
193*0066015aSGerman Gomez switch (idx) {
194*0066015aSGerman Gomez case SPE_OP_PKT_HDR_CLASS_LD_ST_ATOMIC:
195*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_LDST;
196*0066015aSGerman Gomez if (payload & SPE_OP_PKT_ST)
197*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_ST;
19897ae666aSLeo Yan else
199*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_LD;
200*0066015aSGerman Gomez if (SPE_OP_PKT_IS_LDST_SVE(payload))
201*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_SVE_LDST;
202*0066015aSGerman Gomez break;
203*0066015aSGerman Gomez case SPE_OP_PKT_HDR_CLASS_OTHER:
204*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_OTHER;
205*0066015aSGerman Gomez if (SPE_OP_PKT_IS_OTHER_SVE_OP(payload))
206*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_SVE_OTHER;
207*0066015aSGerman Gomez break;
208*0066015aSGerman Gomez case SPE_OP_PKT_HDR_CLASS_BR_ERET:
209*0066015aSGerman Gomez decoder->record.op |= ARM_SPE_OP_BRANCH_ERET;
210*0066015aSGerman Gomez break;
211*0066015aSGerman Gomez default:
212*0066015aSGerman Gomez pr_err("Get packet error!\n");
213*0066015aSGerman Gomez return -1;
21497ae666aSLeo Yan }
215a54ca194STan Xiaojun break;
216a54ca194STan Xiaojun case ARM_SPE_EVENTS:
217a54ca194STan Xiaojun if (payload & BIT(EV_L1D_REFILL))
218a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_L1D_MISS;
219a54ca194STan Xiaojun
220a54ca194STan Xiaojun if (payload & BIT(EV_L1D_ACCESS))
221a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_L1D_ACCESS;
222a54ca194STan Xiaojun
223a54ca194STan Xiaojun if (payload & BIT(EV_TLB_WALK))
224a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_TLB_MISS;
225a54ca194STan Xiaojun
226a54ca194STan Xiaojun if (payload & BIT(EV_TLB_ACCESS))
227a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_TLB_ACCESS;
228a54ca194STan Xiaojun
2294d0f4ca2SLeo Yan if (payload & BIT(EV_LLC_MISS))
230a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_LLC_MISS;
231a54ca194STan Xiaojun
2324d0f4ca2SLeo Yan if (payload & BIT(EV_LLC_ACCESS))
233a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_LLC_ACCESS;
234a54ca194STan Xiaojun
2354d0f4ca2SLeo Yan if (payload & BIT(EV_REMOTE_ACCESS))
236a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_REMOTE_ACCESS;
237a54ca194STan Xiaojun
238a54ca194STan Xiaojun if (payload & BIT(EV_MISPRED))
239a54ca194STan Xiaojun decoder->record.type |= ARM_SPE_BRANCH_MISS;
240a54ca194STan Xiaojun
241*0066015aSGerman Gomez if (payload & BIT(EV_PARTIAL_PREDICATE))
242*0066015aSGerman Gomez decoder->record.type |= ARM_SPE_SVE_PARTIAL_PRED;
243*0066015aSGerman Gomez
244*0066015aSGerman Gomez if (payload & BIT(EV_EMPTY_PREDICATE))
245*0066015aSGerman Gomez decoder->record.type |= ARM_SPE_SVE_EMPTY_PRED;
246*0066015aSGerman Gomez
247a54ca194STan Xiaojun break;
248a54ca194STan Xiaojun case ARM_SPE_DATA_SOURCE:
2494e6430cbSAli Saidi decoder->record.source = payload;
250a54ca194STan Xiaojun break;
251a54ca194STan Xiaojun case ARM_SPE_BAD:
252a54ca194STan Xiaojun break;
253a54ca194STan Xiaojun case ARM_SPE_PAD:
254a54ca194STan Xiaojun break;
255a54ca194STan Xiaojun default:
256a54ca194STan Xiaojun pr_err("Get packet error!\n");
257a54ca194STan Xiaojun return -1;
258a54ca194STan Xiaojun }
259a54ca194STan Xiaojun }
260a54ca194STan Xiaojun
261a54ca194STan Xiaojun return 0;
262a54ca194STan Xiaojun }
263a54ca194STan Xiaojun
arm_spe_decode(struct arm_spe_decoder * decoder)264a54ca194STan Xiaojun int arm_spe_decode(struct arm_spe_decoder *decoder)
265a54ca194STan Xiaojun {
266a54ca194STan Xiaojun return arm_spe_read_record(decoder);
267a54ca194STan Xiaojun }
268