1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Copyright (C) 2020-2023 Intel Corporation 4 */ 5 6 #include <linux/circ_buf.h> 7 #include <linux/highmem.h> 8 9 #include "ivpu_drv.h" 10 #include "ivpu_hw_37xx_reg.h" 11 #include "ivpu_hw_reg_io.h" 12 #include "ivpu_mmu.h" 13 #include "ivpu_mmu_context.h" 14 #include "ivpu_pm.h" 15 16 #define IVPU_MMU_IDR0_REF 0x080f3e0f 17 #define IVPU_MMU_IDR0_REF_SIMICS 0x080f3e1f 18 #define IVPU_MMU_IDR1_REF 0x0e739d18 19 #define IVPU_MMU_IDR3_REF 0x0000003c 20 #define IVPU_MMU_IDR5_REF 0x00040070 21 #define IVPU_MMU_IDR5_REF_SIMICS 0x00000075 22 #define IVPU_MMU_IDR5_REF_FPGA 0x00800075 23 24 #define IVPU_MMU_CDTAB_ENT_SIZE 64 25 #define IVPU_MMU_CDTAB_ENT_COUNT_LOG2 8 /* 256 entries */ 26 #define IVPU_MMU_CDTAB_ENT_COUNT ((u32)1 << IVPU_MMU_CDTAB_ENT_COUNT_LOG2) 27 28 #define IVPU_MMU_STREAM_ID0 0 29 #define IVPU_MMU_STREAM_ID3 3 30 31 #define IVPU_MMU_STRTAB_ENT_SIZE 64 32 #define IVPU_MMU_STRTAB_ENT_COUNT 4 33 #define IVPU_MMU_STRTAB_CFG_LOG2SIZE 2 34 #define IVPU_MMU_STRTAB_CFG IVPU_MMU_STRTAB_CFG_LOG2SIZE 35 36 #define IVPU_MMU_Q_COUNT_LOG2 4 /* 16 entries */ 37 #define IVPU_MMU_Q_COUNT ((u32)1 << IVPU_MMU_Q_COUNT_LOG2) 38 #define IVPU_MMU_Q_WRAP_BIT (IVPU_MMU_Q_COUNT << 1) 39 #define IVPU_MMU_Q_WRAP_MASK (IVPU_MMU_Q_WRAP_BIT - 1) 40 #define IVPU_MMU_Q_IDX_MASK (IVPU_MMU_Q_COUNT - 1) 41 #define IVPU_MMU_Q_IDX(val) ((val) & IVPU_MMU_Q_IDX_MASK) 42 43 #define IVPU_MMU_CMDQ_CMD_SIZE 16 44 #define IVPU_MMU_CMDQ_SIZE (IVPU_MMU_Q_COUNT * IVPU_MMU_CMDQ_CMD_SIZE) 45 46 #define IVPU_MMU_EVTQ_CMD_SIZE 32 47 #define IVPU_MMU_EVTQ_SIZE (IVPU_MMU_Q_COUNT * IVPU_MMU_EVTQ_CMD_SIZE) 48 49 #define IVPU_MMU_CMD_OPCODE GENMASK(7, 0) 50 51 #define IVPU_MMU_CMD_SYNC_0_CS GENMASK(13, 12) 52 #define IVPU_MMU_CMD_SYNC_0_MSH GENMASK(23, 22) 53 #define IVPU_MMU_CMD_SYNC_0_MSI_ATTR GENMASK(27, 24) 54 #define IVPU_MMU_CMD_SYNC_0_MSI_ATTR GENMASK(27, 24) 55 #define IVPU_MMU_CMD_SYNC_0_MSI_DATA GENMASK(63, 32) 56 57 #define IVPU_MMU_CMD_CFGI_0_SSEC BIT(10) 58 #define IVPU_MMU_CMD_CFGI_0_SSV BIT(11) 59 #define IVPU_MMU_CMD_CFGI_0_SSID GENMASK(31, 12) 60 #define IVPU_MMU_CMD_CFGI_0_SID GENMASK(63, 32) 61 #define IVPU_MMU_CMD_CFGI_1_RANGE GENMASK(4, 0) 62 63 #define IVPU_MMU_CMD_TLBI_0_ASID GENMASK(63, 48) 64 #define IVPU_MMU_CMD_TLBI_0_VMID GENMASK(47, 32) 65 66 #define CMD_PREFETCH_CFG 0x1 67 #define CMD_CFGI_STE 0x3 68 #define CMD_CFGI_ALL 0x4 69 #define CMD_CFGI_CD 0x5 70 #define CMD_CFGI_CD_ALL 0x6 71 #define CMD_TLBI_NH_ASID 0x11 72 #define CMD_TLBI_EL2_ALL 0x20 73 #define CMD_TLBI_NSNH_ALL 0x30 74 #define CMD_SYNC 0x46 75 76 #define IVPU_MMU_EVT_F_UUT 0x01 77 #define IVPU_MMU_EVT_C_BAD_STREAMID 0x02 78 #define IVPU_MMU_EVT_F_STE_FETCH 0x03 79 #define IVPU_MMU_EVT_C_BAD_STE 0x04 80 #define IVPU_MMU_EVT_F_BAD_ATS_TREQ 0x05 81 #define IVPU_MMU_EVT_F_STREAM_DISABLED 0x06 82 #define IVPU_MMU_EVT_F_TRANSL_FORBIDDEN 0x07 83 #define IVPU_MMU_EVT_C_BAD_SUBSTREAMID 0x08 84 #define IVPU_MMU_EVT_F_CD_FETCH 0x09 85 #define IVPU_MMU_EVT_C_BAD_CD 0x0a 86 #define IVPU_MMU_EVT_F_WALK_EABT 0x0b 87 #define IVPU_MMU_EVT_F_TRANSLATION 0x10 88 #define IVPU_MMU_EVT_F_ADDR_SIZE 0x11 89 #define IVPU_MMU_EVT_F_ACCESS 0x12 90 #define IVPU_MMU_EVT_F_PERMISSION 0x13 91 #define IVPU_MMU_EVT_F_TLB_CONFLICT 0x20 92 #define IVPU_MMU_EVT_F_CFG_CONFLICT 0x21 93 #define IVPU_MMU_EVT_E_PAGE_REQUEST 0x24 94 #define IVPU_MMU_EVT_F_VMS_FETCH 0x25 95 96 #define IVPU_MMU_EVT_OP_MASK GENMASK_ULL(7, 0) 97 #define IVPU_MMU_EVT_SSID_MASK GENMASK_ULL(31, 12) 98 99 #define IVPU_MMU_Q_BASE_RWA BIT(62) 100 #define IVPU_MMU_Q_BASE_ADDR_MASK GENMASK_ULL(51, 5) 101 #define IVPU_MMU_STRTAB_BASE_RA BIT(62) 102 #define IVPU_MMU_STRTAB_BASE_ADDR_MASK GENMASK_ULL(51, 6) 103 104 #define IVPU_MMU_IRQ_EVTQ_EN BIT(2) 105 #define IVPU_MMU_IRQ_GERROR_EN BIT(0) 106 107 #define IVPU_MMU_CR0_ATSCHK BIT(4) 108 #define IVPU_MMU_CR0_CMDQEN BIT(3) 109 #define IVPU_MMU_CR0_EVTQEN BIT(2) 110 #define IVPU_MMU_CR0_PRIQEN BIT(1) 111 #define IVPU_MMU_CR0_SMMUEN BIT(0) 112 113 #define IVPU_MMU_CR1_TABLE_SH GENMASK(11, 10) 114 #define IVPU_MMU_CR1_TABLE_OC GENMASK(9, 8) 115 #define IVPU_MMU_CR1_TABLE_IC GENMASK(7, 6) 116 #define IVPU_MMU_CR1_QUEUE_SH GENMASK(5, 4) 117 #define IVPU_MMU_CR1_QUEUE_OC GENMASK(3, 2) 118 #define IVPU_MMU_CR1_QUEUE_IC GENMASK(1, 0) 119 #define IVPU_MMU_CACHE_NC 0 120 #define IVPU_MMU_CACHE_WB 1 121 #define IVPU_MMU_CACHE_WT 2 122 #define IVPU_MMU_SH_NSH 0 123 #define IVPU_MMU_SH_OSH 2 124 #define IVPU_MMU_SH_ISH 3 125 126 #define IVPU_MMU_CMDQ_OP GENMASK_ULL(7, 0) 127 128 #define IVPU_MMU_CD_0_TCR_T0SZ GENMASK_ULL(5, 0) 129 #define IVPU_MMU_CD_0_TCR_TG0 GENMASK_ULL(7, 6) 130 #define IVPU_MMU_CD_0_TCR_IRGN0 GENMASK_ULL(9, 8) 131 #define IVPU_MMU_CD_0_TCR_ORGN0 GENMASK_ULL(11, 10) 132 #define IVPU_MMU_CD_0_TCR_SH0 GENMASK_ULL(13, 12) 133 #define IVPU_MMU_CD_0_TCR_EPD0 BIT_ULL(14) 134 #define IVPU_MMU_CD_0_TCR_EPD1 BIT_ULL(30) 135 #define IVPU_MMU_CD_0_ENDI BIT(15) 136 #define IVPU_MMU_CD_0_V BIT(31) 137 #define IVPU_MMU_CD_0_TCR_IPS GENMASK_ULL(34, 32) 138 #define IVPU_MMU_CD_0_TCR_TBI0 BIT_ULL(38) 139 #define IVPU_MMU_CD_0_AA64 BIT(41) 140 #define IVPU_MMU_CD_0_S BIT(44) 141 #define IVPU_MMU_CD_0_R BIT(45) 142 #define IVPU_MMU_CD_0_A BIT(46) 143 #define IVPU_MMU_CD_0_ASET BIT(47) 144 #define IVPU_MMU_CD_0_ASID GENMASK_ULL(63, 48) 145 146 #define IVPU_MMU_T0SZ_48BIT 16 147 #define IVPU_MMU_T0SZ_38BIT 26 148 149 #define IVPU_MMU_IPS_48BIT 5 150 #define IVPU_MMU_IPS_44BIT 4 151 #define IVPU_MMU_IPS_42BIT 3 152 #define IVPU_MMU_IPS_40BIT 2 153 #define IVPU_MMU_IPS_36BIT 1 154 #define IVPU_MMU_IPS_32BIT 0 155 156 #define IVPU_MMU_CD_1_TTB0_MASK GENMASK_ULL(51, 4) 157 158 #define IVPU_MMU_STE_0_S1CDMAX GENMASK_ULL(63, 59) 159 #define IVPU_MMU_STE_0_S1FMT GENMASK_ULL(5, 4) 160 #define IVPU_MMU_STE_0_S1FMT_LINEAR 0 161 #define IVPU_MMU_STE_DWORDS 8 162 #define IVPU_MMU_STE_0_CFG_S1_TRANS 5 163 #define IVPU_MMU_STE_0_CFG GENMASK_ULL(3, 1) 164 #define IVPU_MMU_STE_0_S1CTXPTR_MASK GENMASK_ULL(51, 6) 165 #define IVPU_MMU_STE_0_V BIT(0) 166 167 #define IVPU_MMU_STE_1_STRW_NSEL1 0ul 168 #define IVPU_MMU_STE_1_CONT GENMASK_ULL(16, 13) 169 #define IVPU_MMU_STE_1_STRW GENMASK_ULL(31, 30) 170 #define IVPU_MMU_STE_1_PRIVCFG GENMASK_ULL(49, 48) 171 #define IVPU_MMU_STE_1_PRIVCFG_UNPRIV 2ul 172 #define IVPU_MMU_STE_1_INSTCFG GENMASK_ULL(51, 50) 173 #define IVPU_MMU_STE_1_INSTCFG_DATA 2ul 174 #define IVPU_MMU_STE_1_MEV BIT(19) 175 #define IVPU_MMU_STE_1_S1STALLD BIT(27) 176 #define IVPU_MMU_STE_1_S1C_CACHE_NC 0ul 177 #define IVPU_MMU_STE_1_S1C_CACHE_WBRA 1ul 178 #define IVPU_MMU_STE_1_S1C_CACHE_WT 2ul 179 #define IVPU_MMU_STE_1_S1C_CACHE_WB 3ul 180 #define IVPU_MMU_STE_1_S1CIR GENMASK_ULL(3, 2) 181 #define IVPU_MMU_STE_1_S1COR GENMASK_ULL(5, 4) 182 #define IVPU_MMU_STE_1_S1CSH GENMASK_ULL(7, 6) 183 #define IVPU_MMU_STE_1_S1DSS GENMASK_ULL(1, 0) 184 #define IVPU_MMU_STE_1_S1DSS_TERMINATE 0x0 185 186 #define IVPU_MMU_REG_TIMEOUT_US (10 * USEC_PER_MSEC) 187 #define IVPU_MMU_QUEUE_TIMEOUT_US (100 * USEC_PER_MSEC) 188 189 #define IVPU_MMU_GERROR_ERR_MASK ((REG_FLD(VPU_37XX_HOST_MMU_GERROR, CMDQ)) | \ 190 (REG_FLD(VPU_37XX_HOST_MMU_GERROR, EVTQ_ABT)) | \ 191 (REG_FLD(VPU_37XX_HOST_MMU_GERROR, PRIQ_ABT)) | \ 192 (REG_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_CMDQ_ABT)) | \ 193 (REG_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_EVTQ_ABT)) | \ 194 (REG_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_PRIQ_ABT)) | \ 195 (REG_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_ABT))) 196 197 static char *ivpu_mmu_event_to_str(u32 cmd) 198 { 199 switch (cmd) { 200 case IVPU_MMU_EVT_F_UUT: 201 return "Unsupported Upstream Transaction"; 202 case IVPU_MMU_EVT_C_BAD_STREAMID: 203 return "Transaction StreamID out of range"; 204 case IVPU_MMU_EVT_F_STE_FETCH: 205 return "Fetch of STE caused external abort"; 206 case IVPU_MMU_EVT_C_BAD_STE: 207 return "Used STE invalid"; 208 case IVPU_MMU_EVT_F_BAD_ATS_TREQ: 209 return "Address Request disallowed for a StreamID"; 210 case IVPU_MMU_EVT_F_STREAM_DISABLED: 211 return "Transaction marks non-substream disabled"; 212 case IVPU_MMU_EVT_F_TRANSL_FORBIDDEN: 213 return "MMU bypass is disallowed for this StreamID"; 214 case IVPU_MMU_EVT_C_BAD_SUBSTREAMID: 215 return "Invalid StreamID"; 216 case IVPU_MMU_EVT_F_CD_FETCH: 217 return "Fetch of CD caused external abort"; 218 case IVPU_MMU_EVT_C_BAD_CD: 219 return "Fetched CD invalid"; 220 case IVPU_MMU_EVT_F_WALK_EABT: 221 return " An external abort occurred fetching a TLB"; 222 case IVPU_MMU_EVT_F_TRANSLATION: 223 return "Translation fault"; 224 case IVPU_MMU_EVT_F_ADDR_SIZE: 225 return " Output address caused address size fault"; 226 case IVPU_MMU_EVT_F_ACCESS: 227 return "Access flag fault"; 228 case IVPU_MMU_EVT_F_PERMISSION: 229 return "Permission fault occurred on page access"; 230 case IVPU_MMU_EVT_F_TLB_CONFLICT: 231 return "A TLB conflict"; 232 case IVPU_MMU_EVT_F_CFG_CONFLICT: 233 return "A configuration cache conflict"; 234 case IVPU_MMU_EVT_E_PAGE_REQUEST: 235 return "Page request hint from a client device"; 236 case IVPU_MMU_EVT_F_VMS_FETCH: 237 return "Fetch of VMS caused external abort"; 238 default: 239 return "Unknown CMDQ command"; 240 } 241 } 242 243 static void ivpu_mmu_config_check(struct ivpu_device *vdev) 244 { 245 u32 val_ref; 246 u32 val; 247 248 if (ivpu_is_simics(vdev)) 249 val_ref = IVPU_MMU_IDR0_REF_SIMICS; 250 else 251 val_ref = IVPU_MMU_IDR0_REF; 252 253 val = REGV_RD32(VPU_37XX_HOST_MMU_IDR0); 254 if (val != val_ref) 255 ivpu_dbg(vdev, MMU, "IDR0 0x%x != IDR0_REF 0x%x\n", val, val_ref); 256 257 val = REGV_RD32(VPU_37XX_HOST_MMU_IDR1); 258 if (val != IVPU_MMU_IDR1_REF) 259 ivpu_dbg(vdev, MMU, "IDR1 0x%x != IDR1_REF 0x%x\n", val, IVPU_MMU_IDR1_REF); 260 261 val = REGV_RD32(VPU_37XX_HOST_MMU_IDR3); 262 if (val != IVPU_MMU_IDR3_REF) 263 ivpu_dbg(vdev, MMU, "IDR3 0x%x != IDR3_REF 0x%x\n", val, IVPU_MMU_IDR3_REF); 264 265 if (ivpu_is_simics(vdev)) 266 val_ref = IVPU_MMU_IDR5_REF_SIMICS; 267 else if (ivpu_is_fpga(vdev)) 268 val_ref = IVPU_MMU_IDR5_REF_FPGA; 269 else 270 val_ref = IVPU_MMU_IDR5_REF; 271 272 val = REGV_RD32(VPU_37XX_HOST_MMU_IDR5); 273 if (val != val_ref) 274 ivpu_dbg(vdev, MMU, "IDR5 0x%x != IDR5_REF 0x%x\n", val, val_ref); 275 } 276 277 static int ivpu_mmu_cdtab_alloc(struct ivpu_device *vdev) 278 { 279 struct ivpu_mmu_info *mmu = vdev->mmu; 280 struct ivpu_mmu_cdtab *cdtab = &mmu->cdtab; 281 size_t size = IVPU_MMU_CDTAB_ENT_COUNT * IVPU_MMU_CDTAB_ENT_SIZE; 282 283 cdtab->base = dmam_alloc_coherent(vdev->drm.dev, size, &cdtab->dma, GFP_KERNEL); 284 if (!cdtab->base) 285 return -ENOMEM; 286 287 ivpu_dbg(vdev, MMU, "CDTAB alloc: dma=%pad size=%zu\n", &cdtab->dma, size); 288 289 return 0; 290 } 291 292 static int ivpu_mmu_strtab_alloc(struct ivpu_device *vdev) 293 { 294 struct ivpu_mmu_info *mmu = vdev->mmu; 295 struct ivpu_mmu_strtab *strtab = &mmu->strtab; 296 size_t size = IVPU_MMU_STRTAB_ENT_COUNT * IVPU_MMU_STRTAB_ENT_SIZE; 297 298 strtab->base = dmam_alloc_coherent(vdev->drm.dev, size, &strtab->dma, GFP_KERNEL); 299 if (!strtab->base) 300 return -ENOMEM; 301 302 strtab->base_cfg = IVPU_MMU_STRTAB_CFG; 303 strtab->dma_q = IVPU_MMU_STRTAB_BASE_RA; 304 strtab->dma_q |= strtab->dma & IVPU_MMU_STRTAB_BASE_ADDR_MASK; 305 306 ivpu_dbg(vdev, MMU, "STRTAB alloc: dma=%pad dma_q=%pad size=%zu\n", 307 &strtab->dma, &strtab->dma_q, size); 308 309 return 0; 310 } 311 312 static int ivpu_mmu_cmdq_alloc(struct ivpu_device *vdev) 313 { 314 struct ivpu_mmu_info *mmu = vdev->mmu; 315 struct ivpu_mmu_queue *q = &mmu->cmdq; 316 317 q->base = dmam_alloc_coherent(vdev->drm.dev, IVPU_MMU_CMDQ_SIZE, &q->dma, GFP_KERNEL); 318 if (!q->base) 319 return -ENOMEM; 320 321 q->dma_q = IVPU_MMU_Q_BASE_RWA; 322 q->dma_q |= q->dma & IVPU_MMU_Q_BASE_ADDR_MASK; 323 q->dma_q |= IVPU_MMU_Q_COUNT_LOG2; 324 325 ivpu_dbg(vdev, MMU, "CMDQ alloc: dma=%pad dma_q=%pad size=%u\n", 326 &q->dma, &q->dma_q, IVPU_MMU_CMDQ_SIZE); 327 328 return 0; 329 } 330 331 static int ivpu_mmu_evtq_alloc(struct ivpu_device *vdev) 332 { 333 struct ivpu_mmu_info *mmu = vdev->mmu; 334 struct ivpu_mmu_queue *q = &mmu->evtq; 335 336 q->base = dmam_alloc_coherent(vdev->drm.dev, IVPU_MMU_EVTQ_SIZE, &q->dma, GFP_KERNEL); 337 if (!q->base) 338 return -ENOMEM; 339 340 q->dma_q = IVPU_MMU_Q_BASE_RWA; 341 q->dma_q |= q->dma & IVPU_MMU_Q_BASE_ADDR_MASK; 342 q->dma_q |= IVPU_MMU_Q_COUNT_LOG2; 343 344 ivpu_dbg(vdev, MMU, "EVTQ alloc: dma=%pad dma_q=%pad size=%u\n", 345 &q->dma, &q->dma_q, IVPU_MMU_EVTQ_SIZE); 346 347 return 0; 348 } 349 350 static int ivpu_mmu_structs_alloc(struct ivpu_device *vdev) 351 { 352 int ret; 353 354 ret = ivpu_mmu_cdtab_alloc(vdev); 355 if (ret) { 356 ivpu_err(vdev, "Failed to allocate cdtab: %d\n", ret); 357 return ret; 358 } 359 360 ret = ivpu_mmu_strtab_alloc(vdev); 361 if (ret) { 362 ivpu_err(vdev, "Failed to allocate strtab: %d\n", ret); 363 return ret; 364 } 365 366 ret = ivpu_mmu_cmdq_alloc(vdev); 367 if (ret) { 368 ivpu_err(vdev, "Failed to allocate cmdq: %d\n", ret); 369 return ret; 370 } 371 372 ret = ivpu_mmu_evtq_alloc(vdev); 373 if (ret) 374 ivpu_err(vdev, "Failed to allocate evtq: %d\n", ret); 375 376 return ret; 377 } 378 379 static int ivpu_mmu_reg_write(struct ivpu_device *vdev, u32 reg, u32 val) 380 { 381 u32 reg_ack = reg + 4; /* ACK register is 4B after base register */ 382 u32 val_ack; 383 int ret; 384 385 REGV_WR32(reg, val); 386 387 ret = REGV_POLL(reg_ack, val_ack, (val == val_ack), IVPU_MMU_REG_TIMEOUT_US); 388 if (ret) 389 ivpu_err(vdev, "Failed to write register 0x%x\n", reg); 390 391 return ret; 392 } 393 394 static int ivpu_mmu_irqs_setup(struct ivpu_device *vdev) 395 { 396 u32 irq_ctrl = IVPU_MMU_IRQ_EVTQ_EN | IVPU_MMU_IRQ_GERROR_EN; 397 int ret; 398 399 ret = ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_IRQ_CTRL, 0); 400 if (ret) 401 return ret; 402 403 return ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_IRQ_CTRL, irq_ctrl); 404 } 405 406 static int ivpu_mmu_cmdq_wait_for_cons(struct ivpu_device *vdev) 407 { 408 struct ivpu_mmu_queue *cmdq = &vdev->mmu->cmdq; 409 410 return REGV_POLL(VPU_37XX_HOST_MMU_CMDQ_CONS, cmdq->cons, (cmdq->prod == cmdq->cons), 411 IVPU_MMU_QUEUE_TIMEOUT_US); 412 } 413 414 static int ivpu_mmu_cmdq_cmd_write(struct ivpu_device *vdev, const char *name, u64 data0, u64 data1) 415 { 416 struct ivpu_mmu_queue *q = &vdev->mmu->cmdq; 417 u64 *queue_buffer = q->base; 418 int idx = IVPU_MMU_Q_IDX(q->prod) * (IVPU_MMU_CMDQ_CMD_SIZE / sizeof(*queue_buffer)); 419 420 if (!CIRC_SPACE(IVPU_MMU_Q_IDX(q->prod), IVPU_MMU_Q_IDX(q->cons), IVPU_MMU_Q_COUNT)) { 421 ivpu_err(vdev, "Failed to write MMU CMD %s\n", name); 422 return -EBUSY; 423 } 424 425 queue_buffer[idx] = data0; 426 queue_buffer[idx + 1] = data1; 427 q->prod = (q->prod + 1) & IVPU_MMU_Q_WRAP_MASK; 428 429 ivpu_dbg(vdev, MMU, "CMD write: %s data: 0x%llx 0x%llx\n", name, data0, data1); 430 431 return 0; 432 } 433 434 static int ivpu_mmu_cmdq_sync(struct ivpu_device *vdev) 435 { 436 struct ivpu_mmu_queue *q = &vdev->mmu->cmdq; 437 u64 val; 438 int ret; 439 440 val = FIELD_PREP(IVPU_MMU_CMD_OPCODE, CMD_SYNC) | 441 FIELD_PREP(IVPU_MMU_CMD_SYNC_0_CS, 0x2) | 442 FIELD_PREP(IVPU_MMU_CMD_SYNC_0_MSH, 0x3) | 443 FIELD_PREP(IVPU_MMU_CMD_SYNC_0_MSI_ATTR, 0xf); 444 445 ret = ivpu_mmu_cmdq_cmd_write(vdev, "SYNC", val, 0); 446 if (ret) 447 return ret; 448 449 clflush_cache_range(q->base, IVPU_MMU_CMDQ_SIZE); 450 REGV_WR32(VPU_37XX_HOST_MMU_CMDQ_PROD, q->prod); 451 452 ret = ivpu_mmu_cmdq_wait_for_cons(vdev); 453 if (ret) 454 ivpu_err(vdev, "Timed out waiting for consumer: %d\n", ret); 455 456 return ret; 457 } 458 459 static int ivpu_mmu_cmdq_write_cfgi_all(struct ivpu_device *vdev) 460 { 461 u64 data0 = FIELD_PREP(IVPU_MMU_CMD_OPCODE, CMD_CFGI_ALL); 462 u64 data1 = FIELD_PREP(IVPU_MMU_CMD_CFGI_1_RANGE, 0x1f); 463 464 return ivpu_mmu_cmdq_cmd_write(vdev, "CFGI_ALL", data0, data1); 465 } 466 467 static int ivpu_mmu_cmdq_write_tlbi_nh_asid(struct ivpu_device *vdev, u16 ssid) 468 { 469 u64 val = FIELD_PREP(IVPU_MMU_CMD_OPCODE, CMD_TLBI_NH_ASID) | 470 FIELD_PREP(IVPU_MMU_CMD_TLBI_0_ASID, ssid); 471 472 return ivpu_mmu_cmdq_cmd_write(vdev, "TLBI_NH_ASID", val, 0); 473 } 474 475 static int ivpu_mmu_cmdq_write_tlbi_nsnh_all(struct ivpu_device *vdev) 476 { 477 u64 val = FIELD_PREP(IVPU_MMU_CMD_OPCODE, CMD_TLBI_NSNH_ALL); 478 479 return ivpu_mmu_cmdq_cmd_write(vdev, "TLBI_NSNH_ALL", val, 0); 480 } 481 482 static int ivpu_mmu_reset(struct ivpu_device *vdev) 483 { 484 struct ivpu_mmu_info *mmu = vdev->mmu; 485 u32 val; 486 int ret; 487 488 memset(mmu->cmdq.base, 0, IVPU_MMU_CMDQ_SIZE); 489 clflush_cache_range(mmu->cmdq.base, IVPU_MMU_CMDQ_SIZE); 490 mmu->cmdq.prod = 0; 491 mmu->cmdq.cons = 0; 492 493 memset(mmu->evtq.base, 0, IVPU_MMU_EVTQ_SIZE); 494 mmu->evtq.prod = 0; 495 mmu->evtq.cons = 0; 496 497 ret = ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_CR0, 0); 498 if (ret) 499 return ret; 500 501 val = FIELD_PREP(IVPU_MMU_CR1_TABLE_SH, IVPU_MMU_SH_ISH) | 502 FIELD_PREP(IVPU_MMU_CR1_TABLE_OC, IVPU_MMU_CACHE_WB) | 503 FIELD_PREP(IVPU_MMU_CR1_TABLE_IC, IVPU_MMU_CACHE_WB) | 504 FIELD_PREP(IVPU_MMU_CR1_QUEUE_SH, IVPU_MMU_SH_ISH) | 505 FIELD_PREP(IVPU_MMU_CR1_QUEUE_OC, IVPU_MMU_CACHE_WB) | 506 FIELD_PREP(IVPU_MMU_CR1_QUEUE_IC, IVPU_MMU_CACHE_WB); 507 REGV_WR32(VPU_37XX_HOST_MMU_CR1, val); 508 509 REGV_WR64(VPU_37XX_HOST_MMU_STRTAB_BASE, mmu->strtab.dma_q); 510 REGV_WR32(VPU_37XX_HOST_MMU_STRTAB_BASE_CFG, mmu->strtab.base_cfg); 511 512 REGV_WR64(VPU_37XX_HOST_MMU_CMDQ_BASE, mmu->cmdq.dma_q); 513 REGV_WR32(VPU_37XX_HOST_MMU_CMDQ_PROD, 0); 514 REGV_WR32(VPU_37XX_HOST_MMU_CMDQ_CONS, 0); 515 516 val = IVPU_MMU_CR0_CMDQEN; 517 ret = ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_CR0, val); 518 if (ret) 519 return ret; 520 521 ret = ivpu_mmu_cmdq_write_cfgi_all(vdev); 522 if (ret) 523 return ret; 524 525 ret = ivpu_mmu_cmdq_write_tlbi_nsnh_all(vdev); 526 if (ret) 527 return ret; 528 529 ret = ivpu_mmu_cmdq_sync(vdev); 530 if (ret) 531 return ret; 532 533 REGV_WR64(VPU_37XX_HOST_MMU_EVTQ_BASE, mmu->evtq.dma_q); 534 REGV_WR32(VPU_37XX_HOST_MMU_EVTQ_PROD_SEC, 0); 535 REGV_WR32(VPU_37XX_HOST_MMU_EVTQ_CONS_SEC, 0); 536 537 val |= IVPU_MMU_CR0_EVTQEN; 538 ret = ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_CR0, val); 539 if (ret) 540 return ret; 541 542 val |= IVPU_MMU_CR0_ATSCHK; 543 ret = ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_CR0, val); 544 if (ret) 545 return ret; 546 547 ret = ivpu_mmu_irqs_setup(vdev); 548 if (ret) 549 return ret; 550 551 val |= IVPU_MMU_CR0_SMMUEN; 552 return ivpu_mmu_reg_write(vdev, VPU_37XX_HOST_MMU_CR0, val); 553 } 554 555 static void ivpu_mmu_strtab_link_cd(struct ivpu_device *vdev, u32 sid) 556 { 557 struct ivpu_mmu_info *mmu = vdev->mmu; 558 struct ivpu_mmu_strtab *strtab = &mmu->strtab; 559 struct ivpu_mmu_cdtab *cdtab = &mmu->cdtab; 560 u64 *entry = strtab->base + (sid * IVPU_MMU_STRTAB_ENT_SIZE); 561 u64 str[2]; 562 563 str[0] = FIELD_PREP(IVPU_MMU_STE_0_CFG, IVPU_MMU_STE_0_CFG_S1_TRANS) | 564 FIELD_PREP(IVPU_MMU_STE_0_S1CDMAX, IVPU_MMU_CDTAB_ENT_COUNT_LOG2) | 565 FIELD_PREP(IVPU_MMU_STE_0_S1FMT, IVPU_MMU_STE_0_S1FMT_LINEAR) | 566 IVPU_MMU_STE_0_V | 567 (cdtab->dma & IVPU_MMU_STE_0_S1CTXPTR_MASK); 568 569 str[1] = FIELD_PREP(IVPU_MMU_STE_1_S1DSS, IVPU_MMU_STE_1_S1DSS_TERMINATE) | 570 FIELD_PREP(IVPU_MMU_STE_1_S1CIR, IVPU_MMU_STE_1_S1C_CACHE_NC) | 571 FIELD_PREP(IVPU_MMU_STE_1_S1COR, IVPU_MMU_STE_1_S1C_CACHE_NC) | 572 FIELD_PREP(IVPU_MMU_STE_1_S1CSH, IVPU_MMU_SH_NSH) | 573 FIELD_PREP(IVPU_MMU_STE_1_PRIVCFG, IVPU_MMU_STE_1_PRIVCFG_UNPRIV) | 574 FIELD_PREP(IVPU_MMU_STE_1_INSTCFG, IVPU_MMU_STE_1_INSTCFG_DATA) | 575 FIELD_PREP(IVPU_MMU_STE_1_STRW, IVPU_MMU_STE_1_STRW_NSEL1) | 576 FIELD_PREP(IVPU_MMU_STE_1_CONT, IVPU_MMU_STRTAB_CFG_LOG2SIZE) | 577 IVPU_MMU_STE_1_MEV | 578 IVPU_MMU_STE_1_S1STALLD; 579 580 WRITE_ONCE(entry[1], str[1]); 581 WRITE_ONCE(entry[0], str[0]); 582 583 clflush_cache_range(entry, IVPU_MMU_STRTAB_ENT_SIZE); 584 585 ivpu_dbg(vdev, MMU, "STRTAB write entry (SSID=%u): 0x%llx, 0x%llx\n", sid, str[0], str[1]); 586 } 587 588 static int ivpu_mmu_strtab_init(struct ivpu_device *vdev) 589 { 590 ivpu_mmu_strtab_link_cd(vdev, IVPU_MMU_STREAM_ID0); 591 ivpu_mmu_strtab_link_cd(vdev, IVPU_MMU_STREAM_ID3); 592 593 return 0; 594 } 595 596 int ivpu_mmu_invalidate_tlb(struct ivpu_device *vdev, u16 ssid) 597 { 598 struct ivpu_mmu_info *mmu = vdev->mmu; 599 int ret = 0; 600 601 mutex_lock(&mmu->lock); 602 if (!mmu->on) 603 goto unlock; 604 605 ret = ivpu_mmu_cmdq_write_tlbi_nh_asid(vdev, ssid); 606 if (ret) 607 goto unlock; 608 609 ret = ivpu_mmu_cmdq_sync(vdev); 610 unlock: 611 mutex_unlock(&mmu->lock); 612 return ret; 613 } 614 615 static int ivpu_mmu_cd_add(struct ivpu_device *vdev, u32 ssid, u64 cd_dma) 616 { 617 struct ivpu_mmu_info *mmu = vdev->mmu; 618 struct ivpu_mmu_cdtab *cdtab = &mmu->cdtab; 619 u64 *entry; 620 u64 cd[4]; 621 int ret = 0; 622 623 if (ssid > IVPU_MMU_CDTAB_ENT_COUNT) 624 return -EINVAL; 625 626 entry = cdtab->base + (ssid * IVPU_MMU_CDTAB_ENT_SIZE); 627 628 if (cd_dma != 0) { 629 cd[0] = FIELD_PREP(IVPU_MMU_CD_0_TCR_T0SZ, IVPU_MMU_T0SZ_48BIT) | 630 FIELD_PREP(IVPU_MMU_CD_0_TCR_TG0, 0) | 631 FIELD_PREP(IVPU_MMU_CD_0_TCR_IRGN0, 0) | 632 FIELD_PREP(IVPU_MMU_CD_0_TCR_ORGN0, 0) | 633 FIELD_PREP(IVPU_MMU_CD_0_TCR_SH0, 0) | 634 FIELD_PREP(IVPU_MMU_CD_0_TCR_IPS, IVPU_MMU_IPS_48BIT) | 635 FIELD_PREP(IVPU_MMU_CD_0_ASID, ssid) | 636 IVPU_MMU_CD_0_TCR_EPD1 | 637 IVPU_MMU_CD_0_AA64 | 638 IVPU_MMU_CD_0_R | 639 IVPU_MMU_CD_0_ASET | 640 IVPU_MMU_CD_0_V; 641 cd[1] = cd_dma & IVPU_MMU_CD_1_TTB0_MASK; 642 cd[2] = 0; 643 cd[3] = 0x0000000000007444; 644 645 /* For global context generate memory fault on VPU */ 646 if (ssid == IVPU_GLOBAL_CONTEXT_MMU_SSID) 647 cd[0] |= IVPU_MMU_CD_0_A; 648 } else { 649 memset(cd, 0, sizeof(cd)); 650 } 651 652 WRITE_ONCE(entry[1], cd[1]); 653 WRITE_ONCE(entry[2], cd[2]); 654 WRITE_ONCE(entry[3], cd[3]); 655 WRITE_ONCE(entry[0], cd[0]); 656 657 clflush_cache_range(entry, IVPU_MMU_CDTAB_ENT_SIZE); 658 659 ivpu_dbg(vdev, MMU, "CDTAB %s entry (SSID=%u, dma=%pad): 0x%llx, 0x%llx, 0x%llx, 0x%llx\n", 660 cd_dma ? "write" : "clear", ssid, &cd_dma, cd[0], cd[1], cd[2], cd[3]); 661 662 mutex_lock(&mmu->lock); 663 if (!mmu->on) 664 goto unlock; 665 666 ret = ivpu_mmu_cmdq_write_cfgi_all(vdev); 667 if (ret) 668 goto unlock; 669 670 ret = ivpu_mmu_cmdq_sync(vdev); 671 unlock: 672 mutex_unlock(&mmu->lock); 673 return ret; 674 } 675 676 static int ivpu_mmu_cd_add_gbl(struct ivpu_device *vdev) 677 { 678 int ret; 679 680 ret = ivpu_mmu_cd_add(vdev, 0, vdev->gctx.pgtable.pgd_dma); 681 if (ret) 682 ivpu_err(vdev, "Failed to add global CD entry: %d\n", ret); 683 684 return ret; 685 } 686 687 static int ivpu_mmu_cd_add_user(struct ivpu_device *vdev, u32 ssid, dma_addr_t cd_dma) 688 { 689 int ret; 690 691 if (ssid == 0) { 692 ivpu_err(vdev, "Invalid SSID: %u\n", ssid); 693 return -EINVAL; 694 } 695 696 ret = ivpu_mmu_cd_add(vdev, ssid, cd_dma); 697 if (ret) 698 ivpu_err(vdev, "Failed to add CD entry SSID=%u: %d\n", ssid, ret); 699 700 return ret; 701 } 702 703 int ivpu_mmu_init(struct ivpu_device *vdev) 704 { 705 struct ivpu_mmu_info *mmu = vdev->mmu; 706 int ret; 707 708 ivpu_dbg(vdev, MMU, "Init..\n"); 709 710 drmm_mutex_init(&vdev->drm, &mmu->lock); 711 ivpu_mmu_config_check(vdev); 712 713 ret = ivpu_mmu_structs_alloc(vdev); 714 if (ret) 715 return ret; 716 717 ret = ivpu_mmu_strtab_init(vdev); 718 if (ret) { 719 ivpu_err(vdev, "Failed to initialize strtab: %d\n", ret); 720 return ret; 721 } 722 723 ret = ivpu_mmu_cd_add_gbl(vdev); 724 if (ret) { 725 ivpu_err(vdev, "Failed to initialize strtab: %d\n", ret); 726 return ret; 727 } 728 729 ret = ivpu_mmu_enable(vdev); 730 if (ret) { 731 ivpu_err(vdev, "Failed to resume MMU: %d\n", ret); 732 return ret; 733 } 734 735 ivpu_dbg(vdev, MMU, "Init done\n"); 736 737 return 0; 738 } 739 740 int ivpu_mmu_enable(struct ivpu_device *vdev) 741 { 742 struct ivpu_mmu_info *mmu = vdev->mmu; 743 int ret; 744 745 mutex_lock(&mmu->lock); 746 747 mmu->on = true; 748 749 ret = ivpu_mmu_reset(vdev); 750 if (ret) { 751 ivpu_err(vdev, "Failed to reset MMU: %d\n", ret); 752 goto err; 753 } 754 755 ret = ivpu_mmu_cmdq_write_cfgi_all(vdev); 756 if (ret) 757 goto err; 758 759 ret = ivpu_mmu_cmdq_write_tlbi_nsnh_all(vdev); 760 if (ret) 761 goto err; 762 763 ret = ivpu_mmu_cmdq_sync(vdev); 764 if (ret) 765 goto err; 766 767 mutex_unlock(&mmu->lock); 768 769 return 0; 770 err: 771 mmu->on = false; 772 mutex_unlock(&mmu->lock); 773 return ret; 774 } 775 776 void ivpu_mmu_disable(struct ivpu_device *vdev) 777 { 778 struct ivpu_mmu_info *mmu = vdev->mmu; 779 780 mutex_lock(&mmu->lock); 781 mmu->on = false; 782 mutex_unlock(&mmu->lock); 783 } 784 785 static void ivpu_mmu_dump_event(struct ivpu_device *vdev, u32 *event) 786 { 787 u32 ssid = FIELD_GET(IVPU_MMU_EVT_SSID_MASK, event[0]); 788 u32 op = FIELD_GET(IVPU_MMU_EVT_OP_MASK, event[0]); 789 u64 fetch_addr = ((u64)event[7]) << 32 | event[6]; 790 u64 in_addr = ((u64)event[5]) << 32 | event[4]; 791 u32 sid = event[1]; 792 793 ivpu_err(vdev, "MMU EVTQ: 0x%x (%s) SSID: %d SID: %d, e[2] %08x, e[3] %08x, in addr: 0x%llx, fetch addr: 0x%llx\n", 794 op, ivpu_mmu_event_to_str(op), ssid, sid, event[2], event[3], in_addr, fetch_addr); 795 } 796 797 static u32 *ivpu_mmu_get_event(struct ivpu_device *vdev) 798 { 799 struct ivpu_mmu_queue *evtq = &vdev->mmu->evtq; 800 u32 idx = IVPU_MMU_Q_IDX(evtq->cons); 801 u32 *evt = evtq->base + (idx * IVPU_MMU_EVTQ_CMD_SIZE); 802 803 evtq->prod = REGV_RD32(VPU_37XX_HOST_MMU_EVTQ_PROD_SEC); 804 if (!CIRC_CNT(IVPU_MMU_Q_IDX(evtq->prod), IVPU_MMU_Q_IDX(evtq->cons), IVPU_MMU_Q_COUNT)) 805 return NULL; 806 807 evtq->cons = (evtq->cons + 1) & IVPU_MMU_Q_WRAP_MASK; 808 REGV_WR32(VPU_37XX_HOST_MMU_EVTQ_CONS_SEC, evtq->cons); 809 810 return evt; 811 } 812 813 void ivpu_mmu_irq_evtq_handler(struct ivpu_device *vdev) 814 { 815 bool schedule_recovery = false; 816 u32 *event; 817 u32 ssid; 818 819 ivpu_dbg(vdev, IRQ, "MMU event queue\n"); 820 821 while ((event = ivpu_mmu_get_event(vdev)) != NULL) { 822 ivpu_mmu_dump_event(vdev, event); 823 824 ssid = FIELD_GET(IVPU_MMU_EVT_SSID_MASK, event[0]); 825 if (ssid == IVPU_GLOBAL_CONTEXT_MMU_SSID) 826 schedule_recovery = true; 827 else 828 ivpu_mmu_user_context_mark_invalid(vdev, ssid); 829 } 830 831 if (schedule_recovery) 832 ivpu_pm_schedule_recovery(vdev); 833 } 834 835 void ivpu_mmu_irq_gerr_handler(struct ivpu_device *vdev) 836 { 837 u32 gerror_val, gerrorn_val, active; 838 839 ivpu_dbg(vdev, IRQ, "MMU error\n"); 840 841 gerror_val = REGV_RD32(VPU_37XX_HOST_MMU_GERROR); 842 gerrorn_val = REGV_RD32(VPU_37XX_HOST_MMU_GERRORN); 843 844 active = gerror_val ^ gerrorn_val; 845 if (!(active & IVPU_MMU_GERROR_ERR_MASK)) 846 return; 847 848 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_ABT, active)) 849 ivpu_warn_ratelimited(vdev, "MMU MSI ABT write aborted\n"); 850 851 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_PRIQ_ABT, active)) 852 ivpu_warn_ratelimited(vdev, "MMU PRIQ MSI ABT write aborted\n"); 853 854 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_EVTQ_ABT, active)) 855 ivpu_warn_ratelimited(vdev, "MMU EVTQ MSI ABT write aborted\n"); 856 857 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, MSI_CMDQ_ABT, active)) 858 ivpu_warn_ratelimited(vdev, "MMU CMDQ MSI ABT write aborted\n"); 859 860 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, PRIQ_ABT, active)) 861 ivpu_err_ratelimited(vdev, "MMU PRIQ write aborted\n"); 862 863 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, EVTQ_ABT, active)) 864 ivpu_err_ratelimited(vdev, "MMU EVTQ write aborted\n"); 865 866 if (REG_TEST_FLD(VPU_37XX_HOST_MMU_GERROR, CMDQ, active)) 867 ivpu_err_ratelimited(vdev, "MMU CMDQ write aborted\n"); 868 869 REGV_WR32(VPU_37XX_HOST_MMU_GERRORN, gerror_val); 870 } 871 872 int ivpu_mmu_set_pgtable(struct ivpu_device *vdev, int ssid, struct ivpu_mmu_pgtable *pgtable) 873 { 874 return ivpu_mmu_cd_add_user(vdev, ssid, pgtable->pgd_dma); 875 } 876 877 void ivpu_mmu_clear_pgtable(struct ivpu_device *vdev, int ssid) 878 { 879 ivpu_mmu_cd_add_user(vdev, ssid, 0); /* 0 will clear CD entry */ 880 } 881