1 /* 2 * Copyright 2014 IBM Corp. 3 * 4 * This program is free software; you can redistribute it and/or 5 * modify it under the terms of the GNU General Public License 6 * as published by the Free Software Foundation; either version 7 * 2 of the License, or (at your option) any later version. 8 */ 9 10 #include <linux/spinlock.h> 11 #include <linux/sched.h> 12 #include <linux/slab.h> 13 #include <linux/sched.h> 14 #include <linux/mutex.h> 15 #include <linux/mm.h> 16 #include <linux/uaccess.h> 17 #include <asm/synch.h> 18 #include <misc/cxl.h> 19 20 #include "cxl.h" 21 22 static int afu_control(struct cxl_afu *afu, u64 command, 23 u64 result, u64 mask, bool enabled) 24 { 25 u64 AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); 26 unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); 27 28 spin_lock(&afu->afu_cntl_lock); 29 pr_devel("AFU command starting: %llx\n", command); 30 31 cxl_p2n_write(afu, CXL_AFU_Cntl_An, AFU_Cntl | command); 32 33 AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); 34 while ((AFU_Cntl & mask) != result) { 35 if (time_after_eq(jiffies, timeout)) { 36 dev_warn(&afu->dev, "WARNING: AFU control timed out!\n"); 37 spin_unlock(&afu->afu_cntl_lock); 38 return -EBUSY; 39 } 40 pr_devel_ratelimited("AFU control... (0x%.16llx)\n", 41 AFU_Cntl | command); 42 cpu_relax(); 43 AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); 44 }; 45 pr_devel("AFU command complete: %llx\n", command); 46 afu->enabled = enabled; 47 spin_unlock(&afu->afu_cntl_lock); 48 49 return 0; 50 } 51 52 static int afu_enable(struct cxl_afu *afu) 53 { 54 pr_devel("AFU enable request\n"); 55 56 return afu_control(afu, CXL_AFU_Cntl_An_E, 57 CXL_AFU_Cntl_An_ES_Enabled, 58 CXL_AFU_Cntl_An_ES_MASK, true); 59 } 60 61 int cxl_afu_disable(struct cxl_afu *afu) 62 { 63 pr_devel("AFU disable request\n"); 64 65 return afu_control(afu, 0, CXL_AFU_Cntl_An_ES_Disabled, 66 CXL_AFU_Cntl_An_ES_MASK, false); 67 } 68 69 /* This will disable as well as reset */ 70 int cxl_afu_reset(struct cxl_afu *afu) 71 { 72 pr_devel("AFU reset request\n"); 73 74 return afu_control(afu, CXL_AFU_Cntl_An_RA, 75 CXL_AFU_Cntl_An_RS_Complete | CXL_AFU_Cntl_An_ES_Disabled, 76 CXL_AFU_Cntl_An_RS_MASK | CXL_AFU_Cntl_An_ES_MASK, 77 false); 78 } 79 80 static int afu_check_and_enable(struct cxl_afu *afu) 81 { 82 if (afu->enabled) 83 return 0; 84 return afu_enable(afu); 85 } 86 87 int cxl_psl_purge(struct cxl_afu *afu) 88 { 89 u64 PSL_CNTL = cxl_p1n_read(afu, CXL_PSL_SCNTL_An); 90 u64 AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); 91 u64 dsisr, dar; 92 u64 start, end; 93 unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); 94 95 pr_devel("PSL purge request\n"); 96 97 if ((AFU_Cntl & CXL_AFU_Cntl_An_ES_MASK) != CXL_AFU_Cntl_An_ES_Disabled) { 98 WARN(1, "psl_purge request while AFU not disabled!\n"); 99 cxl_afu_disable(afu); 100 } 101 102 cxl_p1n_write(afu, CXL_PSL_SCNTL_An, 103 PSL_CNTL | CXL_PSL_SCNTL_An_Pc); 104 start = local_clock(); 105 PSL_CNTL = cxl_p1n_read(afu, CXL_PSL_SCNTL_An); 106 while ((PSL_CNTL & CXL_PSL_SCNTL_An_Ps_MASK) 107 == CXL_PSL_SCNTL_An_Ps_Pending) { 108 if (time_after_eq(jiffies, timeout)) { 109 dev_warn(&afu->dev, "WARNING: PSL Purge timed out!\n"); 110 return -EBUSY; 111 } 112 dsisr = cxl_p2n_read(afu, CXL_PSL_DSISR_An); 113 pr_devel_ratelimited("PSL purging... PSL_CNTL: 0x%.16llx PSL_DSISR: 0x%.16llx\n", PSL_CNTL, dsisr); 114 if (dsisr & CXL_PSL_DSISR_TRANS) { 115 dar = cxl_p2n_read(afu, CXL_PSL_DAR_An); 116 dev_notice(&afu->dev, "PSL purge terminating pending translation, DSISR: 0x%.16llx, DAR: 0x%.16llx\n", dsisr, dar); 117 cxl_p2n_write(afu, CXL_PSL_TFC_An, CXL_PSL_TFC_An_AE); 118 } else if (dsisr) { 119 dev_notice(&afu->dev, "PSL purge acknowledging pending non-translation fault, DSISR: 0x%.16llx\n", dsisr); 120 cxl_p2n_write(afu, CXL_PSL_TFC_An, CXL_PSL_TFC_An_A); 121 } else { 122 cpu_relax(); 123 } 124 PSL_CNTL = cxl_p1n_read(afu, CXL_PSL_SCNTL_An); 125 }; 126 end = local_clock(); 127 pr_devel("PSL purged in %lld ns\n", end - start); 128 129 cxl_p1n_write(afu, CXL_PSL_SCNTL_An, 130 PSL_CNTL & ~CXL_PSL_SCNTL_An_Pc); 131 return 0; 132 } 133 134 static int spa_max_procs(int spa_size) 135 { 136 /* 137 * From the CAIA: 138 * end_of_SPA_area = SPA_Base + ((n+4) * 128) + (( ((n*8) + 127) >> 7) * 128) + 255 139 * Most of that junk is really just an overly-complicated way of saying 140 * the last 256 bytes are __aligned(128), so it's really: 141 * end_of_SPA_area = end_of_PSL_queue_area + __aligned(128) 255 142 * and 143 * end_of_PSL_queue_area = SPA_Base + ((n+4) * 128) + (n*8) - 1 144 * so 145 * sizeof(SPA) = ((n+4) * 128) + (n*8) + __aligned(128) 256 146 * Ignore the alignment (which is safe in this case as long as we are 147 * careful with our rounding) and solve for n: 148 */ 149 return ((spa_size / 8) - 96) / 17; 150 } 151 152 static int alloc_spa(struct cxl_afu *afu) 153 { 154 u64 spap; 155 156 /* Work out how many pages to allocate */ 157 afu->spa_order = 0; 158 do { 159 afu->spa_order++; 160 afu->spa_size = (1 << afu->spa_order) * PAGE_SIZE; 161 afu->spa_max_procs = spa_max_procs(afu->spa_size); 162 } while (afu->spa_max_procs < afu->num_procs); 163 164 WARN_ON(afu->spa_size > 0x100000); /* Max size supported by the hardware */ 165 166 if (!(afu->spa = (struct cxl_process_element *) 167 __get_free_pages(GFP_KERNEL | __GFP_ZERO, afu->spa_order))) { 168 pr_err("cxl_alloc_spa: Unable to allocate scheduled process area\n"); 169 return -ENOMEM; 170 } 171 pr_devel("spa pages: %i afu->spa_max_procs: %i afu->num_procs: %i\n", 172 1<<afu->spa_order, afu->spa_max_procs, afu->num_procs); 173 174 afu->sw_command_status = (__be64 *)((char *)afu->spa + 175 ((afu->spa_max_procs + 3) * 128)); 176 177 spap = virt_to_phys(afu->spa) & CXL_PSL_SPAP_Addr; 178 spap |= ((afu->spa_size >> (12 - CXL_PSL_SPAP_Size_Shift)) - 1) & CXL_PSL_SPAP_Size; 179 spap |= CXL_PSL_SPAP_V; 180 pr_devel("cxl: SPA allocated at 0x%p. Max processes: %i, sw_command_status: 0x%p CXL_PSL_SPAP_An=0x%016llx\n", afu->spa, afu->spa_max_procs, afu->sw_command_status, spap); 181 cxl_p1n_write(afu, CXL_PSL_SPAP_An, spap); 182 183 return 0; 184 } 185 186 static void release_spa(struct cxl_afu *afu) 187 { 188 free_pages((unsigned long) afu->spa, afu->spa_order); 189 } 190 191 int cxl_tlb_slb_invalidate(struct cxl *adapter) 192 { 193 unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); 194 195 pr_devel("CXL adapter wide TLBIA & SLBIA\n"); 196 197 cxl_p1_write(adapter, CXL_PSL_AFUSEL, CXL_PSL_AFUSEL_A); 198 199 cxl_p1_write(adapter, CXL_PSL_TLBIA, CXL_TLB_SLB_IQ_ALL); 200 while (cxl_p1_read(adapter, CXL_PSL_TLBIA) & CXL_TLB_SLB_P) { 201 if (time_after_eq(jiffies, timeout)) { 202 dev_warn(&adapter->dev, "WARNING: CXL adapter wide TLBIA timed out!\n"); 203 return -EBUSY; 204 } 205 cpu_relax(); 206 } 207 208 cxl_p1_write(adapter, CXL_PSL_SLBIA, CXL_TLB_SLB_IQ_ALL); 209 while (cxl_p1_read(adapter, CXL_PSL_SLBIA) & CXL_TLB_SLB_P) { 210 if (time_after_eq(jiffies, timeout)) { 211 dev_warn(&adapter->dev, "WARNING: CXL adapter wide SLBIA timed out!\n"); 212 return -EBUSY; 213 } 214 cpu_relax(); 215 } 216 return 0; 217 } 218 219 int cxl_afu_slbia(struct cxl_afu *afu) 220 { 221 unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); 222 223 pr_devel("cxl_afu_slbia issuing SLBIA command\n"); 224 cxl_p2n_write(afu, CXL_SLBIA_An, CXL_TLB_SLB_IQ_ALL); 225 while (cxl_p2n_read(afu, CXL_SLBIA_An) & CXL_TLB_SLB_P) { 226 if (time_after_eq(jiffies, timeout)) { 227 dev_warn(&afu->dev, "WARNING: CXL AFU SLBIA timed out!\n"); 228 return -EBUSY; 229 } 230 cpu_relax(); 231 } 232 return 0; 233 } 234 235 static int cxl_write_sstp(struct cxl_afu *afu, u64 sstp0, u64 sstp1) 236 { 237 int rc; 238 239 /* 1. Disable SSTP by writing 0 to SSTP1[V] */ 240 cxl_p2n_write(afu, CXL_SSTP1_An, 0); 241 242 /* 2. Invalidate all SLB entries */ 243 if ((rc = cxl_afu_slbia(afu))) 244 return rc; 245 246 /* 3. Set SSTP0_An */ 247 cxl_p2n_write(afu, CXL_SSTP0_An, sstp0); 248 249 /* 4. Set SSTP1_An */ 250 cxl_p2n_write(afu, CXL_SSTP1_An, sstp1); 251 252 return 0; 253 } 254 255 /* Using per slice version may improve performance here. (ie. SLBIA_An) */ 256 static void slb_invalid(struct cxl_context *ctx) 257 { 258 struct cxl *adapter = ctx->afu->adapter; 259 u64 slbia; 260 261 WARN_ON(!mutex_is_locked(&ctx->afu->spa_mutex)); 262 263 cxl_p1_write(adapter, CXL_PSL_LBISEL, 264 ((u64)be32_to_cpu(ctx->elem->common.pid) << 32) | 265 be32_to_cpu(ctx->elem->lpid)); 266 cxl_p1_write(adapter, CXL_PSL_SLBIA, CXL_TLB_SLB_IQ_LPIDPID); 267 268 while (1) { 269 slbia = cxl_p1_read(adapter, CXL_PSL_SLBIA); 270 if (!(slbia & CXL_TLB_SLB_P)) 271 break; 272 cpu_relax(); 273 } 274 } 275 276 static int do_process_element_cmd(struct cxl_context *ctx, 277 u64 cmd, u64 pe_state) 278 { 279 u64 state; 280 281 WARN_ON(!ctx->afu->enabled); 282 283 ctx->elem->software_state = cpu_to_be32(pe_state); 284 smp_wmb(); 285 *(ctx->afu->sw_command_status) = cpu_to_be64(cmd | 0 | ctx->pe); 286 smp_mb(); 287 cxl_p1n_write(ctx->afu, CXL_PSL_LLCMD_An, cmd | ctx->pe); 288 while (1) { 289 state = be64_to_cpup(ctx->afu->sw_command_status); 290 if (state == ~0ULL) { 291 pr_err("cxl: Error adding process element to AFU\n"); 292 return -1; 293 } 294 if ((state & (CXL_SPA_SW_CMD_MASK | CXL_SPA_SW_STATE_MASK | CXL_SPA_SW_LINK_MASK)) == 295 (cmd | (cmd >> 16) | ctx->pe)) 296 break; 297 /* 298 * The command won't finish in the PSL if there are 299 * outstanding DSIs. Hence we need to yield here in 300 * case there are outstanding DSIs that we need to 301 * service. Tuning possiblity: we could wait for a 302 * while before sched 303 */ 304 schedule(); 305 306 } 307 return 0; 308 } 309 310 static int add_process_element(struct cxl_context *ctx) 311 { 312 int rc = 0; 313 314 mutex_lock(&ctx->afu->spa_mutex); 315 pr_devel("%s Adding pe: %i started\n", __func__, ctx->pe); 316 if (!(rc = do_process_element_cmd(ctx, CXL_SPA_SW_CMD_ADD, CXL_PE_SOFTWARE_STATE_V))) 317 ctx->pe_inserted = true; 318 pr_devel("%s Adding pe: %i finished\n", __func__, ctx->pe); 319 mutex_unlock(&ctx->afu->spa_mutex); 320 return rc; 321 } 322 323 static int terminate_process_element(struct cxl_context *ctx) 324 { 325 int rc = 0; 326 327 /* fast path terminate if it's already invalid */ 328 if (!(ctx->elem->software_state & cpu_to_be32(CXL_PE_SOFTWARE_STATE_V))) 329 return rc; 330 331 mutex_lock(&ctx->afu->spa_mutex); 332 pr_devel("%s Terminate pe: %i started\n", __func__, ctx->pe); 333 rc = do_process_element_cmd(ctx, CXL_SPA_SW_CMD_TERMINATE, 334 CXL_PE_SOFTWARE_STATE_V | CXL_PE_SOFTWARE_STATE_T); 335 ctx->elem->software_state = 0; /* Remove Valid bit */ 336 pr_devel("%s Terminate pe: %i finished\n", __func__, ctx->pe); 337 mutex_unlock(&ctx->afu->spa_mutex); 338 return rc; 339 } 340 341 static int remove_process_element(struct cxl_context *ctx) 342 { 343 int rc = 0; 344 345 mutex_lock(&ctx->afu->spa_mutex); 346 pr_devel("%s Remove pe: %i started\n", __func__, ctx->pe); 347 if (!(rc = do_process_element_cmd(ctx, CXL_SPA_SW_CMD_REMOVE, 0))) 348 ctx->pe_inserted = false; 349 slb_invalid(ctx); 350 pr_devel("%s Remove pe: %i finished\n", __func__, ctx->pe); 351 mutex_unlock(&ctx->afu->spa_mutex); 352 353 return rc; 354 } 355 356 357 static void assign_psn_space(struct cxl_context *ctx) 358 { 359 if (!ctx->afu->pp_size || ctx->master) { 360 ctx->psn_phys = ctx->afu->psn_phys; 361 ctx->psn_size = ctx->afu->adapter->ps_size; 362 } else { 363 ctx->psn_phys = ctx->afu->psn_phys + 364 (ctx->afu->pp_offset + ctx->afu->pp_size * ctx->pe); 365 ctx->psn_size = ctx->afu->pp_size; 366 } 367 } 368 369 static int activate_afu_directed(struct cxl_afu *afu) 370 { 371 int rc; 372 373 dev_info(&afu->dev, "Activating AFU directed mode\n"); 374 375 if (alloc_spa(afu)) 376 return -ENOMEM; 377 378 cxl_p1n_write(afu, CXL_PSL_SCNTL_An, CXL_PSL_SCNTL_An_PM_AFU); 379 cxl_p1n_write(afu, CXL_PSL_AMOR_An, 0xFFFFFFFFFFFFFFFFULL); 380 cxl_p1n_write(afu, CXL_PSL_ID_An, CXL_PSL_ID_An_F | CXL_PSL_ID_An_L); 381 382 afu->current_mode = CXL_MODE_DIRECTED; 383 afu->num_procs = afu->max_procs_virtualised; 384 385 if ((rc = cxl_chardev_m_afu_add(afu))) 386 return rc; 387 388 if ((rc = cxl_sysfs_afu_m_add(afu))) 389 goto err; 390 391 if ((rc = cxl_chardev_s_afu_add(afu))) 392 goto err1; 393 394 return 0; 395 err1: 396 cxl_sysfs_afu_m_remove(afu); 397 err: 398 cxl_chardev_afu_remove(afu); 399 return rc; 400 } 401 402 #ifdef CONFIG_CPU_LITTLE_ENDIAN 403 #define set_endian(sr) ((sr) |= CXL_PSL_SR_An_LE) 404 #else 405 #define set_endian(sr) ((sr) &= ~(CXL_PSL_SR_An_LE)) 406 #endif 407 408 static int attach_afu_directed(struct cxl_context *ctx, u64 wed, u64 amr) 409 { 410 u64 sr; 411 int r, result; 412 413 assign_psn_space(ctx); 414 415 ctx->elem->ctxtime = 0; /* disable */ 416 ctx->elem->lpid = cpu_to_be32(mfspr(SPRN_LPID)); 417 ctx->elem->haurp = 0; /* disable */ 418 ctx->elem->sdr = cpu_to_be64(mfspr(SPRN_SDR1)); 419 420 sr = 0; 421 if (ctx->master) 422 sr |= CXL_PSL_SR_An_MP; 423 if (mfspr(SPRN_LPCR) & LPCR_TC) 424 sr |= CXL_PSL_SR_An_TC; 425 /* HV=0, PR=1, R=1 for userspace 426 * For kernel contexts: this would need to change 427 */ 428 sr |= CXL_PSL_SR_An_PR | CXL_PSL_SR_An_R; 429 set_endian(sr); 430 sr &= ~(CXL_PSL_SR_An_HV); 431 if (!test_tsk_thread_flag(current, TIF_32BIT)) 432 sr |= CXL_PSL_SR_An_SF; 433 ctx->elem->common.pid = cpu_to_be32(current->pid); 434 ctx->elem->common.tid = 0; 435 ctx->elem->sr = cpu_to_be64(sr); 436 437 ctx->elem->common.csrp = 0; /* disable */ 438 ctx->elem->common.aurp0 = 0; /* disable */ 439 ctx->elem->common.aurp1 = 0; /* disable */ 440 441 cxl_prefault(ctx, wed); 442 443 ctx->elem->common.sstp0 = cpu_to_be64(ctx->sstp0); 444 ctx->elem->common.sstp1 = cpu_to_be64(ctx->sstp1); 445 446 for (r = 0; r < CXL_IRQ_RANGES; r++) { 447 ctx->elem->ivte_offsets[r] = cpu_to_be16(ctx->irqs.offset[r]); 448 ctx->elem->ivte_ranges[r] = cpu_to_be16(ctx->irqs.range[r]); 449 } 450 451 ctx->elem->common.amr = cpu_to_be64(amr); 452 ctx->elem->common.wed = cpu_to_be64(wed); 453 454 /* first guy needs to enable */ 455 if ((result = afu_check_and_enable(ctx->afu))) 456 return result; 457 458 add_process_element(ctx); 459 460 return 0; 461 } 462 463 static int deactivate_afu_directed(struct cxl_afu *afu) 464 { 465 dev_info(&afu->dev, "Deactivating AFU directed mode\n"); 466 467 afu->current_mode = 0; 468 afu->num_procs = 0; 469 470 cxl_sysfs_afu_m_remove(afu); 471 cxl_chardev_afu_remove(afu); 472 473 cxl_afu_reset(afu); 474 cxl_afu_disable(afu); 475 cxl_psl_purge(afu); 476 477 release_spa(afu); 478 479 return 0; 480 } 481 482 static int activate_dedicated_process(struct cxl_afu *afu) 483 { 484 dev_info(&afu->dev, "Activating dedicated process mode\n"); 485 486 cxl_p1n_write(afu, CXL_PSL_SCNTL_An, CXL_PSL_SCNTL_An_PM_Process); 487 488 cxl_p1n_write(afu, CXL_PSL_CtxTime_An, 0); /* disable */ 489 cxl_p1n_write(afu, CXL_PSL_SPAP_An, 0); /* disable */ 490 cxl_p1n_write(afu, CXL_PSL_AMOR_An, 0xFFFFFFFFFFFFFFFFULL); 491 cxl_p1n_write(afu, CXL_PSL_LPID_An, mfspr(SPRN_LPID)); 492 cxl_p1n_write(afu, CXL_HAURP_An, 0); /* disable */ 493 cxl_p1n_write(afu, CXL_PSL_SDR_An, mfspr(SPRN_SDR1)); 494 495 cxl_p2n_write(afu, CXL_CSRP_An, 0); /* disable */ 496 cxl_p2n_write(afu, CXL_AURP0_An, 0); /* disable */ 497 cxl_p2n_write(afu, CXL_AURP1_An, 0); /* disable */ 498 499 afu->current_mode = CXL_MODE_DEDICATED; 500 afu->num_procs = 1; 501 502 return cxl_chardev_d_afu_add(afu); 503 } 504 505 static int attach_dedicated(struct cxl_context *ctx, u64 wed, u64 amr) 506 { 507 struct cxl_afu *afu = ctx->afu; 508 u64 sr; 509 int rc; 510 511 sr = 0; 512 set_endian(sr); 513 if (ctx->master) 514 sr |= CXL_PSL_SR_An_MP; 515 if (mfspr(SPRN_LPCR) & LPCR_TC) 516 sr |= CXL_PSL_SR_An_TC; 517 sr |= CXL_PSL_SR_An_PR | CXL_PSL_SR_An_R; 518 if (!test_tsk_thread_flag(current, TIF_32BIT)) 519 sr |= CXL_PSL_SR_An_SF; 520 cxl_p2n_write(afu, CXL_PSL_PID_TID_An, (u64)current->pid << 32); 521 cxl_p1n_write(afu, CXL_PSL_SR_An, sr); 522 523 if ((rc = cxl_write_sstp(afu, ctx->sstp0, ctx->sstp1))) 524 return rc; 525 526 cxl_prefault(ctx, wed); 527 528 cxl_p1n_write(afu, CXL_PSL_IVTE_Offset_An, 529 (((u64)ctx->irqs.offset[0] & 0xffff) << 48) | 530 (((u64)ctx->irqs.offset[1] & 0xffff) << 32) | 531 (((u64)ctx->irqs.offset[2] & 0xffff) << 16) | 532 ((u64)ctx->irqs.offset[3] & 0xffff)); 533 cxl_p1n_write(afu, CXL_PSL_IVTE_Limit_An, (u64) 534 (((u64)ctx->irqs.range[0] & 0xffff) << 48) | 535 (((u64)ctx->irqs.range[1] & 0xffff) << 32) | 536 (((u64)ctx->irqs.range[2] & 0xffff) << 16) | 537 ((u64)ctx->irqs.range[3] & 0xffff)); 538 539 cxl_p2n_write(afu, CXL_PSL_AMR_An, amr); 540 541 /* master only context for dedicated */ 542 assign_psn_space(ctx); 543 544 if ((rc = cxl_afu_reset(afu))) 545 return rc; 546 547 cxl_p2n_write(afu, CXL_PSL_WED_An, wed); 548 549 return afu_enable(afu); 550 } 551 552 static int deactivate_dedicated_process(struct cxl_afu *afu) 553 { 554 dev_info(&afu->dev, "Deactivating dedicated process mode\n"); 555 556 afu->current_mode = 0; 557 afu->num_procs = 0; 558 559 cxl_chardev_afu_remove(afu); 560 561 return 0; 562 } 563 564 int _cxl_afu_deactivate_mode(struct cxl_afu *afu, int mode) 565 { 566 if (mode == CXL_MODE_DIRECTED) 567 return deactivate_afu_directed(afu); 568 if (mode == CXL_MODE_DEDICATED) 569 return deactivate_dedicated_process(afu); 570 return 0; 571 } 572 573 int cxl_afu_deactivate_mode(struct cxl_afu *afu) 574 { 575 return _cxl_afu_deactivate_mode(afu, afu->current_mode); 576 } 577 578 int cxl_afu_activate_mode(struct cxl_afu *afu, int mode) 579 { 580 if (!mode) 581 return 0; 582 if (!(mode & afu->modes_supported)) 583 return -EINVAL; 584 585 if (mode == CXL_MODE_DIRECTED) 586 return activate_afu_directed(afu); 587 if (mode == CXL_MODE_DEDICATED) 588 return activate_dedicated_process(afu); 589 590 return -EINVAL; 591 } 592 593 int cxl_attach_process(struct cxl_context *ctx, bool kernel, u64 wed, u64 amr) 594 { 595 ctx->kernel = kernel; 596 if (ctx->afu->current_mode == CXL_MODE_DIRECTED) 597 return attach_afu_directed(ctx, wed, amr); 598 599 if (ctx->afu->current_mode == CXL_MODE_DEDICATED) 600 return attach_dedicated(ctx, wed, amr); 601 602 return -EINVAL; 603 } 604 605 static inline int detach_process_native_dedicated(struct cxl_context *ctx) 606 { 607 cxl_afu_reset(ctx->afu); 608 cxl_afu_disable(ctx->afu); 609 cxl_psl_purge(ctx->afu); 610 return 0; 611 } 612 613 /* 614 * TODO: handle case when this is called inside a rcu_read_lock() which may 615 * happen when we unbind the driver (ie. cxl_context_detach_all()) . Terminate 616 * & remove use a mutex lock and schedule which will not good with lock held. 617 * May need to write do_process_element_cmd() that handles outstanding page 618 * faults synchronously. 619 */ 620 static inline int detach_process_native_afu_directed(struct cxl_context *ctx) 621 { 622 if (!ctx->pe_inserted) 623 return 0; 624 if (terminate_process_element(ctx)) 625 return -1; 626 if (remove_process_element(ctx)) 627 return -1; 628 629 return 0; 630 } 631 632 int cxl_detach_process(struct cxl_context *ctx) 633 { 634 if (ctx->afu->current_mode == CXL_MODE_DEDICATED) 635 return detach_process_native_dedicated(ctx); 636 637 return detach_process_native_afu_directed(ctx); 638 } 639 640 int cxl_get_irq(struct cxl_context *ctx, struct cxl_irq_info *info) 641 { 642 u64 pidtid; 643 644 info->dsisr = cxl_p2n_read(ctx->afu, CXL_PSL_DSISR_An); 645 info->dar = cxl_p2n_read(ctx->afu, CXL_PSL_DAR_An); 646 info->dsr = cxl_p2n_read(ctx->afu, CXL_PSL_DSR_An); 647 pidtid = cxl_p2n_read(ctx->afu, CXL_PSL_PID_TID_An); 648 info->pid = pidtid >> 32; 649 info->tid = pidtid & 0xffffffff; 650 info->afu_err = cxl_p2n_read(ctx->afu, CXL_AFU_ERR_An); 651 info->errstat = cxl_p2n_read(ctx->afu, CXL_PSL_ErrStat_An); 652 653 return 0; 654 } 655 656 static void recover_psl_err(struct cxl_afu *afu, u64 errstat) 657 { 658 u64 dsisr; 659 660 pr_devel("RECOVERING FROM PSL ERROR... (0x%.16llx)\n", errstat); 661 662 /* Clear PSL_DSISR[PE] */ 663 dsisr = cxl_p2n_read(afu, CXL_PSL_DSISR_An); 664 cxl_p2n_write(afu, CXL_PSL_DSISR_An, dsisr & ~CXL_PSL_DSISR_An_PE); 665 666 /* Write 1s to clear error status bits */ 667 cxl_p2n_write(afu, CXL_PSL_ErrStat_An, errstat); 668 } 669 670 int cxl_ack_irq(struct cxl_context *ctx, u64 tfc, u64 psl_reset_mask) 671 { 672 if (tfc) 673 cxl_p2n_write(ctx->afu, CXL_PSL_TFC_An, tfc); 674 if (psl_reset_mask) 675 recover_psl_err(ctx->afu, psl_reset_mask); 676 677 return 0; 678 } 679 680 int cxl_check_error(struct cxl_afu *afu) 681 { 682 return (cxl_p1n_read(afu, CXL_PSL_SCNTL_An) == ~0ULL); 683 } 684