1 // SPDX-License-Identifier: MIT 2 /* 3 * Copyright © 2019 Intel Corporation 4 */ 5 6 #include "gem/i915_gem_context.h" 7 #include "gem/i915_gem_pm.h" 8 9 #include "i915_drv.h" 10 #include "i915_trace.h" 11 12 #include "intel_context.h" 13 #include "intel_engine.h" 14 #include "intel_engine_pm.h" 15 #include "intel_ring.h" 16 17 static struct kmem_cache *slab_ce; 18 19 static struct intel_context *intel_context_alloc(void) 20 { 21 return kmem_cache_zalloc(slab_ce, GFP_KERNEL); 22 } 23 24 static void rcu_context_free(struct rcu_head *rcu) 25 { 26 struct intel_context *ce = container_of(rcu, typeof(*ce), rcu); 27 28 trace_intel_context_free(ce); 29 kmem_cache_free(slab_ce, ce); 30 } 31 32 void intel_context_free(struct intel_context *ce) 33 { 34 call_rcu(&ce->rcu, rcu_context_free); 35 } 36 37 struct intel_context * 38 intel_context_create(struct intel_engine_cs *engine) 39 { 40 struct intel_context *ce; 41 42 ce = intel_context_alloc(); 43 if (!ce) 44 return ERR_PTR(-ENOMEM); 45 46 intel_context_init(ce, engine); 47 trace_intel_context_create(ce); 48 return ce; 49 } 50 51 int intel_context_alloc_state(struct intel_context *ce) 52 { 53 int err = 0; 54 55 if (mutex_lock_interruptible(&ce->pin_mutex)) 56 return -EINTR; 57 58 if (!test_bit(CONTEXT_ALLOC_BIT, &ce->flags)) { 59 if (intel_context_is_banned(ce)) { 60 err = -EIO; 61 goto unlock; 62 } 63 64 err = ce->ops->alloc(ce); 65 if (unlikely(err)) 66 goto unlock; 67 68 set_bit(CONTEXT_ALLOC_BIT, &ce->flags); 69 } 70 71 unlock: 72 mutex_unlock(&ce->pin_mutex); 73 return err; 74 } 75 76 static int intel_context_active_acquire(struct intel_context *ce) 77 { 78 int err; 79 80 __i915_active_acquire(&ce->active); 81 82 if (intel_context_is_barrier(ce) || intel_engine_uses_guc(ce->engine)) 83 return 0; 84 85 /* Preallocate tracking nodes */ 86 err = i915_active_acquire_preallocate_barrier(&ce->active, 87 ce->engine); 88 if (err) 89 i915_active_release(&ce->active); 90 91 return err; 92 } 93 94 static void intel_context_active_release(struct intel_context *ce) 95 { 96 /* Nodes preallocated in intel_context_active() */ 97 i915_active_acquire_barrier(&ce->active); 98 i915_active_release(&ce->active); 99 } 100 101 static int __context_pin_state(struct i915_vma *vma, struct i915_gem_ww_ctx *ww) 102 { 103 unsigned int bias = i915_ggtt_pin_bias(vma) | PIN_OFFSET_BIAS; 104 int err; 105 106 err = i915_ggtt_pin(vma, ww, 0, bias | PIN_HIGH); 107 if (err) 108 return err; 109 110 err = i915_active_acquire(&vma->active); 111 if (err) 112 goto err_unpin; 113 114 /* 115 * And mark it as a globally pinned object to let the shrinker know 116 * it cannot reclaim the object until we release it. 117 */ 118 i915_vma_make_unshrinkable(vma); 119 vma->obj->mm.dirty = true; 120 121 return 0; 122 123 err_unpin: 124 i915_vma_unpin(vma); 125 return err; 126 } 127 128 static void __context_unpin_state(struct i915_vma *vma) 129 { 130 i915_vma_make_shrinkable(vma); 131 i915_active_release(&vma->active); 132 __i915_vma_unpin(vma); 133 } 134 135 static int __ring_active(struct intel_ring *ring, 136 struct i915_gem_ww_ctx *ww) 137 { 138 int err; 139 140 err = intel_ring_pin(ring, ww); 141 if (err) 142 return err; 143 144 err = i915_active_acquire(&ring->vma->active); 145 if (err) 146 goto err_pin; 147 148 return 0; 149 150 err_pin: 151 intel_ring_unpin(ring); 152 return err; 153 } 154 155 static void __ring_retire(struct intel_ring *ring) 156 { 157 i915_active_release(&ring->vma->active); 158 intel_ring_unpin(ring); 159 } 160 161 static int intel_context_pre_pin(struct intel_context *ce, 162 struct i915_gem_ww_ctx *ww) 163 { 164 int err; 165 166 CE_TRACE(ce, "active\n"); 167 168 err = __ring_active(ce->ring, ww); 169 if (err) 170 return err; 171 172 err = intel_timeline_pin(ce->timeline, ww); 173 if (err) 174 goto err_ring; 175 176 if (!ce->state) 177 return 0; 178 179 err = __context_pin_state(ce->state, ww); 180 if (err) 181 goto err_timeline; 182 183 184 return 0; 185 186 err_timeline: 187 intel_timeline_unpin(ce->timeline); 188 err_ring: 189 __ring_retire(ce->ring); 190 return err; 191 } 192 193 static void intel_context_post_unpin(struct intel_context *ce) 194 { 195 if (ce->state) 196 __context_unpin_state(ce->state); 197 198 intel_timeline_unpin(ce->timeline); 199 __ring_retire(ce->ring); 200 } 201 202 int __intel_context_do_pin_ww(struct intel_context *ce, 203 struct i915_gem_ww_ctx *ww) 204 { 205 bool handoff = false; 206 void *vaddr; 207 int err = 0; 208 209 if (unlikely(!test_bit(CONTEXT_ALLOC_BIT, &ce->flags))) { 210 err = intel_context_alloc_state(ce); 211 if (err) 212 return err; 213 } 214 215 /* 216 * We always pin the context/ring/timeline here, to ensure a pin 217 * refcount for __intel_context_active(), which prevent a lock 218 * inversion of ce->pin_mutex vs dma_resv_lock(). 219 */ 220 221 err = i915_gem_object_lock(ce->timeline->hwsp_ggtt->obj, ww); 222 if (!err && ce->ring->vma->obj) 223 err = i915_gem_object_lock(ce->ring->vma->obj, ww); 224 if (!err && ce->state) 225 err = i915_gem_object_lock(ce->state->obj, ww); 226 if (!err) 227 err = intel_context_pre_pin(ce, ww); 228 if (err) 229 return err; 230 231 err = i915_active_acquire(&ce->active); 232 if (err) 233 goto err_ctx_unpin; 234 235 err = ce->ops->pre_pin(ce, ww, &vaddr); 236 if (err) 237 goto err_release; 238 239 err = mutex_lock_interruptible(&ce->pin_mutex); 240 if (err) 241 goto err_post_unpin; 242 243 intel_engine_pm_might_get(ce->engine); 244 245 if (unlikely(intel_context_is_closed(ce))) { 246 err = -ENOENT; 247 goto err_unlock; 248 } 249 250 if (likely(!atomic_add_unless(&ce->pin_count, 1, 0))) { 251 err = intel_context_active_acquire(ce); 252 if (unlikely(err)) 253 goto err_unlock; 254 255 err = ce->ops->pin(ce, vaddr); 256 if (err) { 257 intel_context_active_release(ce); 258 goto err_unlock; 259 } 260 261 CE_TRACE(ce, "pin ring:{start:%08x, head:%04x, tail:%04x}\n", 262 i915_ggtt_offset(ce->ring->vma), 263 ce->ring->head, ce->ring->tail); 264 265 handoff = true; 266 smp_mb__before_atomic(); /* flush pin before it is visible */ 267 atomic_inc(&ce->pin_count); 268 } 269 270 GEM_BUG_ON(!intel_context_is_pinned(ce)); /* no overflow! */ 271 272 trace_intel_context_do_pin(ce); 273 274 err_unlock: 275 mutex_unlock(&ce->pin_mutex); 276 err_post_unpin: 277 if (!handoff) 278 ce->ops->post_unpin(ce); 279 err_release: 280 i915_active_release(&ce->active); 281 err_ctx_unpin: 282 intel_context_post_unpin(ce); 283 284 /* 285 * Unlock the hwsp_ggtt object since it's shared. 286 * In principle we can unlock all the global state locked above 287 * since it's pinned and doesn't need fencing, and will 288 * thus remain resident until it is explicitly unpinned. 289 */ 290 i915_gem_ww_unlock_single(ce->timeline->hwsp_ggtt->obj); 291 292 return err; 293 } 294 295 int __intel_context_do_pin(struct intel_context *ce) 296 { 297 struct i915_gem_ww_ctx ww; 298 int err; 299 300 i915_gem_ww_ctx_init(&ww, true); 301 retry: 302 err = __intel_context_do_pin_ww(ce, &ww); 303 if (err == -EDEADLK) { 304 err = i915_gem_ww_ctx_backoff(&ww); 305 if (!err) 306 goto retry; 307 } 308 i915_gem_ww_ctx_fini(&ww); 309 return err; 310 } 311 312 void __intel_context_do_unpin(struct intel_context *ce, int sub) 313 { 314 if (!atomic_sub_and_test(sub, &ce->pin_count)) 315 return; 316 317 CE_TRACE(ce, "unpin\n"); 318 ce->ops->unpin(ce); 319 ce->ops->post_unpin(ce); 320 321 /* 322 * Once released, we may asynchronously drop the active reference. 323 * As that may be the only reference keeping the context alive, 324 * take an extra now so that it is not freed before we finish 325 * dereferencing it. 326 */ 327 intel_context_get(ce); 328 intel_context_active_release(ce); 329 trace_intel_context_do_unpin(ce); 330 intel_context_put(ce); 331 } 332 333 static void __intel_context_retire(struct i915_active *active) 334 { 335 struct intel_context *ce = container_of(active, typeof(*ce), active); 336 337 CE_TRACE(ce, "retire runtime: { total:%lluns, avg:%lluns }\n", 338 intel_context_get_total_runtime_ns(ce), 339 intel_context_get_avg_runtime_ns(ce)); 340 341 set_bit(CONTEXT_VALID_BIT, &ce->flags); 342 intel_context_post_unpin(ce); 343 intel_context_put(ce); 344 } 345 346 static int __intel_context_active(struct i915_active *active) 347 { 348 struct intel_context *ce = container_of(active, typeof(*ce), active); 349 350 intel_context_get(ce); 351 352 /* everything should already be activated by intel_context_pre_pin() */ 353 GEM_WARN_ON(!i915_active_acquire_if_busy(&ce->ring->vma->active)); 354 __intel_ring_pin(ce->ring); 355 356 __intel_timeline_pin(ce->timeline); 357 358 if (ce->state) { 359 GEM_WARN_ON(!i915_active_acquire_if_busy(&ce->state->active)); 360 __i915_vma_pin(ce->state); 361 i915_vma_make_unshrinkable(ce->state); 362 } 363 364 return 0; 365 } 366 367 static int __i915_sw_fence_call 368 sw_fence_dummy_notify(struct i915_sw_fence *sf, enum i915_sw_fence_notify state) 369 { 370 return NOTIFY_DONE; 371 } 372 373 void 374 intel_context_init(struct intel_context *ce, struct intel_engine_cs *engine) 375 { 376 GEM_BUG_ON(!engine->cops); 377 GEM_BUG_ON(!engine->gt->vm); 378 379 kref_init(&ce->ref); 380 381 ce->engine = engine; 382 ce->ops = engine->cops; 383 ce->sseu = engine->sseu; 384 ce->ring = NULL; 385 ce->ring_size = SZ_4K; 386 387 ewma_runtime_init(&ce->runtime.avg); 388 389 ce->vm = i915_vm_get(engine->gt->vm); 390 391 /* NB ce->signal_link/lock is used under RCU */ 392 spin_lock_init(&ce->signal_lock); 393 INIT_LIST_HEAD(&ce->signals); 394 395 mutex_init(&ce->pin_mutex); 396 397 spin_lock_init(&ce->guc_state.lock); 398 INIT_LIST_HEAD(&ce->guc_state.fences); 399 INIT_LIST_HEAD(&ce->guc_state.requests); 400 401 ce->guc_id.id = GUC_INVALID_LRC_ID; 402 INIT_LIST_HEAD(&ce->guc_id.link); 403 404 INIT_LIST_HEAD(&ce->destroyed_link); 405 406 INIT_LIST_HEAD(&ce->parallel.child_list); 407 408 /* 409 * Initialize fence to be complete as this is expected to be complete 410 * unless there is a pending schedule disable outstanding. 411 */ 412 i915_sw_fence_init(&ce->guc_state.blocked, 413 sw_fence_dummy_notify); 414 i915_sw_fence_commit(&ce->guc_state.blocked); 415 416 i915_active_init(&ce->active, 417 __intel_context_active, __intel_context_retire, 0); 418 } 419 420 void intel_context_fini(struct intel_context *ce) 421 { 422 struct intel_context *child, *next; 423 424 if (ce->timeline) 425 intel_timeline_put(ce->timeline); 426 i915_vm_put(ce->vm); 427 428 /* Need to put the creation ref for the children */ 429 if (intel_context_is_parent(ce)) 430 for_each_child_safe(ce, child, next) 431 intel_context_put(child); 432 433 mutex_destroy(&ce->pin_mutex); 434 i915_active_fini(&ce->active); 435 i915_sw_fence_fini(&ce->guc_state.blocked); 436 } 437 438 void i915_context_module_exit(void) 439 { 440 kmem_cache_destroy(slab_ce); 441 } 442 443 int __init i915_context_module_init(void) 444 { 445 slab_ce = KMEM_CACHE(intel_context, SLAB_HWCACHE_ALIGN); 446 if (!slab_ce) 447 return -ENOMEM; 448 449 return 0; 450 } 451 452 void intel_context_enter_engine(struct intel_context *ce) 453 { 454 intel_engine_pm_get(ce->engine); 455 intel_timeline_enter(ce->timeline); 456 } 457 458 void intel_context_exit_engine(struct intel_context *ce) 459 { 460 intel_timeline_exit(ce->timeline); 461 intel_engine_pm_put(ce->engine); 462 } 463 464 int intel_context_prepare_remote_request(struct intel_context *ce, 465 struct i915_request *rq) 466 { 467 struct intel_timeline *tl = ce->timeline; 468 int err; 469 470 /* Only suitable for use in remotely modifying this context */ 471 GEM_BUG_ON(rq->context == ce); 472 473 if (rcu_access_pointer(rq->timeline) != tl) { /* timeline sharing! */ 474 /* Queue this switch after current activity by this context. */ 475 err = i915_active_fence_set(&tl->last_request, rq); 476 if (err) 477 return err; 478 } 479 480 /* 481 * Guarantee context image and the timeline remains pinned until the 482 * modifying request is retired by setting the ce activity tracker. 483 * 484 * But we only need to take one pin on the account of it. Or in other 485 * words transfer the pinned ce object to tracked active request. 486 */ 487 GEM_BUG_ON(i915_active_is_idle(&ce->active)); 488 return i915_active_add_request(&ce->active, rq); 489 } 490 491 struct i915_request *intel_context_create_request(struct intel_context *ce) 492 { 493 struct i915_gem_ww_ctx ww; 494 struct i915_request *rq; 495 int err; 496 497 i915_gem_ww_ctx_init(&ww, true); 498 retry: 499 err = intel_context_pin_ww(ce, &ww); 500 if (!err) { 501 rq = i915_request_create(ce); 502 intel_context_unpin(ce); 503 } else if (err == -EDEADLK) { 504 err = i915_gem_ww_ctx_backoff(&ww); 505 if (!err) 506 goto retry; 507 rq = ERR_PTR(err); 508 } else { 509 rq = ERR_PTR(err); 510 } 511 512 i915_gem_ww_ctx_fini(&ww); 513 514 if (IS_ERR(rq)) 515 return rq; 516 517 /* 518 * timeline->mutex should be the inner lock, but is used as outer lock. 519 * Hack around this to shut up lockdep in selftests.. 520 */ 521 lockdep_unpin_lock(&ce->timeline->mutex, rq->cookie); 522 mutex_release(&ce->timeline->mutex.dep_map, _RET_IP_); 523 mutex_acquire(&ce->timeline->mutex.dep_map, SINGLE_DEPTH_NESTING, 0, _RET_IP_); 524 rq->cookie = lockdep_pin_lock(&ce->timeline->mutex); 525 526 return rq; 527 } 528 529 struct i915_request *intel_context_find_active_request(struct intel_context *ce) 530 { 531 struct intel_context *parent = intel_context_to_parent(ce); 532 struct i915_request *rq, *active = NULL; 533 unsigned long flags; 534 535 GEM_BUG_ON(!intel_engine_uses_guc(ce->engine)); 536 537 /* 538 * We search the parent list to find an active request on the submitted 539 * context. The parent list contains the requests for all the contexts 540 * in the relationship so we have to do a compare of each request's 541 * context. 542 */ 543 spin_lock_irqsave(&parent->guc_state.lock, flags); 544 list_for_each_entry_reverse(rq, &parent->guc_state.requests, 545 sched.link) { 546 if (rq->context != ce) 547 continue; 548 if (i915_request_completed(rq)) 549 break; 550 551 active = rq; 552 } 553 spin_unlock_irqrestore(&parent->guc_state.lock, flags); 554 555 return active; 556 } 557 558 void intel_context_bind_parent_child(struct intel_context *parent, 559 struct intel_context *child) 560 { 561 /* 562 * Callers responsibility to validate that this function is used 563 * correctly but we use GEM_BUG_ON here ensure that they do. 564 */ 565 GEM_BUG_ON(!intel_engine_uses_guc(parent->engine)); 566 GEM_BUG_ON(intel_context_is_pinned(parent)); 567 GEM_BUG_ON(intel_context_is_child(parent)); 568 GEM_BUG_ON(intel_context_is_pinned(child)); 569 GEM_BUG_ON(intel_context_is_child(child)); 570 GEM_BUG_ON(intel_context_is_parent(child)); 571 572 parent->parallel.child_index = parent->parallel.number_children++; 573 list_add_tail(&child->parallel.child_link, 574 &parent->parallel.child_list); 575 child->parallel.parent = parent; 576 } 577 578 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST) 579 #include "selftest_context.c" 580 #endif 581