1 /* 2 * Copyright 2017 Advanced Micro Devices, Inc. 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 * 22 */ 23 24 #if !defined(_AMDGPU_TRACE_H) || defined(TRACE_HEADER_MULTI_READ) 25 #define _AMDGPU_TRACE_H_ 26 27 #include <linux/stringify.h> 28 #include <linux/types.h> 29 #include <linux/tracepoint.h> 30 31 #undef TRACE_SYSTEM 32 #define TRACE_SYSTEM amdgpu 33 #define TRACE_INCLUDE_FILE amdgpu_trace 34 35 #define AMDGPU_JOB_GET_TIMELINE_NAME(job) \ 36 job->base.s_fence->finished.ops->get_timeline_name(&job->base.s_fence->finished) 37 38 TRACE_EVENT(amdgpu_mm_rreg, 39 TP_PROTO(unsigned did, uint32_t reg, uint32_t value), 40 TP_ARGS(did, reg, value), 41 TP_STRUCT__entry( 42 __field(unsigned, did) 43 __field(uint32_t, reg) 44 __field(uint32_t, value) 45 ), 46 TP_fast_assign( 47 __entry->did = did; 48 __entry->reg = reg; 49 __entry->value = value; 50 ), 51 TP_printk("0x%04lx, 0x%08lx, 0x%08lx", 52 (unsigned long)__entry->did, 53 (unsigned long)__entry->reg, 54 (unsigned long)__entry->value) 55 ); 56 57 TRACE_EVENT(amdgpu_mm_wreg, 58 TP_PROTO(unsigned did, uint32_t reg, uint32_t value), 59 TP_ARGS(did, reg, value), 60 TP_STRUCT__entry( 61 __field(unsigned, did) 62 __field(uint32_t, reg) 63 __field(uint32_t, value) 64 ), 65 TP_fast_assign( 66 __entry->did = did; 67 __entry->reg = reg; 68 __entry->value = value; 69 ), 70 TP_printk("0x%04lx, 0x%08lx, 0x%08lx", 71 (unsigned long)__entry->did, 72 (unsigned long)__entry->reg, 73 (unsigned long)__entry->value) 74 ); 75 76 TRACE_EVENT(amdgpu_iv, 77 TP_PROTO(unsigned ih, struct amdgpu_iv_entry *iv), 78 TP_ARGS(ih, iv), 79 TP_STRUCT__entry( 80 __field(unsigned, ih) 81 __field(unsigned, client_id) 82 __field(unsigned, src_id) 83 __field(unsigned, ring_id) 84 __field(unsigned, vmid) 85 __field(unsigned, vmid_src) 86 __field(uint64_t, timestamp) 87 __field(unsigned, timestamp_src) 88 __field(unsigned, pasid) 89 __array(unsigned, src_data, 4) 90 ), 91 TP_fast_assign( 92 __entry->ih = ih; 93 __entry->client_id = iv->client_id; 94 __entry->src_id = iv->src_id; 95 __entry->ring_id = iv->ring_id; 96 __entry->vmid = iv->vmid; 97 __entry->vmid_src = iv->vmid_src; 98 __entry->timestamp = iv->timestamp; 99 __entry->timestamp_src = iv->timestamp_src; 100 __entry->pasid = iv->pasid; 101 __entry->src_data[0] = iv->src_data[0]; 102 __entry->src_data[1] = iv->src_data[1]; 103 __entry->src_data[2] = iv->src_data[2]; 104 __entry->src_data[3] = iv->src_data[3]; 105 ), 106 TP_printk("ih:%u client_id:%u src_id:%u ring:%u vmid:%u " 107 "timestamp: %llu pasid:%u src_data: %08x %08x %08x %08x", 108 __entry->ih, __entry->client_id, __entry->src_id, 109 __entry->ring_id, __entry->vmid, 110 __entry->timestamp, __entry->pasid, 111 __entry->src_data[0], __entry->src_data[1], 112 __entry->src_data[2], __entry->src_data[3]) 113 ); 114 115 116 TRACE_EVENT(amdgpu_bo_create, 117 TP_PROTO(struct amdgpu_bo *bo), 118 TP_ARGS(bo), 119 TP_STRUCT__entry( 120 __field(struct amdgpu_bo *, bo) 121 __field(u32, pages) 122 __field(u32, type) 123 __field(u32, prefer) 124 __field(u32, allow) 125 __field(u32, visible) 126 ), 127 128 TP_fast_assign( 129 __entry->bo = bo; 130 __entry->pages = bo->tbo.num_pages; 131 __entry->type = bo->tbo.mem.mem_type; 132 __entry->prefer = bo->preferred_domains; 133 __entry->allow = bo->allowed_domains; 134 __entry->visible = bo->flags; 135 ), 136 137 TP_printk("bo=%p, pages=%u, type=%d, preferred=%d, allowed=%d, visible=%d", 138 __entry->bo, __entry->pages, __entry->type, 139 __entry->prefer, __entry->allow, __entry->visible) 140 ); 141 142 TRACE_EVENT(amdgpu_cs, 143 TP_PROTO(struct amdgpu_cs_parser *p, int i), 144 TP_ARGS(p, i), 145 TP_STRUCT__entry( 146 __field(struct amdgpu_bo_list *, bo_list) 147 __field(u32, ring) 148 __field(u32, dw) 149 __field(u32, fences) 150 ), 151 152 TP_fast_assign( 153 __entry->bo_list = p->bo_list; 154 __entry->ring = to_amdgpu_ring(p->entity->rq->sched)->idx; 155 __entry->dw = p->job->ibs[i].length_dw; 156 __entry->fences = amdgpu_fence_count_emitted( 157 to_amdgpu_ring(p->entity->rq->sched)); 158 ), 159 TP_printk("bo_list=%p, ring=%u, dw=%u, fences=%u", 160 __entry->bo_list, __entry->ring, __entry->dw, 161 __entry->fences) 162 ); 163 164 TRACE_EVENT(amdgpu_cs_ioctl, 165 TP_PROTO(struct amdgpu_job *job), 166 TP_ARGS(job), 167 TP_STRUCT__entry( 168 __field(uint64_t, sched_job_id) 169 __string(timeline, AMDGPU_JOB_GET_TIMELINE_NAME(job)) 170 __field(unsigned int, context) 171 __field(unsigned int, seqno) 172 __field(struct dma_fence *, fence) 173 __string(ring, to_amdgpu_ring(job->base.sched)->name) 174 __field(u32, num_ibs) 175 ), 176 177 TP_fast_assign( 178 __entry->sched_job_id = job->base.id; 179 __assign_str(timeline, AMDGPU_JOB_GET_TIMELINE_NAME(job)) 180 __entry->context = job->base.s_fence->finished.context; 181 __entry->seqno = job->base.s_fence->finished.seqno; 182 __assign_str(ring, to_amdgpu_ring(job->base.sched)->name) 183 __entry->num_ibs = job->num_ibs; 184 ), 185 TP_printk("sched_job=%llu, timeline=%s, context=%u, seqno=%u, ring_name=%s, num_ibs=%u", 186 __entry->sched_job_id, __get_str(timeline), __entry->context, 187 __entry->seqno, __get_str(ring), __entry->num_ibs) 188 ); 189 190 TRACE_EVENT(amdgpu_sched_run_job, 191 TP_PROTO(struct amdgpu_job *job), 192 TP_ARGS(job), 193 TP_STRUCT__entry( 194 __field(uint64_t, sched_job_id) 195 __string(timeline, AMDGPU_JOB_GET_TIMELINE_NAME(job)) 196 __field(unsigned int, context) 197 __field(unsigned int, seqno) 198 __string(ring, to_amdgpu_ring(job->base.sched)->name) 199 __field(u32, num_ibs) 200 ), 201 202 TP_fast_assign( 203 __entry->sched_job_id = job->base.id; 204 __assign_str(timeline, AMDGPU_JOB_GET_TIMELINE_NAME(job)) 205 __entry->context = job->base.s_fence->finished.context; 206 __entry->seqno = job->base.s_fence->finished.seqno; 207 __assign_str(ring, to_amdgpu_ring(job->base.sched)->name) 208 __entry->num_ibs = job->num_ibs; 209 ), 210 TP_printk("sched_job=%llu, timeline=%s, context=%u, seqno=%u, ring_name=%s, num_ibs=%u", 211 __entry->sched_job_id, __get_str(timeline), __entry->context, 212 __entry->seqno, __get_str(ring), __entry->num_ibs) 213 ); 214 215 216 TRACE_EVENT(amdgpu_vm_grab_id, 217 TP_PROTO(struct amdgpu_vm *vm, struct amdgpu_ring *ring, 218 struct amdgpu_job *job), 219 TP_ARGS(vm, ring, job), 220 TP_STRUCT__entry( 221 __field(u32, pasid) 222 __string(ring, ring->name) 223 __field(u32, ring) 224 __field(u32, vmid) 225 __field(u32, vm_hub) 226 __field(u64, pd_addr) 227 __field(u32, needs_flush) 228 ), 229 230 TP_fast_assign( 231 __entry->pasid = vm->pasid; 232 __assign_str(ring, ring->name) 233 __entry->vmid = job->vmid; 234 __entry->vm_hub = ring->funcs->vmhub, 235 __entry->pd_addr = job->vm_pd_addr; 236 __entry->needs_flush = job->vm_needs_flush; 237 ), 238 TP_printk("pasid=%d, ring=%s, id=%u, hub=%u, pd_addr=%010Lx needs_flush=%u", 239 __entry->pasid, __get_str(ring), __entry->vmid, 240 __entry->vm_hub, __entry->pd_addr, __entry->needs_flush) 241 ); 242 243 TRACE_EVENT(amdgpu_vm_bo_map, 244 TP_PROTO(struct amdgpu_bo_va *bo_va, 245 struct amdgpu_bo_va_mapping *mapping), 246 TP_ARGS(bo_va, mapping), 247 TP_STRUCT__entry( 248 __field(struct amdgpu_bo *, bo) 249 __field(long, start) 250 __field(long, last) 251 __field(u64, offset) 252 __field(u64, flags) 253 ), 254 255 TP_fast_assign( 256 __entry->bo = bo_va ? bo_va->base.bo : NULL; 257 __entry->start = mapping->start; 258 __entry->last = mapping->last; 259 __entry->offset = mapping->offset; 260 __entry->flags = mapping->flags; 261 ), 262 TP_printk("bo=%p, start=%lx, last=%lx, offset=%010llx, flags=%llx", 263 __entry->bo, __entry->start, __entry->last, 264 __entry->offset, __entry->flags) 265 ); 266 267 TRACE_EVENT(amdgpu_vm_bo_unmap, 268 TP_PROTO(struct amdgpu_bo_va *bo_va, 269 struct amdgpu_bo_va_mapping *mapping), 270 TP_ARGS(bo_va, mapping), 271 TP_STRUCT__entry( 272 __field(struct amdgpu_bo *, bo) 273 __field(long, start) 274 __field(long, last) 275 __field(u64, offset) 276 __field(u64, flags) 277 ), 278 279 TP_fast_assign( 280 __entry->bo = bo_va ? bo_va->base.bo : NULL; 281 __entry->start = mapping->start; 282 __entry->last = mapping->last; 283 __entry->offset = mapping->offset; 284 __entry->flags = mapping->flags; 285 ), 286 TP_printk("bo=%p, start=%lx, last=%lx, offset=%010llx, flags=%llx", 287 __entry->bo, __entry->start, __entry->last, 288 __entry->offset, __entry->flags) 289 ); 290 291 DECLARE_EVENT_CLASS(amdgpu_vm_mapping, 292 TP_PROTO(struct amdgpu_bo_va_mapping *mapping), 293 TP_ARGS(mapping), 294 TP_STRUCT__entry( 295 __field(u64, soffset) 296 __field(u64, eoffset) 297 __field(u64, flags) 298 ), 299 300 TP_fast_assign( 301 __entry->soffset = mapping->start; 302 __entry->eoffset = mapping->last + 1; 303 __entry->flags = mapping->flags; 304 ), 305 TP_printk("soffs=%010llx, eoffs=%010llx, flags=%llx", 306 __entry->soffset, __entry->eoffset, __entry->flags) 307 ); 308 309 DEFINE_EVENT(amdgpu_vm_mapping, amdgpu_vm_bo_update, 310 TP_PROTO(struct amdgpu_bo_va_mapping *mapping), 311 TP_ARGS(mapping) 312 ); 313 314 DEFINE_EVENT(amdgpu_vm_mapping, amdgpu_vm_bo_mapping, 315 TP_PROTO(struct amdgpu_bo_va_mapping *mapping), 316 TP_ARGS(mapping) 317 ); 318 319 DEFINE_EVENT(amdgpu_vm_mapping, amdgpu_vm_bo_cs, 320 TP_PROTO(struct amdgpu_bo_va_mapping *mapping), 321 TP_ARGS(mapping) 322 ); 323 324 TRACE_EVENT(amdgpu_vm_set_ptes, 325 TP_PROTO(uint64_t pe, uint64_t addr, unsigned count, 326 uint32_t incr, uint64_t flags, bool direct), 327 TP_ARGS(pe, addr, count, incr, flags, direct), 328 TP_STRUCT__entry( 329 __field(u64, pe) 330 __field(u64, addr) 331 __field(u32, count) 332 __field(u32, incr) 333 __field(u64, flags) 334 __field(bool, direct) 335 ), 336 337 TP_fast_assign( 338 __entry->pe = pe; 339 __entry->addr = addr; 340 __entry->count = count; 341 __entry->incr = incr; 342 __entry->flags = flags; 343 __entry->direct = direct; 344 ), 345 TP_printk("pe=%010Lx, addr=%010Lx, incr=%u, flags=%llx, count=%u, " 346 "direct=%d", __entry->pe, __entry->addr, __entry->incr, 347 __entry->flags, __entry->count, __entry->direct) 348 ); 349 350 TRACE_EVENT(amdgpu_vm_copy_ptes, 351 TP_PROTO(uint64_t pe, uint64_t src, unsigned count, bool direct), 352 TP_ARGS(pe, src, count, direct), 353 TP_STRUCT__entry( 354 __field(u64, pe) 355 __field(u64, src) 356 __field(u32, count) 357 __field(bool, direct) 358 ), 359 360 TP_fast_assign( 361 __entry->pe = pe; 362 __entry->src = src; 363 __entry->count = count; 364 __entry->direct = direct; 365 ), 366 TP_printk("pe=%010Lx, src=%010Lx, count=%u, direct=%d", 367 __entry->pe, __entry->src, __entry->count, 368 __entry->direct) 369 ); 370 371 TRACE_EVENT(amdgpu_vm_flush, 372 TP_PROTO(struct amdgpu_ring *ring, unsigned vmid, 373 uint64_t pd_addr), 374 TP_ARGS(ring, vmid, pd_addr), 375 TP_STRUCT__entry( 376 __string(ring, ring->name) 377 __field(u32, vmid) 378 __field(u32, vm_hub) 379 __field(u64, pd_addr) 380 ), 381 382 TP_fast_assign( 383 __assign_str(ring, ring->name) 384 __entry->vmid = vmid; 385 __entry->vm_hub = ring->funcs->vmhub; 386 __entry->pd_addr = pd_addr; 387 ), 388 TP_printk("ring=%s, id=%u, hub=%u, pd_addr=%010Lx", 389 __get_str(ring), __entry->vmid, 390 __entry->vm_hub,__entry->pd_addr) 391 ); 392 393 DECLARE_EVENT_CLASS(amdgpu_pasid, 394 TP_PROTO(unsigned pasid), 395 TP_ARGS(pasid), 396 TP_STRUCT__entry( 397 __field(unsigned, pasid) 398 ), 399 TP_fast_assign( 400 __entry->pasid = pasid; 401 ), 402 TP_printk("pasid=%u", __entry->pasid) 403 ); 404 405 DEFINE_EVENT(amdgpu_pasid, amdgpu_pasid_allocated, 406 TP_PROTO(unsigned pasid), 407 TP_ARGS(pasid) 408 ); 409 410 DEFINE_EVENT(amdgpu_pasid, amdgpu_pasid_freed, 411 TP_PROTO(unsigned pasid), 412 TP_ARGS(pasid) 413 ); 414 415 TRACE_EVENT(amdgpu_bo_list_set, 416 TP_PROTO(struct amdgpu_bo_list *list, struct amdgpu_bo *bo), 417 TP_ARGS(list, bo), 418 TP_STRUCT__entry( 419 __field(struct amdgpu_bo_list *, list) 420 __field(struct amdgpu_bo *, bo) 421 __field(u64, bo_size) 422 ), 423 424 TP_fast_assign( 425 __entry->list = list; 426 __entry->bo = bo; 427 __entry->bo_size = amdgpu_bo_size(bo); 428 ), 429 TP_printk("list=%p, bo=%p, bo_size=%Ld", 430 __entry->list, 431 __entry->bo, 432 __entry->bo_size) 433 ); 434 435 TRACE_EVENT(amdgpu_cs_bo_status, 436 TP_PROTO(uint64_t total_bo, uint64_t total_size), 437 TP_ARGS(total_bo, total_size), 438 TP_STRUCT__entry( 439 __field(u64, total_bo) 440 __field(u64, total_size) 441 ), 442 443 TP_fast_assign( 444 __entry->total_bo = total_bo; 445 __entry->total_size = total_size; 446 ), 447 TP_printk("total_bo_size=%Ld, total_bo_count=%Ld", 448 __entry->total_bo, __entry->total_size) 449 ); 450 451 TRACE_EVENT(amdgpu_bo_move, 452 TP_PROTO(struct amdgpu_bo* bo, uint32_t new_placement, uint32_t old_placement), 453 TP_ARGS(bo, new_placement, old_placement), 454 TP_STRUCT__entry( 455 __field(struct amdgpu_bo *, bo) 456 __field(u64, bo_size) 457 __field(u32, new_placement) 458 __field(u32, old_placement) 459 ), 460 461 TP_fast_assign( 462 __entry->bo = bo; 463 __entry->bo_size = amdgpu_bo_size(bo); 464 __entry->new_placement = new_placement; 465 __entry->old_placement = old_placement; 466 ), 467 TP_printk("bo=%p, from=%d, to=%d, size=%Ld", 468 __entry->bo, __entry->old_placement, 469 __entry->new_placement, __entry->bo_size) 470 ); 471 472 TRACE_EVENT(amdgpu_ib_pipe_sync, 473 TP_PROTO(struct amdgpu_job *sched_job, struct dma_fence *fence), 474 TP_ARGS(sched_job, fence), 475 TP_STRUCT__entry( 476 __string(ring, sched_job->base.sched->name) 477 __field(uint64_t, id) 478 __field(struct dma_fence *, fence) 479 __field(uint64_t, ctx) 480 __field(unsigned, seqno) 481 ), 482 483 TP_fast_assign( 484 __assign_str(ring, sched_job->base.sched->name) 485 __entry->id = sched_job->base.id; 486 __entry->fence = fence; 487 __entry->ctx = fence->context; 488 __entry->seqno = fence->seqno; 489 ), 490 TP_printk("job ring=%s, id=%llu, need pipe sync to fence=%p, context=%llu, seq=%u", 491 __get_str(ring), __entry->id, 492 __entry->fence, __entry->ctx, 493 __entry->seqno) 494 ); 495 496 #undef AMDGPU_JOB_GET_TIMELINE_NAME 497 #endif 498 499 /* This part must be outside protection */ 500 #undef TRACE_INCLUDE_PATH 501 #define TRACE_INCLUDE_PATH ../../drivers/gpu/drm/amd/amdgpu 502 #include <trace/define_trace.h> 503