1 /* 2 * Copyright 2008 Advanced Micro Devices, Inc. 3 * Copyright 2008 Red Hat Inc. 4 * Copyright 2009 Jerome Glisse. 5 * 6 * Permission is hereby granted, free of charge, to any person obtaining a 7 * copy of this software and associated documentation files (the "Software"), 8 * to deal in the Software without restriction, including without limitation 9 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 10 * and/or sell copies of the Software, and to permit persons to whom the 11 * Software is furnished to do so, subject to the following conditions: 12 * 13 * The above copyright notice and this permission notice shall be included in 14 * all copies or substantial portions of the Software. 15 * 16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 22 * OTHER DEALINGS IN THE SOFTWARE. 23 * 24 */ 25 26 #include <linux/kthread.h> 27 #include <linux/pci.h> 28 #include <linux/uaccess.h> 29 #include <linux/pm_runtime.h> 30 31 #include "amdgpu.h" 32 #include "amdgpu_pm.h" 33 #include "amdgpu_dm_debugfs.h" 34 #include "amdgpu_ras.h" 35 #include "amdgpu_rap.h" 36 #include "amdgpu_securedisplay.h" 37 #include "amdgpu_fw_attestation.h" 38 #include "amdgpu_umr.h" 39 40 #include "amdgpu_reset.h" 41 #include "amdgpu_psp_ta.h" 42 43 #if defined(CONFIG_DEBUG_FS) 44 45 /** 46 * amdgpu_debugfs_process_reg_op - Handle MMIO register reads/writes 47 * 48 * @read: True if reading 49 * @f: open file handle 50 * @buf: User buffer to write/read to 51 * @size: Number of bytes to write/read 52 * @pos: Offset to seek to 53 * 54 * This debugfs entry has special meaning on the offset being sought. 55 * Various bits have different meanings: 56 * 57 * Bit 62: Indicates a GRBM bank switch is needed 58 * Bit 61: Indicates a SRBM bank switch is needed (implies bit 62 is 59 * zero) 60 * Bits 24..33: The SE or ME selector if needed 61 * Bits 34..43: The SH (or SA) or PIPE selector if needed 62 * Bits 44..53: The INSTANCE (or CU/WGP) or QUEUE selector if needed 63 * 64 * Bit 23: Indicates that the PM power gating lock should be held 65 * This is necessary to read registers that might be 66 * unreliable during a power gating transistion. 67 * 68 * The lower bits are the BYTE offset of the register to read. This 69 * allows reading multiple registers in a single call and having 70 * the returned size reflect that. 71 */ 72 static int amdgpu_debugfs_process_reg_op(bool read, struct file *f, 73 char __user *buf, size_t size, loff_t *pos) 74 { 75 struct amdgpu_device *adev = file_inode(f)->i_private; 76 ssize_t result = 0; 77 int r; 78 bool pm_pg_lock, use_bank, use_ring; 79 unsigned instance_bank, sh_bank, se_bank, me, pipe, queue, vmid; 80 81 pm_pg_lock = use_bank = use_ring = false; 82 instance_bank = sh_bank = se_bank = me = pipe = queue = vmid = 0; 83 84 if (size & 0x3 || *pos & 0x3 || 85 ((*pos & (1ULL << 62)) && (*pos & (1ULL << 61)))) 86 return -EINVAL; 87 88 /* are we reading registers for which a PG lock is necessary? */ 89 pm_pg_lock = (*pos >> 23) & 1; 90 91 if (*pos & (1ULL << 62)) { 92 se_bank = (*pos & GENMASK_ULL(33, 24)) >> 24; 93 sh_bank = (*pos & GENMASK_ULL(43, 34)) >> 34; 94 instance_bank = (*pos & GENMASK_ULL(53, 44)) >> 44; 95 96 if (se_bank == 0x3FF) 97 se_bank = 0xFFFFFFFF; 98 if (sh_bank == 0x3FF) 99 sh_bank = 0xFFFFFFFF; 100 if (instance_bank == 0x3FF) 101 instance_bank = 0xFFFFFFFF; 102 use_bank = true; 103 } else if (*pos & (1ULL << 61)) { 104 105 me = (*pos & GENMASK_ULL(33, 24)) >> 24; 106 pipe = (*pos & GENMASK_ULL(43, 34)) >> 34; 107 queue = (*pos & GENMASK_ULL(53, 44)) >> 44; 108 vmid = (*pos & GENMASK_ULL(58, 54)) >> 54; 109 110 use_ring = true; 111 } else { 112 use_bank = use_ring = false; 113 } 114 115 *pos &= (1UL << 22) - 1; 116 117 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 118 if (r < 0) { 119 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 120 return r; 121 } 122 123 r = amdgpu_virt_enable_access_debugfs(adev); 124 if (r < 0) { 125 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 126 return r; 127 } 128 129 if (use_bank) { 130 if ((sh_bank != 0xFFFFFFFF && sh_bank >= adev->gfx.config.max_sh_per_se) || 131 (se_bank != 0xFFFFFFFF && se_bank >= adev->gfx.config.max_shader_engines)) { 132 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 133 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 134 amdgpu_virt_disable_access_debugfs(adev); 135 return -EINVAL; 136 } 137 mutex_lock(&adev->grbm_idx_mutex); 138 amdgpu_gfx_select_se_sh(adev, se_bank, 139 sh_bank, instance_bank); 140 } else if (use_ring) { 141 mutex_lock(&adev->srbm_mutex); 142 amdgpu_gfx_select_me_pipe_q(adev, me, pipe, queue, vmid); 143 } 144 145 if (pm_pg_lock) 146 mutex_lock(&adev->pm.mutex); 147 148 while (size) { 149 uint32_t value; 150 151 if (read) { 152 value = RREG32(*pos >> 2); 153 r = put_user(value, (uint32_t *)buf); 154 } else { 155 r = get_user(value, (uint32_t *)buf); 156 if (!r) 157 amdgpu_mm_wreg_mmio_rlc(adev, *pos >> 2, value); 158 } 159 if (r) { 160 result = r; 161 goto end; 162 } 163 164 result += 4; 165 buf += 4; 166 *pos += 4; 167 size -= 4; 168 } 169 170 end: 171 if (use_bank) { 172 amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff); 173 mutex_unlock(&adev->grbm_idx_mutex); 174 } else if (use_ring) { 175 amdgpu_gfx_select_me_pipe_q(adev, 0, 0, 0, 0); 176 mutex_unlock(&adev->srbm_mutex); 177 } 178 179 if (pm_pg_lock) 180 mutex_unlock(&adev->pm.mutex); 181 182 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 183 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 184 185 amdgpu_virt_disable_access_debugfs(adev); 186 return result; 187 } 188 189 /* 190 * amdgpu_debugfs_regs_read - Callback for reading MMIO registers 191 */ 192 static ssize_t amdgpu_debugfs_regs_read(struct file *f, char __user *buf, 193 size_t size, loff_t *pos) 194 { 195 return amdgpu_debugfs_process_reg_op(true, f, buf, size, pos); 196 } 197 198 /* 199 * amdgpu_debugfs_regs_write - Callback for writing MMIO registers 200 */ 201 static ssize_t amdgpu_debugfs_regs_write(struct file *f, const char __user *buf, 202 size_t size, loff_t *pos) 203 { 204 return amdgpu_debugfs_process_reg_op(false, f, (char __user *)buf, size, pos); 205 } 206 207 static int amdgpu_debugfs_regs2_open(struct inode *inode, struct file *file) 208 { 209 struct amdgpu_debugfs_regs2_data *rd; 210 211 rd = kzalloc(sizeof *rd, GFP_KERNEL); 212 if (!rd) 213 return -ENOMEM; 214 rd->adev = file_inode(file)->i_private; 215 file->private_data = rd; 216 mutex_init(&rd->lock); 217 218 return 0; 219 } 220 221 static int amdgpu_debugfs_regs2_release(struct inode *inode, struct file *file) 222 { 223 struct amdgpu_debugfs_regs2_data *rd = file->private_data; 224 mutex_destroy(&rd->lock); 225 kfree(file->private_data); 226 return 0; 227 } 228 229 static ssize_t amdgpu_debugfs_regs2_op(struct file *f, char __user *buf, u32 offset, size_t size, int write_en) 230 { 231 struct amdgpu_debugfs_regs2_data *rd = f->private_data; 232 struct amdgpu_device *adev = rd->adev; 233 ssize_t result = 0; 234 int r; 235 uint32_t value; 236 237 if (size & 0x3 || offset & 0x3) 238 return -EINVAL; 239 240 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 241 if (r < 0) { 242 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 243 return r; 244 } 245 246 r = amdgpu_virt_enable_access_debugfs(adev); 247 if (r < 0) { 248 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 249 return r; 250 } 251 252 mutex_lock(&rd->lock); 253 254 if (rd->id.use_grbm) { 255 if ((rd->id.grbm.sh != 0xFFFFFFFF && rd->id.grbm.sh >= adev->gfx.config.max_sh_per_se) || 256 (rd->id.grbm.se != 0xFFFFFFFF && rd->id.grbm.se >= adev->gfx.config.max_shader_engines)) { 257 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 258 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 259 amdgpu_virt_disable_access_debugfs(adev); 260 mutex_unlock(&rd->lock); 261 return -EINVAL; 262 } 263 mutex_lock(&adev->grbm_idx_mutex); 264 amdgpu_gfx_select_se_sh(adev, rd->id.grbm.se, 265 rd->id.grbm.sh, 266 rd->id.grbm.instance); 267 } 268 269 if (rd->id.use_srbm) { 270 mutex_lock(&adev->srbm_mutex); 271 amdgpu_gfx_select_me_pipe_q(adev, rd->id.srbm.me, rd->id.srbm.pipe, 272 rd->id.srbm.queue, rd->id.srbm.vmid); 273 } 274 275 if (rd->id.pg_lock) 276 mutex_lock(&adev->pm.mutex); 277 278 while (size) { 279 if (!write_en) { 280 value = RREG32(offset >> 2); 281 r = put_user(value, (uint32_t *)buf); 282 } else { 283 r = get_user(value, (uint32_t *)buf); 284 if (!r) 285 amdgpu_mm_wreg_mmio_rlc(adev, offset >> 2, value); 286 } 287 if (r) { 288 result = r; 289 goto end; 290 } 291 offset += 4; 292 size -= 4; 293 result += 4; 294 buf += 4; 295 } 296 end: 297 if (rd->id.use_grbm) { 298 amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff); 299 mutex_unlock(&adev->grbm_idx_mutex); 300 } 301 302 if (rd->id.use_srbm) { 303 amdgpu_gfx_select_me_pipe_q(adev, 0, 0, 0, 0); 304 mutex_unlock(&adev->srbm_mutex); 305 } 306 307 if (rd->id.pg_lock) 308 mutex_unlock(&adev->pm.mutex); 309 310 mutex_unlock(&rd->lock); 311 312 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 313 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 314 315 amdgpu_virt_disable_access_debugfs(adev); 316 return result; 317 } 318 319 static long amdgpu_debugfs_regs2_ioctl(struct file *f, unsigned int cmd, unsigned long data) 320 { 321 struct amdgpu_debugfs_regs2_data *rd = f->private_data; 322 int r; 323 324 switch (cmd) { 325 case AMDGPU_DEBUGFS_REGS2_IOC_SET_STATE: 326 mutex_lock(&rd->lock); 327 r = copy_from_user(&rd->id, (struct amdgpu_debugfs_regs2_iocdata *)data, sizeof rd->id); 328 mutex_unlock(&rd->lock); 329 return r ? -EINVAL : 0; 330 default: 331 return -EINVAL; 332 } 333 return 0; 334 } 335 336 static ssize_t amdgpu_debugfs_regs2_read(struct file *f, char __user *buf, size_t size, loff_t *pos) 337 { 338 return amdgpu_debugfs_regs2_op(f, buf, *pos, size, 0); 339 } 340 341 static ssize_t amdgpu_debugfs_regs2_write(struct file *f, const char __user *buf, size_t size, loff_t *pos) 342 { 343 return amdgpu_debugfs_regs2_op(f, (char __user *)buf, *pos, size, 1); 344 } 345 346 347 /** 348 * amdgpu_debugfs_regs_pcie_read - Read from a PCIE register 349 * 350 * @f: open file handle 351 * @buf: User buffer to store read data in 352 * @size: Number of bytes to read 353 * @pos: Offset to seek to 354 * 355 * The lower bits are the BYTE offset of the register to read. This 356 * allows reading multiple registers in a single call and having 357 * the returned size reflect that. 358 */ 359 static ssize_t amdgpu_debugfs_regs_pcie_read(struct file *f, char __user *buf, 360 size_t size, loff_t *pos) 361 { 362 struct amdgpu_device *adev = file_inode(f)->i_private; 363 ssize_t result = 0; 364 int r; 365 366 if (size & 0x3 || *pos & 0x3) 367 return -EINVAL; 368 369 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 370 if (r < 0) { 371 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 372 return r; 373 } 374 375 r = amdgpu_virt_enable_access_debugfs(adev); 376 if (r < 0) { 377 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 378 return r; 379 } 380 381 while (size) { 382 uint32_t value; 383 384 value = RREG32_PCIE(*pos); 385 r = put_user(value, (uint32_t *)buf); 386 if (r) 387 goto out; 388 389 result += 4; 390 buf += 4; 391 *pos += 4; 392 size -= 4; 393 } 394 395 r = result; 396 out: 397 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 398 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 399 amdgpu_virt_disable_access_debugfs(adev); 400 return r; 401 } 402 403 /** 404 * amdgpu_debugfs_regs_pcie_write - Write to a PCIE register 405 * 406 * @f: open file handle 407 * @buf: User buffer to write data from 408 * @size: Number of bytes to write 409 * @pos: Offset to seek to 410 * 411 * The lower bits are the BYTE offset of the register to write. This 412 * allows writing multiple registers in a single call and having 413 * the returned size reflect that. 414 */ 415 static ssize_t amdgpu_debugfs_regs_pcie_write(struct file *f, const char __user *buf, 416 size_t size, loff_t *pos) 417 { 418 struct amdgpu_device *adev = file_inode(f)->i_private; 419 ssize_t result = 0; 420 int r; 421 422 if (size & 0x3 || *pos & 0x3) 423 return -EINVAL; 424 425 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 426 if (r < 0) { 427 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 428 return r; 429 } 430 431 r = amdgpu_virt_enable_access_debugfs(adev); 432 if (r < 0) { 433 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 434 return r; 435 } 436 437 while (size) { 438 uint32_t value; 439 440 r = get_user(value, (uint32_t *)buf); 441 if (r) 442 goto out; 443 444 WREG32_PCIE(*pos, value); 445 446 result += 4; 447 buf += 4; 448 *pos += 4; 449 size -= 4; 450 } 451 452 r = result; 453 out: 454 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 455 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 456 amdgpu_virt_disable_access_debugfs(adev); 457 return r; 458 } 459 460 /** 461 * amdgpu_debugfs_regs_didt_read - Read from a DIDT register 462 * 463 * @f: open file handle 464 * @buf: User buffer to store read data in 465 * @size: Number of bytes to read 466 * @pos: Offset to seek to 467 * 468 * The lower bits are the BYTE offset of the register to read. This 469 * allows reading multiple registers in a single call and having 470 * the returned size reflect that. 471 */ 472 static ssize_t amdgpu_debugfs_regs_didt_read(struct file *f, char __user *buf, 473 size_t size, loff_t *pos) 474 { 475 struct amdgpu_device *adev = file_inode(f)->i_private; 476 ssize_t result = 0; 477 int r; 478 479 if (size & 0x3 || *pos & 0x3) 480 return -EINVAL; 481 482 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 483 if (r < 0) { 484 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 485 return r; 486 } 487 488 r = amdgpu_virt_enable_access_debugfs(adev); 489 if (r < 0) { 490 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 491 return r; 492 } 493 494 while (size) { 495 uint32_t value; 496 497 value = RREG32_DIDT(*pos >> 2); 498 r = put_user(value, (uint32_t *)buf); 499 if (r) 500 goto out; 501 502 result += 4; 503 buf += 4; 504 *pos += 4; 505 size -= 4; 506 } 507 508 r = result; 509 out: 510 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 511 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 512 amdgpu_virt_disable_access_debugfs(adev); 513 return r; 514 } 515 516 /** 517 * amdgpu_debugfs_regs_didt_write - Write to a DIDT register 518 * 519 * @f: open file handle 520 * @buf: User buffer to write data from 521 * @size: Number of bytes to write 522 * @pos: Offset to seek to 523 * 524 * The lower bits are the BYTE offset of the register to write. This 525 * allows writing multiple registers in a single call and having 526 * the returned size reflect that. 527 */ 528 static ssize_t amdgpu_debugfs_regs_didt_write(struct file *f, const char __user *buf, 529 size_t size, loff_t *pos) 530 { 531 struct amdgpu_device *adev = file_inode(f)->i_private; 532 ssize_t result = 0; 533 int r; 534 535 if (size & 0x3 || *pos & 0x3) 536 return -EINVAL; 537 538 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 539 if (r < 0) { 540 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 541 return r; 542 } 543 544 r = amdgpu_virt_enable_access_debugfs(adev); 545 if (r < 0) { 546 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 547 return r; 548 } 549 550 while (size) { 551 uint32_t value; 552 553 r = get_user(value, (uint32_t *)buf); 554 if (r) 555 goto out; 556 557 WREG32_DIDT(*pos >> 2, value); 558 559 result += 4; 560 buf += 4; 561 *pos += 4; 562 size -= 4; 563 } 564 565 r = result; 566 out: 567 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 568 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 569 amdgpu_virt_disable_access_debugfs(adev); 570 return r; 571 } 572 573 /** 574 * amdgpu_debugfs_regs_smc_read - Read from a SMC register 575 * 576 * @f: open file handle 577 * @buf: User buffer to store read data in 578 * @size: Number of bytes to read 579 * @pos: Offset to seek to 580 * 581 * The lower bits are the BYTE offset of the register to read. This 582 * allows reading multiple registers in a single call and having 583 * the returned size reflect that. 584 */ 585 static ssize_t amdgpu_debugfs_regs_smc_read(struct file *f, char __user *buf, 586 size_t size, loff_t *pos) 587 { 588 struct amdgpu_device *adev = file_inode(f)->i_private; 589 ssize_t result = 0; 590 int r; 591 592 if (size & 0x3 || *pos & 0x3) 593 return -EINVAL; 594 595 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 596 if (r < 0) { 597 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 598 return r; 599 } 600 601 r = amdgpu_virt_enable_access_debugfs(adev); 602 if (r < 0) { 603 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 604 return r; 605 } 606 607 while (size) { 608 uint32_t value; 609 610 value = RREG32_SMC(*pos); 611 r = put_user(value, (uint32_t *)buf); 612 if (r) 613 goto out; 614 615 result += 4; 616 buf += 4; 617 *pos += 4; 618 size -= 4; 619 } 620 621 r = result; 622 out: 623 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 624 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 625 amdgpu_virt_disable_access_debugfs(adev); 626 return r; 627 } 628 629 /** 630 * amdgpu_debugfs_regs_smc_write - Write to a SMC register 631 * 632 * @f: open file handle 633 * @buf: User buffer to write data from 634 * @size: Number of bytes to write 635 * @pos: Offset to seek to 636 * 637 * The lower bits are the BYTE offset of the register to write. This 638 * allows writing multiple registers in a single call and having 639 * the returned size reflect that. 640 */ 641 static ssize_t amdgpu_debugfs_regs_smc_write(struct file *f, const char __user *buf, 642 size_t size, loff_t *pos) 643 { 644 struct amdgpu_device *adev = file_inode(f)->i_private; 645 ssize_t result = 0; 646 int r; 647 648 if (size & 0x3 || *pos & 0x3) 649 return -EINVAL; 650 651 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 652 if (r < 0) { 653 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 654 return r; 655 } 656 657 r = amdgpu_virt_enable_access_debugfs(adev); 658 if (r < 0) { 659 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 660 return r; 661 } 662 663 while (size) { 664 uint32_t value; 665 666 r = get_user(value, (uint32_t *)buf); 667 if (r) 668 goto out; 669 670 WREG32_SMC(*pos, value); 671 672 result += 4; 673 buf += 4; 674 *pos += 4; 675 size -= 4; 676 } 677 678 r = result; 679 out: 680 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 681 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 682 amdgpu_virt_disable_access_debugfs(adev); 683 return r; 684 } 685 686 /** 687 * amdgpu_debugfs_gca_config_read - Read from gfx config data 688 * 689 * @f: open file handle 690 * @buf: User buffer to store read data in 691 * @size: Number of bytes to read 692 * @pos: Offset to seek to 693 * 694 * This file is used to access configuration data in a somewhat 695 * stable fashion. The format is a series of DWORDs with the first 696 * indicating which revision it is. New content is appended to the 697 * end so that older software can still read the data. 698 */ 699 700 static ssize_t amdgpu_debugfs_gca_config_read(struct file *f, char __user *buf, 701 size_t size, loff_t *pos) 702 { 703 struct amdgpu_device *adev = file_inode(f)->i_private; 704 ssize_t result = 0; 705 int r; 706 uint32_t *config, no_regs = 0; 707 708 if (size & 0x3 || *pos & 0x3) 709 return -EINVAL; 710 711 config = kmalloc_array(256, sizeof(*config), GFP_KERNEL); 712 if (!config) 713 return -ENOMEM; 714 715 /* version, increment each time something is added */ 716 config[no_regs++] = 5; 717 config[no_regs++] = adev->gfx.config.max_shader_engines; 718 config[no_regs++] = adev->gfx.config.max_tile_pipes; 719 config[no_regs++] = adev->gfx.config.max_cu_per_sh; 720 config[no_regs++] = adev->gfx.config.max_sh_per_se; 721 config[no_regs++] = adev->gfx.config.max_backends_per_se; 722 config[no_regs++] = adev->gfx.config.max_texture_channel_caches; 723 config[no_regs++] = adev->gfx.config.max_gprs; 724 config[no_regs++] = adev->gfx.config.max_gs_threads; 725 config[no_regs++] = adev->gfx.config.max_hw_contexts; 726 config[no_regs++] = adev->gfx.config.sc_prim_fifo_size_frontend; 727 config[no_regs++] = adev->gfx.config.sc_prim_fifo_size_backend; 728 config[no_regs++] = adev->gfx.config.sc_hiz_tile_fifo_size; 729 config[no_regs++] = adev->gfx.config.sc_earlyz_tile_fifo_size; 730 config[no_regs++] = adev->gfx.config.num_tile_pipes; 731 config[no_regs++] = adev->gfx.config.backend_enable_mask; 732 config[no_regs++] = adev->gfx.config.mem_max_burst_length_bytes; 733 config[no_regs++] = adev->gfx.config.mem_row_size_in_kb; 734 config[no_regs++] = adev->gfx.config.shader_engine_tile_size; 735 config[no_regs++] = adev->gfx.config.num_gpus; 736 config[no_regs++] = adev->gfx.config.multi_gpu_tile_size; 737 config[no_regs++] = adev->gfx.config.mc_arb_ramcfg; 738 config[no_regs++] = adev->gfx.config.gb_addr_config; 739 config[no_regs++] = adev->gfx.config.num_rbs; 740 741 /* rev==1 */ 742 config[no_regs++] = adev->rev_id; 743 config[no_regs++] = lower_32_bits(adev->pg_flags); 744 config[no_regs++] = lower_32_bits(adev->cg_flags); 745 746 /* rev==2 */ 747 config[no_regs++] = adev->family; 748 config[no_regs++] = adev->external_rev_id; 749 750 /* rev==3 */ 751 config[no_regs++] = adev->pdev->device; 752 config[no_regs++] = adev->pdev->revision; 753 config[no_regs++] = adev->pdev->subsystem_device; 754 config[no_regs++] = adev->pdev->subsystem_vendor; 755 756 /* rev==4 APU flag */ 757 config[no_regs++] = adev->flags & AMD_IS_APU ? 1 : 0; 758 759 /* rev==5 PG/CG flag upper 32bit */ 760 config[no_regs++] = upper_32_bits(adev->pg_flags); 761 config[no_regs++] = upper_32_bits(adev->cg_flags); 762 763 while (size && (*pos < no_regs * 4)) { 764 uint32_t value; 765 766 value = config[*pos >> 2]; 767 r = put_user(value, (uint32_t *)buf); 768 if (r) { 769 kfree(config); 770 return r; 771 } 772 773 result += 4; 774 buf += 4; 775 *pos += 4; 776 size -= 4; 777 } 778 779 kfree(config); 780 return result; 781 } 782 783 /** 784 * amdgpu_debugfs_sensor_read - Read from the powerplay sensors 785 * 786 * @f: open file handle 787 * @buf: User buffer to store read data in 788 * @size: Number of bytes to read 789 * @pos: Offset to seek to 790 * 791 * The offset is treated as the BYTE address of one of the sensors 792 * enumerated in amd/include/kgd_pp_interface.h under the 793 * 'amd_pp_sensors' enumeration. For instance to read the UVD VCLK 794 * you would use the offset 3 * 4 = 12. 795 */ 796 static ssize_t amdgpu_debugfs_sensor_read(struct file *f, char __user *buf, 797 size_t size, loff_t *pos) 798 { 799 struct amdgpu_device *adev = file_inode(f)->i_private; 800 int idx, x, outsize, r, valuesize; 801 uint32_t values[16]; 802 803 if (size & 3 || *pos & 0x3) 804 return -EINVAL; 805 806 if (!adev->pm.dpm_enabled) 807 return -EINVAL; 808 809 /* convert offset to sensor number */ 810 idx = *pos >> 2; 811 812 valuesize = sizeof(values); 813 814 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 815 if (r < 0) { 816 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 817 return r; 818 } 819 820 r = amdgpu_virt_enable_access_debugfs(adev); 821 if (r < 0) { 822 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 823 return r; 824 } 825 826 r = amdgpu_dpm_read_sensor(adev, idx, &values[0], &valuesize); 827 828 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 829 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 830 831 if (r) { 832 amdgpu_virt_disable_access_debugfs(adev); 833 return r; 834 } 835 836 if (size > valuesize) { 837 amdgpu_virt_disable_access_debugfs(adev); 838 return -EINVAL; 839 } 840 841 outsize = 0; 842 x = 0; 843 if (!r) { 844 while (size) { 845 r = put_user(values[x++], (int32_t *)buf); 846 buf += 4; 847 size -= 4; 848 outsize += 4; 849 } 850 } 851 852 amdgpu_virt_disable_access_debugfs(adev); 853 return !r ? outsize : r; 854 } 855 856 /** amdgpu_debugfs_wave_read - Read WAVE STATUS data 857 * 858 * @f: open file handle 859 * @buf: User buffer to store read data in 860 * @size: Number of bytes to read 861 * @pos: Offset to seek to 862 * 863 * The offset being sought changes which wave that the status data 864 * will be returned for. The bits are used as follows: 865 * 866 * Bits 0..6: Byte offset into data 867 * Bits 7..14: SE selector 868 * Bits 15..22: SH/SA selector 869 * Bits 23..30: CU/{WGP+SIMD} selector 870 * Bits 31..36: WAVE ID selector 871 * Bits 37..44: SIMD ID selector 872 * 873 * The returned data begins with one DWORD of version information 874 * Followed by WAVE STATUS registers relevant to the GFX IP version 875 * being used. See gfx_v8_0_read_wave_data() for an example output. 876 */ 877 static ssize_t amdgpu_debugfs_wave_read(struct file *f, char __user *buf, 878 size_t size, loff_t *pos) 879 { 880 struct amdgpu_device *adev = f->f_inode->i_private; 881 int r, x; 882 ssize_t result = 0; 883 uint32_t offset, se, sh, cu, wave, simd, data[32]; 884 885 if (size & 3 || *pos & 3) 886 return -EINVAL; 887 888 /* decode offset */ 889 offset = (*pos & GENMASK_ULL(6, 0)); 890 se = (*pos & GENMASK_ULL(14, 7)) >> 7; 891 sh = (*pos & GENMASK_ULL(22, 15)) >> 15; 892 cu = (*pos & GENMASK_ULL(30, 23)) >> 23; 893 wave = (*pos & GENMASK_ULL(36, 31)) >> 31; 894 simd = (*pos & GENMASK_ULL(44, 37)) >> 37; 895 896 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 897 if (r < 0) { 898 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 899 return r; 900 } 901 902 r = amdgpu_virt_enable_access_debugfs(adev); 903 if (r < 0) { 904 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 905 return r; 906 } 907 908 /* switch to the specific se/sh/cu */ 909 mutex_lock(&adev->grbm_idx_mutex); 910 amdgpu_gfx_select_se_sh(adev, se, sh, cu); 911 912 x = 0; 913 if (adev->gfx.funcs->read_wave_data) 914 adev->gfx.funcs->read_wave_data(adev, simd, wave, data, &x); 915 916 amdgpu_gfx_select_se_sh(adev, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF); 917 mutex_unlock(&adev->grbm_idx_mutex); 918 919 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 920 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 921 922 if (!x) { 923 amdgpu_virt_disable_access_debugfs(adev); 924 return -EINVAL; 925 } 926 927 while (size && (offset < x * 4)) { 928 uint32_t value; 929 930 value = data[offset >> 2]; 931 r = put_user(value, (uint32_t *)buf); 932 if (r) { 933 amdgpu_virt_disable_access_debugfs(adev); 934 return r; 935 } 936 937 result += 4; 938 buf += 4; 939 offset += 4; 940 size -= 4; 941 } 942 943 amdgpu_virt_disable_access_debugfs(adev); 944 return result; 945 } 946 947 /** amdgpu_debugfs_gpr_read - Read wave gprs 948 * 949 * @f: open file handle 950 * @buf: User buffer to store read data in 951 * @size: Number of bytes to read 952 * @pos: Offset to seek to 953 * 954 * The offset being sought changes which wave that the status data 955 * will be returned for. The bits are used as follows: 956 * 957 * Bits 0..11: Byte offset into data 958 * Bits 12..19: SE selector 959 * Bits 20..27: SH/SA selector 960 * Bits 28..35: CU/{WGP+SIMD} selector 961 * Bits 36..43: WAVE ID selector 962 * Bits 37..44: SIMD ID selector 963 * Bits 52..59: Thread selector 964 * Bits 60..61: Bank selector (VGPR=0,SGPR=1) 965 * 966 * The return data comes from the SGPR or VGPR register bank for 967 * the selected operational unit. 968 */ 969 static ssize_t amdgpu_debugfs_gpr_read(struct file *f, char __user *buf, 970 size_t size, loff_t *pos) 971 { 972 struct amdgpu_device *adev = f->f_inode->i_private; 973 int r; 974 ssize_t result = 0; 975 uint32_t offset, se, sh, cu, wave, simd, thread, bank, *data; 976 977 if (size > 4096 || size & 3 || *pos & 3) 978 return -EINVAL; 979 980 /* decode offset */ 981 offset = (*pos & GENMASK_ULL(11, 0)) >> 2; 982 se = (*pos & GENMASK_ULL(19, 12)) >> 12; 983 sh = (*pos & GENMASK_ULL(27, 20)) >> 20; 984 cu = (*pos & GENMASK_ULL(35, 28)) >> 28; 985 wave = (*pos & GENMASK_ULL(43, 36)) >> 36; 986 simd = (*pos & GENMASK_ULL(51, 44)) >> 44; 987 thread = (*pos & GENMASK_ULL(59, 52)) >> 52; 988 bank = (*pos & GENMASK_ULL(61, 60)) >> 60; 989 990 data = kcalloc(1024, sizeof(*data), GFP_KERNEL); 991 if (!data) 992 return -ENOMEM; 993 994 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 995 if (r < 0) 996 goto err; 997 998 r = amdgpu_virt_enable_access_debugfs(adev); 999 if (r < 0) 1000 goto err; 1001 1002 /* switch to the specific se/sh/cu */ 1003 mutex_lock(&adev->grbm_idx_mutex); 1004 amdgpu_gfx_select_se_sh(adev, se, sh, cu); 1005 1006 if (bank == 0) { 1007 if (adev->gfx.funcs->read_wave_vgprs) 1008 adev->gfx.funcs->read_wave_vgprs(adev, simd, wave, thread, offset, size>>2, data); 1009 } else { 1010 if (adev->gfx.funcs->read_wave_sgprs) 1011 adev->gfx.funcs->read_wave_sgprs(adev, simd, wave, offset, size>>2, data); 1012 } 1013 1014 amdgpu_gfx_select_se_sh(adev, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF); 1015 mutex_unlock(&adev->grbm_idx_mutex); 1016 1017 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 1018 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1019 1020 while (size) { 1021 uint32_t value; 1022 1023 value = data[result >> 2]; 1024 r = put_user(value, (uint32_t *)buf); 1025 if (r) { 1026 amdgpu_virt_disable_access_debugfs(adev); 1027 goto err; 1028 } 1029 1030 result += 4; 1031 buf += 4; 1032 size -= 4; 1033 } 1034 1035 kfree(data); 1036 amdgpu_virt_disable_access_debugfs(adev); 1037 return result; 1038 1039 err: 1040 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1041 kfree(data); 1042 return r; 1043 } 1044 1045 /** 1046 * amdgpu_debugfs_gfxoff_write - Enable/disable GFXOFF 1047 * 1048 * @f: open file handle 1049 * @buf: User buffer to write data from 1050 * @size: Number of bytes to write 1051 * @pos: Offset to seek to 1052 * 1053 * Write a 32-bit zero to disable or a 32-bit non-zero to enable 1054 */ 1055 static ssize_t amdgpu_debugfs_gfxoff_write(struct file *f, const char __user *buf, 1056 size_t size, loff_t *pos) 1057 { 1058 struct amdgpu_device *adev = file_inode(f)->i_private; 1059 ssize_t result = 0; 1060 int r; 1061 1062 if (size & 0x3 || *pos & 0x3) 1063 return -EINVAL; 1064 1065 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 1066 if (r < 0) { 1067 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1068 return r; 1069 } 1070 1071 while (size) { 1072 uint32_t value; 1073 1074 r = get_user(value, (uint32_t *)buf); 1075 if (r) 1076 goto out; 1077 1078 amdgpu_gfx_off_ctrl(adev, value ? true : false); 1079 1080 result += 4; 1081 buf += 4; 1082 *pos += 4; 1083 size -= 4; 1084 } 1085 1086 r = result; 1087 out: 1088 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 1089 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1090 1091 return r; 1092 } 1093 1094 1095 /** 1096 * amdgpu_debugfs_gfxoff_read - read gfxoff status 1097 * 1098 * @f: open file handle 1099 * @buf: User buffer to store read data in 1100 * @size: Number of bytes to read 1101 * @pos: Offset to seek to 1102 */ 1103 static ssize_t amdgpu_debugfs_gfxoff_read(struct file *f, char __user *buf, 1104 size_t size, loff_t *pos) 1105 { 1106 struct amdgpu_device *adev = file_inode(f)->i_private; 1107 ssize_t result = 0; 1108 int r; 1109 1110 if (size & 0x3 || *pos & 0x3) 1111 return -EINVAL; 1112 1113 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 1114 if (r < 0) { 1115 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1116 return r; 1117 } 1118 1119 while (size) { 1120 u32 value = adev->gfx.gfx_off_state; 1121 1122 r = put_user(value, (u32 *)buf); 1123 if (r) 1124 goto out; 1125 1126 result += 4; 1127 buf += 4; 1128 *pos += 4; 1129 size -= 4; 1130 } 1131 1132 r = result; 1133 out: 1134 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 1135 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1136 1137 return r; 1138 } 1139 1140 static ssize_t amdgpu_debugfs_gfxoff_status_read(struct file *f, char __user *buf, 1141 size_t size, loff_t *pos) 1142 { 1143 struct amdgpu_device *adev = file_inode(f)->i_private; 1144 ssize_t result = 0; 1145 int r; 1146 1147 if (size & 0x3 || *pos & 0x3) 1148 return -EINVAL; 1149 1150 r = pm_runtime_get_sync(adev_to_drm(adev)->dev); 1151 if (r < 0) { 1152 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1153 return r; 1154 } 1155 1156 while (size) { 1157 u32 value; 1158 1159 r = amdgpu_get_gfx_off_status(adev, &value); 1160 if (r) 1161 goto out; 1162 1163 r = put_user(value, (u32 *)buf); 1164 if (r) 1165 goto out; 1166 1167 result += 4; 1168 buf += 4; 1169 *pos += 4; 1170 size -= 4; 1171 } 1172 1173 r = result; 1174 out: 1175 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 1176 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1177 1178 return r; 1179 } 1180 1181 static const struct file_operations amdgpu_debugfs_regs2_fops = { 1182 .owner = THIS_MODULE, 1183 .unlocked_ioctl = amdgpu_debugfs_regs2_ioctl, 1184 .read = amdgpu_debugfs_regs2_read, 1185 .write = amdgpu_debugfs_regs2_write, 1186 .open = amdgpu_debugfs_regs2_open, 1187 .release = amdgpu_debugfs_regs2_release, 1188 .llseek = default_llseek 1189 }; 1190 1191 static const struct file_operations amdgpu_debugfs_regs_fops = { 1192 .owner = THIS_MODULE, 1193 .read = amdgpu_debugfs_regs_read, 1194 .write = amdgpu_debugfs_regs_write, 1195 .llseek = default_llseek 1196 }; 1197 static const struct file_operations amdgpu_debugfs_regs_didt_fops = { 1198 .owner = THIS_MODULE, 1199 .read = amdgpu_debugfs_regs_didt_read, 1200 .write = amdgpu_debugfs_regs_didt_write, 1201 .llseek = default_llseek 1202 }; 1203 static const struct file_operations amdgpu_debugfs_regs_pcie_fops = { 1204 .owner = THIS_MODULE, 1205 .read = amdgpu_debugfs_regs_pcie_read, 1206 .write = amdgpu_debugfs_regs_pcie_write, 1207 .llseek = default_llseek 1208 }; 1209 static const struct file_operations amdgpu_debugfs_regs_smc_fops = { 1210 .owner = THIS_MODULE, 1211 .read = amdgpu_debugfs_regs_smc_read, 1212 .write = amdgpu_debugfs_regs_smc_write, 1213 .llseek = default_llseek 1214 }; 1215 1216 static const struct file_operations amdgpu_debugfs_gca_config_fops = { 1217 .owner = THIS_MODULE, 1218 .read = amdgpu_debugfs_gca_config_read, 1219 .llseek = default_llseek 1220 }; 1221 1222 static const struct file_operations amdgpu_debugfs_sensors_fops = { 1223 .owner = THIS_MODULE, 1224 .read = amdgpu_debugfs_sensor_read, 1225 .llseek = default_llseek 1226 }; 1227 1228 static const struct file_operations amdgpu_debugfs_wave_fops = { 1229 .owner = THIS_MODULE, 1230 .read = amdgpu_debugfs_wave_read, 1231 .llseek = default_llseek 1232 }; 1233 static const struct file_operations amdgpu_debugfs_gpr_fops = { 1234 .owner = THIS_MODULE, 1235 .read = amdgpu_debugfs_gpr_read, 1236 .llseek = default_llseek 1237 }; 1238 1239 static const struct file_operations amdgpu_debugfs_gfxoff_fops = { 1240 .owner = THIS_MODULE, 1241 .read = amdgpu_debugfs_gfxoff_read, 1242 .write = amdgpu_debugfs_gfxoff_write, 1243 .llseek = default_llseek 1244 }; 1245 1246 static const struct file_operations amdgpu_debugfs_gfxoff_status_fops = { 1247 .owner = THIS_MODULE, 1248 .read = amdgpu_debugfs_gfxoff_status_read, 1249 .llseek = default_llseek 1250 }; 1251 1252 static const struct file_operations *debugfs_regs[] = { 1253 &amdgpu_debugfs_regs_fops, 1254 &amdgpu_debugfs_regs2_fops, 1255 &amdgpu_debugfs_regs_didt_fops, 1256 &amdgpu_debugfs_regs_pcie_fops, 1257 &amdgpu_debugfs_regs_smc_fops, 1258 &amdgpu_debugfs_gca_config_fops, 1259 &amdgpu_debugfs_sensors_fops, 1260 &amdgpu_debugfs_wave_fops, 1261 &amdgpu_debugfs_gpr_fops, 1262 &amdgpu_debugfs_gfxoff_fops, 1263 &amdgpu_debugfs_gfxoff_status_fops, 1264 }; 1265 1266 static const char *debugfs_regs_names[] = { 1267 "amdgpu_regs", 1268 "amdgpu_regs2", 1269 "amdgpu_regs_didt", 1270 "amdgpu_regs_pcie", 1271 "amdgpu_regs_smc", 1272 "amdgpu_gca_config", 1273 "amdgpu_sensors", 1274 "amdgpu_wave", 1275 "amdgpu_gpr", 1276 "amdgpu_gfxoff", 1277 "amdgpu_gfxoff_status", 1278 }; 1279 1280 /** 1281 * amdgpu_debugfs_regs_init - Initialize debugfs entries that provide 1282 * register access. 1283 * 1284 * @adev: The device to attach the debugfs entries to 1285 */ 1286 int amdgpu_debugfs_regs_init(struct amdgpu_device *adev) 1287 { 1288 struct drm_minor *minor = adev_to_drm(adev)->primary; 1289 struct dentry *ent, *root = minor->debugfs_root; 1290 unsigned int i; 1291 1292 for (i = 0; i < ARRAY_SIZE(debugfs_regs); i++) { 1293 ent = debugfs_create_file(debugfs_regs_names[i], 1294 S_IFREG | S_IRUGO, root, 1295 adev, debugfs_regs[i]); 1296 if (!i && !IS_ERR_OR_NULL(ent)) 1297 i_size_write(ent->d_inode, adev->rmmio_size); 1298 } 1299 1300 return 0; 1301 } 1302 1303 static int amdgpu_debugfs_test_ib_show(struct seq_file *m, void *unused) 1304 { 1305 struct amdgpu_device *adev = (struct amdgpu_device *)m->private; 1306 struct drm_device *dev = adev_to_drm(adev); 1307 int r = 0, i; 1308 1309 r = pm_runtime_get_sync(dev->dev); 1310 if (r < 0) { 1311 pm_runtime_put_autosuspend(dev->dev); 1312 return r; 1313 } 1314 1315 /* Avoid accidently unparking the sched thread during GPU reset */ 1316 r = down_write_killable(&adev->reset_domain->sem); 1317 if (r) 1318 return r; 1319 1320 /* hold on the scheduler */ 1321 for (i = 0; i < AMDGPU_MAX_RINGS; i++) { 1322 struct amdgpu_ring *ring = adev->rings[i]; 1323 1324 if (!ring || !ring->sched.thread) 1325 continue; 1326 kthread_park(ring->sched.thread); 1327 } 1328 1329 seq_printf(m, "run ib test:\n"); 1330 r = amdgpu_ib_ring_tests(adev); 1331 if (r) 1332 seq_printf(m, "ib ring tests failed (%d).\n", r); 1333 else 1334 seq_printf(m, "ib ring tests passed.\n"); 1335 1336 /* go on the scheduler */ 1337 for (i = 0; i < AMDGPU_MAX_RINGS; i++) { 1338 struct amdgpu_ring *ring = adev->rings[i]; 1339 1340 if (!ring || !ring->sched.thread) 1341 continue; 1342 kthread_unpark(ring->sched.thread); 1343 } 1344 1345 up_write(&adev->reset_domain->sem); 1346 1347 pm_runtime_mark_last_busy(dev->dev); 1348 pm_runtime_put_autosuspend(dev->dev); 1349 1350 return 0; 1351 } 1352 1353 static int amdgpu_debugfs_evict_vram(void *data, u64 *val) 1354 { 1355 struct amdgpu_device *adev = (struct amdgpu_device *)data; 1356 struct drm_device *dev = adev_to_drm(adev); 1357 int r; 1358 1359 r = pm_runtime_get_sync(dev->dev); 1360 if (r < 0) { 1361 pm_runtime_put_autosuspend(dev->dev); 1362 return r; 1363 } 1364 1365 *val = amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM); 1366 1367 pm_runtime_mark_last_busy(dev->dev); 1368 pm_runtime_put_autosuspend(dev->dev); 1369 1370 return 0; 1371 } 1372 1373 1374 static int amdgpu_debugfs_evict_gtt(void *data, u64 *val) 1375 { 1376 struct amdgpu_device *adev = (struct amdgpu_device *)data; 1377 struct drm_device *dev = adev_to_drm(adev); 1378 int r; 1379 1380 r = pm_runtime_get_sync(dev->dev); 1381 if (r < 0) { 1382 pm_runtime_put_autosuspend(dev->dev); 1383 return r; 1384 } 1385 1386 *val = amdgpu_ttm_evict_resources(adev, TTM_PL_TT); 1387 1388 pm_runtime_mark_last_busy(dev->dev); 1389 pm_runtime_put_autosuspend(dev->dev); 1390 1391 return 0; 1392 } 1393 1394 static int amdgpu_debugfs_benchmark(void *data, u64 val) 1395 { 1396 struct amdgpu_device *adev = (struct amdgpu_device *)data; 1397 struct drm_device *dev = adev_to_drm(adev); 1398 int r; 1399 1400 r = pm_runtime_get_sync(dev->dev); 1401 if (r < 0) { 1402 pm_runtime_put_autosuspend(dev->dev); 1403 return r; 1404 } 1405 1406 r = amdgpu_benchmark(adev, val); 1407 1408 pm_runtime_mark_last_busy(dev->dev); 1409 pm_runtime_put_autosuspend(dev->dev); 1410 1411 return r; 1412 } 1413 1414 static int amdgpu_debugfs_vm_info_show(struct seq_file *m, void *unused) 1415 { 1416 struct amdgpu_device *adev = (struct amdgpu_device *)m->private; 1417 struct drm_device *dev = adev_to_drm(adev); 1418 struct drm_file *file; 1419 int r; 1420 1421 r = mutex_lock_interruptible(&dev->filelist_mutex); 1422 if (r) 1423 return r; 1424 1425 list_for_each_entry(file, &dev->filelist, lhead) { 1426 struct amdgpu_fpriv *fpriv = file->driver_priv; 1427 struct amdgpu_vm *vm = &fpriv->vm; 1428 1429 seq_printf(m, "pid:%d\tProcess:%s ----------\n", 1430 vm->task_info.pid, vm->task_info.process_name); 1431 r = amdgpu_bo_reserve(vm->root.bo, true); 1432 if (r) 1433 break; 1434 amdgpu_debugfs_vm_bo_info(vm, m); 1435 amdgpu_bo_unreserve(vm->root.bo); 1436 } 1437 1438 mutex_unlock(&dev->filelist_mutex); 1439 1440 return r; 1441 } 1442 1443 DEFINE_SHOW_ATTRIBUTE(amdgpu_debugfs_test_ib); 1444 DEFINE_SHOW_ATTRIBUTE(amdgpu_debugfs_vm_info); 1445 DEFINE_DEBUGFS_ATTRIBUTE(amdgpu_evict_vram_fops, amdgpu_debugfs_evict_vram, 1446 NULL, "%lld\n"); 1447 DEFINE_DEBUGFS_ATTRIBUTE(amdgpu_evict_gtt_fops, amdgpu_debugfs_evict_gtt, 1448 NULL, "%lld\n"); 1449 DEFINE_DEBUGFS_ATTRIBUTE(amdgpu_benchmark_fops, NULL, amdgpu_debugfs_benchmark, 1450 "%lld\n"); 1451 1452 static void amdgpu_ib_preempt_fences_swap(struct amdgpu_ring *ring, 1453 struct dma_fence **fences) 1454 { 1455 struct amdgpu_fence_driver *drv = &ring->fence_drv; 1456 uint32_t sync_seq, last_seq; 1457 1458 last_seq = atomic_read(&ring->fence_drv.last_seq); 1459 sync_seq = ring->fence_drv.sync_seq; 1460 1461 last_seq &= drv->num_fences_mask; 1462 sync_seq &= drv->num_fences_mask; 1463 1464 do { 1465 struct dma_fence *fence, **ptr; 1466 1467 ++last_seq; 1468 last_seq &= drv->num_fences_mask; 1469 ptr = &drv->fences[last_seq]; 1470 1471 fence = rcu_dereference_protected(*ptr, 1); 1472 RCU_INIT_POINTER(*ptr, NULL); 1473 1474 if (!fence) 1475 continue; 1476 1477 fences[last_seq] = fence; 1478 1479 } while (last_seq != sync_seq); 1480 } 1481 1482 static void amdgpu_ib_preempt_signal_fences(struct dma_fence **fences, 1483 int length) 1484 { 1485 int i; 1486 struct dma_fence *fence; 1487 1488 for (i = 0; i < length; i++) { 1489 fence = fences[i]; 1490 if (!fence) 1491 continue; 1492 dma_fence_signal(fence); 1493 dma_fence_put(fence); 1494 } 1495 } 1496 1497 static void amdgpu_ib_preempt_job_recovery(struct drm_gpu_scheduler *sched) 1498 { 1499 struct drm_sched_job *s_job; 1500 struct dma_fence *fence; 1501 1502 spin_lock(&sched->job_list_lock); 1503 list_for_each_entry(s_job, &sched->pending_list, list) { 1504 fence = sched->ops->run_job(s_job); 1505 dma_fence_put(fence); 1506 } 1507 spin_unlock(&sched->job_list_lock); 1508 } 1509 1510 static void amdgpu_ib_preempt_mark_partial_job(struct amdgpu_ring *ring) 1511 { 1512 struct amdgpu_job *job; 1513 struct drm_sched_job *s_job, *tmp; 1514 uint32_t preempt_seq; 1515 struct dma_fence *fence, **ptr; 1516 struct amdgpu_fence_driver *drv = &ring->fence_drv; 1517 struct drm_gpu_scheduler *sched = &ring->sched; 1518 bool preempted = true; 1519 1520 if (ring->funcs->type != AMDGPU_RING_TYPE_GFX) 1521 return; 1522 1523 preempt_seq = le32_to_cpu(*(drv->cpu_addr + 2)); 1524 if (preempt_seq <= atomic_read(&drv->last_seq)) { 1525 preempted = false; 1526 goto no_preempt; 1527 } 1528 1529 preempt_seq &= drv->num_fences_mask; 1530 ptr = &drv->fences[preempt_seq]; 1531 fence = rcu_dereference_protected(*ptr, 1); 1532 1533 no_preempt: 1534 spin_lock(&sched->job_list_lock); 1535 list_for_each_entry_safe(s_job, tmp, &sched->pending_list, list) { 1536 if (dma_fence_is_signaled(&s_job->s_fence->finished)) { 1537 /* remove job from ring_mirror_list */ 1538 list_del_init(&s_job->list); 1539 sched->ops->free_job(s_job); 1540 continue; 1541 } 1542 job = to_amdgpu_job(s_job); 1543 if (preempted && (&job->hw_fence) == fence) 1544 /* mark the job as preempted */ 1545 job->preemption_status |= AMDGPU_IB_PREEMPTED; 1546 } 1547 spin_unlock(&sched->job_list_lock); 1548 } 1549 1550 static int amdgpu_debugfs_ib_preempt(void *data, u64 val) 1551 { 1552 int r, resched, length; 1553 struct amdgpu_ring *ring; 1554 struct dma_fence **fences = NULL; 1555 struct amdgpu_device *adev = (struct amdgpu_device *)data; 1556 1557 if (val >= AMDGPU_MAX_RINGS) 1558 return -EINVAL; 1559 1560 ring = adev->rings[val]; 1561 1562 if (!ring || !ring->funcs->preempt_ib || !ring->sched.thread) 1563 return -EINVAL; 1564 1565 /* the last preemption failed */ 1566 if (ring->trail_seq != le32_to_cpu(*ring->trail_fence_cpu_addr)) 1567 return -EBUSY; 1568 1569 length = ring->fence_drv.num_fences_mask + 1; 1570 fences = kcalloc(length, sizeof(void *), GFP_KERNEL); 1571 if (!fences) 1572 return -ENOMEM; 1573 1574 /* Avoid accidently unparking the sched thread during GPU reset */ 1575 r = down_read_killable(&adev->reset_domain->sem); 1576 if (r) 1577 goto pro_end; 1578 1579 /* stop the scheduler */ 1580 kthread_park(ring->sched.thread); 1581 1582 resched = ttm_bo_lock_delayed_workqueue(&adev->mman.bdev); 1583 1584 /* preempt the IB */ 1585 r = amdgpu_ring_preempt_ib(ring); 1586 if (r) { 1587 DRM_WARN("failed to preempt ring %d\n", ring->idx); 1588 goto failure; 1589 } 1590 1591 amdgpu_fence_process(ring); 1592 1593 if (atomic_read(&ring->fence_drv.last_seq) != 1594 ring->fence_drv.sync_seq) { 1595 DRM_INFO("ring %d was preempted\n", ring->idx); 1596 1597 amdgpu_ib_preempt_mark_partial_job(ring); 1598 1599 /* swap out the old fences */ 1600 amdgpu_ib_preempt_fences_swap(ring, fences); 1601 1602 amdgpu_fence_driver_force_completion(ring); 1603 1604 /* resubmit unfinished jobs */ 1605 amdgpu_ib_preempt_job_recovery(&ring->sched); 1606 1607 /* wait for jobs finished */ 1608 amdgpu_fence_wait_empty(ring); 1609 1610 /* signal the old fences */ 1611 amdgpu_ib_preempt_signal_fences(fences, length); 1612 } 1613 1614 failure: 1615 /* restart the scheduler */ 1616 kthread_unpark(ring->sched.thread); 1617 1618 up_read(&adev->reset_domain->sem); 1619 1620 ttm_bo_unlock_delayed_workqueue(&adev->mman.bdev, resched); 1621 1622 pro_end: 1623 kfree(fences); 1624 1625 return r; 1626 } 1627 1628 static int amdgpu_debugfs_sclk_set(void *data, u64 val) 1629 { 1630 int ret = 0; 1631 uint32_t max_freq, min_freq; 1632 struct amdgpu_device *adev = (struct amdgpu_device *)data; 1633 1634 if (amdgpu_sriov_vf(adev) && !amdgpu_sriov_is_pp_one_vf(adev)) 1635 return -EINVAL; 1636 1637 ret = pm_runtime_get_sync(adev_to_drm(adev)->dev); 1638 if (ret < 0) { 1639 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1640 return ret; 1641 } 1642 1643 ret = amdgpu_dpm_get_dpm_freq_range(adev, PP_SCLK, &min_freq, &max_freq); 1644 if (ret == -EOPNOTSUPP) { 1645 ret = 0; 1646 goto out; 1647 } 1648 if (ret || val > max_freq || val < min_freq) { 1649 ret = -EINVAL; 1650 goto out; 1651 } 1652 1653 ret = amdgpu_dpm_set_soft_freq_range(adev, PP_SCLK, (uint32_t)val, (uint32_t)val); 1654 if (ret) 1655 ret = -EINVAL; 1656 1657 out: 1658 pm_runtime_mark_last_busy(adev_to_drm(adev)->dev); 1659 pm_runtime_put_autosuspend(adev_to_drm(adev)->dev); 1660 1661 return ret; 1662 } 1663 1664 DEFINE_DEBUGFS_ATTRIBUTE(fops_ib_preempt, NULL, 1665 amdgpu_debugfs_ib_preempt, "%llu\n"); 1666 1667 DEFINE_DEBUGFS_ATTRIBUTE(fops_sclk_set, NULL, 1668 amdgpu_debugfs_sclk_set, "%llu\n"); 1669 1670 static ssize_t amdgpu_reset_dump_register_list_read(struct file *f, 1671 char __user *buf, size_t size, loff_t *pos) 1672 { 1673 struct amdgpu_device *adev = (struct amdgpu_device *)file_inode(f)->i_private; 1674 char reg_offset[12]; 1675 int i, ret, len = 0; 1676 1677 if (*pos) 1678 return 0; 1679 1680 memset(reg_offset, 0, 12); 1681 ret = down_read_killable(&adev->reset_domain->sem); 1682 if (ret) 1683 return ret; 1684 1685 for (i = 0; i < adev->num_regs; i++) { 1686 sprintf(reg_offset, "0x%x\n", adev->reset_dump_reg_list[i]); 1687 up_read(&adev->reset_domain->sem); 1688 if (copy_to_user(buf + len, reg_offset, strlen(reg_offset))) 1689 return -EFAULT; 1690 1691 len += strlen(reg_offset); 1692 ret = down_read_killable(&adev->reset_domain->sem); 1693 if (ret) 1694 return ret; 1695 } 1696 1697 up_read(&adev->reset_domain->sem); 1698 *pos += len; 1699 1700 return len; 1701 } 1702 1703 static ssize_t amdgpu_reset_dump_register_list_write(struct file *f, 1704 const char __user *buf, size_t size, loff_t *pos) 1705 { 1706 struct amdgpu_device *adev = (struct amdgpu_device *)file_inode(f)->i_private; 1707 char reg_offset[11]; 1708 uint32_t *new = NULL, *tmp = NULL; 1709 int ret, i = 0, len = 0; 1710 1711 do { 1712 memset(reg_offset, 0, 11); 1713 if (copy_from_user(reg_offset, buf + len, 1714 min(10, ((int)size-len)))) { 1715 ret = -EFAULT; 1716 goto error_free; 1717 } 1718 1719 new = krealloc_array(tmp, i + 1, sizeof(uint32_t), GFP_KERNEL); 1720 if (!new) { 1721 ret = -ENOMEM; 1722 goto error_free; 1723 } 1724 tmp = new; 1725 if (sscanf(reg_offset, "%X %n", &tmp[i], &ret) != 1) { 1726 ret = -EINVAL; 1727 goto error_free; 1728 } 1729 1730 len += ret; 1731 i++; 1732 } while (len < size); 1733 1734 new = kmalloc_array(i, sizeof(uint32_t), GFP_KERNEL); 1735 if (!new) { 1736 ret = -ENOMEM; 1737 goto error_free; 1738 } 1739 ret = down_write_killable(&adev->reset_domain->sem); 1740 if (ret) 1741 goto error_free; 1742 1743 swap(adev->reset_dump_reg_list, tmp); 1744 swap(adev->reset_dump_reg_value, new); 1745 adev->num_regs = i; 1746 up_write(&adev->reset_domain->sem); 1747 ret = size; 1748 1749 error_free: 1750 if (tmp != new) 1751 kfree(tmp); 1752 kfree(new); 1753 return ret; 1754 } 1755 1756 static const struct file_operations amdgpu_reset_dump_register_list = { 1757 .owner = THIS_MODULE, 1758 .read = amdgpu_reset_dump_register_list_read, 1759 .write = amdgpu_reset_dump_register_list_write, 1760 .llseek = default_llseek 1761 }; 1762 1763 int amdgpu_debugfs_init(struct amdgpu_device *adev) 1764 { 1765 struct dentry *root = adev_to_drm(adev)->primary->debugfs_root; 1766 struct dentry *ent; 1767 int r, i; 1768 1769 if (!debugfs_initialized()) 1770 return 0; 1771 1772 debugfs_create_x32("amdgpu_smu_debug", 0600, root, 1773 &adev->pm.smu_debug_mask); 1774 1775 ent = debugfs_create_file("amdgpu_preempt_ib", 0600, root, adev, 1776 &fops_ib_preempt); 1777 if (IS_ERR(ent)) { 1778 DRM_ERROR("unable to create amdgpu_preempt_ib debugsfs file\n"); 1779 return PTR_ERR(ent); 1780 } 1781 1782 ent = debugfs_create_file("amdgpu_force_sclk", 0200, root, adev, 1783 &fops_sclk_set); 1784 if (IS_ERR(ent)) { 1785 DRM_ERROR("unable to create amdgpu_set_sclk debugsfs file\n"); 1786 return PTR_ERR(ent); 1787 } 1788 1789 /* Register debugfs entries for amdgpu_ttm */ 1790 amdgpu_ttm_debugfs_init(adev); 1791 amdgpu_debugfs_pm_init(adev); 1792 amdgpu_debugfs_sa_init(adev); 1793 amdgpu_debugfs_fence_init(adev); 1794 amdgpu_debugfs_gem_init(adev); 1795 1796 r = amdgpu_debugfs_regs_init(adev); 1797 if (r) 1798 DRM_ERROR("registering register debugfs failed (%d).\n", r); 1799 1800 amdgpu_debugfs_firmware_init(adev); 1801 amdgpu_ta_if_debugfs_init(adev); 1802 1803 #if defined(CONFIG_DRM_AMD_DC) 1804 if (amdgpu_device_has_dc_support(adev)) 1805 dtn_debugfs_init(adev); 1806 #endif 1807 1808 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) { 1809 struct amdgpu_ring *ring = adev->rings[i]; 1810 1811 if (!ring) 1812 continue; 1813 1814 amdgpu_debugfs_ring_init(adev, ring); 1815 } 1816 1817 for ( i = 0; i < adev->vcn.num_vcn_inst; i++) { 1818 if (!amdgpu_vcnfw_log) 1819 break; 1820 1821 if (adev->vcn.harvest_config & (1 << i)) 1822 continue; 1823 1824 amdgpu_debugfs_vcn_fwlog_init(adev, i, &adev->vcn.inst[i]); 1825 } 1826 1827 amdgpu_ras_debugfs_create_all(adev); 1828 amdgpu_rap_debugfs_init(adev); 1829 amdgpu_securedisplay_debugfs_init(adev); 1830 amdgpu_fw_attestation_debugfs_init(adev); 1831 1832 debugfs_create_file("amdgpu_evict_vram", 0444, root, adev, 1833 &amdgpu_evict_vram_fops); 1834 debugfs_create_file("amdgpu_evict_gtt", 0444, root, adev, 1835 &amdgpu_evict_gtt_fops); 1836 debugfs_create_file("amdgpu_test_ib", 0444, root, adev, 1837 &amdgpu_debugfs_test_ib_fops); 1838 debugfs_create_file("amdgpu_vm_info", 0444, root, adev, 1839 &amdgpu_debugfs_vm_info_fops); 1840 debugfs_create_file("amdgpu_benchmark", 0200, root, adev, 1841 &amdgpu_benchmark_fops); 1842 debugfs_create_file("amdgpu_reset_dump_register_list", 0644, root, adev, 1843 &amdgpu_reset_dump_register_list); 1844 1845 adev->debugfs_vbios_blob.data = adev->bios; 1846 adev->debugfs_vbios_blob.size = adev->bios_size; 1847 debugfs_create_blob("amdgpu_vbios", 0444, root, 1848 &adev->debugfs_vbios_blob); 1849 1850 adev->debugfs_discovery_blob.data = adev->mman.discovery_bin; 1851 adev->debugfs_discovery_blob.size = adev->mman.discovery_tmr_size; 1852 debugfs_create_blob("amdgpu_discovery", 0444, root, 1853 &adev->debugfs_discovery_blob); 1854 1855 return 0; 1856 } 1857 1858 #else 1859 int amdgpu_debugfs_init(struct amdgpu_device *adev) 1860 { 1861 return 0; 1862 } 1863 int amdgpu_debugfs_regs_init(struct amdgpu_device *adev) 1864 { 1865 return 0; 1866 } 1867 #endif 1868