10ab2d753SJonathan Kim /*
20ab2d753SJonathan Kim  * Copyright 2023 Advanced Micro Devices, Inc.
30ab2d753SJonathan Kim  *
40ab2d753SJonathan Kim  * Permission is hereby granted, free of charge, to any person obtaining a
50ab2d753SJonathan Kim  * copy of this software and associated documentation files (the "Software"),
60ab2d753SJonathan Kim  * to deal in the Software without restriction, including without limitation
70ab2d753SJonathan Kim  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
80ab2d753SJonathan Kim  * and/or sell copies of the Software, and to permit persons to whom the
90ab2d753SJonathan Kim  * Software is furnished to do so, subject to the following conditions:
100ab2d753SJonathan Kim  *
110ab2d753SJonathan Kim  * The above copyright notice and this permission notice shall be included in
120ab2d753SJonathan Kim  * all copies or substantial portions of the Software.
130ab2d753SJonathan Kim  *
140ab2d753SJonathan Kim  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
150ab2d753SJonathan Kim  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
160ab2d753SJonathan Kim  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
170ab2d753SJonathan Kim  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
180ab2d753SJonathan Kim  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
190ab2d753SJonathan Kim  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
200ab2d753SJonathan Kim  * OTHER DEALINGS IN THE SOFTWARE.
210ab2d753SJonathan Kim  */
220ab2d753SJonathan Kim 
230ab2d753SJonathan Kim #ifndef KFD_DEBUG_EVENTS_H_INCLUDED
240ab2d753SJonathan Kim #define KFD_DEBUG_EVENTS_H_INCLUDED
250ab2d753SJonathan Kim 
260ab2d753SJonathan Kim #include "kfd_priv.h"
270ab2d753SJonathan Kim 
28455227c4SJonathan Kim void kfd_dbg_trap_deactivate(struct kfd_process *target, bool unwind, int unwind_count);
29455227c4SJonathan Kim int kfd_dbg_trap_activate(struct kfd_process *target);
305bc20c22SJonathan Kim int kfd_dbg_ev_query_debug_event(struct kfd_process *process,
315bc20c22SJonathan Kim 			unsigned int *queue_id,
325bc20c22SJonathan Kim 			unsigned int *gpu_id,
335bc20c22SJonathan Kim 			uint64_t exception_clear_mask,
345bc20c22SJonathan Kim 			uint64_t *event_status);
3512fb1ad7SJonathan Kim bool kfd_set_dbg_ev_from_interrupt(struct kfd_node *dev,
3612fb1ad7SJonathan Kim 				   unsigned int pasid,
3712fb1ad7SJonathan Kim 				   uint32_t doorbell_id,
3812fb1ad7SJonathan Kim 				   uint64_t trap_mask,
3912fb1ad7SJonathan Kim 				   void *exception_data,
4012fb1ad7SJonathan Kim 				   size_t exception_data_size);
4144b87bb0SJonathan Kim bool kfd_dbg_ev_raise(uint64_t event_mask,
4244b87bb0SJonathan Kim 			struct kfd_process *process, struct kfd_node *dev,
4344b87bb0SJonathan Kim 			unsigned int source_id, bool use_worker,
4444b87bb0SJonathan Kim 			void *exception_data,
4544b87bb0SJonathan Kim 			size_t exception_data_size);
460ab2d753SJonathan Kim int kfd_dbg_trap_disable(struct kfd_process *target);
470ab2d753SJonathan Kim int kfd_dbg_trap_enable(struct kfd_process *target, uint32_t fd,
480ab2d753SJonathan Kim 			void __user *runtime_info,
490ab2d753SJonathan Kim 			uint32_t *runtime_info_size);
50101827e1SJonathan Kim int kfd_dbg_trap_set_wave_launch_override(struct kfd_process *target,
51101827e1SJonathan Kim 					uint32_t trap_override,
52101827e1SJonathan Kim 					uint32_t trap_mask_bits,
53101827e1SJonathan Kim 					uint32_t trap_mask_request,
54101827e1SJonathan Kim 					uint32_t *trap_mask_prev,
55101827e1SJonathan Kim 					uint32_t *trap_mask_supported);
56aea1b473SJonathan Kim int kfd_dbg_trap_set_wave_launch_mode(struct kfd_process *target,
57aea1b473SJonathan Kim 					uint8_t wave_launch_mode);
58e0f85f46SJonathan Kim int kfd_dbg_trap_clear_dev_address_watch(struct kfd_process_device *pdd,
59e0f85f46SJonathan Kim 					uint32_t watch_id);
60e0f85f46SJonathan Kim int kfd_dbg_trap_set_dev_address_watch(struct kfd_process_device *pdd,
61e0f85f46SJonathan Kim 					uint64_t watch_address,
62e0f85f46SJonathan Kim 					uint32_t watch_address_mask,
63e0f85f46SJonathan Kim 					uint32_t *watch_id,
64e0f85f46SJonathan Kim 					uint32_t watch_mode);
65103d5f08SJonathan Kim int kfd_dbg_trap_set_flags(struct kfd_process *target, uint32_t *flags);
662b36de97SJonathan Kim int kfd_dbg_trap_query_exception_info(struct kfd_process *target,
672b36de97SJonathan Kim 		uint32_t source_id,
682b36de97SJonathan Kim 		uint32_t exception_code,
692b36de97SJonathan Kim 		bool clear_exception,
702b36de97SJonathan Kim 		void __user *info,
712b36de97SJonathan Kim 		uint32_t *info_size);
72c2d2588cSJonathan Kim int kfd_dbg_send_exception_to_runtime(struct kfd_process *p,
73c2d2588cSJonathan Kim 					unsigned int dev_id,
74c2d2588cSJonathan Kim 					unsigned int queue_id,
75c2d2588cSJonathan Kim 					uint64_t error_reason);
76c2d2588cSJonathan Kim 
kfd_dbg_is_per_vmid_supported(struct kfd_node * dev)770de4ec9aSJonathan Kim static inline bool kfd_dbg_is_per_vmid_supported(struct kfd_node *dev)
780de4ec9aSJonathan Kim {
7941b8a081SJonathan Kim 	return (KFD_GC_VERSION(dev) == IP_VERSION(9, 4, 2) ||
8041b8a081SJonathan Kim 		KFD_GC_VERSION(dev) == IP_VERSION(9, 4, 3) ||
8141b8a081SJonathan Kim 		KFD_GC_VERSION(dev) >= IP_VERSION(11, 0, 0));
820de4ec9aSJonathan Kim }
830de4ec9aSJonathan Kim 
8444b87bb0SJonathan Kim void debug_event_write_work_handler(struct work_struct *work);
8512976e6aSJonathan Kim int kfd_dbg_trap_device_snapshot(struct kfd_process *target,
8612976e6aSJonathan Kim 		uint64_t exception_clear_mask,
8712976e6aSJonathan Kim 		void __user *user_info,
8812976e6aSJonathan Kim 		uint32_t *number_of_device_infos,
8912976e6aSJonathan Kim 		uint32_t *entry_size);
9044b87bb0SJonathan Kim 
91e90bf919SJonathan Kim void kfd_dbg_set_enabled_debug_exception_mask(struct kfd_process *target,
92e90bf919SJonathan Kim 					uint64_t exception_set_mask);
9321889582SJonathan Kim /*
9421889582SJonathan Kim  * If GFX off is enabled, chips that do not support RLC restore for the debug
9521889582SJonathan Kim  * registers will disable GFX off temporarily for the entire debug session.
9621889582SJonathan Kim  * See disable_on_trap_action_entry and enable_on_trap_action_exit for details.
9721889582SJonathan Kim  */
kfd_dbg_is_rlc_restore_supported(struct kfd_node * dev)9821889582SJonathan Kim static inline bool kfd_dbg_is_rlc_restore_supported(struct kfd_node *dev)
9921889582SJonathan Kim {
10021889582SJonathan Kim 	return !(KFD_GC_VERSION(dev) == IP_VERSION(10, 1, 10) ||
10121889582SJonathan Kim 		 KFD_GC_VERSION(dev) == IP_VERSION(10, 1, 1));
10221889582SJonathan Kim }
10321889582SJonathan Kim 
kfd_dbg_has_cwsr_workaround(struct kfd_node * dev)104cef600e1SJonathan Kim static inline bool kfd_dbg_has_cwsr_workaround(struct kfd_node *dev)
105cef600e1SJonathan Kim {
106cef600e1SJonathan Kim 	return KFD_GC_VERSION(dev) >= IP_VERSION(11, 0, 0) &&
107cef600e1SJonathan Kim 	       KFD_GC_VERSION(dev) <= IP_VERSION(11, 0, 3);
108cef600e1SJonathan Kim }
109cef600e1SJonathan Kim 
kfd_dbg_has_gws_support(struct kfd_node * dev)11021889582SJonathan Kim static inline bool kfd_dbg_has_gws_support(struct kfd_node *dev)
11121889582SJonathan Kim {
11221889582SJonathan Kim 	if ((KFD_GC_VERSION(dev) == IP_VERSION(9, 0, 1)
11321889582SJonathan Kim 			&& dev->kfd->mec2_fw_version < 0x81b6) ||
11421889582SJonathan Kim 		(KFD_GC_VERSION(dev) >= IP_VERSION(9, 1, 0)
11521889582SJonathan Kim 			&& KFD_GC_VERSION(dev) <= IP_VERSION(9, 2, 2)
11621889582SJonathan Kim 			&& dev->kfd->mec2_fw_version < 0x1b6) ||
11721889582SJonathan Kim 		(KFD_GC_VERSION(dev) == IP_VERSION(9, 4, 0)
11821889582SJonathan Kim 			&& dev->kfd->mec2_fw_version < 0x1b6) ||
11921889582SJonathan Kim 		(KFD_GC_VERSION(dev) == IP_VERSION(9, 4, 1)
12021889582SJonathan Kim 			&& dev->kfd->mec2_fw_version < 0x30) ||
12121889582SJonathan Kim 		(KFD_GC_VERSION(dev) >= IP_VERSION(11, 0, 0) &&
12221889582SJonathan Kim 			KFD_GC_VERSION(dev) < IP_VERSION(12, 0, 0)))
12321889582SJonathan Kim 		return false;
12421889582SJonathan Kim 
12521889582SJonathan Kim 	/* Assume debugging and cooperative launch supported otherwise. */
12621889582SJonathan Kim 	return true;
12721889582SJonathan Kim }
128455227c4SJonathan Kim 
129*fc7f1d96SJonathan Kim int kfd_dbg_set_mes_debug_mode(struct kfd_process_device *pdd, bool sq_trap_en);
130*fc7f1d96SJonathan Kim 
kfd_dbg_has_ttmps_always_setup(struct kfd_node * dev)131*fc7f1d96SJonathan Kim static inline bool kfd_dbg_has_ttmps_always_setup(struct kfd_node *dev)
132*fc7f1d96SJonathan Kim {
133*fc7f1d96SJonathan Kim 	return (KFD_GC_VERSION(dev) < IP_VERSION(11, 0, 0) &&
134*fc7f1d96SJonathan Kim 			KFD_GC_VERSION(dev) != IP_VERSION(9, 4, 2)) ||
135*fc7f1d96SJonathan Kim 	       (KFD_GC_VERSION(dev) >= IP_VERSION(11, 0, 0) &&
136*fc7f1d96SJonathan Kim 			KFD_GC_VERSION(dev) < IP_VERSION(12, 0, 0) &&
137*fc7f1d96SJonathan Kim 			(dev->adev->mes.sched_version & AMDGPU_MES_VERSION_MASK) >= 70);
138*fc7f1d96SJonathan Kim }
1390ab2d753SJonathan Kim #endif
140