1 | /* |
2 | * Copyright 2014 Advanced Micro Devices, Inc. |
3 | * |
4 | * Permission is hereby granted, free of charge, to any person obtaining a |
5 | * copy of this software and associated documentation files (the "Software"), |
6 | * to deal in the Software without restriction, including without limitation |
7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
8 | * and/or sell copies of the Software, and to permit persons to whom the |
9 | * Software is furnished to do so, subject to the following conditions: |
10 | * |
11 | * The above copyright notice and this permission notice shall be included in |
12 | * all copies or substantial portions of the Software. |
13 | * |
14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
20 | * OTHER DEALINGS IN THE SOFTWARE. |
21 | * |
22 | */ |
23 | |
24 | #ifndef KFD_DBGMGR_H_ |
25 | #define KFD_DBGMGR_H_ |
26 | |
27 | #include "kfd_priv.h" |
28 | |
29 | /* must align with hsakmttypes definition */ |
30 | #pragma pack(push, 4) |
31 | |
32 | enum HSA_DBG_WAVEOP { |
33 | HSA_DBG_WAVEOP_HALT = 1, /* Halts a wavefront */ |
34 | HSA_DBG_WAVEOP_RESUME = 2, /* Resumes a wavefront */ |
35 | HSA_DBG_WAVEOP_KILL = 3, /* Kills a wavefront */ |
36 | HSA_DBG_WAVEOP_DEBUG = 4, /* Causes wavefront to enter dbg mode */ |
37 | HSA_DBG_WAVEOP_TRAP = 5, /* Causes wavefront to take a trap */ |
38 | HSA_DBG_NUM_WAVEOP = 5, |
39 | HSA_DBG_MAX_WAVEOP = 0xFFFFFFFF |
40 | }; |
41 | |
42 | enum HSA_DBG_WAVEMODE { |
43 | /* send command to a single wave */ |
44 | HSA_DBG_WAVEMODE_SINGLE = 0, |
45 | /* |
46 | * Broadcast to all wavefronts of all processes is not |
47 | * supported for HSA user mode |
48 | */ |
49 | |
50 | /* send to waves within current process */ |
51 | HSA_DBG_WAVEMODE_BROADCAST_PROCESS = 2, |
52 | /* send to waves within current process on CU */ |
53 | HSA_DBG_WAVEMODE_BROADCAST_PROCESS_CU = 3, |
54 | HSA_DBG_NUM_WAVEMODE = 3, |
55 | HSA_DBG_MAX_WAVEMODE = 0xFFFFFFFF |
56 | }; |
57 | |
58 | enum HSA_DBG_WAVEMSG_TYPE { |
59 | HSA_DBG_WAVEMSG_AUTO = 0, |
60 | HSA_DBG_WAVEMSG_USER = 1, |
61 | HSA_DBG_WAVEMSG_ERROR = 2, |
62 | HSA_DBG_NUM_WAVEMSG, |
63 | HSA_DBG_MAX_WAVEMSG = 0xFFFFFFFF |
64 | }; |
65 | |
66 | enum HSA_DBG_WATCH_MODE { |
67 | HSA_DBG_WATCH_READ = 0, /* Read operations only */ |
68 | HSA_DBG_WATCH_NONREAD = 1, /* Write or Atomic operations only */ |
69 | HSA_DBG_WATCH_ATOMIC = 2, /* Atomic Operations only */ |
70 | HSA_DBG_WATCH_ALL = 3, /* Read, Write or Atomic operations */ |
71 | HSA_DBG_WATCH_NUM, |
72 | HSA_DBG_WATCH_SIZE = 0xFFFFFFFF |
73 | }; |
74 | |
75 | /* This structure is hardware specific and may change in the future */ |
76 | struct HsaDbgWaveMsgAMDGen2 { |
77 | union { |
78 | struct ui32 { |
79 | uint32_t UserData:8; /* user data */ |
80 | uint32_t ShaderArray:1; /* Shader array */ |
81 | uint32_t Priv:1; /* Privileged */ |
82 | uint32_t Reserved0:4; /* Reserved, should be 0 */ |
83 | uint32_t WaveId:4; /* wave id */ |
84 | uint32_t SIMD:2; /* SIMD id */ |
85 | uint32_t HSACU:4; /* Compute unit */ |
86 | uint32_t ShaderEngine:2;/* Shader engine */ |
87 | uint32_t MessageType:2; /* see HSA_DBG_WAVEMSG_TYPE */ |
88 | uint32_t Reserved1:4; /* Reserved, should be 0 */ |
89 | } ui32; |
90 | uint32_t Value; |
91 | }; |
92 | uint32_t Reserved2; |
93 | }; |
94 | |
95 | union HsaDbgWaveMessageAMD { |
96 | struct HsaDbgWaveMsgAMDGen2 WaveMsgInfoGen2; |
97 | /* for future HsaDbgWaveMsgAMDGen3; */ |
98 | }; |
99 | |
100 | struct HsaDbgWaveMessage { |
101 | void *MemoryVA; /* ptr to associated host-accessible data */ |
102 | union HsaDbgWaveMessageAMD DbgWaveMsg; |
103 | }; |
104 | |
105 | /* |
106 | * TODO: This definitions to be MOVED to kfd_event, once it is implemented. |
107 | * |
108 | * HSA sync primitive, Event and HW Exception notification API definitions. |
109 | * The API functions allow the runtime to define a so-called sync-primitive, |
110 | * a SW object combining a user-mode provided "syncvar" and a scheduler event |
111 | * that can be signaled through a defined GPU interrupt. A syncvar is |
112 | * a process virtual memory location of a certain size that can be accessed |
113 | * by CPU and GPU shader code within the process to set and query the content |
114 | * within that memory. The definition of the content is determined by the HSA |
115 | * runtime and potentially GPU shader code interfacing with the HSA runtime. |
116 | * The syncvar values may be commonly written through an PM4 WRITE_DATA packet |
117 | * in the user mode instruction stream. The OS scheduler event is typically |
118 | * associated and signaled by an interrupt issued by the GPU, but other HSA |
119 | * system interrupt conditions from other HW (e.g. IOMMUv2) may be surfaced |
120 | * by the KFD by this mechanism, too. |
121 | */ |
122 | |
123 | /* these are the new definitions for events */ |
124 | enum HSA_EVENTTYPE { |
125 | HSA_EVENTTYPE_SIGNAL = 0, /* user-mode generated GPU signal */ |
126 | HSA_EVENTTYPE_NODECHANGE = 1, /* HSA node change (attach/detach) */ |
127 | HSA_EVENTTYPE_DEVICESTATECHANGE = 2, /* HSA device state change |
128 | * (start/stop) |
129 | */ |
130 | HSA_EVENTTYPE_HW_EXCEPTION = 3, /* GPU shader exception event */ |
131 | HSA_EVENTTYPE_SYSTEM_EVENT = 4, /* GPU SYSCALL with parameter info */ |
132 | HSA_EVENTTYPE_DEBUG_EVENT = 5, /* GPU signal for debugging */ |
133 | HSA_EVENTTYPE_PROFILE_EVENT = 6,/* GPU signal for profiling */ |
134 | HSA_EVENTTYPE_QUEUE_EVENT = 7, /* GPU signal queue idle state |
135 | * (EOP pm4) |
136 | */ |
137 | /* ... */ |
138 | HSA_EVENTTYPE_MAXID, |
139 | HSA_EVENTTYPE_TYPE_SIZE = 0xFFFFFFFF |
140 | }; |
141 | |
142 | /* Sub-definitions for various event types: Syncvar */ |
143 | struct HsaSyncVar { |
144 | union SyncVar { |
145 | void *UserData; /* pointer to user mode data */ |
146 | uint64_t UserDataPtrValue; /* 64bit compatibility of value */ |
147 | } SyncVar; |
148 | uint64_t SyncVarSize; |
149 | }; |
150 | |
151 | /* Sub-definitions for various event types: NodeChange */ |
152 | |
153 | enum HSA_EVENTTYPE_NODECHANGE_FLAGS { |
154 | HSA_EVENTTYPE_NODECHANGE_ADD = 0, |
155 | HSA_EVENTTYPE_NODECHANGE_REMOVE = 1, |
156 | HSA_EVENTTYPE_NODECHANGE_SIZE = 0xFFFFFFFF |
157 | }; |
158 | |
159 | struct HsaNodeChange { |
160 | /* HSA node added/removed on the platform */ |
161 | enum HSA_EVENTTYPE_NODECHANGE_FLAGS Flags; |
162 | }; |
163 | |
164 | /* Sub-definitions for various event types: DeviceStateChange */ |
165 | enum HSA_EVENTTYPE_DEVICESTATECHANGE_FLAGS { |
166 | /* device started (and available) */ |
167 | HSA_EVENTTYPE_DEVICESTATUSCHANGE_START = 0, |
168 | /* device stopped (i.e. unavailable) */ |
169 | HSA_EVENTTYPE_DEVICESTATUSCHANGE_STOP = 1, |
170 | HSA_EVENTTYPE_DEVICESTATUSCHANGE_SIZE = 0xFFFFFFFF |
171 | }; |
172 | |
173 | enum HSA_DEVICE { |
174 | HSA_DEVICE_CPU = 0, |
175 | HSA_DEVICE_GPU = 1, |
176 | MAX_HSA_DEVICE = 2 |
177 | }; |
178 | |
179 | struct HsaDeviceStateChange { |
180 | uint32_t NodeId; /* F-NUMA node that contains the device */ |
181 | enum HSA_DEVICE Device; /* device type: GPU or CPU */ |
182 | enum HSA_EVENTTYPE_DEVICESTATECHANGE_FLAGS Flags; /* event flags */ |
183 | }; |
184 | |
185 | struct HsaEventData { |
186 | enum HSA_EVENTTYPE EventType; /* event type */ |
187 | union EventData { |
188 | /* |
189 | * return data associated with HSA_EVENTTYPE_SIGNAL |
190 | * and other events |
191 | */ |
192 | struct HsaSyncVar SyncVar; |
193 | |
194 | /* data associated with HSA_EVENTTYPE_NODE_CHANGE */ |
195 | struct HsaNodeChange NodeChangeState; |
196 | |
197 | /* data associated with HSA_EVENTTYPE_DEVICE_STATE_CHANGE */ |
198 | struct HsaDeviceStateChange DeviceState; |
199 | } EventData; |
200 | |
201 | /* the following data entries are internal to the KFD & thunk itself */ |
202 | |
203 | /* internal thunk store for Event data (OsEventHandle) */ |
204 | uint64_t HWData1; |
205 | /* internal thunk store for Event data (HWAddress) */ |
206 | uint64_t HWData2; |
207 | /* internal thunk store for Event data (HWData) */ |
208 | uint32_t HWData3; |
209 | }; |
210 | |
211 | struct HsaEventDescriptor { |
212 | /* event type to allocate */ |
213 | enum HSA_EVENTTYPE EventType; |
214 | /* H-NUMA node containing GPU device that is event source */ |
215 | uint32_t NodeId; |
216 | /* pointer to user mode syncvar data, syncvar->UserDataPtrValue |
217 | * may be NULL |
218 | */ |
219 | struct HsaSyncVar SyncVar; |
220 | }; |
221 | |
222 | struct HsaEvent { |
223 | uint32_t EventId; |
224 | struct HsaEventData EventData; |
225 | }; |
226 | |
227 | #pragma pack(pop) |
228 | |
229 | enum DBGDEV_TYPE { |
230 | DBGDEV_TYPE_ILLEGAL = 0, |
231 | DBGDEV_TYPE_NODIQ = 1, |
232 | DBGDEV_TYPE_DIQ = 2, |
233 | DBGDEV_TYPE_TEST = 3 |
234 | }; |
235 | |
236 | struct dbg_address_watch_info { |
237 | struct kfd_process *process; |
238 | enum HSA_DBG_WATCH_MODE *watch_mode; |
239 | uint64_t *watch_address; |
240 | uint64_t *watch_mask; |
241 | struct HsaEvent *watch_event; |
242 | uint32_t num_watch_points; |
243 | }; |
244 | |
245 | struct dbg_wave_control_info { |
246 | struct kfd_process *process; |
247 | uint32_t trapId; |
248 | enum HSA_DBG_WAVEOP operand; |
249 | enum HSA_DBG_WAVEMODE mode; |
250 | struct HsaDbgWaveMessage dbgWave_msg; |
251 | }; |
252 | |
253 | struct kfd_dbgdev { |
254 | |
255 | /* The device that owns this data. */ |
256 | struct kfd_dev *dev; |
257 | |
258 | /* kernel queue for DIQ */ |
259 | struct kernel_queue *kq; |
260 | |
261 | /* a pointer to the pqm of the calling process */ |
262 | struct process_queue_manager *pqm; |
263 | |
264 | /* type of debug device ( DIQ, non DIQ, etc. ) */ |
265 | enum DBGDEV_TYPE type; |
266 | |
267 | /* virtualized function pointers to device dbg */ |
268 | int (*dbgdev_register)(struct kfd_dbgdev *dbgdev); |
269 | int (*dbgdev_unregister)(struct kfd_dbgdev *dbgdev); |
270 | int (*dbgdev_address_watch)(struct kfd_dbgdev *dbgdev, |
271 | struct dbg_address_watch_info *adw_info); |
272 | int (*dbgdev_wave_control)(struct kfd_dbgdev *dbgdev, |
273 | struct dbg_wave_control_info *wac_info); |
274 | |
275 | }; |
276 | |
277 | struct kfd_dbgmgr { |
278 | unsigned int pasid; |
279 | struct kfd_dev *dev; |
280 | struct kfd_dbgdev *dbgdev; |
281 | }; |
282 | |
283 | /* prototypes for debug manager functions */ |
284 | struct mutex *kfd_get_dbgmgr_mutex(void); |
285 | void kfd_dbgmgr_destroy(struct kfd_dbgmgr *pmgr); |
286 | bool kfd_dbgmgr_create(struct kfd_dbgmgr **ppmgr, struct kfd_dev *pdev); |
287 | long kfd_dbgmgr_register(struct kfd_dbgmgr *pmgr, struct kfd_process *p); |
288 | long kfd_dbgmgr_unregister(struct kfd_dbgmgr *pmgr, struct kfd_process *p); |
289 | long kfd_dbgmgr_wave_control(struct kfd_dbgmgr *pmgr, |
290 | struct dbg_wave_control_info *wac_info); |
291 | long kfd_dbgmgr_address_watch(struct kfd_dbgmgr *pmgr, |
292 | struct dbg_address_watch_info *adw_info); |
293 | #endif /* KFD_DBGMGR_H_ */ |
294 | |