xref: /linux/drivers/gpu/drm/xe/xe_debugfs.c (revision 1b5d39e6672fdee158c3306f5cb2df8975c77e5a)
1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright © 2022 Intel Corporation
4  */
5 
6 #include "xe_debugfs.h"
7 
8 #include <linux/debugfs.h>
9 #include <linux/fault-inject.h>
10 #include <linux/string_helpers.h>
11 
12 #include <drm/drm_debugfs.h>
13 
14 #include "regs/xe_pmt.h"
15 #include "xe_bo.h"
16 #include "xe_device.h"
17 #include "xe_force_wake.h"
18 #include "xe_gt_debugfs.h"
19 #include "xe_gt_printk.h"
20 #include "xe_guc_ads.h"
21 #include "xe_mmio.h"
22 #include "xe_pm.h"
23 #include "xe_psmi.h"
24 #include "xe_pxp_debugfs.h"
25 #include "xe_sriov.h"
26 #include "xe_sriov_pf_debugfs.h"
27 #include "xe_sriov_vf.h"
28 #include "xe_step.h"
29 #include "xe_tile_debugfs.h"
30 #include "xe_vsec.h"
31 #include "xe_wa.h"
32 
33 #ifdef CONFIG_DRM_XE_DEBUG
34 #include "xe_bo_evict.h"
35 #include "xe_migrate.h"
36 #include "xe_vm.h"
37 #endif
38 
39 DECLARE_FAULT_ATTR(gt_reset_failure);
40 DECLARE_FAULT_ATTR(inject_csc_hw_error);
41 
42 static void read_residency_counter(struct xe_device *xe, struct xe_mmio *mmio,
43 				   u32 offset, const char *name, struct drm_printer *p)
44 {
45 	u64 residency = 0;
46 	int ret;
47 
48 	ret = xe_pmt_telem_read(to_pci_dev(xe->drm.dev),
49 				xe_mmio_read32(mmio, PUNIT_TELEMETRY_GUID),
50 				&residency, offset, sizeof(residency));
51 	if (ret != sizeof(residency)) {
52 		drm_warn(&xe->drm, "%s counter failed to read, ret %d\n", name, ret);
53 		return;
54 	}
55 
56 	drm_printf(p, "%s : %llu\n", name, residency);
57 }
58 
59 static struct xe_device *node_to_xe(struct drm_info_node *node)
60 {
61 	return to_xe_device(node->minor->dev);
62 }
63 
64 static int info(struct seq_file *m, void *data)
65 {
66 	struct xe_device *xe = node_to_xe(m->private);
67 	struct drm_printer p = drm_seq_file_printer(m);
68 	struct xe_gt *gt;
69 	u8 id;
70 
71 	guard(xe_pm_runtime)(xe);
72 
73 	drm_printf(&p, "graphics_verx100 %d\n", xe->info.graphics_verx100);
74 	drm_printf(&p, "media_verx100 %d\n", xe->info.media_verx100);
75 	drm_printf(&p, "stepping G:%s M:%s B:%s\n",
76 		   xe_step_name(xe->info.step.graphics),
77 		   xe_step_name(xe->info.step.media),
78 		   xe_step_name(xe->info.step.basedie));
79 	drm_printf(&p, "is_dgfx %s\n", str_yes_no(xe->info.is_dgfx));
80 	drm_printf(&p, "platform %d\n", xe->info.platform);
81 	drm_printf(&p, "subplatform %d\n",
82 		   xe->info.subplatform > XE_SUBPLATFORM_NONE ? xe->info.subplatform : 0);
83 	drm_printf(&p, "devid 0x%x\n", xe->info.devid);
84 	drm_printf(&p, "revid %d\n", xe->info.revid);
85 	drm_printf(&p, "tile_count %d\n", xe->info.tile_count);
86 	drm_printf(&p, "vm_max_level %d\n", xe->info.vm_max_level);
87 	drm_printf(&p, "force_execlist %s\n", str_yes_no(xe->info.force_execlist));
88 	drm_printf(&p, "has_flat_ccs %s\n", str_yes_no(xe->info.has_flat_ccs));
89 	drm_printf(&p, "has_usm %s\n", str_yes_no(xe->info.has_usm));
90 	drm_printf(&p, "skip_guc_pc %s\n", str_yes_no(xe->info.skip_guc_pc));
91 	for_each_gt(gt, xe, id) {
92 		drm_printf(&p, "gt%d force wake %d\n", id,
93 			   xe_force_wake_ref(gt_to_fw(gt), XE_FW_GT));
94 		drm_printf(&p, "gt%d engine_mask 0x%llx\n", id,
95 			   gt->info.engine_mask);
96 		drm_printf(&p, "gt%d multi_queue_engine_class_mask 0x%x\n", id,
97 			   gt->info.multi_queue_engine_class_mask);
98 	}
99 
100 	return 0;
101 }
102 
103 static int sriov_info(struct seq_file *m, void *data)
104 {
105 	struct xe_device *xe = node_to_xe(m->private);
106 	struct drm_printer p = drm_seq_file_printer(m);
107 
108 	xe_sriov_print_info(xe, &p);
109 	return 0;
110 }
111 
112 static int workarounds(struct xe_device *xe, struct drm_printer *p)
113 {
114 	guard(xe_pm_runtime)(xe);
115 	xe_wa_device_dump(xe, p);
116 
117 	return 0;
118 }
119 
120 static int workaround_info(struct seq_file *m, void *data)
121 {
122 	struct xe_device *xe = node_to_xe(m->private);
123 	struct drm_printer p = drm_seq_file_printer(m);
124 
125 	workarounds(xe, &p);
126 	return 0;
127 }
128 
129 static int dgfx_pkg_residencies_show(struct seq_file *m, void *data)
130 {
131 	struct xe_device *xe;
132 	struct xe_mmio *mmio;
133 	struct drm_printer p;
134 
135 	xe = node_to_xe(m->private);
136 	p = drm_seq_file_printer(m);
137 	guard(xe_pm_runtime)(xe);
138 	mmio = xe_root_tile_mmio(xe);
139 	static const struct {
140 		u32 offset;
141 		const char *name;
142 	} residencies[] = {
143 		{BMG_G2_RESIDENCY_OFFSET, "Package G2"},
144 		{BMG_G6_RESIDENCY_OFFSET, "Package G6"},
145 		{BMG_G7_RESIDENCY_OFFSET, "Package G7"},
146 		{BMG_G8_RESIDENCY_OFFSET, "Package G8"},
147 		{BMG_G10_RESIDENCY_OFFSET, "Package G10"},
148 		{BMG_MODS_RESIDENCY_OFFSET, "Package ModS"}
149 	};
150 
151 	for (int i = 0; i < ARRAY_SIZE(residencies); i++)
152 		read_residency_counter(xe, mmio, residencies[i].offset, residencies[i].name, &p);
153 
154 	return 0;
155 }
156 
157 static int dgfx_pcie_link_residencies_show(struct seq_file *m, void *data)
158 {
159 	struct xe_device *xe;
160 	struct xe_mmio *mmio;
161 	struct drm_printer p;
162 
163 	xe = node_to_xe(m->private);
164 	p = drm_seq_file_printer(m);
165 	guard(xe_pm_runtime)(xe);
166 	mmio = xe_root_tile_mmio(xe);
167 
168 	static const struct {
169 		u32 offset;
170 		const char *name;
171 	} residencies[] = {
172 		{BMG_PCIE_LINK_L0_RESIDENCY_OFFSET, "PCIE LINK L0 RESIDENCY"},
173 		{BMG_PCIE_LINK_L1_RESIDENCY_OFFSET, "PCIE LINK L1 RESIDENCY"},
174 		{BMG_PCIE_LINK_L1_2_RESIDENCY_OFFSET, "PCIE LINK L1.2 RESIDENCY"}
175 	};
176 
177 	for (int i = 0; i < ARRAY_SIZE(residencies); i++)
178 		read_residency_counter(xe, mmio, residencies[i].offset, residencies[i].name, &p);
179 
180 	return 0;
181 }
182 
183 static const struct drm_info_list debugfs_list[] = {
184 	{"info", info, 0},
185 	{ .name = "sriov_info", .show = sriov_info, },
186 	{ .name = "workarounds", .show = workaround_info, },
187 };
188 
189 static const struct drm_info_list debugfs_residencies[] = {
190 	{ .name = "dgfx_pkg_residencies", .show = dgfx_pkg_residencies_show, },
191 	{ .name = "dgfx_pcie_link_residencies", .show = dgfx_pcie_link_residencies_show, },
192 };
193 
194 static int forcewake_open(struct inode *inode, struct file *file)
195 {
196 	struct xe_device *xe = inode->i_private;
197 	struct xe_gt *gt;
198 	u8 id, last_gt;
199 	unsigned int fw_ref;
200 
201 	xe_pm_runtime_get(xe);
202 	for_each_gt(gt, xe, id) {
203 		last_gt = id;
204 
205 		fw_ref = xe_force_wake_get(gt_to_fw(gt), XE_FORCEWAKE_ALL);
206 		if (!xe_force_wake_ref_has_domain(fw_ref, XE_FORCEWAKE_ALL))
207 			goto err_fw_get;
208 	}
209 
210 	return 0;
211 
212 err_fw_get:
213 	for_each_gt(gt, xe, id) {
214 		if (id < last_gt)
215 			xe_force_wake_put(gt_to_fw(gt), XE_FORCEWAKE_ALL);
216 		else if (id == last_gt)
217 			xe_force_wake_put(gt_to_fw(gt), fw_ref);
218 		else
219 			break;
220 	}
221 
222 	xe_pm_runtime_put(xe);
223 	return -ETIMEDOUT;
224 }
225 
226 static int forcewake_release(struct inode *inode, struct file *file)
227 {
228 	struct xe_device *xe = inode->i_private;
229 	struct xe_gt *gt;
230 	u8 id;
231 
232 	for_each_gt(gt, xe, id)
233 		xe_force_wake_put(gt_to_fw(gt), XE_FORCEWAKE_ALL);
234 	xe_pm_runtime_put(xe);
235 
236 	return 0;
237 }
238 
239 static const struct file_operations forcewake_all_fops = {
240 	.owner = THIS_MODULE,
241 	.open = forcewake_open,
242 	.release = forcewake_release,
243 };
244 
245 static ssize_t wedged_mode_show(struct file *f, char __user *ubuf,
246 				size_t size, loff_t *pos)
247 {
248 	struct xe_device *xe = file_inode(f)->i_private;
249 	char buf[32];
250 	int len = 0;
251 
252 	len = scnprintf(buf, sizeof(buf), "%d\n", xe->wedged.mode);
253 
254 	return simple_read_from_buffer(ubuf, size, pos, buf, len);
255 }
256 
257 static ssize_t wedged_mode_set(struct file *f, const char __user *ubuf,
258 			       size_t size, loff_t *pos)
259 {
260 	struct xe_device *xe = file_inode(f)->i_private;
261 	struct xe_gt *gt;
262 	u32 wedged_mode;
263 	ssize_t ret;
264 	u8 id;
265 
266 	ret = kstrtouint_from_user(ubuf, size, 0, &wedged_mode);
267 	if (ret)
268 		return ret;
269 
270 	if (wedged_mode > 2)
271 		return -EINVAL;
272 
273 	if (xe->wedged.mode == wedged_mode)
274 		return size;
275 
276 	xe->wedged.mode = wedged_mode;
277 
278 	guard(xe_pm_runtime)(xe);
279 	for_each_gt(gt, xe, id) {
280 		ret = xe_guc_ads_scheduler_policy_toggle_reset(&gt->uc.guc.ads);
281 		if (ret) {
282 			xe_gt_err(gt, "Failed to update GuC ADS scheduler policy. GuC may still cause engine reset even with wedged_mode=2\n");
283 			return -EIO;
284 		}
285 	}
286 
287 	return size;
288 }
289 
290 static const struct file_operations wedged_mode_fops = {
291 	.owner = THIS_MODULE,
292 	.read = wedged_mode_show,
293 	.write = wedged_mode_set,
294 };
295 
296 static ssize_t atomic_svm_timeslice_ms_show(struct file *f, char __user *ubuf,
297 					    size_t size, loff_t *pos)
298 {
299 	struct xe_device *xe = file_inode(f)->i_private;
300 	char buf[32];
301 	int len = 0;
302 
303 	len = scnprintf(buf, sizeof(buf), "%d\n", xe->atomic_svm_timeslice_ms);
304 
305 	return simple_read_from_buffer(ubuf, size, pos, buf, len);
306 }
307 
308 static ssize_t atomic_svm_timeslice_ms_set(struct file *f,
309 					   const char __user *ubuf,
310 					   size_t size, loff_t *pos)
311 {
312 	struct xe_device *xe = file_inode(f)->i_private;
313 	u32 atomic_svm_timeslice_ms;
314 	ssize_t ret;
315 
316 	ret = kstrtouint_from_user(ubuf, size, 0, &atomic_svm_timeslice_ms);
317 	if (ret)
318 		return ret;
319 
320 	xe->atomic_svm_timeslice_ms = atomic_svm_timeslice_ms;
321 
322 	return size;
323 }
324 
325 static const struct file_operations atomic_svm_timeslice_ms_fops = {
326 	.owner = THIS_MODULE,
327 	.read = atomic_svm_timeslice_ms_show,
328 	.write = atomic_svm_timeslice_ms_set,
329 };
330 
331 static ssize_t disable_late_binding_show(struct file *f, char __user *ubuf,
332 					 size_t size, loff_t *pos)
333 {
334 	struct xe_device *xe = file_inode(f)->i_private;
335 	struct xe_late_bind *late_bind = &xe->late_bind;
336 	char buf[32];
337 	int len;
338 
339 	len = scnprintf(buf, sizeof(buf), "%d\n", late_bind->disable);
340 
341 	return simple_read_from_buffer(ubuf, size, pos, buf, len);
342 }
343 
344 static ssize_t disable_late_binding_set(struct file *f, const char __user *ubuf,
345 					size_t size, loff_t *pos)
346 {
347 	struct xe_device *xe = file_inode(f)->i_private;
348 	struct xe_late_bind *late_bind = &xe->late_bind;
349 	bool val;
350 	int ret;
351 
352 	ret = kstrtobool_from_user(ubuf, size, &val);
353 	if (ret)
354 		return ret;
355 
356 	late_bind->disable = val;
357 	return size;
358 }
359 
360 static const struct file_operations disable_late_binding_fops = {
361 	.owner = THIS_MODULE,
362 	.read = disable_late_binding_show,
363 	.write = disable_late_binding_set,
364 };
365 
366 void xe_debugfs_register(struct xe_device *xe)
367 {
368 	struct ttm_device *bdev = &xe->ttm;
369 	struct drm_minor *minor = xe->drm.primary;
370 	struct dentry *root = minor->debugfs_root;
371 	struct ttm_resource_manager *man;
372 	struct xe_tile *tile;
373 	struct xe_gt *gt;
374 	u8 tile_id;
375 	u8 id;
376 
377 	drm_debugfs_create_files(debugfs_list,
378 				 ARRAY_SIZE(debugfs_list),
379 				 root, minor);
380 
381 	if (xe->info.platform == XE_BATTLEMAGE && !IS_SRIOV_VF(xe)) {
382 		drm_debugfs_create_files(debugfs_residencies,
383 					 ARRAY_SIZE(debugfs_residencies),
384 					 root, minor);
385 		fault_create_debugfs_attr("inject_csc_hw_error", root,
386 					  &inject_csc_hw_error);
387 	}
388 
389 	debugfs_create_file("forcewake_all", 0400, root, xe,
390 			    &forcewake_all_fops);
391 
392 	debugfs_create_file("wedged_mode", 0600, root, xe,
393 			    &wedged_mode_fops);
394 
395 	debugfs_create_file("atomic_svm_timeslice_ms", 0600, root, xe,
396 			    &atomic_svm_timeslice_ms_fops);
397 
398 	debugfs_create_file("disable_late_binding", 0600, root, xe,
399 			    &disable_late_binding_fops);
400 
401 	man = ttm_manager_type(bdev, XE_PL_TT);
402 	ttm_resource_manager_create_debugfs(man, root, "gtt_mm");
403 
404 	man = ttm_manager_type(bdev, XE_PL_STOLEN);
405 	if (man)
406 		ttm_resource_manager_create_debugfs(man, root, "stolen_mm");
407 
408 	for_each_tile(tile, xe, tile_id)
409 		xe_tile_debugfs_register(tile);
410 
411 	for_each_gt(gt, xe, id)
412 		xe_gt_debugfs_register(gt);
413 
414 	xe_pxp_debugfs_register(xe->pxp);
415 
416 	xe_psmi_debugfs_register(xe);
417 
418 	fault_create_debugfs_attr("fail_gt_reset", root, &gt_reset_failure);
419 
420 	if (IS_SRIOV_PF(xe))
421 		xe_sriov_pf_debugfs_register(xe, root);
422 	else if (IS_SRIOV_VF(xe))
423 		xe_sriov_vf_debugfs_register(xe, root);
424 }
425