xref: /linux/drivers/gpu/drm/amd/pm/amdgpu_pm.c (revision c532de5a67a70f8533d495f8f2aaa9a0491c3ad0)
1 /*
2  * Copyright 2017 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Authors: Rafał Miłecki <zajec5@gmail.com>
23  *          Alex Deucher <alexdeucher@gmail.com>
24  */
25 
26 #include "amdgpu.h"
27 #include "amdgpu_drv.h"
28 #include "amdgpu_pm.h"
29 #include "amdgpu_dpm.h"
30 #include "atom.h"
31 #include <linux/pci.h>
32 #include <linux/hwmon.h>
33 #include <linux/hwmon-sysfs.h>
34 #include <linux/nospec.h>
35 #include <linux/pm_runtime.h>
36 #include <asm/processor.h>
37 
38 #define MAX_NUM_OF_FEATURES_PER_SUBSET		8
39 #define MAX_NUM_OF_SUBSETS			8
40 
41 #define DEVICE_ATTR_IS(_name)		(attr_id == device_attr_id__##_name)
42 
43 struct od_attribute {
44 	struct kobj_attribute	attribute;
45 	struct list_head	entry;
46 };
47 
48 struct od_kobj {
49 	struct kobject		kobj;
50 	struct list_head	entry;
51 	struct list_head	attribute;
52 	void			*priv;
53 };
54 
55 struct od_feature_ops {
56 	umode_t (*is_visible)(struct amdgpu_device *adev);
57 	ssize_t (*show)(struct kobject *kobj, struct kobj_attribute *attr,
58 			char *buf);
59 	ssize_t (*store)(struct kobject *kobj, struct kobj_attribute *attr,
60 			 const char *buf, size_t count);
61 };
62 
63 struct od_feature_item {
64 	const char		*name;
65 	struct od_feature_ops	ops;
66 };
67 
68 struct od_feature_container {
69 	char				*name;
70 	struct od_feature_ops		ops;
71 	struct od_feature_item		sub_feature[MAX_NUM_OF_FEATURES_PER_SUBSET];
72 };
73 
74 struct od_feature_set {
75 	struct od_feature_container	containers[MAX_NUM_OF_SUBSETS];
76 };
77 
78 static const struct hwmon_temp_label {
79 	enum PP_HWMON_TEMP channel;
80 	const char *label;
81 } temp_label[] = {
82 	{PP_TEMP_EDGE, "edge"},
83 	{PP_TEMP_JUNCTION, "junction"},
84 	{PP_TEMP_MEM, "mem"},
85 };
86 
87 const char * const amdgpu_pp_profile_name[] = {
88 	"BOOTUP_DEFAULT",
89 	"3D_FULL_SCREEN",
90 	"POWER_SAVING",
91 	"VIDEO",
92 	"VR",
93 	"COMPUTE",
94 	"CUSTOM",
95 	"WINDOW_3D",
96 	"CAPPED",
97 	"UNCAPPED",
98 };
99 
100 /**
101  * DOC: power_dpm_state
102  *
103  * The power_dpm_state file is a legacy interface and is only provided for
104  * backwards compatibility. The amdgpu driver provides a sysfs API for adjusting
105  * certain power related parameters.  The file power_dpm_state is used for this.
106  * It accepts the following arguments:
107  *
108  * - battery
109  *
110  * - balanced
111  *
112  * - performance
113  *
114  * battery
115  *
116  * On older GPUs, the vbios provided a special power state for battery
117  * operation.  Selecting battery switched to this state.  This is no
118  * longer provided on newer GPUs so the option does nothing in that case.
119  *
120  * balanced
121  *
122  * On older GPUs, the vbios provided a special power state for balanced
123  * operation.  Selecting balanced switched to this state.  This is no
124  * longer provided on newer GPUs so the option does nothing in that case.
125  *
126  * performance
127  *
128  * On older GPUs, the vbios provided a special power state for performance
129  * operation.  Selecting performance switched to this state.  This is no
130  * longer provided on newer GPUs so the option does nothing in that case.
131  *
132  */
133 
134 static ssize_t amdgpu_get_power_dpm_state(struct device *dev,
135 					  struct device_attribute *attr,
136 					  char *buf)
137 {
138 	struct drm_device *ddev = dev_get_drvdata(dev);
139 	struct amdgpu_device *adev = drm_to_adev(ddev);
140 	enum amd_pm_state_type pm;
141 	int ret;
142 
143 	if (amdgpu_in_reset(adev))
144 		return -EPERM;
145 	if (adev->in_suspend && !adev->in_runpm)
146 		return -EPERM;
147 
148 	ret = pm_runtime_get_sync(ddev->dev);
149 	if (ret < 0) {
150 		pm_runtime_put_autosuspend(ddev->dev);
151 		return ret;
152 	}
153 
154 	amdgpu_dpm_get_current_power_state(adev, &pm);
155 
156 	pm_runtime_mark_last_busy(ddev->dev);
157 	pm_runtime_put_autosuspend(ddev->dev);
158 
159 	return sysfs_emit(buf, "%s\n",
160 			  (pm == POWER_STATE_TYPE_BATTERY) ? "battery" :
161 			  (pm == POWER_STATE_TYPE_BALANCED) ? "balanced" : "performance");
162 }
163 
164 static ssize_t amdgpu_set_power_dpm_state(struct device *dev,
165 					  struct device_attribute *attr,
166 					  const char *buf,
167 					  size_t count)
168 {
169 	struct drm_device *ddev = dev_get_drvdata(dev);
170 	struct amdgpu_device *adev = drm_to_adev(ddev);
171 	enum amd_pm_state_type  state;
172 	int ret;
173 
174 	if (amdgpu_in_reset(adev))
175 		return -EPERM;
176 	if (adev->in_suspend && !adev->in_runpm)
177 		return -EPERM;
178 
179 	if (strncmp("battery", buf, strlen("battery")) == 0)
180 		state = POWER_STATE_TYPE_BATTERY;
181 	else if (strncmp("balanced", buf, strlen("balanced")) == 0)
182 		state = POWER_STATE_TYPE_BALANCED;
183 	else if (strncmp("performance", buf, strlen("performance")) == 0)
184 		state = POWER_STATE_TYPE_PERFORMANCE;
185 	else
186 		return -EINVAL;
187 
188 	ret = pm_runtime_get_sync(ddev->dev);
189 	if (ret < 0) {
190 		pm_runtime_put_autosuspend(ddev->dev);
191 		return ret;
192 	}
193 
194 	amdgpu_dpm_set_power_state(adev, state);
195 
196 	pm_runtime_mark_last_busy(ddev->dev);
197 	pm_runtime_put_autosuspend(ddev->dev);
198 
199 	return count;
200 }
201 
202 
203 /**
204  * DOC: power_dpm_force_performance_level
205  *
206  * The amdgpu driver provides a sysfs API for adjusting certain power
207  * related parameters.  The file power_dpm_force_performance_level is
208  * used for this.  It accepts the following arguments:
209  *
210  * - auto
211  *
212  * - low
213  *
214  * - high
215  *
216  * - manual
217  *
218  * - profile_standard
219  *
220  * - profile_min_sclk
221  *
222  * - profile_min_mclk
223  *
224  * - profile_peak
225  *
226  * auto
227  *
228  * When auto is selected, the driver will attempt to dynamically select
229  * the optimal power profile for current conditions in the driver.
230  *
231  * low
232  *
233  * When low is selected, the clocks are forced to the lowest power state.
234  *
235  * high
236  *
237  * When high is selected, the clocks are forced to the highest power state.
238  *
239  * manual
240  *
241  * When manual is selected, the user can manually adjust which power states
242  * are enabled for each clock domain via the sysfs pp_dpm_mclk, pp_dpm_sclk,
243  * and pp_dpm_pcie files and adjust the power state transition heuristics
244  * via the pp_power_profile_mode sysfs file.
245  *
246  * profile_standard
247  * profile_min_sclk
248  * profile_min_mclk
249  * profile_peak
250  *
251  * When the profiling modes are selected, clock and power gating are
252  * disabled and the clocks are set for different profiling cases. This
253  * mode is recommended for profiling specific work loads where you do
254  * not want clock or power gating for clock fluctuation to interfere
255  * with your results. profile_standard sets the clocks to a fixed clock
256  * level which varies from asic to asic.  profile_min_sclk forces the sclk
257  * to the lowest level.  profile_min_mclk forces the mclk to the lowest level.
258  * profile_peak sets all clocks (mclk, sclk, pcie) to the highest levels.
259  *
260  */
261 
262 static ssize_t amdgpu_get_power_dpm_force_performance_level(struct device *dev,
263 							    struct device_attribute *attr,
264 							    char *buf)
265 {
266 	struct drm_device *ddev = dev_get_drvdata(dev);
267 	struct amdgpu_device *adev = drm_to_adev(ddev);
268 	enum amd_dpm_forced_level level = 0xff;
269 	int ret;
270 
271 	if (amdgpu_in_reset(adev))
272 		return -EPERM;
273 	if (adev->in_suspend && !adev->in_runpm)
274 		return -EPERM;
275 
276 	ret = pm_runtime_get_sync(ddev->dev);
277 	if (ret < 0) {
278 		pm_runtime_put_autosuspend(ddev->dev);
279 		return ret;
280 	}
281 
282 	level = amdgpu_dpm_get_performance_level(adev);
283 
284 	pm_runtime_mark_last_busy(ddev->dev);
285 	pm_runtime_put_autosuspend(ddev->dev);
286 
287 	return sysfs_emit(buf, "%s\n",
288 			  (level == AMD_DPM_FORCED_LEVEL_AUTO) ? "auto" :
289 			  (level == AMD_DPM_FORCED_LEVEL_LOW) ? "low" :
290 			  (level == AMD_DPM_FORCED_LEVEL_HIGH) ? "high" :
291 			  (level == AMD_DPM_FORCED_LEVEL_MANUAL) ? "manual" :
292 			  (level == AMD_DPM_FORCED_LEVEL_PROFILE_STANDARD) ? "profile_standard" :
293 			  (level == AMD_DPM_FORCED_LEVEL_PROFILE_MIN_SCLK) ? "profile_min_sclk" :
294 			  (level == AMD_DPM_FORCED_LEVEL_PROFILE_MIN_MCLK) ? "profile_min_mclk" :
295 			  (level == AMD_DPM_FORCED_LEVEL_PROFILE_PEAK) ? "profile_peak" :
296 			  (level == AMD_DPM_FORCED_LEVEL_PERF_DETERMINISM) ? "perf_determinism" :
297 			  "unknown");
298 }
299 
300 static ssize_t amdgpu_set_power_dpm_force_performance_level(struct device *dev,
301 							    struct device_attribute *attr,
302 							    const char *buf,
303 							    size_t count)
304 {
305 	struct drm_device *ddev = dev_get_drvdata(dev);
306 	struct amdgpu_device *adev = drm_to_adev(ddev);
307 	enum amd_dpm_forced_level level;
308 	int ret = 0;
309 
310 	if (amdgpu_in_reset(adev))
311 		return -EPERM;
312 	if (adev->in_suspend && !adev->in_runpm)
313 		return -EPERM;
314 
315 	if (strncmp("low", buf, strlen("low")) == 0) {
316 		level = AMD_DPM_FORCED_LEVEL_LOW;
317 	} else if (strncmp("high", buf, strlen("high")) == 0) {
318 		level = AMD_DPM_FORCED_LEVEL_HIGH;
319 	} else if (strncmp("auto", buf, strlen("auto")) == 0) {
320 		level = AMD_DPM_FORCED_LEVEL_AUTO;
321 	} else if (strncmp("manual", buf, strlen("manual")) == 0) {
322 		level = AMD_DPM_FORCED_LEVEL_MANUAL;
323 	} else if (strncmp("profile_exit", buf, strlen("profile_exit")) == 0) {
324 		level = AMD_DPM_FORCED_LEVEL_PROFILE_EXIT;
325 	} else if (strncmp("profile_standard", buf, strlen("profile_standard")) == 0) {
326 		level = AMD_DPM_FORCED_LEVEL_PROFILE_STANDARD;
327 	} else if (strncmp("profile_min_sclk", buf, strlen("profile_min_sclk")) == 0) {
328 		level = AMD_DPM_FORCED_LEVEL_PROFILE_MIN_SCLK;
329 	} else if (strncmp("profile_min_mclk", buf, strlen("profile_min_mclk")) == 0) {
330 		level = AMD_DPM_FORCED_LEVEL_PROFILE_MIN_MCLK;
331 	} else if (strncmp("profile_peak", buf, strlen("profile_peak")) == 0) {
332 		level = AMD_DPM_FORCED_LEVEL_PROFILE_PEAK;
333 	} else if (strncmp("perf_determinism", buf, strlen("perf_determinism")) == 0) {
334 		level = AMD_DPM_FORCED_LEVEL_PERF_DETERMINISM;
335 	}  else {
336 		return -EINVAL;
337 	}
338 
339 	ret = pm_runtime_get_sync(ddev->dev);
340 	if (ret < 0) {
341 		pm_runtime_put_autosuspend(ddev->dev);
342 		return ret;
343 	}
344 
345 	mutex_lock(&adev->pm.stable_pstate_ctx_lock);
346 	if (amdgpu_dpm_force_performance_level(adev, level)) {
347 		pm_runtime_mark_last_busy(ddev->dev);
348 		pm_runtime_put_autosuspend(ddev->dev);
349 		mutex_unlock(&adev->pm.stable_pstate_ctx_lock);
350 		return -EINVAL;
351 	}
352 	/* override whatever a user ctx may have set */
353 	adev->pm.stable_pstate_ctx = NULL;
354 	mutex_unlock(&adev->pm.stable_pstate_ctx_lock);
355 
356 	pm_runtime_mark_last_busy(ddev->dev);
357 	pm_runtime_put_autosuspend(ddev->dev);
358 
359 	return count;
360 }
361 
362 static ssize_t amdgpu_get_pp_num_states(struct device *dev,
363 		struct device_attribute *attr,
364 		char *buf)
365 {
366 	struct drm_device *ddev = dev_get_drvdata(dev);
367 	struct amdgpu_device *adev = drm_to_adev(ddev);
368 	struct pp_states_info data;
369 	uint32_t i;
370 	int buf_len, ret;
371 
372 	if (amdgpu_in_reset(adev))
373 		return -EPERM;
374 	if (adev->in_suspend && !adev->in_runpm)
375 		return -EPERM;
376 
377 	ret = pm_runtime_get_sync(ddev->dev);
378 	if (ret < 0) {
379 		pm_runtime_put_autosuspend(ddev->dev);
380 		return ret;
381 	}
382 
383 	if (amdgpu_dpm_get_pp_num_states(adev, &data))
384 		memset(&data, 0, sizeof(data));
385 
386 	pm_runtime_mark_last_busy(ddev->dev);
387 	pm_runtime_put_autosuspend(ddev->dev);
388 
389 	buf_len = sysfs_emit(buf, "states: %d\n", data.nums);
390 	for (i = 0; i < data.nums; i++)
391 		buf_len += sysfs_emit_at(buf, buf_len, "%d %s\n", i,
392 				(data.states[i] == POWER_STATE_TYPE_INTERNAL_BOOT) ? "boot" :
393 				(data.states[i] == POWER_STATE_TYPE_BATTERY) ? "battery" :
394 				(data.states[i] == POWER_STATE_TYPE_BALANCED) ? "balanced" :
395 				(data.states[i] == POWER_STATE_TYPE_PERFORMANCE) ? "performance" : "default");
396 
397 	return buf_len;
398 }
399 
400 static ssize_t amdgpu_get_pp_cur_state(struct device *dev,
401 		struct device_attribute *attr,
402 		char *buf)
403 {
404 	struct drm_device *ddev = dev_get_drvdata(dev);
405 	struct amdgpu_device *adev = drm_to_adev(ddev);
406 	struct pp_states_info data = {0};
407 	enum amd_pm_state_type pm = 0;
408 	int i = 0, ret = 0;
409 
410 	if (amdgpu_in_reset(adev))
411 		return -EPERM;
412 	if (adev->in_suspend && !adev->in_runpm)
413 		return -EPERM;
414 
415 	ret = pm_runtime_get_sync(ddev->dev);
416 	if (ret < 0) {
417 		pm_runtime_put_autosuspend(ddev->dev);
418 		return ret;
419 	}
420 
421 	amdgpu_dpm_get_current_power_state(adev, &pm);
422 
423 	ret = amdgpu_dpm_get_pp_num_states(adev, &data);
424 
425 	pm_runtime_mark_last_busy(ddev->dev);
426 	pm_runtime_put_autosuspend(ddev->dev);
427 
428 	if (ret)
429 		return ret;
430 
431 	for (i = 0; i < data.nums; i++) {
432 		if (pm == data.states[i])
433 			break;
434 	}
435 
436 	if (i == data.nums)
437 		i = -EINVAL;
438 
439 	return sysfs_emit(buf, "%d\n", i);
440 }
441 
442 static ssize_t amdgpu_get_pp_force_state(struct device *dev,
443 		struct device_attribute *attr,
444 		char *buf)
445 {
446 	struct drm_device *ddev = dev_get_drvdata(dev);
447 	struct amdgpu_device *adev = drm_to_adev(ddev);
448 
449 	if (amdgpu_in_reset(adev))
450 		return -EPERM;
451 	if (adev->in_suspend && !adev->in_runpm)
452 		return -EPERM;
453 
454 	if (adev->pm.pp_force_state_enabled)
455 		return amdgpu_get_pp_cur_state(dev, attr, buf);
456 	else
457 		return sysfs_emit(buf, "\n");
458 }
459 
460 static ssize_t amdgpu_set_pp_force_state(struct device *dev,
461 		struct device_attribute *attr,
462 		const char *buf,
463 		size_t count)
464 {
465 	struct drm_device *ddev = dev_get_drvdata(dev);
466 	struct amdgpu_device *adev = drm_to_adev(ddev);
467 	enum amd_pm_state_type state = 0;
468 	struct pp_states_info data;
469 	unsigned long idx;
470 	int ret;
471 
472 	if (amdgpu_in_reset(adev))
473 		return -EPERM;
474 	if (adev->in_suspend && !adev->in_runpm)
475 		return -EPERM;
476 
477 	adev->pm.pp_force_state_enabled = false;
478 
479 	if (strlen(buf) == 1)
480 		return count;
481 
482 	ret = kstrtoul(buf, 0, &idx);
483 	if (ret || idx >= ARRAY_SIZE(data.states))
484 		return -EINVAL;
485 
486 	idx = array_index_nospec(idx, ARRAY_SIZE(data.states));
487 
488 	ret = pm_runtime_get_sync(ddev->dev);
489 	if (ret < 0) {
490 		pm_runtime_put_autosuspend(ddev->dev);
491 		return ret;
492 	}
493 
494 	ret = amdgpu_dpm_get_pp_num_states(adev, &data);
495 	if (ret)
496 		goto err_out;
497 
498 	state = data.states[idx];
499 
500 	/* only set user selected power states */
501 	if (state != POWER_STATE_TYPE_INTERNAL_BOOT &&
502 	    state != POWER_STATE_TYPE_DEFAULT) {
503 		ret = amdgpu_dpm_dispatch_task(adev,
504 				AMD_PP_TASK_ENABLE_USER_STATE, &state);
505 		if (ret)
506 			goto err_out;
507 
508 		adev->pm.pp_force_state_enabled = true;
509 	}
510 
511 	pm_runtime_mark_last_busy(ddev->dev);
512 	pm_runtime_put_autosuspend(ddev->dev);
513 
514 	return count;
515 
516 err_out:
517 	pm_runtime_mark_last_busy(ddev->dev);
518 	pm_runtime_put_autosuspend(ddev->dev);
519 	return ret;
520 }
521 
522 /**
523  * DOC: pp_table
524  *
525  * The amdgpu driver provides a sysfs API for uploading new powerplay
526  * tables.  The file pp_table is used for this.  Reading the file
527  * will dump the current power play table.  Writing to the file
528  * will attempt to upload a new powerplay table and re-initialize
529  * powerplay using that new table.
530  *
531  */
532 
533 static ssize_t amdgpu_get_pp_table(struct device *dev,
534 		struct device_attribute *attr,
535 		char *buf)
536 {
537 	struct drm_device *ddev = dev_get_drvdata(dev);
538 	struct amdgpu_device *adev = drm_to_adev(ddev);
539 	char *table = NULL;
540 	int size, ret;
541 
542 	if (amdgpu_in_reset(adev))
543 		return -EPERM;
544 	if (adev->in_suspend && !adev->in_runpm)
545 		return -EPERM;
546 
547 	ret = pm_runtime_get_sync(ddev->dev);
548 	if (ret < 0) {
549 		pm_runtime_put_autosuspend(ddev->dev);
550 		return ret;
551 	}
552 
553 	size = amdgpu_dpm_get_pp_table(adev, &table);
554 
555 	pm_runtime_mark_last_busy(ddev->dev);
556 	pm_runtime_put_autosuspend(ddev->dev);
557 
558 	if (size <= 0)
559 		return size;
560 
561 	if (size >= PAGE_SIZE)
562 		size = PAGE_SIZE - 1;
563 
564 	memcpy(buf, table, size);
565 
566 	return size;
567 }
568 
569 static ssize_t amdgpu_set_pp_table(struct device *dev,
570 		struct device_attribute *attr,
571 		const char *buf,
572 		size_t count)
573 {
574 	struct drm_device *ddev = dev_get_drvdata(dev);
575 	struct amdgpu_device *adev = drm_to_adev(ddev);
576 	int ret = 0;
577 
578 	if (amdgpu_in_reset(adev))
579 		return -EPERM;
580 	if (adev->in_suspend && !adev->in_runpm)
581 		return -EPERM;
582 
583 	ret = pm_runtime_get_sync(ddev->dev);
584 	if (ret < 0) {
585 		pm_runtime_put_autosuspend(ddev->dev);
586 		return ret;
587 	}
588 
589 	ret = amdgpu_dpm_set_pp_table(adev, buf, count);
590 
591 	pm_runtime_mark_last_busy(ddev->dev);
592 	pm_runtime_put_autosuspend(ddev->dev);
593 
594 	if (ret)
595 		return ret;
596 
597 	return count;
598 }
599 
600 /**
601  * DOC: pp_od_clk_voltage
602  *
603  * The amdgpu driver provides a sysfs API for adjusting the clocks and voltages
604  * in each power level within a power state.  The pp_od_clk_voltage is used for
605  * this.
606  *
607  * Note that the actual memory controller clock rate are exposed, not
608  * the effective memory clock of the DRAMs. To translate it, use the
609  * following formula:
610  *
611  * Clock conversion (Mhz):
612  *
613  * HBM: effective_memory_clock = memory_controller_clock * 1
614  *
615  * G5: effective_memory_clock = memory_controller_clock * 1
616  *
617  * G6: effective_memory_clock = memory_controller_clock * 2
618  *
619  * DRAM data rate (MT/s):
620  *
621  * HBM: effective_memory_clock * 2 = data_rate
622  *
623  * G5: effective_memory_clock * 4 = data_rate
624  *
625  * G6: effective_memory_clock * 8 = data_rate
626  *
627  * Bandwidth (MB/s):
628  *
629  * data_rate * vram_bit_width / 8 = memory_bandwidth
630  *
631  * Some examples:
632  *
633  * G5 on RX460:
634  *
635  * memory_controller_clock = 1750 Mhz
636  *
637  * effective_memory_clock = 1750 Mhz * 1 = 1750 Mhz
638  *
639  * data rate = 1750 * 4 = 7000 MT/s
640  *
641  * memory_bandwidth = 7000 * 128 bits / 8 = 112000 MB/s
642  *
643  * G6 on RX5700:
644  *
645  * memory_controller_clock = 875 Mhz
646  *
647  * effective_memory_clock = 875 Mhz * 2 = 1750 Mhz
648  *
649  * data rate = 1750 * 8 = 14000 MT/s
650  *
651  * memory_bandwidth = 14000 * 256 bits / 8 = 448000 MB/s
652  *
653  * < For Vega10 and previous ASICs >
654  *
655  * Reading the file will display:
656  *
657  * - a list of engine clock levels and voltages labeled OD_SCLK
658  *
659  * - a list of memory clock levels and voltages labeled OD_MCLK
660  *
661  * - a list of valid ranges for sclk, mclk, and voltage labeled OD_RANGE
662  *
663  * To manually adjust these settings, first select manual using
664  * power_dpm_force_performance_level. Enter a new value for each
665  * level by writing a string that contains "s/m level clock voltage" to
666  * the file.  E.g., "s 1 500 820" will update sclk level 1 to be 500 MHz
667  * at 820 mV; "m 0 350 810" will update mclk level 0 to be 350 MHz at
668  * 810 mV.  When you have edited all of the states as needed, write
669  * "c" (commit) to the file to commit your changes.  If you want to reset to the
670  * default power levels, write "r" (reset) to the file to reset them.
671  *
672  *
673  * < For Vega20 and newer ASICs >
674  *
675  * Reading the file will display:
676  *
677  * - minimum and maximum engine clock labeled OD_SCLK
678  *
679  * - minimum(not available for Vega20 and Navi1x) and maximum memory
680  *   clock labeled OD_MCLK
681  *
682  * - three <frequency, voltage> points labeled OD_VDDC_CURVE.
683  *   They can be used to calibrate the sclk voltage curve. This is
684  *   available for Vega20 and NV1X.
685  *
686  * - voltage offset(in mV) applied on target voltage calculation.
687  *   This is available for Sienna Cichlid, Navy Flounder, Dimgrey
688  *   Cavefish and some later SMU13 ASICs. For these ASICs, the target
689  *   voltage calculation can be illustrated by "voltage = voltage
690  *   calculated from v/f curve + overdrive vddgfx offset"
691  *
692  * - a list of valid ranges for sclk, mclk, voltage curve points
693  *   or voltage offset labeled OD_RANGE
694  *
695  * < For APUs >
696  *
697  * Reading the file will display:
698  *
699  * - minimum and maximum engine clock labeled OD_SCLK
700  *
701  * - a list of valid ranges for sclk labeled OD_RANGE
702  *
703  * < For VanGogh >
704  *
705  * Reading the file will display:
706  *
707  * - minimum and maximum engine clock labeled OD_SCLK
708  * - minimum and maximum core clocks labeled OD_CCLK
709  *
710  * - a list of valid ranges for sclk and cclk labeled OD_RANGE
711  *
712  * To manually adjust these settings:
713  *
714  * - First select manual using power_dpm_force_performance_level
715  *
716  * - For clock frequency setting, enter a new value by writing a
717  *   string that contains "s/m index clock" to the file. The index
718  *   should be 0 if to set minimum clock. And 1 if to set maximum
719  *   clock. E.g., "s 0 500" will update minimum sclk to be 500 MHz.
720  *   "m 1 800" will update maximum mclk to be 800Mhz. For core
721  *   clocks on VanGogh, the string contains "p core index clock".
722  *   E.g., "p 2 0 800" would set the minimum core clock on core
723  *   2 to 800Mhz.
724  *
725  *   For sclk voltage curve supported by Vega20 and NV1X, enter the new
726  *   values by writing a string that contains "vc point clock voltage"
727  *   to the file. The points are indexed by 0, 1 and 2. E.g., "vc 0 300
728  *   600" will update point1 with clock set as 300Mhz and voltage as 600mV.
729  *   "vc 2 1000 1000" will update point3 with clock set as 1000Mhz and
730  *   voltage 1000mV.
731  *
732  *   For voltage offset supported by Sienna Cichlid, Navy Flounder, Dimgrey
733  *   Cavefish and some later SMU13 ASICs, enter the new value by writing a
734  *   string that contains "vo offset". E.g., "vo -10" will update the extra
735  *   voltage offset applied to the whole v/f curve line as -10mv.
736  *
737  * - When you have edited all of the states as needed, write "c" (commit)
738  *   to the file to commit your changes
739  *
740  * - If you want to reset to the default power levels, write "r" (reset)
741  *   to the file to reset them
742  *
743  */
744 
745 static ssize_t amdgpu_set_pp_od_clk_voltage(struct device *dev,
746 		struct device_attribute *attr,
747 		const char *buf,
748 		size_t count)
749 {
750 	struct drm_device *ddev = dev_get_drvdata(dev);
751 	struct amdgpu_device *adev = drm_to_adev(ddev);
752 	int ret;
753 	uint32_t parameter_size = 0;
754 	long parameter[64];
755 	char buf_cpy[128];
756 	char *tmp_str;
757 	char *sub_str;
758 	const char delimiter[3] = {' ', '\n', '\0'};
759 	uint32_t type;
760 
761 	if (amdgpu_in_reset(adev))
762 		return -EPERM;
763 	if (adev->in_suspend && !adev->in_runpm)
764 		return -EPERM;
765 
766 	if (count > 127 || count == 0)
767 		return -EINVAL;
768 
769 	if (*buf == 's')
770 		type = PP_OD_EDIT_SCLK_VDDC_TABLE;
771 	else if (*buf == 'p')
772 		type = PP_OD_EDIT_CCLK_VDDC_TABLE;
773 	else if (*buf == 'm')
774 		type = PP_OD_EDIT_MCLK_VDDC_TABLE;
775 	else if (*buf == 'r')
776 		type = PP_OD_RESTORE_DEFAULT_TABLE;
777 	else if (*buf == 'c')
778 		type = PP_OD_COMMIT_DPM_TABLE;
779 	else if (!strncmp(buf, "vc", 2))
780 		type = PP_OD_EDIT_VDDC_CURVE;
781 	else if (!strncmp(buf, "vo", 2))
782 		type = PP_OD_EDIT_VDDGFX_OFFSET;
783 	else
784 		return -EINVAL;
785 
786 	memcpy(buf_cpy, buf, count);
787 	buf_cpy[count] = 0;
788 
789 	tmp_str = buf_cpy;
790 
791 	if ((type == PP_OD_EDIT_VDDC_CURVE) ||
792 	     (type == PP_OD_EDIT_VDDGFX_OFFSET))
793 		tmp_str++;
794 	while (isspace(*++tmp_str));
795 
796 	while ((sub_str = strsep(&tmp_str, delimiter)) != NULL) {
797 		if (strlen(sub_str) == 0)
798 			continue;
799 		ret = kstrtol(sub_str, 0, &parameter[parameter_size]);
800 		if (ret)
801 			return -EINVAL;
802 		parameter_size++;
803 
804 		if (!tmp_str)
805 			break;
806 
807 		while (isspace(*tmp_str))
808 			tmp_str++;
809 	}
810 
811 	ret = pm_runtime_get_sync(ddev->dev);
812 	if (ret < 0) {
813 		pm_runtime_put_autosuspend(ddev->dev);
814 		return ret;
815 	}
816 
817 	if (amdgpu_dpm_set_fine_grain_clk_vol(adev,
818 					      type,
819 					      parameter,
820 					      parameter_size))
821 		goto err_out;
822 
823 	if (amdgpu_dpm_odn_edit_dpm_table(adev, type,
824 					  parameter, parameter_size))
825 		goto err_out;
826 
827 	if (type == PP_OD_COMMIT_DPM_TABLE) {
828 		if (amdgpu_dpm_dispatch_task(adev,
829 					     AMD_PP_TASK_READJUST_POWER_STATE,
830 					     NULL))
831 			goto err_out;
832 	}
833 
834 	pm_runtime_mark_last_busy(ddev->dev);
835 	pm_runtime_put_autosuspend(ddev->dev);
836 
837 	return count;
838 
839 err_out:
840 	pm_runtime_mark_last_busy(ddev->dev);
841 	pm_runtime_put_autosuspend(ddev->dev);
842 	return -EINVAL;
843 }
844 
845 static ssize_t amdgpu_get_pp_od_clk_voltage(struct device *dev,
846 		struct device_attribute *attr,
847 		char *buf)
848 {
849 	struct drm_device *ddev = dev_get_drvdata(dev);
850 	struct amdgpu_device *adev = drm_to_adev(ddev);
851 	int size = 0;
852 	int ret;
853 	enum pp_clock_type od_clocks[6] = {
854 		OD_SCLK,
855 		OD_MCLK,
856 		OD_VDDC_CURVE,
857 		OD_RANGE,
858 		OD_VDDGFX_OFFSET,
859 		OD_CCLK,
860 	};
861 	uint clk_index;
862 
863 	if (amdgpu_in_reset(adev))
864 		return -EPERM;
865 	if (adev->in_suspend && !adev->in_runpm)
866 		return -EPERM;
867 
868 	ret = pm_runtime_get_sync(ddev->dev);
869 	if (ret < 0) {
870 		pm_runtime_put_autosuspend(ddev->dev);
871 		return ret;
872 	}
873 
874 	for (clk_index = 0 ; clk_index < 6 ; clk_index++) {
875 		ret = amdgpu_dpm_emit_clock_levels(adev, od_clocks[clk_index], buf, &size);
876 		if (ret)
877 			break;
878 	}
879 	if (ret == -ENOENT) {
880 		size = amdgpu_dpm_print_clock_levels(adev, OD_SCLK, buf);
881 		size += amdgpu_dpm_print_clock_levels(adev, OD_MCLK, buf + size);
882 		size += amdgpu_dpm_print_clock_levels(adev, OD_VDDC_CURVE, buf + size);
883 		size += amdgpu_dpm_print_clock_levels(adev, OD_VDDGFX_OFFSET, buf + size);
884 		size += amdgpu_dpm_print_clock_levels(adev, OD_RANGE, buf + size);
885 		size += amdgpu_dpm_print_clock_levels(adev, OD_CCLK, buf + size);
886 	}
887 
888 	if (size == 0)
889 		size = sysfs_emit(buf, "\n");
890 
891 	pm_runtime_mark_last_busy(ddev->dev);
892 	pm_runtime_put_autosuspend(ddev->dev);
893 
894 	return size;
895 }
896 
897 /**
898  * DOC: pp_features
899  *
900  * The amdgpu driver provides a sysfs API for adjusting what powerplay
901  * features to be enabled. The file pp_features is used for this. And
902  * this is only available for Vega10 and later dGPUs.
903  *
904  * Reading back the file will show you the followings:
905  * - Current ppfeature masks
906  * - List of the all supported powerplay features with their naming,
907  *   bitmasks and enablement status('Y'/'N' means "enabled"/"disabled").
908  *
909  * To manually enable or disable a specific feature, just set or clear
910  * the corresponding bit from original ppfeature masks and input the
911  * new ppfeature masks.
912  */
913 static ssize_t amdgpu_set_pp_features(struct device *dev,
914 				      struct device_attribute *attr,
915 				      const char *buf,
916 				      size_t count)
917 {
918 	struct drm_device *ddev = dev_get_drvdata(dev);
919 	struct amdgpu_device *adev = drm_to_adev(ddev);
920 	uint64_t featuremask;
921 	int ret;
922 
923 	if (amdgpu_in_reset(adev))
924 		return -EPERM;
925 	if (adev->in_suspend && !adev->in_runpm)
926 		return -EPERM;
927 
928 	ret = kstrtou64(buf, 0, &featuremask);
929 	if (ret)
930 		return -EINVAL;
931 
932 	ret = pm_runtime_get_sync(ddev->dev);
933 	if (ret < 0) {
934 		pm_runtime_put_autosuspend(ddev->dev);
935 		return ret;
936 	}
937 
938 	ret = amdgpu_dpm_set_ppfeature_status(adev, featuremask);
939 
940 	pm_runtime_mark_last_busy(ddev->dev);
941 	pm_runtime_put_autosuspend(ddev->dev);
942 
943 	if (ret)
944 		return -EINVAL;
945 
946 	return count;
947 }
948 
949 static ssize_t amdgpu_get_pp_features(struct device *dev,
950 				      struct device_attribute *attr,
951 				      char *buf)
952 {
953 	struct drm_device *ddev = dev_get_drvdata(dev);
954 	struct amdgpu_device *adev = drm_to_adev(ddev);
955 	ssize_t size;
956 	int ret;
957 
958 	if (amdgpu_in_reset(adev))
959 		return -EPERM;
960 	if (adev->in_suspend && !adev->in_runpm)
961 		return -EPERM;
962 
963 	ret = pm_runtime_get_sync(ddev->dev);
964 	if (ret < 0) {
965 		pm_runtime_put_autosuspend(ddev->dev);
966 		return ret;
967 	}
968 
969 	size = amdgpu_dpm_get_ppfeature_status(adev, buf);
970 	if (size <= 0)
971 		size = sysfs_emit(buf, "\n");
972 
973 	pm_runtime_mark_last_busy(ddev->dev);
974 	pm_runtime_put_autosuspend(ddev->dev);
975 
976 	return size;
977 }
978 
979 /**
980  * DOC: pp_dpm_sclk pp_dpm_mclk pp_dpm_socclk pp_dpm_fclk pp_dpm_dcefclk pp_dpm_pcie
981  *
982  * The amdgpu driver provides a sysfs API for adjusting what power levels
983  * are enabled for a given power state.  The files pp_dpm_sclk, pp_dpm_mclk,
984  * pp_dpm_socclk, pp_dpm_fclk, pp_dpm_dcefclk and pp_dpm_pcie are used for
985  * this.
986  *
987  * pp_dpm_socclk and pp_dpm_dcefclk interfaces are only available for
988  * Vega10 and later ASICs.
989  * pp_dpm_fclk interface is only available for Vega20 and later ASICs.
990  *
991  * Reading back the files will show you the available power levels within
992  * the power state and the clock information for those levels. If deep sleep is
993  * applied to a clock, the level will be denoted by a special level 'S:'
994  * E.g., ::
995  *
996  *  S: 19Mhz *
997  *  0: 615Mhz
998  *  1: 800Mhz
999  *  2: 888Mhz
1000  *  3: 1000Mhz
1001  *
1002  *
1003  * To manually adjust these states, first select manual using
1004  * power_dpm_force_performance_level.
1005  * Secondly, enter a new value for each level by inputing a string that
1006  * contains " echo xx xx xx > pp_dpm_sclk/mclk/pcie"
1007  * E.g.,
1008  *
1009  * .. code-block:: bash
1010  *
1011  *	echo "4 5 6" > pp_dpm_sclk
1012  *
1013  * will enable sclk levels 4, 5, and 6.
1014  *
1015  * NOTE: change to the dcefclk max dpm level is not supported now
1016  */
1017 
1018 static ssize_t amdgpu_get_pp_dpm_clock(struct device *dev,
1019 		enum pp_clock_type type,
1020 		char *buf)
1021 {
1022 	struct drm_device *ddev = dev_get_drvdata(dev);
1023 	struct amdgpu_device *adev = drm_to_adev(ddev);
1024 	int size = 0;
1025 	int ret = 0;
1026 
1027 	if (amdgpu_in_reset(adev))
1028 		return -EPERM;
1029 	if (adev->in_suspend && !adev->in_runpm)
1030 		return -EPERM;
1031 
1032 	ret = pm_runtime_get_sync(ddev->dev);
1033 	if (ret < 0) {
1034 		pm_runtime_put_autosuspend(ddev->dev);
1035 		return ret;
1036 	}
1037 
1038 	ret = amdgpu_dpm_emit_clock_levels(adev, type, buf, &size);
1039 	if (ret == -ENOENT)
1040 		size = amdgpu_dpm_print_clock_levels(adev, type, buf);
1041 
1042 	if (size == 0)
1043 		size = sysfs_emit(buf, "\n");
1044 
1045 	pm_runtime_mark_last_busy(ddev->dev);
1046 	pm_runtime_put_autosuspend(ddev->dev);
1047 
1048 	return size;
1049 }
1050 
1051 /*
1052  * Worst case: 32 bits individually specified, in octal at 12 characters
1053  * per line (+1 for \n).
1054  */
1055 #define AMDGPU_MASK_BUF_MAX	(32 * 13)
1056 
1057 static ssize_t amdgpu_read_mask(const char *buf, size_t count, uint32_t *mask)
1058 {
1059 	int ret;
1060 	unsigned long level;
1061 	char *sub_str = NULL;
1062 	char *tmp;
1063 	char buf_cpy[AMDGPU_MASK_BUF_MAX + 1];
1064 	const char delimiter[3] = {' ', '\n', '\0'};
1065 	size_t bytes;
1066 
1067 	*mask = 0;
1068 
1069 	bytes = min(count, sizeof(buf_cpy) - 1);
1070 	memcpy(buf_cpy, buf, bytes);
1071 	buf_cpy[bytes] = '\0';
1072 	tmp = buf_cpy;
1073 	while ((sub_str = strsep(&tmp, delimiter)) != NULL) {
1074 		if (strlen(sub_str)) {
1075 			ret = kstrtoul(sub_str, 0, &level);
1076 			if (ret || level > 31)
1077 				return -EINVAL;
1078 			*mask |= 1 << level;
1079 		} else
1080 			break;
1081 	}
1082 
1083 	return 0;
1084 }
1085 
1086 static ssize_t amdgpu_set_pp_dpm_clock(struct device *dev,
1087 		enum pp_clock_type type,
1088 		const char *buf,
1089 		size_t count)
1090 {
1091 	struct drm_device *ddev = dev_get_drvdata(dev);
1092 	struct amdgpu_device *adev = drm_to_adev(ddev);
1093 	int ret;
1094 	uint32_t mask = 0;
1095 
1096 	if (amdgpu_in_reset(adev))
1097 		return -EPERM;
1098 	if (adev->in_suspend && !adev->in_runpm)
1099 		return -EPERM;
1100 
1101 	ret = amdgpu_read_mask(buf, count, &mask);
1102 	if (ret)
1103 		return ret;
1104 
1105 	ret = pm_runtime_get_sync(ddev->dev);
1106 	if (ret < 0) {
1107 		pm_runtime_put_autosuspend(ddev->dev);
1108 		return ret;
1109 	}
1110 
1111 	ret = amdgpu_dpm_force_clock_level(adev, type, mask);
1112 
1113 	pm_runtime_mark_last_busy(ddev->dev);
1114 	pm_runtime_put_autosuspend(ddev->dev);
1115 
1116 	if (ret)
1117 		return -EINVAL;
1118 
1119 	return count;
1120 }
1121 
1122 static ssize_t amdgpu_get_pp_dpm_sclk(struct device *dev,
1123 		struct device_attribute *attr,
1124 		char *buf)
1125 {
1126 	return amdgpu_get_pp_dpm_clock(dev, PP_SCLK, buf);
1127 }
1128 
1129 static ssize_t amdgpu_set_pp_dpm_sclk(struct device *dev,
1130 		struct device_attribute *attr,
1131 		const char *buf,
1132 		size_t count)
1133 {
1134 	return amdgpu_set_pp_dpm_clock(dev, PP_SCLK, buf, count);
1135 }
1136 
1137 static ssize_t amdgpu_get_pp_dpm_mclk(struct device *dev,
1138 		struct device_attribute *attr,
1139 		char *buf)
1140 {
1141 	return amdgpu_get_pp_dpm_clock(dev, PP_MCLK, buf);
1142 }
1143 
1144 static ssize_t amdgpu_set_pp_dpm_mclk(struct device *dev,
1145 		struct device_attribute *attr,
1146 		const char *buf,
1147 		size_t count)
1148 {
1149 	return amdgpu_set_pp_dpm_clock(dev, PP_MCLK, buf, count);
1150 }
1151 
1152 static ssize_t amdgpu_get_pp_dpm_socclk(struct device *dev,
1153 		struct device_attribute *attr,
1154 		char *buf)
1155 {
1156 	return amdgpu_get_pp_dpm_clock(dev, PP_SOCCLK, buf);
1157 }
1158 
1159 static ssize_t amdgpu_set_pp_dpm_socclk(struct device *dev,
1160 		struct device_attribute *attr,
1161 		const char *buf,
1162 		size_t count)
1163 {
1164 	return amdgpu_set_pp_dpm_clock(dev, PP_SOCCLK, buf, count);
1165 }
1166 
1167 static ssize_t amdgpu_get_pp_dpm_fclk(struct device *dev,
1168 		struct device_attribute *attr,
1169 		char *buf)
1170 {
1171 	return amdgpu_get_pp_dpm_clock(dev, PP_FCLK, buf);
1172 }
1173 
1174 static ssize_t amdgpu_set_pp_dpm_fclk(struct device *dev,
1175 		struct device_attribute *attr,
1176 		const char *buf,
1177 		size_t count)
1178 {
1179 	return amdgpu_set_pp_dpm_clock(dev, PP_FCLK, buf, count);
1180 }
1181 
1182 static ssize_t amdgpu_get_pp_dpm_vclk(struct device *dev,
1183 		struct device_attribute *attr,
1184 		char *buf)
1185 {
1186 	return amdgpu_get_pp_dpm_clock(dev, PP_VCLK, buf);
1187 }
1188 
1189 static ssize_t amdgpu_set_pp_dpm_vclk(struct device *dev,
1190 		struct device_attribute *attr,
1191 		const char *buf,
1192 		size_t count)
1193 {
1194 	return amdgpu_set_pp_dpm_clock(dev, PP_VCLK, buf, count);
1195 }
1196 
1197 static ssize_t amdgpu_get_pp_dpm_vclk1(struct device *dev,
1198 		struct device_attribute *attr,
1199 		char *buf)
1200 {
1201 	return amdgpu_get_pp_dpm_clock(dev, PP_VCLK1, buf);
1202 }
1203 
1204 static ssize_t amdgpu_set_pp_dpm_vclk1(struct device *dev,
1205 		struct device_attribute *attr,
1206 		const char *buf,
1207 		size_t count)
1208 {
1209 	return amdgpu_set_pp_dpm_clock(dev, PP_VCLK1, buf, count);
1210 }
1211 
1212 static ssize_t amdgpu_get_pp_dpm_dclk(struct device *dev,
1213 		struct device_attribute *attr,
1214 		char *buf)
1215 {
1216 	return amdgpu_get_pp_dpm_clock(dev, PP_DCLK, buf);
1217 }
1218 
1219 static ssize_t amdgpu_set_pp_dpm_dclk(struct device *dev,
1220 		struct device_attribute *attr,
1221 		const char *buf,
1222 		size_t count)
1223 {
1224 	return amdgpu_set_pp_dpm_clock(dev, PP_DCLK, buf, count);
1225 }
1226 
1227 static ssize_t amdgpu_get_pp_dpm_dclk1(struct device *dev,
1228 		struct device_attribute *attr,
1229 		char *buf)
1230 {
1231 	return amdgpu_get_pp_dpm_clock(dev, PP_DCLK1, buf);
1232 }
1233 
1234 static ssize_t amdgpu_set_pp_dpm_dclk1(struct device *dev,
1235 		struct device_attribute *attr,
1236 		const char *buf,
1237 		size_t count)
1238 {
1239 	return amdgpu_set_pp_dpm_clock(dev, PP_DCLK1, buf, count);
1240 }
1241 
1242 static ssize_t amdgpu_get_pp_dpm_dcefclk(struct device *dev,
1243 		struct device_attribute *attr,
1244 		char *buf)
1245 {
1246 	return amdgpu_get_pp_dpm_clock(dev, PP_DCEFCLK, buf);
1247 }
1248 
1249 static ssize_t amdgpu_set_pp_dpm_dcefclk(struct device *dev,
1250 		struct device_attribute *attr,
1251 		const char *buf,
1252 		size_t count)
1253 {
1254 	return amdgpu_set_pp_dpm_clock(dev, PP_DCEFCLK, buf, count);
1255 }
1256 
1257 static ssize_t amdgpu_get_pp_dpm_pcie(struct device *dev,
1258 		struct device_attribute *attr,
1259 		char *buf)
1260 {
1261 	return amdgpu_get_pp_dpm_clock(dev, PP_PCIE, buf);
1262 }
1263 
1264 static ssize_t amdgpu_set_pp_dpm_pcie(struct device *dev,
1265 		struct device_attribute *attr,
1266 		const char *buf,
1267 		size_t count)
1268 {
1269 	return amdgpu_set_pp_dpm_clock(dev, PP_PCIE, buf, count);
1270 }
1271 
1272 static ssize_t amdgpu_get_pp_sclk_od(struct device *dev,
1273 		struct device_attribute *attr,
1274 		char *buf)
1275 {
1276 	struct drm_device *ddev = dev_get_drvdata(dev);
1277 	struct amdgpu_device *adev = drm_to_adev(ddev);
1278 	uint32_t value = 0;
1279 	int ret;
1280 
1281 	if (amdgpu_in_reset(adev))
1282 		return -EPERM;
1283 	if (adev->in_suspend && !adev->in_runpm)
1284 		return -EPERM;
1285 
1286 	ret = pm_runtime_get_sync(ddev->dev);
1287 	if (ret < 0) {
1288 		pm_runtime_put_autosuspend(ddev->dev);
1289 		return ret;
1290 	}
1291 
1292 	value = amdgpu_dpm_get_sclk_od(adev);
1293 
1294 	pm_runtime_mark_last_busy(ddev->dev);
1295 	pm_runtime_put_autosuspend(ddev->dev);
1296 
1297 	return sysfs_emit(buf, "%d\n", value);
1298 }
1299 
1300 static ssize_t amdgpu_set_pp_sclk_od(struct device *dev,
1301 		struct device_attribute *attr,
1302 		const char *buf,
1303 		size_t count)
1304 {
1305 	struct drm_device *ddev = dev_get_drvdata(dev);
1306 	struct amdgpu_device *adev = drm_to_adev(ddev);
1307 	int ret;
1308 	long int value;
1309 
1310 	if (amdgpu_in_reset(adev))
1311 		return -EPERM;
1312 	if (adev->in_suspend && !adev->in_runpm)
1313 		return -EPERM;
1314 
1315 	ret = kstrtol(buf, 0, &value);
1316 
1317 	if (ret)
1318 		return -EINVAL;
1319 
1320 	ret = pm_runtime_get_sync(ddev->dev);
1321 	if (ret < 0) {
1322 		pm_runtime_put_autosuspend(ddev->dev);
1323 		return ret;
1324 	}
1325 
1326 	amdgpu_dpm_set_sclk_od(adev, (uint32_t)value);
1327 
1328 	pm_runtime_mark_last_busy(ddev->dev);
1329 	pm_runtime_put_autosuspend(ddev->dev);
1330 
1331 	return count;
1332 }
1333 
1334 static ssize_t amdgpu_get_pp_mclk_od(struct device *dev,
1335 		struct device_attribute *attr,
1336 		char *buf)
1337 {
1338 	struct drm_device *ddev = dev_get_drvdata(dev);
1339 	struct amdgpu_device *adev = drm_to_adev(ddev);
1340 	uint32_t value = 0;
1341 	int ret;
1342 
1343 	if (amdgpu_in_reset(adev))
1344 		return -EPERM;
1345 	if (adev->in_suspend && !adev->in_runpm)
1346 		return -EPERM;
1347 
1348 	ret = pm_runtime_get_sync(ddev->dev);
1349 	if (ret < 0) {
1350 		pm_runtime_put_autosuspend(ddev->dev);
1351 		return ret;
1352 	}
1353 
1354 	value = amdgpu_dpm_get_mclk_od(adev);
1355 
1356 	pm_runtime_mark_last_busy(ddev->dev);
1357 	pm_runtime_put_autosuspend(ddev->dev);
1358 
1359 	return sysfs_emit(buf, "%d\n", value);
1360 }
1361 
1362 static ssize_t amdgpu_set_pp_mclk_od(struct device *dev,
1363 		struct device_attribute *attr,
1364 		const char *buf,
1365 		size_t count)
1366 {
1367 	struct drm_device *ddev = dev_get_drvdata(dev);
1368 	struct amdgpu_device *adev = drm_to_adev(ddev);
1369 	int ret;
1370 	long int value;
1371 
1372 	if (amdgpu_in_reset(adev))
1373 		return -EPERM;
1374 	if (adev->in_suspend && !adev->in_runpm)
1375 		return -EPERM;
1376 
1377 	ret = kstrtol(buf, 0, &value);
1378 
1379 	if (ret)
1380 		return -EINVAL;
1381 
1382 	ret = pm_runtime_get_sync(ddev->dev);
1383 	if (ret < 0) {
1384 		pm_runtime_put_autosuspend(ddev->dev);
1385 		return ret;
1386 	}
1387 
1388 	amdgpu_dpm_set_mclk_od(adev, (uint32_t)value);
1389 
1390 	pm_runtime_mark_last_busy(ddev->dev);
1391 	pm_runtime_put_autosuspend(ddev->dev);
1392 
1393 	return count;
1394 }
1395 
1396 /**
1397  * DOC: pp_power_profile_mode
1398  *
1399  * The amdgpu driver provides a sysfs API for adjusting the heuristics
1400  * related to switching between power levels in a power state.  The file
1401  * pp_power_profile_mode is used for this.
1402  *
1403  * Reading this file outputs a list of all of the predefined power profiles
1404  * and the relevant heuristics settings for that profile.
1405  *
1406  * To select a profile or create a custom profile, first select manual using
1407  * power_dpm_force_performance_level.  Writing the number of a predefined
1408  * profile to pp_power_profile_mode will enable those heuristics.  To
1409  * create a custom set of heuristics, write a string of numbers to the file
1410  * starting with the number of the custom profile along with a setting
1411  * for each heuristic parameter.  Due to differences across asic families
1412  * the heuristic parameters vary from family to family.
1413  *
1414  */
1415 
1416 static ssize_t amdgpu_get_pp_power_profile_mode(struct device *dev,
1417 		struct device_attribute *attr,
1418 		char *buf)
1419 {
1420 	struct drm_device *ddev = dev_get_drvdata(dev);
1421 	struct amdgpu_device *adev = drm_to_adev(ddev);
1422 	ssize_t size;
1423 	int ret;
1424 
1425 	if (amdgpu_in_reset(adev))
1426 		return -EPERM;
1427 	if (adev->in_suspend && !adev->in_runpm)
1428 		return -EPERM;
1429 
1430 	ret = pm_runtime_get_sync(ddev->dev);
1431 	if (ret < 0) {
1432 		pm_runtime_put_autosuspend(ddev->dev);
1433 		return ret;
1434 	}
1435 
1436 	size = amdgpu_dpm_get_power_profile_mode(adev, buf);
1437 	if (size <= 0)
1438 		size = sysfs_emit(buf, "\n");
1439 
1440 	pm_runtime_mark_last_busy(ddev->dev);
1441 	pm_runtime_put_autosuspend(ddev->dev);
1442 
1443 	return size;
1444 }
1445 
1446 
1447 static ssize_t amdgpu_set_pp_power_profile_mode(struct device *dev,
1448 		struct device_attribute *attr,
1449 		const char *buf,
1450 		size_t count)
1451 {
1452 	int ret;
1453 	struct drm_device *ddev = dev_get_drvdata(dev);
1454 	struct amdgpu_device *adev = drm_to_adev(ddev);
1455 	uint32_t parameter_size = 0;
1456 	long parameter[64];
1457 	char *sub_str, buf_cpy[128];
1458 	char *tmp_str;
1459 	uint32_t i = 0;
1460 	char tmp[2];
1461 	long int profile_mode = 0;
1462 	const char delimiter[3] = {' ', '\n', '\0'};
1463 
1464 	if (amdgpu_in_reset(adev))
1465 		return -EPERM;
1466 	if (adev->in_suspend && !adev->in_runpm)
1467 		return -EPERM;
1468 
1469 	tmp[0] = *(buf);
1470 	tmp[1] = '\0';
1471 	ret = kstrtol(tmp, 0, &profile_mode);
1472 	if (ret)
1473 		return -EINVAL;
1474 
1475 	if (profile_mode == PP_SMC_POWER_PROFILE_CUSTOM) {
1476 		if (count < 2 || count > 127)
1477 			return -EINVAL;
1478 		while (isspace(*++buf))
1479 			i++;
1480 		memcpy(buf_cpy, buf, count-i);
1481 		tmp_str = buf_cpy;
1482 		while ((sub_str = strsep(&tmp_str, delimiter)) != NULL) {
1483 			if (strlen(sub_str) == 0)
1484 				continue;
1485 			ret = kstrtol(sub_str, 0, &parameter[parameter_size]);
1486 			if (ret)
1487 				return -EINVAL;
1488 			parameter_size++;
1489 			while (isspace(*tmp_str))
1490 				tmp_str++;
1491 		}
1492 	}
1493 	parameter[parameter_size] = profile_mode;
1494 
1495 	ret = pm_runtime_get_sync(ddev->dev);
1496 	if (ret < 0) {
1497 		pm_runtime_put_autosuspend(ddev->dev);
1498 		return ret;
1499 	}
1500 
1501 	ret = amdgpu_dpm_set_power_profile_mode(adev, parameter, parameter_size);
1502 
1503 	pm_runtime_mark_last_busy(ddev->dev);
1504 	pm_runtime_put_autosuspend(ddev->dev);
1505 
1506 	if (!ret)
1507 		return count;
1508 
1509 	return -EINVAL;
1510 }
1511 
1512 static int amdgpu_hwmon_get_sensor_generic(struct amdgpu_device *adev,
1513 					   enum amd_pp_sensors sensor,
1514 					   void *query)
1515 {
1516 	int r, size = sizeof(uint32_t);
1517 
1518 	if (amdgpu_in_reset(adev))
1519 		return -EPERM;
1520 	if (adev->in_suspend && !adev->in_runpm)
1521 		return -EPERM;
1522 
1523 	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
1524 	if (r < 0) {
1525 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1526 		return r;
1527 	}
1528 
1529 	/* get the sensor value */
1530 	r = amdgpu_dpm_read_sensor(adev, sensor, query, &size);
1531 
1532 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
1533 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
1534 
1535 	return r;
1536 }
1537 
1538 /**
1539  * DOC: gpu_busy_percent
1540  *
1541  * The amdgpu driver provides a sysfs API for reading how busy the GPU
1542  * is as a percentage.  The file gpu_busy_percent is used for this.
1543  * The SMU firmware computes a percentage of load based on the
1544  * aggregate activity level in the IP cores.
1545  */
1546 static ssize_t amdgpu_get_gpu_busy_percent(struct device *dev,
1547 					   struct device_attribute *attr,
1548 					   char *buf)
1549 {
1550 	struct drm_device *ddev = dev_get_drvdata(dev);
1551 	struct amdgpu_device *adev = drm_to_adev(ddev);
1552 	unsigned int value;
1553 	int r;
1554 
1555 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_GPU_LOAD, &value);
1556 	if (r)
1557 		return r;
1558 
1559 	return sysfs_emit(buf, "%d\n", value);
1560 }
1561 
1562 /**
1563  * DOC: mem_busy_percent
1564  *
1565  * The amdgpu driver provides a sysfs API for reading how busy the VRAM
1566  * is as a percentage.  The file mem_busy_percent is used for this.
1567  * The SMU firmware computes a percentage of load based on the
1568  * aggregate activity level in the IP cores.
1569  */
1570 static ssize_t amdgpu_get_mem_busy_percent(struct device *dev,
1571 					   struct device_attribute *attr,
1572 					   char *buf)
1573 {
1574 	struct drm_device *ddev = dev_get_drvdata(dev);
1575 	struct amdgpu_device *adev = drm_to_adev(ddev);
1576 	unsigned int value;
1577 	int r;
1578 
1579 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_MEM_LOAD, &value);
1580 	if (r)
1581 		return r;
1582 
1583 	return sysfs_emit(buf, "%d\n", value);
1584 }
1585 
1586 /**
1587  * DOC: vcn_busy_percent
1588  *
1589  * The amdgpu driver provides a sysfs API for reading how busy the VCN
1590  * is as a percentage.  The file vcn_busy_percent is used for this.
1591  * The SMU firmware computes a percentage of load based on the
1592  * aggregate activity level in the IP cores.
1593  */
1594 static ssize_t amdgpu_get_vcn_busy_percent(struct device *dev,
1595 						  struct device_attribute *attr,
1596 						  char *buf)
1597 {
1598 	struct drm_device *ddev = dev_get_drvdata(dev);
1599 	struct amdgpu_device *adev = drm_to_adev(ddev);
1600 	unsigned int value;
1601 	int r;
1602 
1603 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_VCN_LOAD, &value);
1604 	if (r)
1605 		return r;
1606 
1607 	return sysfs_emit(buf, "%d\n", value);
1608 }
1609 
1610 /**
1611  * DOC: pcie_bw
1612  *
1613  * The amdgpu driver provides a sysfs API for estimating how much data
1614  * has been received and sent by the GPU in the last second through PCIe.
1615  * The file pcie_bw is used for this.
1616  * The Perf counters count the number of received and sent messages and return
1617  * those values, as well as the maximum payload size of a PCIe packet (mps).
1618  * Note that it is not possible to easily and quickly obtain the size of each
1619  * packet transmitted, so we output the max payload size (mps) to allow for
1620  * quick estimation of the PCIe bandwidth usage
1621  */
1622 static ssize_t amdgpu_get_pcie_bw(struct device *dev,
1623 		struct device_attribute *attr,
1624 		char *buf)
1625 {
1626 	struct drm_device *ddev = dev_get_drvdata(dev);
1627 	struct amdgpu_device *adev = drm_to_adev(ddev);
1628 	uint64_t count0 = 0, count1 = 0;
1629 	int ret;
1630 
1631 	if (amdgpu_in_reset(adev))
1632 		return -EPERM;
1633 	if (adev->in_suspend && !adev->in_runpm)
1634 		return -EPERM;
1635 
1636 	if (adev->flags & AMD_IS_APU)
1637 		return -ENODATA;
1638 
1639 	if (!adev->asic_funcs->get_pcie_usage)
1640 		return -ENODATA;
1641 
1642 	ret = pm_runtime_get_sync(ddev->dev);
1643 	if (ret < 0) {
1644 		pm_runtime_put_autosuspend(ddev->dev);
1645 		return ret;
1646 	}
1647 
1648 	amdgpu_asic_get_pcie_usage(adev, &count0, &count1);
1649 
1650 	pm_runtime_mark_last_busy(ddev->dev);
1651 	pm_runtime_put_autosuspend(ddev->dev);
1652 
1653 	return sysfs_emit(buf, "%llu %llu %i\n",
1654 			  count0, count1, pcie_get_mps(adev->pdev));
1655 }
1656 
1657 /**
1658  * DOC: unique_id
1659  *
1660  * The amdgpu driver provides a sysfs API for providing a unique ID for the GPU
1661  * The file unique_id is used for this.
1662  * This will provide a Unique ID that will persist from machine to machine
1663  *
1664  * NOTE: This will only work for GFX9 and newer. This file will be absent
1665  * on unsupported ASICs (GFX8 and older)
1666  */
1667 static ssize_t amdgpu_get_unique_id(struct device *dev,
1668 		struct device_attribute *attr,
1669 		char *buf)
1670 {
1671 	struct drm_device *ddev = dev_get_drvdata(dev);
1672 	struct amdgpu_device *adev = drm_to_adev(ddev);
1673 
1674 	if (amdgpu_in_reset(adev))
1675 		return -EPERM;
1676 	if (adev->in_suspend && !adev->in_runpm)
1677 		return -EPERM;
1678 
1679 	if (adev->unique_id)
1680 		return sysfs_emit(buf, "%016llx\n", adev->unique_id);
1681 
1682 	return 0;
1683 }
1684 
1685 /**
1686  * DOC: thermal_throttling_logging
1687  *
1688  * Thermal throttling pulls down the clock frequency and thus the performance.
1689  * It's an useful mechanism to protect the chip from overheating. Since it
1690  * impacts performance, the user controls whether it is enabled and if so,
1691  * the log frequency.
1692  *
1693  * Reading back the file shows you the status(enabled or disabled) and
1694  * the interval(in seconds) between each thermal logging.
1695  *
1696  * Writing an integer to the file, sets a new logging interval, in seconds.
1697  * The value should be between 1 and 3600. If the value is less than 1,
1698  * thermal logging is disabled. Values greater than 3600 are ignored.
1699  */
1700 static ssize_t amdgpu_get_thermal_throttling_logging(struct device *dev,
1701 						     struct device_attribute *attr,
1702 						     char *buf)
1703 {
1704 	struct drm_device *ddev = dev_get_drvdata(dev);
1705 	struct amdgpu_device *adev = drm_to_adev(ddev);
1706 
1707 	return sysfs_emit(buf, "%s: thermal throttling logging %s, with interval %d seconds\n",
1708 			  adev_to_drm(adev)->unique,
1709 			  atomic_read(&adev->throttling_logging_enabled) ? "enabled" : "disabled",
1710 			  adev->throttling_logging_rs.interval / HZ + 1);
1711 }
1712 
1713 static ssize_t amdgpu_set_thermal_throttling_logging(struct device *dev,
1714 						     struct device_attribute *attr,
1715 						     const char *buf,
1716 						     size_t count)
1717 {
1718 	struct drm_device *ddev = dev_get_drvdata(dev);
1719 	struct amdgpu_device *adev = drm_to_adev(ddev);
1720 	long throttling_logging_interval;
1721 	unsigned long flags;
1722 	int ret = 0;
1723 
1724 	ret = kstrtol(buf, 0, &throttling_logging_interval);
1725 	if (ret)
1726 		return ret;
1727 
1728 	if (throttling_logging_interval > 3600)
1729 		return -EINVAL;
1730 
1731 	if (throttling_logging_interval > 0) {
1732 		raw_spin_lock_irqsave(&adev->throttling_logging_rs.lock, flags);
1733 		/*
1734 		 * Reset the ratelimit timer internals.
1735 		 * This can effectively restart the timer.
1736 		 */
1737 		adev->throttling_logging_rs.interval =
1738 			(throttling_logging_interval - 1) * HZ;
1739 		adev->throttling_logging_rs.begin = 0;
1740 		adev->throttling_logging_rs.printed = 0;
1741 		adev->throttling_logging_rs.missed = 0;
1742 		raw_spin_unlock_irqrestore(&adev->throttling_logging_rs.lock, flags);
1743 
1744 		atomic_set(&adev->throttling_logging_enabled, 1);
1745 	} else {
1746 		atomic_set(&adev->throttling_logging_enabled, 0);
1747 	}
1748 
1749 	return count;
1750 }
1751 
1752 /**
1753  * DOC: apu_thermal_cap
1754  *
1755  * The amdgpu driver provides a sysfs API for retrieving/updating thermal
1756  * limit temperature in millidegrees Celsius
1757  *
1758  * Reading back the file shows you core limit value
1759  *
1760  * Writing an integer to the file, sets a new thermal limit. The value
1761  * should be between 0 and 100. If the value is less than 0 or greater
1762  * than 100, then the write request will be ignored.
1763  */
1764 static ssize_t amdgpu_get_apu_thermal_cap(struct device *dev,
1765 					 struct device_attribute *attr,
1766 					 char *buf)
1767 {
1768 	int ret, size;
1769 	u32 limit;
1770 	struct drm_device *ddev = dev_get_drvdata(dev);
1771 	struct amdgpu_device *adev = drm_to_adev(ddev);
1772 
1773 	ret = pm_runtime_get_sync(ddev->dev);
1774 	if (ret < 0) {
1775 		pm_runtime_put_autosuspend(ddev->dev);
1776 		return ret;
1777 	}
1778 
1779 	ret = amdgpu_dpm_get_apu_thermal_limit(adev, &limit);
1780 	if (!ret)
1781 		size = sysfs_emit(buf, "%u\n", limit);
1782 	else
1783 		size = sysfs_emit(buf, "failed to get thermal limit\n");
1784 
1785 	pm_runtime_mark_last_busy(ddev->dev);
1786 	pm_runtime_put_autosuspend(ddev->dev);
1787 
1788 	return size;
1789 }
1790 
1791 static ssize_t amdgpu_set_apu_thermal_cap(struct device *dev,
1792 					 struct device_attribute *attr,
1793 					 const char *buf,
1794 					 size_t count)
1795 {
1796 	int ret;
1797 	u32 value;
1798 	struct drm_device *ddev = dev_get_drvdata(dev);
1799 	struct amdgpu_device *adev = drm_to_adev(ddev);
1800 
1801 	ret = kstrtou32(buf, 10, &value);
1802 	if (ret)
1803 		return ret;
1804 
1805 	if (value > 100) {
1806 		dev_err(dev, "Invalid argument !\n");
1807 		return -EINVAL;
1808 	}
1809 
1810 	ret = pm_runtime_get_sync(ddev->dev);
1811 	if (ret < 0) {
1812 		pm_runtime_put_autosuspend(ddev->dev);
1813 		return ret;
1814 	}
1815 
1816 	ret = amdgpu_dpm_set_apu_thermal_limit(adev, value);
1817 	if (ret) {
1818 		dev_err(dev, "failed to update thermal limit\n");
1819 		return ret;
1820 	}
1821 
1822 	pm_runtime_mark_last_busy(ddev->dev);
1823 	pm_runtime_put_autosuspend(ddev->dev);
1824 
1825 	return count;
1826 }
1827 
1828 static int amdgpu_pm_metrics_attr_update(struct amdgpu_device *adev,
1829 					 struct amdgpu_device_attr *attr,
1830 					 uint32_t mask,
1831 					 enum amdgpu_device_attr_states *states)
1832 {
1833 	if (amdgpu_dpm_get_pm_metrics(adev, NULL, 0) == -EOPNOTSUPP)
1834 		*states = ATTR_STATE_UNSUPPORTED;
1835 
1836 	return 0;
1837 }
1838 
1839 static ssize_t amdgpu_get_pm_metrics(struct device *dev,
1840 				     struct device_attribute *attr, char *buf)
1841 {
1842 	struct drm_device *ddev = dev_get_drvdata(dev);
1843 	struct amdgpu_device *adev = drm_to_adev(ddev);
1844 	ssize_t size = 0;
1845 	int ret;
1846 
1847 	if (amdgpu_in_reset(adev))
1848 		return -EPERM;
1849 	if (adev->in_suspend && !adev->in_runpm)
1850 		return -EPERM;
1851 
1852 	ret = pm_runtime_get_sync(ddev->dev);
1853 	if (ret < 0) {
1854 		pm_runtime_put_autosuspend(ddev->dev);
1855 		return ret;
1856 	}
1857 
1858 	size = amdgpu_dpm_get_pm_metrics(adev, buf, PAGE_SIZE);
1859 
1860 	pm_runtime_mark_last_busy(ddev->dev);
1861 	pm_runtime_put_autosuspend(ddev->dev);
1862 
1863 	return size;
1864 }
1865 
1866 /**
1867  * DOC: gpu_metrics
1868  *
1869  * The amdgpu driver provides a sysfs API for retrieving current gpu
1870  * metrics data. The file gpu_metrics is used for this. Reading the
1871  * file will dump all the current gpu metrics data.
1872  *
1873  * These data include temperature, frequency, engines utilization,
1874  * power consume, throttler status, fan speed and cpu core statistics(
1875  * available for APU only). That's it will give a snapshot of all sensors
1876  * at the same time.
1877  */
1878 static ssize_t amdgpu_get_gpu_metrics(struct device *dev,
1879 				      struct device_attribute *attr,
1880 				      char *buf)
1881 {
1882 	struct drm_device *ddev = dev_get_drvdata(dev);
1883 	struct amdgpu_device *adev = drm_to_adev(ddev);
1884 	void *gpu_metrics;
1885 	ssize_t size = 0;
1886 	int ret;
1887 
1888 	if (amdgpu_in_reset(adev))
1889 		return -EPERM;
1890 	if (adev->in_suspend && !adev->in_runpm)
1891 		return -EPERM;
1892 
1893 	ret = pm_runtime_get_sync(ddev->dev);
1894 	if (ret < 0) {
1895 		pm_runtime_put_autosuspend(ddev->dev);
1896 		return ret;
1897 	}
1898 
1899 	size = amdgpu_dpm_get_gpu_metrics(adev, &gpu_metrics);
1900 	if (size <= 0)
1901 		goto out;
1902 
1903 	if (size >= PAGE_SIZE)
1904 		size = PAGE_SIZE - 1;
1905 
1906 	memcpy(buf, gpu_metrics, size);
1907 
1908 out:
1909 	pm_runtime_mark_last_busy(ddev->dev);
1910 	pm_runtime_put_autosuspend(ddev->dev);
1911 
1912 	return size;
1913 }
1914 
1915 static int amdgpu_show_powershift_percent(struct device *dev,
1916 					char *buf, enum amd_pp_sensors sensor)
1917 {
1918 	struct drm_device *ddev = dev_get_drvdata(dev);
1919 	struct amdgpu_device *adev = drm_to_adev(ddev);
1920 	uint32_t ss_power;
1921 	int r = 0, i;
1922 
1923 	r = amdgpu_hwmon_get_sensor_generic(adev, sensor, (void *)&ss_power);
1924 	if (r == -EOPNOTSUPP) {
1925 		/* sensor not available on dGPU, try to read from APU */
1926 		adev = NULL;
1927 		mutex_lock(&mgpu_info.mutex);
1928 		for (i = 0; i < mgpu_info.num_gpu; i++) {
1929 			if (mgpu_info.gpu_ins[i].adev->flags & AMD_IS_APU) {
1930 				adev = mgpu_info.gpu_ins[i].adev;
1931 				break;
1932 			}
1933 		}
1934 		mutex_unlock(&mgpu_info.mutex);
1935 		if (adev)
1936 			r = amdgpu_hwmon_get_sensor_generic(adev, sensor, (void *)&ss_power);
1937 	}
1938 
1939 	if (r)
1940 		return r;
1941 
1942 	return sysfs_emit(buf, "%u%%\n", ss_power);
1943 }
1944 
1945 /**
1946  * DOC: smartshift_apu_power
1947  *
1948  * The amdgpu driver provides a sysfs API for reporting APU power
1949  * shift in percentage if platform supports smartshift. Value 0 means that
1950  * there is no powershift and values between [1-100] means that the power
1951  * is shifted to APU, the percentage of boost is with respect to APU power
1952  * limit on the platform.
1953  */
1954 
1955 static ssize_t amdgpu_get_smartshift_apu_power(struct device *dev, struct device_attribute *attr,
1956 					       char *buf)
1957 {
1958 	return amdgpu_show_powershift_percent(dev, buf, AMDGPU_PP_SENSOR_SS_APU_SHARE);
1959 }
1960 
1961 /**
1962  * DOC: smartshift_dgpu_power
1963  *
1964  * The amdgpu driver provides a sysfs API for reporting dGPU power
1965  * shift in percentage if platform supports smartshift. Value 0 means that
1966  * there is no powershift and values between [1-100] means that the power is
1967  * shifted to dGPU, the percentage of boost is with respect to dGPU power
1968  * limit on the platform.
1969  */
1970 
1971 static ssize_t amdgpu_get_smartshift_dgpu_power(struct device *dev, struct device_attribute *attr,
1972 						char *buf)
1973 {
1974 	return amdgpu_show_powershift_percent(dev, buf, AMDGPU_PP_SENSOR_SS_DGPU_SHARE);
1975 }
1976 
1977 /**
1978  * DOC: smartshift_bias
1979  *
1980  * The amdgpu driver provides a sysfs API for reporting the
1981  * smartshift(SS2.0) bias level. The value ranges from -100 to 100
1982  * and the default is 0. -100 sets maximum preference to APU
1983  * and 100 sets max perference to dGPU.
1984  */
1985 
1986 static ssize_t amdgpu_get_smartshift_bias(struct device *dev,
1987 					  struct device_attribute *attr,
1988 					  char *buf)
1989 {
1990 	int r = 0;
1991 
1992 	r = sysfs_emit(buf, "%d\n", amdgpu_smartshift_bias);
1993 
1994 	return r;
1995 }
1996 
1997 static ssize_t amdgpu_set_smartshift_bias(struct device *dev,
1998 					  struct device_attribute *attr,
1999 					  const char *buf, size_t count)
2000 {
2001 	struct drm_device *ddev = dev_get_drvdata(dev);
2002 	struct amdgpu_device *adev = drm_to_adev(ddev);
2003 	int r = 0;
2004 	int bias = 0;
2005 
2006 	if (amdgpu_in_reset(adev))
2007 		return -EPERM;
2008 	if (adev->in_suspend && !adev->in_runpm)
2009 		return -EPERM;
2010 
2011 	r = pm_runtime_get_sync(ddev->dev);
2012 	if (r < 0) {
2013 		pm_runtime_put_autosuspend(ddev->dev);
2014 		return r;
2015 	}
2016 
2017 	r = kstrtoint(buf, 10, &bias);
2018 	if (r)
2019 		goto out;
2020 
2021 	if (bias > AMDGPU_SMARTSHIFT_MAX_BIAS)
2022 		bias = AMDGPU_SMARTSHIFT_MAX_BIAS;
2023 	else if (bias < AMDGPU_SMARTSHIFT_MIN_BIAS)
2024 		bias = AMDGPU_SMARTSHIFT_MIN_BIAS;
2025 
2026 	amdgpu_smartshift_bias = bias;
2027 	r = count;
2028 
2029 	/* TODO: update bias level with SMU message */
2030 
2031 out:
2032 	pm_runtime_mark_last_busy(ddev->dev);
2033 	pm_runtime_put_autosuspend(ddev->dev);
2034 	return r;
2035 }
2036 
2037 static int ss_power_attr_update(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2038 				uint32_t mask, enum amdgpu_device_attr_states *states)
2039 {
2040 	if (!amdgpu_device_supports_smart_shift(adev_to_drm(adev)))
2041 		*states = ATTR_STATE_UNSUPPORTED;
2042 
2043 	return 0;
2044 }
2045 
2046 static int ss_bias_attr_update(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2047 			       uint32_t mask, enum amdgpu_device_attr_states *states)
2048 {
2049 	uint32_t ss_power;
2050 
2051 	if (!amdgpu_device_supports_smart_shift(adev_to_drm(adev)))
2052 		*states = ATTR_STATE_UNSUPPORTED;
2053 	else if (amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_SS_APU_SHARE,
2054 		 (void *)&ss_power))
2055 		*states = ATTR_STATE_UNSUPPORTED;
2056 	else if (amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_SS_DGPU_SHARE,
2057 		 (void *)&ss_power))
2058 		*states = ATTR_STATE_UNSUPPORTED;
2059 
2060 	return 0;
2061 }
2062 
2063 static int pp_od_clk_voltage_attr_update(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2064 					 uint32_t mask, enum amdgpu_device_attr_states *states)
2065 {
2066 	uint32_t gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
2067 
2068 	*states = ATTR_STATE_SUPPORTED;
2069 
2070 	if (!amdgpu_dpm_is_overdrive_supported(adev)) {
2071 		*states = ATTR_STATE_UNSUPPORTED;
2072 		return 0;
2073 	}
2074 
2075 	/* Enable pp_od_clk_voltage node for gc 9.4.3 SRIOV/BM support */
2076 	if (gc_ver == IP_VERSION(9, 4, 3) ||
2077 	    gc_ver == IP_VERSION(9, 4, 4)) {
2078 		if (amdgpu_sriov_vf(adev) && !amdgpu_sriov_is_pp_one_vf(adev))
2079 			*states = ATTR_STATE_UNSUPPORTED;
2080 		return 0;
2081 	}
2082 
2083 	if (!(attr->flags & mask))
2084 		*states = ATTR_STATE_UNSUPPORTED;
2085 
2086 	return 0;
2087 }
2088 
2089 static int pp_dpm_dcefclk_attr_update(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2090 				      uint32_t mask, enum amdgpu_device_attr_states *states)
2091 {
2092 	struct device_attribute *dev_attr = &attr->dev_attr;
2093 	uint32_t gc_ver;
2094 
2095 	*states = ATTR_STATE_SUPPORTED;
2096 
2097 	if (!(attr->flags & mask)) {
2098 		*states = ATTR_STATE_UNSUPPORTED;
2099 		return 0;
2100 	}
2101 
2102 	gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
2103 	/* dcefclk node is not available on gfx 11.0.3 sriov */
2104 	if ((gc_ver == IP_VERSION(11, 0, 3) && amdgpu_sriov_is_pp_one_vf(adev)) ||
2105 	    gc_ver < IP_VERSION(9, 0, 0) ||
2106 	    !amdgpu_device_has_display_hardware(adev))
2107 		*states = ATTR_STATE_UNSUPPORTED;
2108 
2109 	/* SMU MP1 does not support dcefclk level setting,
2110 	 * setting should not be allowed from VF if not in one VF mode.
2111 	 */
2112 	if (gc_ver >= IP_VERSION(10, 0, 0) ||
2113 	    (amdgpu_sriov_vf(adev) && !amdgpu_sriov_is_pp_one_vf(adev))) {
2114 		dev_attr->attr.mode &= ~S_IWUGO;
2115 		dev_attr->store = NULL;
2116 	}
2117 
2118 	return 0;
2119 }
2120 
2121 static int pp_dpm_clk_default_attr_update(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2122 					  uint32_t mask, enum amdgpu_device_attr_states *states)
2123 {
2124 	struct device_attribute *dev_attr = &attr->dev_attr;
2125 	enum amdgpu_device_attr_id attr_id = attr->attr_id;
2126 	uint32_t mp1_ver = amdgpu_ip_version(adev, MP1_HWIP, 0);
2127 	uint32_t gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
2128 
2129 	*states = ATTR_STATE_SUPPORTED;
2130 
2131 	if (!(attr->flags & mask)) {
2132 		*states = ATTR_STATE_UNSUPPORTED;
2133 		return 0;
2134 	}
2135 
2136 	if (DEVICE_ATTR_IS(pp_dpm_socclk)) {
2137 		if (gc_ver < IP_VERSION(9, 0, 0))
2138 			*states = ATTR_STATE_UNSUPPORTED;
2139 	} else if (DEVICE_ATTR_IS(pp_dpm_fclk)) {
2140 		if (mp1_ver < IP_VERSION(10, 0, 0))
2141 			*states = ATTR_STATE_UNSUPPORTED;
2142 	} else if (DEVICE_ATTR_IS(pp_dpm_vclk)) {
2143 		if (!(gc_ver == IP_VERSION(10, 3, 1) ||
2144 		      gc_ver == IP_VERSION(10, 3, 3) ||
2145 		      gc_ver == IP_VERSION(10, 3, 6) ||
2146 		      gc_ver == IP_VERSION(10, 3, 7) ||
2147 		      gc_ver == IP_VERSION(10, 3, 0) ||
2148 		      gc_ver == IP_VERSION(10, 1, 2) ||
2149 		      gc_ver == IP_VERSION(11, 0, 0) ||
2150 		      gc_ver == IP_VERSION(11, 0, 1) ||
2151 		      gc_ver == IP_VERSION(11, 0, 4) ||
2152 		      gc_ver == IP_VERSION(11, 5, 0) ||
2153 		      gc_ver == IP_VERSION(11, 0, 2) ||
2154 		      gc_ver == IP_VERSION(11, 0, 3) ||
2155 		      gc_ver == IP_VERSION(9, 4, 3) ||
2156 		      gc_ver == IP_VERSION(9, 4, 4)))
2157 			*states = ATTR_STATE_UNSUPPORTED;
2158 	} else if (DEVICE_ATTR_IS(pp_dpm_vclk1)) {
2159 		if (!((gc_ver == IP_VERSION(10, 3, 1) ||
2160 		       gc_ver == IP_VERSION(10, 3, 0) ||
2161 		       gc_ver == IP_VERSION(11, 0, 2) ||
2162 		       gc_ver == IP_VERSION(11, 0, 3)) && adev->vcn.num_vcn_inst >= 2))
2163 			*states = ATTR_STATE_UNSUPPORTED;
2164 	} else if (DEVICE_ATTR_IS(pp_dpm_dclk)) {
2165 		if (!(gc_ver == IP_VERSION(10, 3, 1) ||
2166 		      gc_ver == IP_VERSION(10, 3, 3) ||
2167 		      gc_ver == IP_VERSION(10, 3, 6) ||
2168 		      gc_ver == IP_VERSION(10, 3, 7) ||
2169 		      gc_ver == IP_VERSION(10, 3, 0) ||
2170 		      gc_ver == IP_VERSION(10, 1, 2) ||
2171 		      gc_ver == IP_VERSION(11, 0, 0) ||
2172 		      gc_ver == IP_VERSION(11, 0, 1) ||
2173 		      gc_ver == IP_VERSION(11, 0, 4) ||
2174 		      gc_ver == IP_VERSION(11, 5, 0) ||
2175 		      gc_ver == IP_VERSION(11, 0, 2) ||
2176 		      gc_ver == IP_VERSION(11, 0, 3) ||
2177 		      gc_ver == IP_VERSION(9, 4, 3) ||
2178 		      gc_ver == IP_VERSION(9, 4, 4)))
2179 			*states = ATTR_STATE_UNSUPPORTED;
2180 	} else if (DEVICE_ATTR_IS(pp_dpm_dclk1)) {
2181 		if (!((gc_ver == IP_VERSION(10, 3, 1) ||
2182 		       gc_ver == IP_VERSION(10, 3, 0) ||
2183 		       gc_ver == IP_VERSION(11, 0, 2) ||
2184 		       gc_ver == IP_VERSION(11, 0, 3)) && adev->vcn.num_vcn_inst >= 2))
2185 			*states = ATTR_STATE_UNSUPPORTED;
2186 	} else if (DEVICE_ATTR_IS(pp_dpm_pcie)) {
2187 		if (gc_ver == IP_VERSION(9, 4, 2) ||
2188 		    gc_ver == IP_VERSION(9, 4, 3) ||
2189 		    gc_ver == IP_VERSION(9, 4, 4))
2190 			*states = ATTR_STATE_UNSUPPORTED;
2191 	}
2192 
2193 	switch (gc_ver) {
2194 	case IP_VERSION(9, 4, 1):
2195 	case IP_VERSION(9, 4, 2):
2196 		/* the Mi series card does not support standalone mclk/socclk/fclk level setting */
2197 		if (DEVICE_ATTR_IS(pp_dpm_mclk) ||
2198 		    DEVICE_ATTR_IS(pp_dpm_socclk) ||
2199 		    DEVICE_ATTR_IS(pp_dpm_fclk)) {
2200 			dev_attr->attr.mode &= ~S_IWUGO;
2201 			dev_attr->store = NULL;
2202 		}
2203 		break;
2204 	default:
2205 		break;
2206 	}
2207 
2208 	/* setting should not be allowed from VF if not in one VF mode */
2209 	if (amdgpu_sriov_vf(adev) && amdgpu_sriov_is_pp_one_vf(adev)) {
2210 		dev_attr->attr.mode &= ~S_IWUGO;
2211 		dev_attr->store = NULL;
2212 	}
2213 
2214 	return 0;
2215 }
2216 
2217 /* pm policy attributes */
2218 struct amdgpu_pm_policy_attr {
2219 	struct device_attribute dev_attr;
2220 	enum pp_pm_policy id;
2221 };
2222 
2223 /**
2224  * DOC: pm_policy
2225  *
2226  * Certain SOCs can support different power policies to optimize application
2227  * performance. However, this policy is provided only at SOC level and not at a
2228  * per-process level. This is useful especially when entire SOC is utilized for
2229  * dedicated workload.
2230  *
2231  * The amdgpu driver provides a sysfs API for selecting the policy. Presently,
2232  * only two types of policies are supported through this interface.
2233  *
2234  *  Pstate Policy Selection - This is to select different Pstate profiles which
2235  *  decides clock/throttling preferences.
2236  *
2237  *  XGMI PLPD Policy Selection - When multiple devices are connected over XGMI,
2238  *  this helps to select policy to be applied for per link power down.
2239  *
2240  * The list of available policies and policy levels vary between SOCs. They can
2241  * be viewed under pm_policy node directory. If SOC doesn't support any policy,
2242  * this node won't be available. The different policies supported will be
2243  * available as separate nodes under pm_policy.
2244  *
2245  *	cat /sys/bus/pci/devices/.../pm_policy/<policy_type>
2246  *
2247  * Reading the policy file shows the different levels supported. The level which
2248  * is applied presently is denoted by * (asterisk). E.g.,
2249  *
2250  * .. code-block:: console
2251  *
2252  *	cat /sys/bus/pci/devices/.../pm_policy/soc_pstate
2253  *	0 : soc_pstate_default
2254  *	1 : soc_pstate_0
2255  *	2 : soc_pstate_1*
2256  *	3 : soc_pstate_2
2257  *
2258  *	cat /sys/bus/pci/devices/.../pm_policy/xgmi_plpd
2259  *	0 : plpd_disallow
2260  *	1 : plpd_default
2261  *	2 : plpd_optimized*
2262  *
2263  * To apply a specific policy
2264  *
2265  * "echo  <level> > /sys/bus/pci/devices/.../pm_policy/<policy_type>"
2266  *
2267  * For the levels listed in the example above, to select "plpd_optimized" for
2268  * XGMI and "soc_pstate_2" for soc pstate policy -
2269  *
2270  * .. code-block:: console
2271  *
2272  *	echo "2" > /sys/bus/pci/devices/.../pm_policy/xgmi_plpd
2273  *	echo "3" > /sys/bus/pci/devices/.../pm_policy/soc_pstate
2274  *
2275  */
2276 static ssize_t amdgpu_get_pm_policy_attr(struct device *dev,
2277 					 struct device_attribute *attr,
2278 					 char *buf)
2279 {
2280 	struct drm_device *ddev = dev_get_drvdata(dev);
2281 	struct amdgpu_device *adev = drm_to_adev(ddev);
2282 	struct amdgpu_pm_policy_attr *policy_attr;
2283 
2284 	policy_attr =
2285 		container_of(attr, struct amdgpu_pm_policy_attr, dev_attr);
2286 
2287 	if (amdgpu_in_reset(adev))
2288 		return -EPERM;
2289 	if (adev->in_suspend && !adev->in_runpm)
2290 		return -EPERM;
2291 
2292 	return amdgpu_dpm_get_pm_policy_info(adev, policy_attr->id, buf);
2293 }
2294 
2295 static ssize_t amdgpu_set_pm_policy_attr(struct device *dev,
2296 					 struct device_attribute *attr,
2297 					 const char *buf, size_t count)
2298 {
2299 	struct drm_device *ddev = dev_get_drvdata(dev);
2300 	struct amdgpu_device *adev = drm_to_adev(ddev);
2301 	struct amdgpu_pm_policy_attr *policy_attr;
2302 	int ret, num_params = 0;
2303 	char delimiter[] = " \n\t";
2304 	char tmp_buf[128];
2305 	char *tmp, *param;
2306 	long val;
2307 
2308 	if (amdgpu_in_reset(adev))
2309 		return -EPERM;
2310 	if (adev->in_suspend && !adev->in_runpm)
2311 		return -EPERM;
2312 
2313 	count = min(count, sizeof(tmp_buf));
2314 	memcpy(tmp_buf, buf, count);
2315 	tmp_buf[count - 1] = '\0';
2316 	tmp = tmp_buf;
2317 
2318 	tmp = skip_spaces(tmp);
2319 	while ((param = strsep(&tmp, delimiter))) {
2320 		if (!strlen(param)) {
2321 			tmp = skip_spaces(tmp);
2322 			continue;
2323 		}
2324 		ret = kstrtol(param, 0, &val);
2325 		if (ret)
2326 			return -EINVAL;
2327 		num_params++;
2328 		if (num_params > 1)
2329 			return -EINVAL;
2330 	}
2331 
2332 	if (num_params != 1)
2333 		return -EINVAL;
2334 
2335 	policy_attr =
2336 		container_of(attr, struct amdgpu_pm_policy_attr, dev_attr);
2337 
2338 	ret = pm_runtime_get_sync(ddev->dev);
2339 	if (ret < 0) {
2340 		pm_runtime_put_autosuspend(ddev->dev);
2341 		return ret;
2342 	}
2343 
2344 	ret = amdgpu_dpm_set_pm_policy(adev, policy_attr->id, val);
2345 
2346 	pm_runtime_mark_last_busy(ddev->dev);
2347 	pm_runtime_put_autosuspend(ddev->dev);
2348 
2349 	if (ret)
2350 		return ret;
2351 
2352 	return count;
2353 }
2354 
2355 #define AMDGPU_PM_POLICY_ATTR(_name, _id)                                  \
2356 	static struct amdgpu_pm_policy_attr pm_policy_attr_##_name = {     \
2357 		.dev_attr = __ATTR(_name, 0644, amdgpu_get_pm_policy_attr, \
2358 				   amdgpu_set_pm_policy_attr),             \
2359 		.id = PP_PM_POLICY_##_id,                                  \
2360 	};
2361 
2362 #define AMDGPU_PM_POLICY_ATTR_VAR(_name) pm_policy_attr_##_name.dev_attr.attr
2363 
2364 AMDGPU_PM_POLICY_ATTR(soc_pstate, SOC_PSTATE)
2365 AMDGPU_PM_POLICY_ATTR(xgmi_plpd, XGMI_PLPD)
2366 
2367 static struct attribute *pm_policy_attrs[] = {
2368 	&AMDGPU_PM_POLICY_ATTR_VAR(soc_pstate),
2369 	&AMDGPU_PM_POLICY_ATTR_VAR(xgmi_plpd),
2370 	NULL
2371 };
2372 
2373 static umode_t amdgpu_pm_policy_attr_visible(struct kobject *kobj,
2374 					     struct attribute *attr, int n)
2375 {
2376 	struct device *dev = kobj_to_dev(kobj);
2377 	struct drm_device *ddev = dev_get_drvdata(dev);
2378 	struct amdgpu_device *adev = drm_to_adev(ddev);
2379 	struct amdgpu_pm_policy_attr *policy_attr;
2380 
2381 	policy_attr =
2382 		container_of(attr, struct amdgpu_pm_policy_attr, dev_attr.attr);
2383 
2384 	if (amdgpu_dpm_get_pm_policy_info(adev, policy_attr->id, NULL) ==
2385 	    -ENOENT)
2386 		return 0;
2387 
2388 	return attr->mode;
2389 }
2390 
2391 const struct attribute_group amdgpu_pm_policy_attr_group = {
2392 	.name = "pm_policy",
2393 	.attrs = pm_policy_attrs,
2394 	.is_visible = amdgpu_pm_policy_attr_visible,
2395 };
2396 
2397 static struct amdgpu_device_attr amdgpu_device_attrs[] = {
2398 	AMDGPU_DEVICE_ATTR_RW(power_dpm_state,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2399 	AMDGPU_DEVICE_ATTR_RW(power_dpm_force_performance_level,	ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2400 	AMDGPU_DEVICE_ATTR_RO(pp_num_states,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2401 	AMDGPU_DEVICE_ATTR_RO(pp_cur_state,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2402 	AMDGPU_DEVICE_ATTR_RW(pp_force_state,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2403 	AMDGPU_DEVICE_ATTR_RW(pp_table,					ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2404 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_sclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2405 			      .attr_update = pp_dpm_clk_default_attr_update),
2406 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_mclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2407 			      .attr_update = pp_dpm_clk_default_attr_update),
2408 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_socclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2409 			      .attr_update = pp_dpm_clk_default_attr_update),
2410 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_fclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2411 			      .attr_update = pp_dpm_clk_default_attr_update),
2412 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_vclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2413 			      .attr_update = pp_dpm_clk_default_attr_update),
2414 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_vclk1,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2415 			      .attr_update = pp_dpm_clk_default_attr_update),
2416 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_dclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2417 			      .attr_update = pp_dpm_clk_default_attr_update),
2418 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_dclk1,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2419 			      .attr_update = pp_dpm_clk_default_attr_update),
2420 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_dcefclk,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2421 			      .attr_update = pp_dpm_dcefclk_attr_update),
2422 	AMDGPU_DEVICE_ATTR_RW(pp_dpm_pcie,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF,
2423 			      .attr_update = pp_dpm_clk_default_attr_update),
2424 	AMDGPU_DEVICE_ATTR_RW(pp_sclk_od,				ATTR_FLAG_BASIC),
2425 	AMDGPU_DEVICE_ATTR_RW(pp_mclk_od,				ATTR_FLAG_BASIC),
2426 	AMDGPU_DEVICE_ATTR_RW(pp_power_profile_mode,			ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2427 	AMDGPU_DEVICE_ATTR_RW(pp_od_clk_voltage,			ATTR_FLAG_BASIC,
2428 			      .attr_update = pp_od_clk_voltage_attr_update),
2429 	AMDGPU_DEVICE_ATTR_RO(gpu_busy_percent,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2430 	AMDGPU_DEVICE_ATTR_RO(mem_busy_percent,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2431 	AMDGPU_DEVICE_ATTR_RO(vcn_busy_percent,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2432 	AMDGPU_DEVICE_ATTR_RO(pcie_bw,					ATTR_FLAG_BASIC),
2433 	AMDGPU_DEVICE_ATTR_RW(pp_features,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2434 	AMDGPU_DEVICE_ATTR_RO(unique_id,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2435 	AMDGPU_DEVICE_ATTR_RW(thermal_throttling_logging,		ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2436 	AMDGPU_DEVICE_ATTR_RW(apu_thermal_cap,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2437 	AMDGPU_DEVICE_ATTR_RO(gpu_metrics,				ATTR_FLAG_BASIC|ATTR_FLAG_ONEVF),
2438 	AMDGPU_DEVICE_ATTR_RO(smartshift_apu_power,			ATTR_FLAG_BASIC,
2439 			      .attr_update = ss_power_attr_update),
2440 	AMDGPU_DEVICE_ATTR_RO(smartshift_dgpu_power,			ATTR_FLAG_BASIC,
2441 			      .attr_update = ss_power_attr_update),
2442 	AMDGPU_DEVICE_ATTR_RW(smartshift_bias,				ATTR_FLAG_BASIC,
2443 			      .attr_update = ss_bias_attr_update),
2444 	AMDGPU_DEVICE_ATTR_RO(pm_metrics,				ATTR_FLAG_BASIC,
2445 			      .attr_update = amdgpu_pm_metrics_attr_update),
2446 };
2447 
2448 static int default_attr_update(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2449 			       uint32_t mask, enum amdgpu_device_attr_states *states)
2450 {
2451 	struct device_attribute *dev_attr = &attr->dev_attr;
2452 	enum amdgpu_device_attr_id attr_id = attr->attr_id;
2453 	uint32_t gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
2454 
2455 	if (!(attr->flags & mask)) {
2456 		*states = ATTR_STATE_UNSUPPORTED;
2457 		return 0;
2458 	}
2459 
2460 	if (DEVICE_ATTR_IS(mem_busy_percent)) {
2461 		if ((adev->flags & AMD_IS_APU &&
2462 		     gc_ver != IP_VERSION(9, 4, 3)) ||
2463 		    gc_ver == IP_VERSION(9, 0, 1))
2464 			*states = ATTR_STATE_UNSUPPORTED;
2465 	} else if (DEVICE_ATTR_IS(vcn_busy_percent)) {
2466 		if (!(gc_ver == IP_VERSION(10, 3, 1) ||
2467 			  gc_ver == IP_VERSION(10, 3, 3) ||
2468 			  gc_ver == IP_VERSION(10, 3, 6) ||
2469 			  gc_ver == IP_VERSION(10, 3, 7) ||
2470 			  gc_ver == IP_VERSION(11, 0, 1) ||
2471 			  gc_ver == IP_VERSION(11, 0, 4) ||
2472 			  gc_ver == IP_VERSION(11, 5, 0)))
2473 			*states = ATTR_STATE_UNSUPPORTED;
2474 	} else if (DEVICE_ATTR_IS(pcie_bw)) {
2475 		/* PCIe Perf counters won't work on APU nodes */
2476 		if (adev->flags & AMD_IS_APU ||
2477 		    !adev->asic_funcs->get_pcie_usage)
2478 			*states = ATTR_STATE_UNSUPPORTED;
2479 	} else if (DEVICE_ATTR_IS(unique_id)) {
2480 		switch (gc_ver) {
2481 		case IP_VERSION(9, 0, 1):
2482 		case IP_VERSION(9, 4, 0):
2483 		case IP_VERSION(9, 4, 1):
2484 		case IP_VERSION(9, 4, 2):
2485 		case IP_VERSION(9, 4, 3):
2486 		case IP_VERSION(9, 4, 4):
2487 		case IP_VERSION(10, 3, 0):
2488 		case IP_VERSION(11, 0, 0):
2489 		case IP_VERSION(11, 0, 1):
2490 		case IP_VERSION(11, 0, 2):
2491 		case IP_VERSION(11, 0, 3):
2492 			*states = ATTR_STATE_SUPPORTED;
2493 			break;
2494 		default:
2495 			*states = ATTR_STATE_UNSUPPORTED;
2496 		}
2497 	} else if (DEVICE_ATTR_IS(pp_features)) {
2498 		if ((adev->flags & AMD_IS_APU &&
2499 		     gc_ver != IP_VERSION(9, 4, 3)) ||
2500 		    gc_ver < IP_VERSION(9, 0, 0))
2501 			*states = ATTR_STATE_UNSUPPORTED;
2502 	} else if (DEVICE_ATTR_IS(gpu_metrics)) {
2503 		if (gc_ver < IP_VERSION(9, 1, 0))
2504 			*states = ATTR_STATE_UNSUPPORTED;
2505 	} else if (DEVICE_ATTR_IS(pp_power_profile_mode)) {
2506 		if (amdgpu_dpm_get_power_profile_mode(adev, NULL) == -EOPNOTSUPP)
2507 			*states = ATTR_STATE_UNSUPPORTED;
2508 		else if ((gc_ver == IP_VERSION(10, 3, 0) ||
2509 			  gc_ver == IP_VERSION(11, 0, 3)) && amdgpu_sriov_vf(adev))
2510 			*states = ATTR_STATE_UNSUPPORTED;
2511 	} else if (DEVICE_ATTR_IS(pp_mclk_od)) {
2512 		if (amdgpu_dpm_get_mclk_od(adev) == -EOPNOTSUPP)
2513 			*states = ATTR_STATE_UNSUPPORTED;
2514 	} else if (DEVICE_ATTR_IS(pp_sclk_od)) {
2515 		if (amdgpu_dpm_get_sclk_od(adev) == -EOPNOTSUPP)
2516 			*states = ATTR_STATE_UNSUPPORTED;
2517 	} else if (DEVICE_ATTR_IS(apu_thermal_cap)) {
2518 		u32 limit;
2519 
2520 		if (amdgpu_dpm_get_apu_thermal_limit(adev, &limit) ==
2521 		    -EOPNOTSUPP)
2522 			*states = ATTR_STATE_UNSUPPORTED;
2523 	}
2524 
2525 	switch (gc_ver) {
2526 	case IP_VERSION(10, 3, 0):
2527 		if (DEVICE_ATTR_IS(power_dpm_force_performance_level) &&
2528 		    amdgpu_sriov_vf(adev)) {
2529 			dev_attr->attr.mode &= ~0222;
2530 			dev_attr->store = NULL;
2531 		}
2532 		break;
2533 	default:
2534 		break;
2535 	}
2536 
2537 	return 0;
2538 }
2539 
2540 
2541 static int amdgpu_device_attr_create(struct amdgpu_device *adev,
2542 				     struct amdgpu_device_attr *attr,
2543 				     uint32_t mask, struct list_head *attr_list)
2544 {
2545 	int ret = 0;
2546 	enum amdgpu_device_attr_states attr_states = ATTR_STATE_SUPPORTED;
2547 	struct amdgpu_device_attr_entry *attr_entry;
2548 	struct device_attribute *dev_attr;
2549 	const char *name;
2550 
2551 	int (*attr_update)(struct amdgpu_device *adev, struct amdgpu_device_attr *attr,
2552 			   uint32_t mask, enum amdgpu_device_attr_states *states) = default_attr_update;
2553 
2554 	if (!attr)
2555 		return -EINVAL;
2556 
2557 	dev_attr = &attr->dev_attr;
2558 	name = dev_attr->attr.name;
2559 
2560 	attr_update = attr->attr_update ? attr->attr_update : default_attr_update;
2561 
2562 	ret = attr_update(adev, attr, mask, &attr_states);
2563 	if (ret) {
2564 		dev_err(adev->dev, "failed to update device file %s, ret = %d\n",
2565 			name, ret);
2566 		return ret;
2567 	}
2568 
2569 	if (attr_states == ATTR_STATE_UNSUPPORTED)
2570 		return 0;
2571 
2572 	ret = device_create_file(adev->dev, dev_attr);
2573 	if (ret) {
2574 		dev_err(adev->dev, "failed to create device file %s, ret = %d\n",
2575 			name, ret);
2576 	}
2577 
2578 	attr_entry = kmalloc(sizeof(*attr_entry), GFP_KERNEL);
2579 	if (!attr_entry)
2580 		return -ENOMEM;
2581 
2582 	attr_entry->attr = attr;
2583 	INIT_LIST_HEAD(&attr_entry->entry);
2584 
2585 	list_add_tail(&attr_entry->entry, attr_list);
2586 
2587 	return ret;
2588 }
2589 
2590 static void amdgpu_device_attr_remove(struct amdgpu_device *adev, struct amdgpu_device_attr *attr)
2591 {
2592 	struct device_attribute *dev_attr = &attr->dev_attr;
2593 
2594 	device_remove_file(adev->dev, dev_attr);
2595 }
2596 
2597 static void amdgpu_device_attr_remove_groups(struct amdgpu_device *adev,
2598 					     struct list_head *attr_list);
2599 
2600 static int amdgpu_device_attr_create_groups(struct amdgpu_device *adev,
2601 					    struct amdgpu_device_attr *attrs,
2602 					    uint32_t counts,
2603 					    uint32_t mask,
2604 					    struct list_head *attr_list)
2605 {
2606 	int ret = 0;
2607 	uint32_t i = 0;
2608 
2609 	for (i = 0; i < counts; i++) {
2610 		ret = amdgpu_device_attr_create(adev, &attrs[i], mask, attr_list);
2611 		if (ret)
2612 			goto failed;
2613 	}
2614 
2615 	return 0;
2616 
2617 failed:
2618 	amdgpu_device_attr_remove_groups(adev, attr_list);
2619 
2620 	return ret;
2621 }
2622 
2623 static void amdgpu_device_attr_remove_groups(struct amdgpu_device *adev,
2624 					     struct list_head *attr_list)
2625 {
2626 	struct amdgpu_device_attr_entry *entry, *entry_tmp;
2627 
2628 	if (list_empty(attr_list))
2629 		return ;
2630 
2631 	list_for_each_entry_safe(entry, entry_tmp, attr_list, entry) {
2632 		amdgpu_device_attr_remove(adev, entry->attr);
2633 		list_del(&entry->entry);
2634 		kfree(entry);
2635 	}
2636 }
2637 
2638 static ssize_t amdgpu_hwmon_show_temp(struct device *dev,
2639 				      struct device_attribute *attr,
2640 				      char *buf)
2641 {
2642 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2643 	int channel = to_sensor_dev_attr(attr)->index;
2644 	int r, temp = 0;
2645 
2646 	if (channel >= PP_TEMP_MAX)
2647 		return -EINVAL;
2648 
2649 	switch (channel) {
2650 	case PP_TEMP_JUNCTION:
2651 		/* get current junction temperature */
2652 		r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_HOTSPOT_TEMP,
2653 					   (void *)&temp);
2654 		break;
2655 	case PP_TEMP_EDGE:
2656 		/* get current edge temperature */
2657 		r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_EDGE_TEMP,
2658 					   (void *)&temp);
2659 		break;
2660 	case PP_TEMP_MEM:
2661 		/* get current memory temperature */
2662 		r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_MEM_TEMP,
2663 					   (void *)&temp);
2664 		break;
2665 	default:
2666 		r = -EINVAL;
2667 		break;
2668 	}
2669 
2670 	if (r)
2671 		return r;
2672 
2673 	return sysfs_emit(buf, "%d\n", temp);
2674 }
2675 
2676 static ssize_t amdgpu_hwmon_show_temp_thresh(struct device *dev,
2677 					     struct device_attribute *attr,
2678 					     char *buf)
2679 {
2680 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2681 	int hyst = to_sensor_dev_attr(attr)->index;
2682 	int temp;
2683 
2684 	if (hyst)
2685 		temp = adev->pm.dpm.thermal.min_temp;
2686 	else
2687 		temp = adev->pm.dpm.thermal.max_temp;
2688 
2689 	return sysfs_emit(buf, "%d\n", temp);
2690 }
2691 
2692 static ssize_t amdgpu_hwmon_show_hotspot_temp_thresh(struct device *dev,
2693 					     struct device_attribute *attr,
2694 					     char *buf)
2695 {
2696 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2697 	int hyst = to_sensor_dev_attr(attr)->index;
2698 	int temp;
2699 
2700 	if (hyst)
2701 		temp = adev->pm.dpm.thermal.min_hotspot_temp;
2702 	else
2703 		temp = adev->pm.dpm.thermal.max_hotspot_crit_temp;
2704 
2705 	return sysfs_emit(buf, "%d\n", temp);
2706 }
2707 
2708 static ssize_t amdgpu_hwmon_show_mem_temp_thresh(struct device *dev,
2709 					     struct device_attribute *attr,
2710 					     char *buf)
2711 {
2712 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2713 	int hyst = to_sensor_dev_attr(attr)->index;
2714 	int temp;
2715 
2716 	if (hyst)
2717 		temp = adev->pm.dpm.thermal.min_mem_temp;
2718 	else
2719 		temp = adev->pm.dpm.thermal.max_mem_crit_temp;
2720 
2721 	return sysfs_emit(buf, "%d\n", temp);
2722 }
2723 
2724 static ssize_t amdgpu_hwmon_show_temp_label(struct device *dev,
2725 					     struct device_attribute *attr,
2726 					     char *buf)
2727 {
2728 	int channel = to_sensor_dev_attr(attr)->index;
2729 
2730 	if (channel >= PP_TEMP_MAX)
2731 		return -EINVAL;
2732 
2733 	return sysfs_emit(buf, "%s\n", temp_label[channel].label);
2734 }
2735 
2736 static ssize_t amdgpu_hwmon_show_temp_emergency(struct device *dev,
2737 					     struct device_attribute *attr,
2738 					     char *buf)
2739 {
2740 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2741 	int channel = to_sensor_dev_attr(attr)->index;
2742 	int temp = 0;
2743 
2744 	if (channel >= PP_TEMP_MAX)
2745 		return -EINVAL;
2746 
2747 	switch (channel) {
2748 	case PP_TEMP_JUNCTION:
2749 		temp = adev->pm.dpm.thermal.max_hotspot_emergency_temp;
2750 		break;
2751 	case PP_TEMP_EDGE:
2752 		temp = adev->pm.dpm.thermal.max_edge_emergency_temp;
2753 		break;
2754 	case PP_TEMP_MEM:
2755 		temp = adev->pm.dpm.thermal.max_mem_emergency_temp;
2756 		break;
2757 	}
2758 
2759 	return sysfs_emit(buf, "%d\n", temp);
2760 }
2761 
2762 static ssize_t amdgpu_hwmon_get_pwm1_enable(struct device *dev,
2763 					    struct device_attribute *attr,
2764 					    char *buf)
2765 {
2766 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2767 	u32 pwm_mode = 0;
2768 	int ret;
2769 
2770 	if (amdgpu_in_reset(adev))
2771 		return -EPERM;
2772 	if (adev->in_suspend && !adev->in_runpm)
2773 		return -EPERM;
2774 
2775 	ret = pm_runtime_get_sync(adev_to_drm(adev)->dev);
2776 	if (ret < 0) {
2777 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2778 		return ret;
2779 	}
2780 
2781 	ret = amdgpu_dpm_get_fan_control_mode(adev, &pwm_mode);
2782 
2783 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
2784 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2785 
2786 	if (ret)
2787 		return -EINVAL;
2788 
2789 	return sysfs_emit(buf, "%u\n", pwm_mode);
2790 }
2791 
2792 static ssize_t amdgpu_hwmon_set_pwm1_enable(struct device *dev,
2793 					    struct device_attribute *attr,
2794 					    const char *buf,
2795 					    size_t count)
2796 {
2797 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2798 	int err, ret;
2799 	u32 pwm_mode;
2800 	int value;
2801 
2802 	if (amdgpu_in_reset(adev))
2803 		return -EPERM;
2804 	if (adev->in_suspend && !adev->in_runpm)
2805 		return -EPERM;
2806 
2807 	err = kstrtoint(buf, 10, &value);
2808 	if (err)
2809 		return err;
2810 
2811 	if (value == 0)
2812 		pwm_mode = AMD_FAN_CTRL_NONE;
2813 	else if (value == 1)
2814 		pwm_mode = AMD_FAN_CTRL_MANUAL;
2815 	else if (value == 2)
2816 		pwm_mode = AMD_FAN_CTRL_AUTO;
2817 	else
2818 		return -EINVAL;
2819 
2820 	ret = pm_runtime_get_sync(adev_to_drm(adev)->dev);
2821 	if (ret < 0) {
2822 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2823 		return ret;
2824 	}
2825 
2826 	ret = amdgpu_dpm_set_fan_control_mode(adev, pwm_mode);
2827 
2828 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
2829 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2830 
2831 	if (ret)
2832 		return -EINVAL;
2833 
2834 	return count;
2835 }
2836 
2837 static ssize_t amdgpu_hwmon_get_pwm1_min(struct device *dev,
2838 					 struct device_attribute *attr,
2839 					 char *buf)
2840 {
2841 	return sysfs_emit(buf, "%i\n", 0);
2842 }
2843 
2844 static ssize_t amdgpu_hwmon_get_pwm1_max(struct device *dev,
2845 					 struct device_attribute *attr,
2846 					 char *buf)
2847 {
2848 	return sysfs_emit(buf, "%i\n", 255);
2849 }
2850 
2851 static ssize_t amdgpu_hwmon_set_pwm1(struct device *dev,
2852 				     struct device_attribute *attr,
2853 				     const char *buf, size_t count)
2854 {
2855 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2856 	int err;
2857 	u32 value;
2858 	u32 pwm_mode;
2859 
2860 	if (amdgpu_in_reset(adev))
2861 		return -EPERM;
2862 	if (adev->in_suspend && !adev->in_runpm)
2863 		return -EPERM;
2864 
2865 	err = kstrtou32(buf, 10, &value);
2866 	if (err)
2867 		return err;
2868 
2869 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
2870 	if (err < 0) {
2871 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2872 		return err;
2873 	}
2874 
2875 	err = amdgpu_dpm_get_fan_control_mode(adev, &pwm_mode);
2876 	if (err)
2877 		goto out;
2878 
2879 	if (pwm_mode != AMD_FAN_CTRL_MANUAL) {
2880 		pr_info("manual fan speed control should be enabled first\n");
2881 		err = -EINVAL;
2882 		goto out;
2883 	}
2884 
2885 	err = amdgpu_dpm_set_fan_speed_pwm(adev, value);
2886 
2887 out:
2888 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
2889 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2890 
2891 	if (err)
2892 		return err;
2893 
2894 	return count;
2895 }
2896 
2897 static ssize_t amdgpu_hwmon_get_pwm1(struct device *dev,
2898 				     struct device_attribute *attr,
2899 				     char *buf)
2900 {
2901 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2902 	int err;
2903 	u32 speed = 0;
2904 
2905 	if (amdgpu_in_reset(adev))
2906 		return -EPERM;
2907 	if (adev->in_suspend && !adev->in_runpm)
2908 		return -EPERM;
2909 
2910 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
2911 	if (err < 0) {
2912 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2913 		return err;
2914 	}
2915 
2916 	err = amdgpu_dpm_get_fan_speed_pwm(adev, &speed);
2917 
2918 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
2919 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2920 
2921 	if (err)
2922 		return err;
2923 
2924 	return sysfs_emit(buf, "%i\n", speed);
2925 }
2926 
2927 static ssize_t amdgpu_hwmon_get_fan1_input(struct device *dev,
2928 					   struct device_attribute *attr,
2929 					   char *buf)
2930 {
2931 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2932 	int err;
2933 	u32 speed = 0;
2934 
2935 	if (amdgpu_in_reset(adev))
2936 		return -EPERM;
2937 	if (adev->in_suspend && !adev->in_runpm)
2938 		return -EPERM;
2939 
2940 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
2941 	if (err < 0) {
2942 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2943 		return err;
2944 	}
2945 
2946 	err = amdgpu_dpm_get_fan_speed_rpm(adev, &speed);
2947 
2948 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
2949 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
2950 
2951 	if (err)
2952 		return err;
2953 
2954 	return sysfs_emit(buf, "%i\n", speed);
2955 }
2956 
2957 static ssize_t amdgpu_hwmon_get_fan1_min(struct device *dev,
2958 					 struct device_attribute *attr,
2959 					 char *buf)
2960 {
2961 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2962 	u32 min_rpm = 0;
2963 	int r;
2964 
2965 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_MIN_FAN_RPM,
2966 				   (void *)&min_rpm);
2967 
2968 	if (r)
2969 		return r;
2970 
2971 	return sysfs_emit(buf, "%d\n", min_rpm);
2972 }
2973 
2974 static ssize_t amdgpu_hwmon_get_fan1_max(struct device *dev,
2975 					 struct device_attribute *attr,
2976 					 char *buf)
2977 {
2978 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2979 	u32 max_rpm = 0;
2980 	int r;
2981 
2982 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_MAX_FAN_RPM,
2983 				   (void *)&max_rpm);
2984 
2985 	if (r)
2986 		return r;
2987 
2988 	return sysfs_emit(buf, "%d\n", max_rpm);
2989 }
2990 
2991 static ssize_t amdgpu_hwmon_get_fan1_target(struct device *dev,
2992 					   struct device_attribute *attr,
2993 					   char *buf)
2994 {
2995 	struct amdgpu_device *adev = dev_get_drvdata(dev);
2996 	int err;
2997 	u32 rpm = 0;
2998 
2999 	if (amdgpu_in_reset(adev))
3000 		return -EPERM;
3001 	if (adev->in_suspend && !adev->in_runpm)
3002 		return -EPERM;
3003 
3004 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
3005 	if (err < 0) {
3006 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3007 		return err;
3008 	}
3009 
3010 	err = amdgpu_dpm_get_fan_speed_rpm(adev, &rpm);
3011 
3012 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
3013 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3014 
3015 	if (err)
3016 		return err;
3017 
3018 	return sysfs_emit(buf, "%i\n", rpm);
3019 }
3020 
3021 static ssize_t amdgpu_hwmon_set_fan1_target(struct device *dev,
3022 				     struct device_attribute *attr,
3023 				     const char *buf, size_t count)
3024 {
3025 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3026 	int err;
3027 	u32 value;
3028 	u32 pwm_mode;
3029 
3030 	if (amdgpu_in_reset(adev))
3031 		return -EPERM;
3032 	if (adev->in_suspend && !adev->in_runpm)
3033 		return -EPERM;
3034 
3035 	err = kstrtou32(buf, 10, &value);
3036 	if (err)
3037 		return err;
3038 
3039 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
3040 	if (err < 0) {
3041 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3042 		return err;
3043 	}
3044 
3045 	err = amdgpu_dpm_get_fan_control_mode(adev, &pwm_mode);
3046 	if (err)
3047 		goto out;
3048 
3049 	if (pwm_mode != AMD_FAN_CTRL_MANUAL) {
3050 		err = -ENODATA;
3051 		goto out;
3052 	}
3053 
3054 	err = amdgpu_dpm_set_fan_speed_rpm(adev, value);
3055 
3056 out:
3057 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
3058 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3059 
3060 	if (err)
3061 		return err;
3062 
3063 	return count;
3064 }
3065 
3066 static ssize_t amdgpu_hwmon_get_fan1_enable(struct device *dev,
3067 					    struct device_attribute *attr,
3068 					    char *buf)
3069 {
3070 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3071 	u32 pwm_mode = 0;
3072 	int ret;
3073 
3074 	if (amdgpu_in_reset(adev))
3075 		return -EPERM;
3076 	if (adev->in_suspend && !adev->in_runpm)
3077 		return -EPERM;
3078 
3079 	ret = pm_runtime_get_sync(adev_to_drm(adev)->dev);
3080 	if (ret < 0) {
3081 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3082 		return ret;
3083 	}
3084 
3085 	ret = amdgpu_dpm_get_fan_control_mode(adev, &pwm_mode);
3086 
3087 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
3088 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3089 
3090 	if (ret)
3091 		return -EINVAL;
3092 
3093 	return sysfs_emit(buf, "%i\n", pwm_mode == AMD_FAN_CTRL_AUTO ? 0 : 1);
3094 }
3095 
3096 static ssize_t amdgpu_hwmon_set_fan1_enable(struct device *dev,
3097 					    struct device_attribute *attr,
3098 					    const char *buf,
3099 					    size_t count)
3100 {
3101 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3102 	int err;
3103 	int value;
3104 	u32 pwm_mode;
3105 
3106 	if (amdgpu_in_reset(adev))
3107 		return -EPERM;
3108 	if (adev->in_suspend && !adev->in_runpm)
3109 		return -EPERM;
3110 
3111 	err = kstrtoint(buf, 10, &value);
3112 	if (err)
3113 		return err;
3114 
3115 	if (value == 0)
3116 		pwm_mode = AMD_FAN_CTRL_AUTO;
3117 	else if (value == 1)
3118 		pwm_mode = AMD_FAN_CTRL_MANUAL;
3119 	else
3120 		return -EINVAL;
3121 
3122 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
3123 	if (err < 0) {
3124 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3125 		return err;
3126 	}
3127 
3128 	err = amdgpu_dpm_set_fan_control_mode(adev, pwm_mode);
3129 
3130 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
3131 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3132 
3133 	if (err)
3134 		return -EINVAL;
3135 
3136 	return count;
3137 }
3138 
3139 static ssize_t amdgpu_hwmon_show_vddgfx(struct device *dev,
3140 					struct device_attribute *attr,
3141 					char *buf)
3142 {
3143 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3144 	u32 vddgfx;
3145 	int r;
3146 
3147 	/* get the voltage */
3148 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_VDDGFX,
3149 				   (void *)&vddgfx);
3150 	if (r)
3151 		return r;
3152 
3153 	return sysfs_emit(buf, "%d\n", vddgfx);
3154 }
3155 
3156 static ssize_t amdgpu_hwmon_show_vddgfx_label(struct device *dev,
3157 					      struct device_attribute *attr,
3158 					      char *buf)
3159 {
3160 	return sysfs_emit(buf, "vddgfx\n");
3161 }
3162 
3163 static ssize_t amdgpu_hwmon_show_vddnb(struct device *dev,
3164 				       struct device_attribute *attr,
3165 				       char *buf)
3166 {
3167 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3168 	u32 vddnb;
3169 	int r;
3170 
3171 	/* only APUs have vddnb */
3172 	if  (!(adev->flags & AMD_IS_APU))
3173 		return -EINVAL;
3174 
3175 	/* get the voltage */
3176 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_VDDNB,
3177 				   (void *)&vddnb);
3178 	if (r)
3179 		return r;
3180 
3181 	return sysfs_emit(buf, "%d\n", vddnb);
3182 }
3183 
3184 static ssize_t amdgpu_hwmon_show_vddnb_label(struct device *dev,
3185 					      struct device_attribute *attr,
3186 					      char *buf)
3187 {
3188 	return sysfs_emit(buf, "vddnb\n");
3189 }
3190 
3191 static int amdgpu_hwmon_get_power(struct device *dev,
3192 				  enum amd_pp_sensors sensor)
3193 {
3194 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3195 	unsigned int uw;
3196 	u32 query = 0;
3197 	int r;
3198 
3199 	r = amdgpu_hwmon_get_sensor_generic(adev, sensor, (void *)&query);
3200 	if (r)
3201 		return r;
3202 
3203 	/* convert to microwatts */
3204 	uw = (query >> 8) * 1000000 + (query & 0xff) * 1000;
3205 
3206 	return uw;
3207 }
3208 
3209 static ssize_t amdgpu_hwmon_show_power_avg(struct device *dev,
3210 					   struct device_attribute *attr,
3211 					   char *buf)
3212 {
3213 	ssize_t val;
3214 
3215 	val = amdgpu_hwmon_get_power(dev, AMDGPU_PP_SENSOR_GPU_AVG_POWER);
3216 	if (val < 0)
3217 		return val;
3218 
3219 	return sysfs_emit(buf, "%zd\n", val);
3220 }
3221 
3222 static ssize_t amdgpu_hwmon_show_power_input(struct device *dev,
3223 					     struct device_attribute *attr,
3224 					     char *buf)
3225 {
3226 	ssize_t val;
3227 
3228 	val = amdgpu_hwmon_get_power(dev, AMDGPU_PP_SENSOR_GPU_INPUT_POWER);
3229 	if (val < 0)
3230 		return val;
3231 
3232 	return sysfs_emit(buf, "%zd\n", val);
3233 }
3234 
3235 static ssize_t amdgpu_hwmon_show_power_cap_generic(struct device *dev,
3236 					struct device_attribute *attr,
3237 					char *buf,
3238 					enum pp_power_limit_level pp_limit_level)
3239 {
3240 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3241 	enum pp_power_type power_type = to_sensor_dev_attr(attr)->index;
3242 	uint32_t limit;
3243 	ssize_t size;
3244 	int r;
3245 
3246 	if (amdgpu_in_reset(adev))
3247 		return -EPERM;
3248 	if (adev->in_suspend && !adev->in_runpm)
3249 		return -EPERM;
3250 
3251 	r = pm_runtime_get_sync(adev_to_drm(adev)->dev);
3252 	if (r < 0) {
3253 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3254 		return r;
3255 	}
3256 
3257 	r = amdgpu_dpm_get_power_limit(adev, &limit,
3258 				      pp_limit_level, power_type);
3259 
3260 	if (!r)
3261 		size = sysfs_emit(buf, "%u\n", limit * 1000000);
3262 	else
3263 		size = sysfs_emit(buf, "\n");
3264 
3265 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
3266 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3267 
3268 	return size;
3269 }
3270 
3271 static ssize_t amdgpu_hwmon_show_power_cap_min(struct device *dev,
3272 					 struct device_attribute *attr,
3273 					 char *buf)
3274 {
3275 	return amdgpu_hwmon_show_power_cap_generic(dev, attr, buf, PP_PWR_LIMIT_MIN);
3276 }
3277 
3278 static ssize_t amdgpu_hwmon_show_power_cap_max(struct device *dev,
3279 					 struct device_attribute *attr,
3280 					 char *buf)
3281 {
3282 	return amdgpu_hwmon_show_power_cap_generic(dev, attr, buf, PP_PWR_LIMIT_MAX);
3283 
3284 }
3285 
3286 static ssize_t amdgpu_hwmon_show_power_cap(struct device *dev,
3287 					 struct device_attribute *attr,
3288 					 char *buf)
3289 {
3290 	return amdgpu_hwmon_show_power_cap_generic(dev, attr, buf, PP_PWR_LIMIT_CURRENT);
3291 
3292 }
3293 
3294 static ssize_t amdgpu_hwmon_show_power_cap_default(struct device *dev,
3295 					 struct device_attribute *attr,
3296 					 char *buf)
3297 {
3298 	return amdgpu_hwmon_show_power_cap_generic(dev, attr, buf, PP_PWR_LIMIT_DEFAULT);
3299 
3300 }
3301 
3302 static ssize_t amdgpu_hwmon_show_power_label(struct device *dev,
3303 					 struct device_attribute *attr,
3304 					 char *buf)
3305 {
3306 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3307 	uint32_t gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
3308 
3309 	if (gc_ver == IP_VERSION(10, 3, 1))
3310 		return sysfs_emit(buf, "%s\n",
3311 				  to_sensor_dev_attr(attr)->index == PP_PWR_TYPE_FAST ?
3312 				  "fastPPT" : "slowPPT");
3313 	else
3314 		return sysfs_emit(buf, "PPT\n");
3315 }
3316 
3317 static ssize_t amdgpu_hwmon_set_power_cap(struct device *dev,
3318 		struct device_attribute *attr,
3319 		const char *buf,
3320 		size_t count)
3321 {
3322 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3323 	int limit_type = to_sensor_dev_attr(attr)->index;
3324 	int err;
3325 	u32 value;
3326 
3327 	if (amdgpu_in_reset(adev))
3328 		return -EPERM;
3329 	if (adev->in_suspend && !adev->in_runpm)
3330 		return -EPERM;
3331 
3332 	if (amdgpu_sriov_vf(adev))
3333 		return -EINVAL;
3334 
3335 	err = kstrtou32(buf, 10, &value);
3336 	if (err)
3337 		return err;
3338 
3339 	value = value / 1000000; /* convert to Watt */
3340 	value |= limit_type << 24;
3341 
3342 	err = pm_runtime_get_sync(adev_to_drm(adev)->dev);
3343 	if (err < 0) {
3344 		pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3345 		return err;
3346 	}
3347 
3348 	err = amdgpu_dpm_set_power_limit(adev, value);
3349 
3350 	pm_runtime_mark_last_busy(adev_to_drm(adev)->dev);
3351 	pm_runtime_put_autosuspend(adev_to_drm(adev)->dev);
3352 
3353 	if (err)
3354 		return err;
3355 
3356 	return count;
3357 }
3358 
3359 static ssize_t amdgpu_hwmon_show_sclk(struct device *dev,
3360 				      struct device_attribute *attr,
3361 				      char *buf)
3362 {
3363 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3364 	uint32_t sclk;
3365 	int r;
3366 
3367 	/* get the sclk */
3368 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_GFX_SCLK,
3369 				   (void *)&sclk);
3370 	if (r)
3371 		return r;
3372 
3373 	return sysfs_emit(buf, "%u\n", sclk * 10 * 1000);
3374 }
3375 
3376 static ssize_t amdgpu_hwmon_show_sclk_label(struct device *dev,
3377 					    struct device_attribute *attr,
3378 					    char *buf)
3379 {
3380 	return sysfs_emit(buf, "sclk\n");
3381 }
3382 
3383 static ssize_t amdgpu_hwmon_show_mclk(struct device *dev,
3384 				      struct device_attribute *attr,
3385 				      char *buf)
3386 {
3387 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3388 	uint32_t mclk;
3389 	int r;
3390 
3391 	/* get the sclk */
3392 	r = amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_GFX_MCLK,
3393 				   (void *)&mclk);
3394 	if (r)
3395 		return r;
3396 
3397 	return sysfs_emit(buf, "%u\n", mclk * 10 * 1000);
3398 }
3399 
3400 static ssize_t amdgpu_hwmon_show_mclk_label(struct device *dev,
3401 					    struct device_attribute *attr,
3402 					    char *buf)
3403 {
3404 	return sysfs_emit(buf, "mclk\n");
3405 }
3406 
3407 /**
3408  * DOC: hwmon
3409  *
3410  * The amdgpu driver exposes the following sensor interfaces:
3411  *
3412  * - GPU temperature (via the on-die sensor)
3413  *
3414  * - GPU voltage
3415  *
3416  * - Northbridge voltage (APUs only)
3417  *
3418  * - GPU power
3419  *
3420  * - GPU fan
3421  *
3422  * - GPU gfx/compute engine clock
3423  *
3424  * - GPU memory clock (dGPU only)
3425  *
3426  * hwmon interfaces for GPU temperature:
3427  *
3428  * - temp[1-3]_input: the on die GPU temperature in millidegrees Celsius
3429  *   - temp2_input and temp3_input are supported on SOC15 dGPUs only
3430  *
3431  * - temp[1-3]_label: temperature channel label
3432  *   - temp2_label and temp3_label are supported on SOC15 dGPUs only
3433  *
3434  * - temp[1-3]_crit: temperature critical max value in millidegrees Celsius
3435  *   - temp2_crit and temp3_crit are supported on SOC15 dGPUs only
3436  *
3437  * - temp[1-3]_crit_hyst: temperature hysteresis for critical limit in millidegrees Celsius
3438  *   - temp2_crit_hyst and temp3_crit_hyst are supported on SOC15 dGPUs only
3439  *
3440  * - temp[1-3]_emergency: temperature emergency max value(asic shutdown) in millidegrees Celsius
3441  *   - these are supported on SOC15 dGPUs only
3442  *
3443  * hwmon interfaces for GPU voltage:
3444  *
3445  * - in0_input: the voltage on the GPU in millivolts
3446  *
3447  * - in1_input: the voltage on the Northbridge in millivolts
3448  *
3449  * hwmon interfaces for GPU power:
3450  *
3451  * - power1_average: average power used by the SoC in microWatts.  On APUs this includes the CPU.
3452  *
3453  * - power1_input: instantaneous power used by the SoC in microWatts.  On APUs this includes the CPU.
3454  *
3455  * - power1_cap_min: minimum cap supported in microWatts
3456  *
3457  * - power1_cap_max: maximum cap supported in microWatts
3458  *
3459  * - power1_cap: selected power cap in microWatts
3460  *
3461  * hwmon interfaces for GPU fan:
3462  *
3463  * - pwm1: pulse width modulation fan level (0-255)
3464  *
3465  * - pwm1_enable: pulse width modulation fan control method (0: no fan speed control, 1: manual fan speed control using pwm interface, 2: automatic fan speed control)
3466  *
3467  * - pwm1_min: pulse width modulation fan control minimum level (0)
3468  *
3469  * - pwm1_max: pulse width modulation fan control maximum level (255)
3470  *
3471  * - fan1_min: a minimum value Unit: revolution/min (RPM)
3472  *
3473  * - fan1_max: a maximum value Unit: revolution/max (RPM)
3474  *
3475  * - fan1_input: fan speed in RPM
3476  *
3477  * - fan[1-\*]_target: Desired fan speed Unit: revolution/min (RPM)
3478  *
3479  * - fan[1-\*]_enable: Enable or disable the sensors.1: Enable 0: Disable
3480  *
3481  * NOTE: DO NOT set the fan speed via "pwm1" and "fan[1-\*]_target" interfaces at the same time.
3482  *       That will get the former one overridden.
3483  *
3484  * hwmon interfaces for GPU clocks:
3485  *
3486  * - freq1_input: the gfx/compute clock in hertz
3487  *
3488  * - freq2_input: the memory clock in hertz
3489  *
3490  * You can use hwmon tools like sensors to view this information on your system.
3491  *
3492  */
3493 
3494 static SENSOR_DEVICE_ATTR(temp1_input, S_IRUGO, amdgpu_hwmon_show_temp, NULL, PP_TEMP_EDGE);
3495 static SENSOR_DEVICE_ATTR(temp1_crit, S_IRUGO, amdgpu_hwmon_show_temp_thresh, NULL, 0);
3496 static SENSOR_DEVICE_ATTR(temp1_crit_hyst, S_IRUGO, amdgpu_hwmon_show_temp_thresh, NULL, 1);
3497 static SENSOR_DEVICE_ATTR(temp1_emergency, S_IRUGO, amdgpu_hwmon_show_temp_emergency, NULL, PP_TEMP_EDGE);
3498 static SENSOR_DEVICE_ATTR(temp2_input, S_IRUGO, amdgpu_hwmon_show_temp, NULL, PP_TEMP_JUNCTION);
3499 static SENSOR_DEVICE_ATTR(temp2_crit, S_IRUGO, amdgpu_hwmon_show_hotspot_temp_thresh, NULL, 0);
3500 static SENSOR_DEVICE_ATTR(temp2_crit_hyst, S_IRUGO, amdgpu_hwmon_show_hotspot_temp_thresh, NULL, 1);
3501 static SENSOR_DEVICE_ATTR(temp2_emergency, S_IRUGO, amdgpu_hwmon_show_temp_emergency, NULL, PP_TEMP_JUNCTION);
3502 static SENSOR_DEVICE_ATTR(temp3_input, S_IRUGO, amdgpu_hwmon_show_temp, NULL, PP_TEMP_MEM);
3503 static SENSOR_DEVICE_ATTR(temp3_crit, S_IRUGO, amdgpu_hwmon_show_mem_temp_thresh, NULL, 0);
3504 static SENSOR_DEVICE_ATTR(temp3_crit_hyst, S_IRUGO, amdgpu_hwmon_show_mem_temp_thresh, NULL, 1);
3505 static SENSOR_DEVICE_ATTR(temp3_emergency, S_IRUGO, amdgpu_hwmon_show_temp_emergency, NULL, PP_TEMP_MEM);
3506 static SENSOR_DEVICE_ATTR(temp1_label, S_IRUGO, amdgpu_hwmon_show_temp_label, NULL, PP_TEMP_EDGE);
3507 static SENSOR_DEVICE_ATTR(temp2_label, S_IRUGO, amdgpu_hwmon_show_temp_label, NULL, PP_TEMP_JUNCTION);
3508 static SENSOR_DEVICE_ATTR(temp3_label, S_IRUGO, amdgpu_hwmon_show_temp_label, NULL, PP_TEMP_MEM);
3509 static SENSOR_DEVICE_ATTR(pwm1, S_IRUGO | S_IWUSR, amdgpu_hwmon_get_pwm1, amdgpu_hwmon_set_pwm1, 0);
3510 static SENSOR_DEVICE_ATTR(pwm1_enable, S_IRUGO | S_IWUSR, amdgpu_hwmon_get_pwm1_enable, amdgpu_hwmon_set_pwm1_enable, 0);
3511 static SENSOR_DEVICE_ATTR(pwm1_min, S_IRUGO, amdgpu_hwmon_get_pwm1_min, NULL, 0);
3512 static SENSOR_DEVICE_ATTR(pwm1_max, S_IRUGO, amdgpu_hwmon_get_pwm1_max, NULL, 0);
3513 static SENSOR_DEVICE_ATTR(fan1_input, S_IRUGO, amdgpu_hwmon_get_fan1_input, NULL, 0);
3514 static SENSOR_DEVICE_ATTR(fan1_min, S_IRUGO, amdgpu_hwmon_get_fan1_min, NULL, 0);
3515 static SENSOR_DEVICE_ATTR(fan1_max, S_IRUGO, amdgpu_hwmon_get_fan1_max, NULL, 0);
3516 static SENSOR_DEVICE_ATTR(fan1_target, S_IRUGO | S_IWUSR, amdgpu_hwmon_get_fan1_target, amdgpu_hwmon_set_fan1_target, 0);
3517 static SENSOR_DEVICE_ATTR(fan1_enable, S_IRUGO | S_IWUSR, amdgpu_hwmon_get_fan1_enable, amdgpu_hwmon_set_fan1_enable, 0);
3518 static SENSOR_DEVICE_ATTR(in0_input, S_IRUGO, amdgpu_hwmon_show_vddgfx, NULL, 0);
3519 static SENSOR_DEVICE_ATTR(in0_label, S_IRUGO, amdgpu_hwmon_show_vddgfx_label, NULL, 0);
3520 static SENSOR_DEVICE_ATTR(in1_input, S_IRUGO, amdgpu_hwmon_show_vddnb, NULL, 0);
3521 static SENSOR_DEVICE_ATTR(in1_label, S_IRUGO, amdgpu_hwmon_show_vddnb_label, NULL, 0);
3522 static SENSOR_DEVICE_ATTR(power1_average, S_IRUGO, amdgpu_hwmon_show_power_avg, NULL, 0);
3523 static SENSOR_DEVICE_ATTR(power1_input, S_IRUGO, amdgpu_hwmon_show_power_input, NULL, 0);
3524 static SENSOR_DEVICE_ATTR(power1_cap_max, S_IRUGO, amdgpu_hwmon_show_power_cap_max, NULL, 0);
3525 static SENSOR_DEVICE_ATTR(power1_cap_min, S_IRUGO, amdgpu_hwmon_show_power_cap_min, NULL, 0);
3526 static SENSOR_DEVICE_ATTR(power1_cap, S_IRUGO | S_IWUSR, amdgpu_hwmon_show_power_cap, amdgpu_hwmon_set_power_cap, 0);
3527 static SENSOR_DEVICE_ATTR(power1_cap_default, S_IRUGO, amdgpu_hwmon_show_power_cap_default, NULL, 0);
3528 static SENSOR_DEVICE_ATTR(power1_label, S_IRUGO, amdgpu_hwmon_show_power_label, NULL, 0);
3529 static SENSOR_DEVICE_ATTR(power2_average, S_IRUGO, amdgpu_hwmon_show_power_avg, NULL, 1);
3530 static SENSOR_DEVICE_ATTR(power2_cap_max, S_IRUGO, amdgpu_hwmon_show_power_cap_max, NULL, 1);
3531 static SENSOR_DEVICE_ATTR(power2_cap_min, S_IRUGO, amdgpu_hwmon_show_power_cap_min, NULL, 1);
3532 static SENSOR_DEVICE_ATTR(power2_cap, S_IRUGO | S_IWUSR, amdgpu_hwmon_show_power_cap, amdgpu_hwmon_set_power_cap, 1);
3533 static SENSOR_DEVICE_ATTR(power2_cap_default, S_IRUGO, amdgpu_hwmon_show_power_cap_default, NULL, 1);
3534 static SENSOR_DEVICE_ATTR(power2_label, S_IRUGO, amdgpu_hwmon_show_power_label, NULL, 1);
3535 static SENSOR_DEVICE_ATTR(freq1_input, S_IRUGO, amdgpu_hwmon_show_sclk, NULL, 0);
3536 static SENSOR_DEVICE_ATTR(freq1_label, S_IRUGO, amdgpu_hwmon_show_sclk_label, NULL, 0);
3537 static SENSOR_DEVICE_ATTR(freq2_input, S_IRUGO, amdgpu_hwmon_show_mclk, NULL, 0);
3538 static SENSOR_DEVICE_ATTR(freq2_label, S_IRUGO, amdgpu_hwmon_show_mclk_label, NULL, 0);
3539 
3540 static struct attribute *hwmon_attributes[] = {
3541 	&sensor_dev_attr_temp1_input.dev_attr.attr,
3542 	&sensor_dev_attr_temp1_crit.dev_attr.attr,
3543 	&sensor_dev_attr_temp1_crit_hyst.dev_attr.attr,
3544 	&sensor_dev_attr_temp2_input.dev_attr.attr,
3545 	&sensor_dev_attr_temp2_crit.dev_attr.attr,
3546 	&sensor_dev_attr_temp2_crit_hyst.dev_attr.attr,
3547 	&sensor_dev_attr_temp3_input.dev_attr.attr,
3548 	&sensor_dev_attr_temp3_crit.dev_attr.attr,
3549 	&sensor_dev_attr_temp3_crit_hyst.dev_attr.attr,
3550 	&sensor_dev_attr_temp1_emergency.dev_attr.attr,
3551 	&sensor_dev_attr_temp2_emergency.dev_attr.attr,
3552 	&sensor_dev_attr_temp3_emergency.dev_attr.attr,
3553 	&sensor_dev_attr_temp1_label.dev_attr.attr,
3554 	&sensor_dev_attr_temp2_label.dev_attr.attr,
3555 	&sensor_dev_attr_temp3_label.dev_attr.attr,
3556 	&sensor_dev_attr_pwm1.dev_attr.attr,
3557 	&sensor_dev_attr_pwm1_enable.dev_attr.attr,
3558 	&sensor_dev_attr_pwm1_min.dev_attr.attr,
3559 	&sensor_dev_attr_pwm1_max.dev_attr.attr,
3560 	&sensor_dev_attr_fan1_input.dev_attr.attr,
3561 	&sensor_dev_attr_fan1_min.dev_attr.attr,
3562 	&sensor_dev_attr_fan1_max.dev_attr.attr,
3563 	&sensor_dev_attr_fan1_target.dev_attr.attr,
3564 	&sensor_dev_attr_fan1_enable.dev_attr.attr,
3565 	&sensor_dev_attr_in0_input.dev_attr.attr,
3566 	&sensor_dev_attr_in0_label.dev_attr.attr,
3567 	&sensor_dev_attr_in1_input.dev_attr.attr,
3568 	&sensor_dev_attr_in1_label.dev_attr.attr,
3569 	&sensor_dev_attr_power1_average.dev_attr.attr,
3570 	&sensor_dev_attr_power1_input.dev_attr.attr,
3571 	&sensor_dev_attr_power1_cap_max.dev_attr.attr,
3572 	&sensor_dev_attr_power1_cap_min.dev_attr.attr,
3573 	&sensor_dev_attr_power1_cap.dev_attr.attr,
3574 	&sensor_dev_attr_power1_cap_default.dev_attr.attr,
3575 	&sensor_dev_attr_power1_label.dev_attr.attr,
3576 	&sensor_dev_attr_power2_average.dev_attr.attr,
3577 	&sensor_dev_attr_power2_cap_max.dev_attr.attr,
3578 	&sensor_dev_attr_power2_cap_min.dev_attr.attr,
3579 	&sensor_dev_attr_power2_cap.dev_attr.attr,
3580 	&sensor_dev_attr_power2_cap_default.dev_attr.attr,
3581 	&sensor_dev_attr_power2_label.dev_attr.attr,
3582 	&sensor_dev_attr_freq1_input.dev_attr.attr,
3583 	&sensor_dev_attr_freq1_label.dev_attr.attr,
3584 	&sensor_dev_attr_freq2_input.dev_attr.attr,
3585 	&sensor_dev_attr_freq2_label.dev_attr.attr,
3586 	NULL
3587 };
3588 
3589 static umode_t hwmon_attributes_visible(struct kobject *kobj,
3590 					struct attribute *attr, int index)
3591 {
3592 	struct device *dev = kobj_to_dev(kobj);
3593 	struct amdgpu_device *adev = dev_get_drvdata(dev);
3594 	umode_t effective_mode = attr->mode;
3595 	uint32_t gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
3596 	uint32_t tmp;
3597 
3598 	/* under pp one vf mode manage of hwmon attributes is not supported */
3599 	if (amdgpu_sriov_is_pp_one_vf(adev))
3600 		effective_mode &= ~S_IWUSR;
3601 
3602 	/* Skip fan attributes if fan is not present */
3603 	if (adev->pm.no_fan && (attr == &sensor_dev_attr_pwm1.dev_attr.attr ||
3604 	    attr == &sensor_dev_attr_pwm1_enable.dev_attr.attr ||
3605 	    attr == &sensor_dev_attr_pwm1_max.dev_attr.attr ||
3606 	    attr == &sensor_dev_attr_pwm1_min.dev_attr.attr ||
3607 	    attr == &sensor_dev_attr_fan1_input.dev_attr.attr ||
3608 	    attr == &sensor_dev_attr_fan1_min.dev_attr.attr ||
3609 	    attr == &sensor_dev_attr_fan1_max.dev_attr.attr ||
3610 	    attr == &sensor_dev_attr_fan1_target.dev_attr.attr ||
3611 	    attr == &sensor_dev_attr_fan1_enable.dev_attr.attr))
3612 		return 0;
3613 
3614 	/* Skip fan attributes on APU */
3615 	if ((adev->flags & AMD_IS_APU) &&
3616 	    (attr == &sensor_dev_attr_pwm1.dev_attr.attr ||
3617 	     attr == &sensor_dev_attr_pwm1_enable.dev_attr.attr ||
3618 	     attr == &sensor_dev_attr_pwm1_max.dev_attr.attr ||
3619 	     attr == &sensor_dev_attr_pwm1_min.dev_attr.attr ||
3620 	     attr == &sensor_dev_attr_fan1_input.dev_attr.attr ||
3621 	     attr == &sensor_dev_attr_fan1_min.dev_attr.attr ||
3622 	     attr == &sensor_dev_attr_fan1_max.dev_attr.attr ||
3623 	     attr == &sensor_dev_attr_fan1_target.dev_attr.attr ||
3624 	     attr == &sensor_dev_attr_fan1_enable.dev_attr.attr))
3625 		return 0;
3626 
3627 	/* Skip crit temp on APU */
3628 	if ((((adev->flags & AMD_IS_APU) && (adev->family >= AMDGPU_FAMILY_CZ)) ||
3629 	    (gc_ver == IP_VERSION(9, 4, 3) || gc_ver == IP_VERSION(9, 4, 4))) &&
3630 	    (attr == &sensor_dev_attr_temp1_crit.dev_attr.attr ||
3631 	     attr == &sensor_dev_attr_temp1_crit_hyst.dev_attr.attr))
3632 		return 0;
3633 
3634 	/* Skip limit attributes if DPM is not enabled */
3635 	if (!adev->pm.dpm_enabled &&
3636 	    (attr == &sensor_dev_attr_temp1_crit.dev_attr.attr ||
3637 	     attr == &sensor_dev_attr_temp1_crit_hyst.dev_attr.attr ||
3638 	     attr == &sensor_dev_attr_pwm1.dev_attr.attr ||
3639 	     attr == &sensor_dev_attr_pwm1_enable.dev_attr.attr ||
3640 	     attr == &sensor_dev_attr_pwm1_max.dev_attr.attr ||
3641 	     attr == &sensor_dev_attr_pwm1_min.dev_attr.attr ||
3642 	     attr == &sensor_dev_attr_fan1_input.dev_attr.attr ||
3643 	     attr == &sensor_dev_attr_fan1_min.dev_attr.attr ||
3644 	     attr == &sensor_dev_attr_fan1_max.dev_attr.attr ||
3645 	     attr == &sensor_dev_attr_fan1_target.dev_attr.attr ||
3646 	     attr == &sensor_dev_attr_fan1_enable.dev_attr.attr))
3647 		return 0;
3648 
3649 	/* mask fan attributes if we have no bindings for this asic to expose */
3650 	if (((amdgpu_dpm_get_fan_speed_pwm(adev, NULL) == -EOPNOTSUPP) &&
3651 	      attr == &sensor_dev_attr_pwm1.dev_attr.attr) || /* can't query fan */
3652 	    ((amdgpu_dpm_get_fan_control_mode(adev, NULL) == -EOPNOTSUPP) &&
3653 	     attr == &sensor_dev_attr_pwm1_enable.dev_attr.attr)) /* can't query state */
3654 		effective_mode &= ~S_IRUGO;
3655 
3656 	if (((amdgpu_dpm_set_fan_speed_pwm(adev, U32_MAX) == -EOPNOTSUPP) &&
3657 	      attr == &sensor_dev_attr_pwm1.dev_attr.attr) || /* can't manage fan */
3658 	      ((amdgpu_dpm_set_fan_control_mode(adev, U32_MAX) == -EOPNOTSUPP) &&
3659 	      attr == &sensor_dev_attr_pwm1_enable.dev_attr.attr)) /* can't manage state */
3660 		effective_mode &= ~S_IWUSR;
3661 
3662 	/* not implemented yet for APUs other than GC 10.3.1 (vangogh) and 9.4.3 */
3663 	if (((adev->family == AMDGPU_FAMILY_SI) ||
3664 	     ((adev->flags & AMD_IS_APU) && (gc_ver != IP_VERSION(10, 3, 1)) &&
3665 	      (gc_ver != IP_VERSION(9, 4, 3) && gc_ver != IP_VERSION(9, 4, 4)))) &&
3666 	    (attr == &sensor_dev_attr_power1_cap_max.dev_attr.attr ||
3667 	     attr == &sensor_dev_attr_power1_cap_min.dev_attr.attr ||
3668 	     attr == &sensor_dev_attr_power1_cap.dev_attr.attr ||
3669 	     attr == &sensor_dev_attr_power1_cap_default.dev_attr.attr))
3670 		return 0;
3671 
3672 	/* not implemented yet for APUs having < GC 9.3.0 (Renoir) */
3673 	if (((adev->family == AMDGPU_FAMILY_SI) ||
3674 	     ((adev->flags & AMD_IS_APU) && (gc_ver < IP_VERSION(9, 3, 0)))) &&
3675 	    (attr == &sensor_dev_attr_power1_average.dev_attr.attr))
3676 		return 0;
3677 
3678 	/* not all products support both average and instantaneous */
3679 	if (attr == &sensor_dev_attr_power1_average.dev_attr.attr &&
3680 	    amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_GPU_AVG_POWER, (void *)&tmp) == -EOPNOTSUPP)
3681 		return 0;
3682 	if (attr == &sensor_dev_attr_power1_input.dev_attr.attr &&
3683 	    amdgpu_hwmon_get_sensor_generic(adev, AMDGPU_PP_SENSOR_GPU_INPUT_POWER, (void *)&tmp) == -EOPNOTSUPP)
3684 		return 0;
3685 
3686 	/* hide max/min values if we can't both query and manage the fan */
3687 	if (((amdgpu_dpm_set_fan_speed_pwm(adev, U32_MAX) == -EOPNOTSUPP) &&
3688 	      (amdgpu_dpm_get_fan_speed_pwm(adev, NULL) == -EOPNOTSUPP) &&
3689 	      (amdgpu_dpm_set_fan_speed_rpm(adev, U32_MAX) == -EOPNOTSUPP) &&
3690 	      (amdgpu_dpm_get_fan_speed_rpm(adev, NULL) == -EOPNOTSUPP)) &&
3691 	    (attr == &sensor_dev_attr_pwm1_max.dev_attr.attr ||
3692 	     attr == &sensor_dev_attr_pwm1_min.dev_attr.attr))
3693 		return 0;
3694 
3695 	if ((amdgpu_dpm_set_fan_speed_rpm(adev, U32_MAX) == -EOPNOTSUPP) &&
3696 	     (amdgpu_dpm_get_fan_speed_rpm(adev, NULL) == -EOPNOTSUPP) &&
3697 	     (attr == &sensor_dev_attr_fan1_max.dev_attr.attr ||
3698 	     attr == &sensor_dev_attr_fan1_min.dev_attr.attr))
3699 		return 0;
3700 
3701 	if ((adev->family == AMDGPU_FAMILY_SI ||	/* not implemented yet */
3702 	     adev->family == AMDGPU_FAMILY_KV ||	/* not implemented yet */
3703 	     (gc_ver == IP_VERSION(9, 4, 3) ||
3704 	      gc_ver == IP_VERSION(9, 4, 4))) &&
3705 	    (attr == &sensor_dev_attr_in0_input.dev_attr.attr ||
3706 	     attr == &sensor_dev_attr_in0_label.dev_attr.attr))
3707 		return 0;
3708 
3709 	/* only APUs other than gc 9,4,3 have vddnb */
3710 	if ((!(adev->flags & AMD_IS_APU) ||
3711 	     (gc_ver == IP_VERSION(9, 4, 3) ||
3712 	      gc_ver == IP_VERSION(9, 4, 4))) &&
3713 	    (attr == &sensor_dev_attr_in1_input.dev_attr.attr ||
3714 	     attr == &sensor_dev_attr_in1_label.dev_attr.attr))
3715 		return 0;
3716 
3717 	/* no mclk on APUs other than gc 9,4,3*/
3718 	if (((adev->flags & AMD_IS_APU) && (gc_ver != IP_VERSION(9, 4, 3))) &&
3719 	    (attr == &sensor_dev_attr_freq2_input.dev_attr.attr ||
3720 	     attr == &sensor_dev_attr_freq2_label.dev_attr.attr))
3721 		return 0;
3722 
3723 	if (((adev->flags & AMD_IS_APU) || gc_ver < IP_VERSION(9, 0, 0)) &&
3724 	    (gc_ver != IP_VERSION(9, 4, 3) && gc_ver != IP_VERSION(9, 4, 4)) &&
3725 	    (attr == &sensor_dev_attr_temp2_input.dev_attr.attr ||
3726 	     attr == &sensor_dev_attr_temp2_label.dev_attr.attr ||
3727 	     attr == &sensor_dev_attr_temp2_crit.dev_attr.attr ||
3728 	     attr == &sensor_dev_attr_temp3_input.dev_attr.attr ||
3729 	     attr == &sensor_dev_attr_temp3_label.dev_attr.attr ||
3730 	     attr == &sensor_dev_attr_temp3_crit.dev_attr.attr))
3731 		return 0;
3732 
3733 	/* hotspot temperature for gc 9,4,3*/
3734 	if (gc_ver == IP_VERSION(9, 4, 3) ||
3735 	    gc_ver == IP_VERSION(9, 4, 4)) {
3736 		if (attr == &sensor_dev_attr_temp1_input.dev_attr.attr ||
3737 		    attr == &sensor_dev_attr_temp1_emergency.dev_attr.attr ||
3738 		    attr == &sensor_dev_attr_temp1_label.dev_attr.attr)
3739 			return 0;
3740 
3741 		if (attr == &sensor_dev_attr_temp2_emergency.dev_attr.attr ||
3742 		    attr == &sensor_dev_attr_temp3_emergency.dev_attr.attr)
3743 			return attr->mode;
3744 	}
3745 
3746 	/* only SOC15 dGPUs support hotspot and mem temperatures */
3747 	if (((adev->flags & AMD_IS_APU) || gc_ver < IP_VERSION(9, 0, 0)) &&
3748 	    (attr == &sensor_dev_attr_temp2_crit_hyst.dev_attr.attr ||
3749 	     attr == &sensor_dev_attr_temp3_crit_hyst.dev_attr.attr ||
3750 	     attr == &sensor_dev_attr_temp1_emergency.dev_attr.attr ||
3751 	     attr == &sensor_dev_attr_temp2_emergency.dev_attr.attr ||
3752 	     attr == &sensor_dev_attr_temp3_emergency.dev_attr.attr))
3753 		return 0;
3754 
3755 	/* only Vangogh has fast PPT limit and power labels */
3756 	if (!(gc_ver == IP_VERSION(10, 3, 1)) &&
3757 	    (attr == &sensor_dev_attr_power2_average.dev_attr.attr ||
3758 	     attr == &sensor_dev_attr_power2_cap_max.dev_attr.attr ||
3759 	     attr == &sensor_dev_attr_power2_cap_min.dev_attr.attr ||
3760 	     attr == &sensor_dev_attr_power2_cap.dev_attr.attr ||
3761 	     attr == &sensor_dev_attr_power2_cap_default.dev_attr.attr ||
3762 	     attr == &sensor_dev_attr_power2_label.dev_attr.attr))
3763 		return 0;
3764 
3765 	return effective_mode;
3766 }
3767 
3768 static const struct attribute_group hwmon_attrgroup = {
3769 	.attrs = hwmon_attributes,
3770 	.is_visible = hwmon_attributes_visible,
3771 };
3772 
3773 static const struct attribute_group *hwmon_groups[] = {
3774 	&hwmon_attrgroup,
3775 	NULL
3776 };
3777 
3778 static int amdgpu_retrieve_od_settings(struct amdgpu_device *adev,
3779 				       enum pp_clock_type od_type,
3780 				       char *buf)
3781 {
3782 	int size = 0;
3783 	int ret;
3784 
3785 	if (amdgpu_in_reset(adev))
3786 		return -EPERM;
3787 	if (adev->in_suspend && !adev->in_runpm)
3788 		return -EPERM;
3789 
3790 	ret = pm_runtime_get_sync(adev->dev);
3791 	if (ret < 0) {
3792 		pm_runtime_put_autosuspend(adev->dev);
3793 		return ret;
3794 	}
3795 
3796 	size = amdgpu_dpm_print_clock_levels(adev, od_type, buf);
3797 	if (size == 0)
3798 		size = sysfs_emit(buf, "\n");
3799 
3800 	pm_runtime_mark_last_busy(adev->dev);
3801 	pm_runtime_put_autosuspend(adev->dev);
3802 
3803 	return size;
3804 }
3805 
3806 static int parse_input_od_command_lines(const char *buf,
3807 					size_t count,
3808 					u32 *type,
3809 					long *params,
3810 					uint32_t *num_of_params)
3811 {
3812 	const char delimiter[3] = {' ', '\n', '\0'};
3813 	uint32_t parameter_size = 0;
3814 	char buf_cpy[128] = {0};
3815 	char *tmp_str, *sub_str;
3816 	int ret;
3817 
3818 	if (count > sizeof(buf_cpy) - 1)
3819 		return -EINVAL;
3820 
3821 	memcpy(buf_cpy, buf, count);
3822 	tmp_str = buf_cpy;
3823 
3824 	/* skip heading spaces */
3825 	while (isspace(*tmp_str))
3826 		tmp_str++;
3827 
3828 	switch (*tmp_str) {
3829 	case 'c':
3830 		*type = PP_OD_COMMIT_DPM_TABLE;
3831 		return 0;
3832 	case 'r':
3833 		params[parameter_size] = *type;
3834 		*num_of_params = 1;
3835 		*type = PP_OD_RESTORE_DEFAULT_TABLE;
3836 		return 0;
3837 	default:
3838 		break;
3839 	}
3840 
3841 	while ((sub_str = strsep(&tmp_str, delimiter)) != NULL) {
3842 		if (strlen(sub_str) == 0)
3843 			continue;
3844 
3845 		ret = kstrtol(sub_str, 0, &params[parameter_size]);
3846 		if (ret)
3847 			return -EINVAL;
3848 		parameter_size++;
3849 
3850 		while (isspace(*tmp_str))
3851 			tmp_str++;
3852 	}
3853 
3854 	*num_of_params = parameter_size;
3855 
3856 	return 0;
3857 }
3858 
3859 static int
3860 amdgpu_distribute_custom_od_settings(struct amdgpu_device *adev,
3861 				     enum PP_OD_DPM_TABLE_COMMAND cmd_type,
3862 				     const char *in_buf,
3863 				     size_t count)
3864 {
3865 	uint32_t parameter_size = 0;
3866 	long parameter[64];
3867 	int ret;
3868 
3869 	if (amdgpu_in_reset(adev))
3870 		return -EPERM;
3871 	if (adev->in_suspend && !adev->in_runpm)
3872 		return -EPERM;
3873 
3874 	ret = parse_input_od_command_lines(in_buf,
3875 					   count,
3876 					   &cmd_type,
3877 					   parameter,
3878 					   &parameter_size);
3879 	if (ret)
3880 		return ret;
3881 
3882 	ret = pm_runtime_get_sync(adev->dev);
3883 	if (ret < 0)
3884 		goto err_out0;
3885 
3886 	ret = amdgpu_dpm_odn_edit_dpm_table(adev,
3887 					    cmd_type,
3888 					    parameter,
3889 					    parameter_size);
3890 	if (ret)
3891 		goto err_out1;
3892 
3893 	if (cmd_type == PP_OD_COMMIT_DPM_TABLE) {
3894 		ret = amdgpu_dpm_dispatch_task(adev,
3895 					       AMD_PP_TASK_READJUST_POWER_STATE,
3896 					       NULL);
3897 		if (ret)
3898 			goto err_out1;
3899 	}
3900 
3901 	pm_runtime_mark_last_busy(adev->dev);
3902 	pm_runtime_put_autosuspend(adev->dev);
3903 
3904 	return count;
3905 
3906 err_out1:
3907 	pm_runtime_mark_last_busy(adev->dev);
3908 err_out0:
3909 	pm_runtime_put_autosuspend(adev->dev);
3910 
3911 	return ret;
3912 }
3913 
3914 /**
3915  * DOC: fan_curve
3916  *
3917  * The amdgpu driver provides a sysfs API for checking and adjusting the fan
3918  * control curve line.
3919  *
3920  * Reading back the file shows you the current settings(temperature in Celsius
3921  * degree and fan speed in pwm) applied to every anchor point of the curve line
3922  * and their permitted ranges if changable.
3923  *
3924  * Writing a desired string(with the format like "anchor_point_index temperature
3925  * fan_speed_in_pwm") to the file, change the settings for the specific anchor
3926  * point accordingly.
3927  *
3928  * When you have finished the editing, write "c" (commit) to the file to commit
3929  * your changes.
3930  *
3931  * If you want to reset to the default value, write "r" (reset) to the file to
3932  * reset them
3933  *
3934  * There are two fan control modes supported: auto and manual. With auto mode,
3935  * PMFW handles the fan speed control(how fan speed reacts to ASIC temperature).
3936  * While with manual mode, users can set their own fan curve line as what
3937  * described here. Normally the ASIC is booted up with auto mode. Any
3938  * settings via this interface will switch the fan control to manual mode
3939  * implicitly.
3940  */
3941 static ssize_t fan_curve_show(struct kobject *kobj,
3942 			      struct kobj_attribute *attr,
3943 			      char *buf)
3944 {
3945 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
3946 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
3947 
3948 	return (ssize_t)amdgpu_retrieve_od_settings(adev, OD_FAN_CURVE, buf);
3949 }
3950 
3951 static ssize_t fan_curve_store(struct kobject *kobj,
3952 			       struct kobj_attribute *attr,
3953 			       const char *buf,
3954 			       size_t count)
3955 {
3956 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
3957 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
3958 
3959 	return (ssize_t)amdgpu_distribute_custom_od_settings(adev,
3960 							     PP_OD_EDIT_FAN_CURVE,
3961 							     buf,
3962 							     count);
3963 }
3964 
3965 static umode_t fan_curve_visible(struct amdgpu_device *adev)
3966 {
3967 	umode_t umode = 0000;
3968 
3969 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_FAN_CURVE_RETRIEVE)
3970 		umode |= S_IRUSR | S_IRGRP | S_IROTH;
3971 
3972 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_FAN_CURVE_SET)
3973 		umode |= S_IWUSR;
3974 
3975 	return umode;
3976 }
3977 
3978 /**
3979  * DOC: acoustic_limit_rpm_threshold
3980  *
3981  * The amdgpu driver provides a sysfs API for checking and adjusting the
3982  * acoustic limit in RPM for fan control.
3983  *
3984  * Reading back the file shows you the current setting and the permitted
3985  * ranges if changable.
3986  *
3987  * Writing an integer to the file, change the setting accordingly.
3988  *
3989  * When you have finished the editing, write "c" (commit) to the file to commit
3990  * your changes.
3991  *
3992  * If you want to reset to the default value, write "r" (reset) to the file to
3993  * reset them
3994  *
3995  * This setting works under auto fan control mode only. It adjusts the PMFW's
3996  * behavior about the maximum speed in RPM the fan can spin. Setting via this
3997  * interface will switch the fan control to auto mode implicitly.
3998  */
3999 static ssize_t acoustic_limit_threshold_show(struct kobject *kobj,
4000 					     struct kobj_attribute *attr,
4001 					     char *buf)
4002 {
4003 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4004 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4005 
4006 	return (ssize_t)amdgpu_retrieve_od_settings(adev, OD_ACOUSTIC_LIMIT, buf);
4007 }
4008 
4009 static ssize_t acoustic_limit_threshold_store(struct kobject *kobj,
4010 					      struct kobj_attribute *attr,
4011 					      const char *buf,
4012 					      size_t count)
4013 {
4014 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4015 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4016 
4017 	return (ssize_t)amdgpu_distribute_custom_od_settings(adev,
4018 							     PP_OD_EDIT_ACOUSTIC_LIMIT,
4019 							     buf,
4020 							     count);
4021 }
4022 
4023 static umode_t acoustic_limit_threshold_visible(struct amdgpu_device *adev)
4024 {
4025 	umode_t umode = 0000;
4026 
4027 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_ACOUSTIC_LIMIT_THRESHOLD_RETRIEVE)
4028 		umode |= S_IRUSR | S_IRGRP | S_IROTH;
4029 
4030 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_ACOUSTIC_LIMIT_THRESHOLD_SET)
4031 		umode |= S_IWUSR;
4032 
4033 	return umode;
4034 }
4035 
4036 /**
4037  * DOC: acoustic_target_rpm_threshold
4038  *
4039  * The amdgpu driver provides a sysfs API for checking and adjusting the
4040  * acoustic target in RPM for fan control.
4041  *
4042  * Reading back the file shows you the current setting and the permitted
4043  * ranges if changable.
4044  *
4045  * Writing an integer to the file, change the setting accordingly.
4046  *
4047  * When you have finished the editing, write "c" (commit) to the file to commit
4048  * your changes.
4049  *
4050  * If you want to reset to the default value, write "r" (reset) to the file to
4051  * reset them
4052  *
4053  * This setting works under auto fan control mode only. It can co-exist with
4054  * other settings which can work also under auto mode. It adjusts the PMFW's
4055  * behavior about the maximum speed in RPM the fan can spin when ASIC
4056  * temperature is not greater than target temperature. Setting via this
4057  * interface will switch the fan control to auto mode implicitly.
4058  */
4059 static ssize_t acoustic_target_threshold_show(struct kobject *kobj,
4060 					      struct kobj_attribute *attr,
4061 					      char *buf)
4062 {
4063 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4064 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4065 
4066 	return (ssize_t)amdgpu_retrieve_od_settings(adev, OD_ACOUSTIC_TARGET, buf);
4067 }
4068 
4069 static ssize_t acoustic_target_threshold_store(struct kobject *kobj,
4070 					       struct kobj_attribute *attr,
4071 					       const char *buf,
4072 					       size_t count)
4073 {
4074 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4075 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4076 
4077 	return (ssize_t)amdgpu_distribute_custom_od_settings(adev,
4078 							     PP_OD_EDIT_ACOUSTIC_TARGET,
4079 							     buf,
4080 							     count);
4081 }
4082 
4083 static umode_t acoustic_target_threshold_visible(struct amdgpu_device *adev)
4084 {
4085 	umode_t umode = 0000;
4086 
4087 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_ACOUSTIC_TARGET_THRESHOLD_RETRIEVE)
4088 		umode |= S_IRUSR | S_IRGRP | S_IROTH;
4089 
4090 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_ACOUSTIC_TARGET_THRESHOLD_SET)
4091 		umode |= S_IWUSR;
4092 
4093 	return umode;
4094 }
4095 
4096 /**
4097  * DOC: fan_target_temperature
4098  *
4099  * The amdgpu driver provides a sysfs API for checking and adjusting the
4100  * target tempeature in Celsius degree for fan control.
4101  *
4102  * Reading back the file shows you the current setting and the permitted
4103  * ranges if changable.
4104  *
4105  * Writing an integer to the file, change the setting accordingly.
4106  *
4107  * When you have finished the editing, write "c" (commit) to the file to commit
4108  * your changes.
4109  *
4110  * If you want to reset to the default value, write "r" (reset) to the file to
4111  * reset them
4112  *
4113  * This setting works under auto fan control mode only. It can co-exist with
4114  * other settings which can work also under auto mode. Paring with the
4115  * acoustic_target_rpm_threshold setting, they define the maximum speed in
4116  * RPM the fan can spin when ASIC temperature is not greater than target
4117  * temperature. Setting via this interface will switch the fan control to
4118  * auto mode implicitly.
4119  */
4120 static ssize_t fan_target_temperature_show(struct kobject *kobj,
4121 					   struct kobj_attribute *attr,
4122 					   char *buf)
4123 {
4124 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4125 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4126 
4127 	return (ssize_t)amdgpu_retrieve_od_settings(adev, OD_FAN_TARGET_TEMPERATURE, buf);
4128 }
4129 
4130 static ssize_t fan_target_temperature_store(struct kobject *kobj,
4131 					    struct kobj_attribute *attr,
4132 					    const char *buf,
4133 					    size_t count)
4134 {
4135 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4136 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4137 
4138 	return (ssize_t)amdgpu_distribute_custom_od_settings(adev,
4139 							     PP_OD_EDIT_FAN_TARGET_TEMPERATURE,
4140 							     buf,
4141 							     count);
4142 }
4143 
4144 static umode_t fan_target_temperature_visible(struct amdgpu_device *adev)
4145 {
4146 	umode_t umode = 0000;
4147 
4148 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_FAN_TARGET_TEMPERATURE_RETRIEVE)
4149 		umode |= S_IRUSR | S_IRGRP | S_IROTH;
4150 
4151 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_FAN_TARGET_TEMPERATURE_SET)
4152 		umode |= S_IWUSR;
4153 
4154 	return umode;
4155 }
4156 
4157 /**
4158  * DOC: fan_minimum_pwm
4159  *
4160  * The amdgpu driver provides a sysfs API for checking and adjusting the
4161  * minimum fan speed in PWM.
4162  *
4163  * Reading back the file shows you the current setting and the permitted
4164  * ranges if changable.
4165  *
4166  * Writing an integer to the file, change the setting accordingly.
4167  *
4168  * When you have finished the editing, write "c" (commit) to the file to commit
4169  * your changes.
4170  *
4171  * If you want to reset to the default value, write "r" (reset) to the file to
4172  * reset them
4173  *
4174  * This setting works under auto fan control mode only. It can co-exist with
4175  * other settings which can work also under auto mode. It adjusts the PMFW's
4176  * behavior about the minimum fan speed in PWM the fan should spin. Setting
4177  * via this interface will switch the fan control to auto mode implicitly.
4178  */
4179 static ssize_t fan_minimum_pwm_show(struct kobject *kobj,
4180 				    struct kobj_attribute *attr,
4181 				    char *buf)
4182 {
4183 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4184 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4185 
4186 	return (ssize_t)amdgpu_retrieve_od_settings(adev, OD_FAN_MINIMUM_PWM, buf);
4187 }
4188 
4189 static ssize_t fan_minimum_pwm_store(struct kobject *kobj,
4190 				     struct kobj_attribute *attr,
4191 				     const char *buf,
4192 				     size_t count)
4193 {
4194 	struct od_kobj *container = container_of(kobj, struct od_kobj, kobj);
4195 	struct amdgpu_device *adev = (struct amdgpu_device *)container->priv;
4196 
4197 	return (ssize_t)amdgpu_distribute_custom_od_settings(adev,
4198 							     PP_OD_EDIT_FAN_MINIMUM_PWM,
4199 							     buf,
4200 							     count);
4201 }
4202 
4203 static umode_t fan_minimum_pwm_visible(struct amdgpu_device *adev)
4204 {
4205 	umode_t umode = 0000;
4206 
4207 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_FAN_MINIMUM_PWM_RETRIEVE)
4208 		umode |= S_IRUSR | S_IRGRP | S_IROTH;
4209 
4210 	if (adev->pm.od_feature_mask & OD_OPS_SUPPORT_FAN_MINIMUM_PWM_SET)
4211 		umode |= S_IWUSR;
4212 
4213 	return umode;
4214 }
4215 
4216 static struct od_feature_set amdgpu_od_set = {
4217 	.containers = {
4218 		[0] = {
4219 			.name = "fan_ctrl",
4220 			.sub_feature = {
4221 				[0] = {
4222 					.name = "fan_curve",
4223 					.ops = {
4224 						.is_visible = fan_curve_visible,
4225 						.show = fan_curve_show,
4226 						.store = fan_curve_store,
4227 					},
4228 				},
4229 				[1] = {
4230 					.name = "acoustic_limit_rpm_threshold",
4231 					.ops = {
4232 						.is_visible = acoustic_limit_threshold_visible,
4233 						.show = acoustic_limit_threshold_show,
4234 						.store = acoustic_limit_threshold_store,
4235 					},
4236 				},
4237 				[2] = {
4238 					.name = "acoustic_target_rpm_threshold",
4239 					.ops = {
4240 						.is_visible = acoustic_target_threshold_visible,
4241 						.show = acoustic_target_threshold_show,
4242 						.store = acoustic_target_threshold_store,
4243 					},
4244 				},
4245 				[3] = {
4246 					.name = "fan_target_temperature",
4247 					.ops = {
4248 						.is_visible = fan_target_temperature_visible,
4249 						.show = fan_target_temperature_show,
4250 						.store = fan_target_temperature_store,
4251 					},
4252 				},
4253 				[4] = {
4254 					.name = "fan_minimum_pwm",
4255 					.ops = {
4256 						.is_visible = fan_minimum_pwm_visible,
4257 						.show = fan_minimum_pwm_show,
4258 						.store = fan_minimum_pwm_store,
4259 					},
4260 				},
4261 			},
4262 		},
4263 	},
4264 };
4265 
4266 static void od_kobj_release(struct kobject *kobj)
4267 {
4268 	struct od_kobj *od_kobj = container_of(kobj, struct od_kobj, kobj);
4269 
4270 	kfree(od_kobj);
4271 }
4272 
4273 static const struct kobj_type od_ktype = {
4274 	.release	= od_kobj_release,
4275 	.sysfs_ops	= &kobj_sysfs_ops,
4276 };
4277 
4278 static void amdgpu_od_set_fini(struct amdgpu_device *adev)
4279 {
4280 	struct od_kobj *container, *container_next;
4281 	struct od_attribute *attribute, *attribute_next;
4282 
4283 	if (list_empty(&adev->pm.od_kobj_list))
4284 		return;
4285 
4286 	list_for_each_entry_safe(container, container_next,
4287 				 &adev->pm.od_kobj_list, entry) {
4288 		list_del(&container->entry);
4289 
4290 		list_for_each_entry_safe(attribute, attribute_next,
4291 					 &container->attribute, entry) {
4292 			list_del(&attribute->entry);
4293 			sysfs_remove_file(&container->kobj,
4294 					  &attribute->attribute.attr);
4295 			kfree(attribute);
4296 		}
4297 
4298 		kobject_put(&container->kobj);
4299 	}
4300 }
4301 
4302 static bool amdgpu_is_od_feature_supported(struct amdgpu_device *adev,
4303 					   struct od_feature_ops *feature_ops)
4304 {
4305 	umode_t mode;
4306 
4307 	if (!feature_ops->is_visible)
4308 		return false;
4309 
4310 	/*
4311 	 * If the feature has no user read and write mode set,
4312 	 * we can assume the feature is actually not supported.(?)
4313 	 * And the revelant sysfs interface should not be exposed.
4314 	 */
4315 	mode = feature_ops->is_visible(adev);
4316 	if (mode & (S_IRUSR | S_IWUSR))
4317 		return true;
4318 
4319 	return false;
4320 }
4321 
4322 static bool amdgpu_od_is_self_contained(struct amdgpu_device *adev,
4323 					struct od_feature_container *container)
4324 {
4325 	int i;
4326 
4327 	/*
4328 	 * If there is no valid entry within the container, the container
4329 	 * is recognized as a self contained container. And the valid entry
4330 	 * here means it has a valid naming and it is visible/supported by
4331 	 * the ASIC.
4332 	 */
4333 	for (i = 0; i < ARRAY_SIZE(container->sub_feature); i++) {
4334 		if (container->sub_feature[i].name &&
4335 		    amdgpu_is_od_feature_supported(adev,
4336 			&container->sub_feature[i].ops))
4337 			return false;
4338 	}
4339 
4340 	return true;
4341 }
4342 
4343 static int amdgpu_od_set_init(struct amdgpu_device *adev)
4344 {
4345 	struct od_kobj *top_set, *sub_set;
4346 	struct od_attribute *attribute;
4347 	struct od_feature_container *container;
4348 	struct od_feature_item *feature;
4349 	int i, j;
4350 	int ret;
4351 
4352 	/* Setup the top `gpu_od` directory which holds all other OD interfaces */
4353 	top_set = kzalloc(sizeof(*top_set), GFP_KERNEL);
4354 	if (!top_set)
4355 		return -ENOMEM;
4356 	list_add(&top_set->entry, &adev->pm.od_kobj_list);
4357 
4358 	ret = kobject_init_and_add(&top_set->kobj,
4359 				   &od_ktype,
4360 				   &adev->dev->kobj,
4361 				   "%s",
4362 				   "gpu_od");
4363 	if (ret)
4364 		goto err_out;
4365 	INIT_LIST_HEAD(&top_set->attribute);
4366 	top_set->priv = adev;
4367 
4368 	for (i = 0; i < ARRAY_SIZE(amdgpu_od_set.containers); i++) {
4369 		container = &amdgpu_od_set.containers[i];
4370 
4371 		if (!container->name)
4372 			continue;
4373 
4374 		/*
4375 		 * If there is valid entries within the container, the container
4376 		 * will be presented as a sub directory and all its holding entries
4377 		 * will be presented as plain files under it.
4378 		 * While if there is no valid entry within the container, the container
4379 		 * itself will be presented as a plain file under top `gpu_od` directory.
4380 		 */
4381 		if (amdgpu_od_is_self_contained(adev, container)) {
4382 			if (!amdgpu_is_od_feature_supported(adev,
4383 			     &container->ops))
4384 				continue;
4385 
4386 			/*
4387 			 * The container is presented as a plain file under top `gpu_od`
4388 			 * directory.
4389 			 */
4390 			attribute = kzalloc(sizeof(*attribute), GFP_KERNEL);
4391 			if (!attribute) {
4392 				ret = -ENOMEM;
4393 				goto err_out;
4394 			}
4395 			list_add(&attribute->entry, &top_set->attribute);
4396 
4397 			attribute->attribute.attr.mode =
4398 					container->ops.is_visible(adev);
4399 			attribute->attribute.attr.name = container->name;
4400 			attribute->attribute.show =
4401 					container->ops.show;
4402 			attribute->attribute.store =
4403 					container->ops.store;
4404 			ret = sysfs_create_file(&top_set->kobj,
4405 						&attribute->attribute.attr);
4406 			if (ret)
4407 				goto err_out;
4408 		} else {
4409 			/* The container is presented as a sub directory. */
4410 			sub_set = kzalloc(sizeof(*sub_set), GFP_KERNEL);
4411 			if (!sub_set) {
4412 				ret = -ENOMEM;
4413 				goto err_out;
4414 			}
4415 			list_add(&sub_set->entry, &adev->pm.od_kobj_list);
4416 
4417 			ret = kobject_init_and_add(&sub_set->kobj,
4418 						   &od_ktype,
4419 						   &top_set->kobj,
4420 						   "%s",
4421 						   container->name);
4422 			if (ret)
4423 				goto err_out;
4424 			INIT_LIST_HEAD(&sub_set->attribute);
4425 			sub_set->priv = adev;
4426 
4427 			for (j = 0; j < ARRAY_SIZE(container->sub_feature); j++) {
4428 				feature = &container->sub_feature[j];
4429 				if (!feature->name)
4430 					continue;
4431 
4432 				if (!amdgpu_is_od_feature_supported(adev,
4433 				     &feature->ops))
4434 					continue;
4435 
4436 				/*
4437 				 * With the container presented as a sub directory, the entry within
4438 				 * it is presented as a plain file under the sub directory.
4439 				 */
4440 				attribute = kzalloc(sizeof(*attribute), GFP_KERNEL);
4441 				if (!attribute) {
4442 					ret = -ENOMEM;
4443 					goto err_out;
4444 				}
4445 				list_add(&attribute->entry, &sub_set->attribute);
4446 
4447 				attribute->attribute.attr.mode =
4448 						feature->ops.is_visible(adev);
4449 				attribute->attribute.attr.name = feature->name;
4450 				attribute->attribute.show =
4451 						feature->ops.show;
4452 				attribute->attribute.store =
4453 						feature->ops.store;
4454 				ret = sysfs_create_file(&sub_set->kobj,
4455 							&attribute->attribute.attr);
4456 				if (ret)
4457 					goto err_out;
4458 			}
4459 		}
4460 	}
4461 
4462 	/*
4463 	 * If gpu_od is the only member in the list, that means gpu_od is an
4464 	 * empty directory, so remove it.
4465 	 */
4466 	if (list_is_singular(&adev->pm.od_kobj_list))
4467 		goto err_out;
4468 
4469 	return 0;
4470 
4471 err_out:
4472 	amdgpu_od_set_fini(adev);
4473 
4474 	return ret;
4475 }
4476 
4477 int amdgpu_pm_sysfs_init(struct amdgpu_device *adev)
4478 {
4479 	enum amdgpu_sriov_vf_mode mode;
4480 	uint32_t mask = 0;
4481 	int ret;
4482 
4483 	if (adev->pm.sysfs_initialized)
4484 		return 0;
4485 
4486 	INIT_LIST_HEAD(&adev->pm.pm_attr_list);
4487 
4488 	if (adev->pm.dpm_enabled == 0)
4489 		return 0;
4490 
4491 	mode = amdgpu_virt_get_sriov_vf_mode(adev);
4492 
4493 	/* under multi-vf mode, the hwmon attributes are all not supported */
4494 	if (mode != SRIOV_VF_MODE_MULTI_VF) {
4495 		adev->pm.int_hwmon_dev = hwmon_device_register_with_groups(adev->dev,
4496 									DRIVER_NAME, adev,
4497 									hwmon_groups);
4498 		if (IS_ERR(adev->pm.int_hwmon_dev)) {
4499 			ret = PTR_ERR(adev->pm.int_hwmon_dev);
4500 			dev_err(adev->dev, "Unable to register hwmon device: %d\n", ret);
4501 			return ret;
4502 		}
4503 	}
4504 
4505 	switch (mode) {
4506 	case SRIOV_VF_MODE_ONE_VF:
4507 		mask = ATTR_FLAG_ONEVF;
4508 		break;
4509 	case SRIOV_VF_MODE_MULTI_VF:
4510 		mask = 0;
4511 		break;
4512 	case SRIOV_VF_MODE_BARE_METAL:
4513 	default:
4514 		mask = ATTR_FLAG_MASK_ALL;
4515 		break;
4516 	}
4517 
4518 	ret = amdgpu_device_attr_create_groups(adev,
4519 					       amdgpu_device_attrs,
4520 					       ARRAY_SIZE(amdgpu_device_attrs),
4521 					       mask,
4522 					       &adev->pm.pm_attr_list);
4523 	if (ret)
4524 		goto err_out0;
4525 
4526 	if (amdgpu_dpm_is_overdrive_supported(adev)) {
4527 		ret = amdgpu_od_set_init(adev);
4528 		if (ret)
4529 			goto err_out1;
4530 	} else if (adev->pm.pp_feature & PP_OVERDRIVE_MASK) {
4531 		dev_info(adev->dev, "overdrive feature is not supported\n");
4532 	}
4533 
4534 	if (amdgpu_dpm_get_pm_policy_info(adev, PP_PM_POLICY_NONE, NULL) !=
4535 	    -EOPNOTSUPP) {
4536 		ret = devm_device_add_group(adev->dev,
4537 					    &amdgpu_pm_policy_attr_group);
4538 		if (ret)
4539 			goto err_out0;
4540 	}
4541 
4542 	adev->pm.sysfs_initialized = true;
4543 
4544 	return 0;
4545 
4546 err_out1:
4547 	amdgpu_device_attr_remove_groups(adev, &adev->pm.pm_attr_list);
4548 err_out0:
4549 	if (adev->pm.int_hwmon_dev)
4550 		hwmon_device_unregister(adev->pm.int_hwmon_dev);
4551 
4552 	return ret;
4553 }
4554 
4555 void amdgpu_pm_sysfs_fini(struct amdgpu_device *adev)
4556 {
4557 	amdgpu_od_set_fini(adev);
4558 
4559 	if (adev->pm.int_hwmon_dev)
4560 		hwmon_device_unregister(adev->pm.int_hwmon_dev);
4561 
4562 	amdgpu_device_attr_remove_groups(adev, &adev->pm.pm_attr_list);
4563 }
4564 
4565 /*
4566  * Debugfs info
4567  */
4568 #if defined(CONFIG_DEBUG_FS)
4569 
4570 static void amdgpu_debugfs_prints_cpu_info(struct seq_file *m,
4571 					   struct amdgpu_device *adev)
4572 {
4573 	uint16_t *p_val;
4574 	uint32_t size;
4575 	int i;
4576 	uint32_t num_cpu_cores = amdgpu_dpm_get_num_cpu_cores(adev);
4577 
4578 	if (amdgpu_dpm_is_cclk_dpm_supported(adev)) {
4579 		p_val = kcalloc(num_cpu_cores, sizeof(uint16_t),
4580 				GFP_KERNEL);
4581 
4582 		if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_CPU_CLK,
4583 					    (void *)p_val, &size)) {
4584 			for (i = 0; i < num_cpu_cores; i++)
4585 				seq_printf(m, "\t%u MHz (CPU%d)\n",
4586 					   *(p_val + i), i);
4587 		}
4588 
4589 		kfree(p_val);
4590 	}
4591 }
4592 
4593 static int amdgpu_debugfs_pm_info_pp(struct seq_file *m, struct amdgpu_device *adev)
4594 {
4595 	uint32_t mp1_ver = amdgpu_ip_version(adev, MP1_HWIP, 0);
4596 	uint32_t gc_ver = amdgpu_ip_version(adev, GC_HWIP, 0);
4597 	uint32_t value;
4598 	uint64_t value64 = 0;
4599 	uint32_t query = 0;
4600 	int size;
4601 
4602 	/* GPU Clocks */
4603 	size = sizeof(value);
4604 	seq_printf(m, "GFX Clocks and Power:\n");
4605 
4606 	amdgpu_debugfs_prints_cpu_info(m, adev);
4607 
4608 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GFX_MCLK, (void *)&value, &size))
4609 		seq_printf(m, "\t%u MHz (MCLK)\n", value/100);
4610 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GFX_SCLK, (void *)&value, &size))
4611 		seq_printf(m, "\t%u MHz (SCLK)\n", value/100);
4612 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_STABLE_PSTATE_SCLK, (void *)&value, &size))
4613 		seq_printf(m, "\t%u MHz (PSTATE_SCLK)\n", value/100);
4614 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_STABLE_PSTATE_MCLK, (void *)&value, &size))
4615 		seq_printf(m, "\t%u MHz (PSTATE_MCLK)\n", value/100);
4616 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_VDDGFX, (void *)&value, &size))
4617 		seq_printf(m, "\t%u mV (VDDGFX)\n", value);
4618 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_VDDNB, (void *)&value, &size))
4619 		seq_printf(m, "\t%u mV (VDDNB)\n", value);
4620 	size = sizeof(uint32_t);
4621 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GPU_AVG_POWER, (void *)&query, &size)) {
4622 		if (adev->flags & AMD_IS_APU)
4623 			seq_printf(m, "\t%u.%02u W (average SoC including CPU)\n", query >> 8, query & 0xff);
4624 		else
4625 			seq_printf(m, "\t%u.%02u W (average SoC)\n", query >> 8, query & 0xff);
4626 	}
4627 	size = sizeof(uint32_t);
4628 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GPU_INPUT_POWER, (void *)&query, &size)) {
4629 		if (adev->flags & AMD_IS_APU)
4630 			seq_printf(m, "\t%u.%02u W (current SoC including CPU)\n", query >> 8, query & 0xff);
4631 		else
4632 			seq_printf(m, "\t%u.%02u W (current SoC)\n", query >> 8, query & 0xff);
4633 	}
4634 	size = sizeof(value);
4635 	seq_printf(m, "\n");
4636 
4637 	/* GPU Temp */
4638 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GPU_TEMP, (void *)&value, &size))
4639 		seq_printf(m, "GPU Temperature: %u C\n", value/1000);
4640 
4641 	/* GPU Load */
4642 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GPU_LOAD, (void *)&value, &size))
4643 		seq_printf(m, "GPU Load: %u %%\n", value);
4644 	/* MEM Load */
4645 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_MEM_LOAD, (void *)&value, &size))
4646 		seq_printf(m, "MEM Load: %u %%\n", value);
4647 	/* VCN Load */
4648 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_VCN_LOAD, (void *)&value, &size))
4649 		seq_printf(m, "VCN Load: %u %%\n", value);
4650 
4651 	seq_printf(m, "\n");
4652 
4653 	/* SMC feature mask */
4654 	if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_ENABLED_SMC_FEATURES_MASK, (void *)&value64, &size))
4655 		seq_printf(m, "SMC Feature Mask: 0x%016llx\n", value64);
4656 
4657 	/* ASICs greater than CHIP_VEGA20 supports these sensors */
4658 	if (gc_ver != IP_VERSION(9, 4, 0) && mp1_ver > IP_VERSION(9, 0, 0)) {
4659 		/* VCN clocks */
4660 		if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_VCN_POWER_STATE, (void *)&value, &size)) {
4661 			if (!value) {
4662 				seq_printf(m, "VCN: Powered down\n");
4663 			} else {
4664 				seq_printf(m, "VCN: Powered up\n");
4665 				if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_UVD_DCLK, (void *)&value, &size))
4666 					seq_printf(m, "\t%u MHz (DCLK)\n", value/100);
4667 				if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_UVD_VCLK, (void *)&value, &size))
4668 					seq_printf(m, "\t%u MHz (VCLK)\n", value/100);
4669 			}
4670 		}
4671 		seq_printf(m, "\n");
4672 	} else {
4673 		/* UVD clocks */
4674 		if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_UVD_POWER, (void *)&value, &size)) {
4675 			if (!value) {
4676 				seq_printf(m, "UVD: Powered down\n");
4677 			} else {
4678 				seq_printf(m, "UVD: Powered up\n");
4679 				if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_UVD_DCLK, (void *)&value, &size))
4680 					seq_printf(m, "\t%u MHz (DCLK)\n", value/100);
4681 				if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_UVD_VCLK, (void *)&value, &size))
4682 					seq_printf(m, "\t%u MHz (VCLK)\n", value/100);
4683 			}
4684 		}
4685 		seq_printf(m, "\n");
4686 
4687 		/* VCE clocks */
4688 		if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_VCE_POWER, (void *)&value, &size)) {
4689 			if (!value) {
4690 				seq_printf(m, "VCE: Powered down\n");
4691 			} else {
4692 				seq_printf(m, "VCE: Powered up\n");
4693 				if (!amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_VCE_ECCLK, (void *)&value, &size))
4694 					seq_printf(m, "\t%u MHz (ECCLK)\n", value/100);
4695 			}
4696 		}
4697 	}
4698 
4699 	return 0;
4700 }
4701 
4702 static const struct cg_flag_name clocks[] = {
4703 	{AMD_CG_SUPPORT_GFX_FGCG, "Graphics Fine Grain Clock Gating"},
4704 	{AMD_CG_SUPPORT_GFX_MGCG, "Graphics Medium Grain Clock Gating"},
4705 	{AMD_CG_SUPPORT_GFX_MGLS, "Graphics Medium Grain memory Light Sleep"},
4706 	{AMD_CG_SUPPORT_GFX_CGCG, "Graphics Coarse Grain Clock Gating"},
4707 	{AMD_CG_SUPPORT_GFX_CGLS, "Graphics Coarse Grain memory Light Sleep"},
4708 	{AMD_CG_SUPPORT_GFX_CGTS, "Graphics Coarse Grain Tree Shader Clock Gating"},
4709 	{AMD_CG_SUPPORT_GFX_CGTS_LS, "Graphics Coarse Grain Tree Shader Light Sleep"},
4710 	{AMD_CG_SUPPORT_GFX_CP_LS, "Graphics Command Processor Light Sleep"},
4711 	{AMD_CG_SUPPORT_GFX_RLC_LS, "Graphics Run List Controller Light Sleep"},
4712 	{AMD_CG_SUPPORT_GFX_3D_CGCG, "Graphics 3D Coarse Grain Clock Gating"},
4713 	{AMD_CG_SUPPORT_GFX_3D_CGLS, "Graphics 3D Coarse Grain memory Light Sleep"},
4714 	{AMD_CG_SUPPORT_MC_LS, "Memory Controller Light Sleep"},
4715 	{AMD_CG_SUPPORT_MC_MGCG, "Memory Controller Medium Grain Clock Gating"},
4716 	{AMD_CG_SUPPORT_SDMA_LS, "System Direct Memory Access Light Sleep"},
4717 	{AMD_CG_SUPPORT_SDMA_MGCG, "System Direct Memory Access Medium Grain Clock Gating"},
4718 	{AMD_CG_SUPPORT_BIF_MGCG, "Bus Interface Medium Grain Clock Gating"},
4719 	{AMD_CG_SUPPORT_BIF_LS, "Bus Interface Light Sleep"},
4720 	{AMD_CG_SUPPORT_UVD_MGCG, "Unified Video Decoder Medium Grain Clock Gating"},
4721 	{AMD_CG_SUPPORT_VCE_MGCG, "Video Compression Engine Medium Grain Clock Gating"},
4722 	{AMD_CG_SUPPORT_HDP_LS, "Host Data Path Light Sleep"},
4723 	{AMD_CG_SUPPORT_HDP_MGCG, "Host Data Path Medium Grain Clock Gating"},
4724 	{AMD_CG_SUPPORT_DRM_MGCG, "Digital Right Management Medium Grain Clock Gating"},
4725 	{AMD_CG_SUPPORT_DRM_LS, "Digital Right Management Light Sleep"},
4726 	{AMD_CG_SUPPORT_ROM_MGCG, "Rom Medium Grain Clock Gating"},
4727 	{AMD_CG_SUPPORT_DF_MGCG, "Data Fabric Medium Grain Clock Gating"},
4728 	{AMD_CG_SUPPORT_VCN_MGCG, "VCN Medium Grain Clock Gating"},
4729 	{AMD_CG_SUPPORT_HDP_DS, "Host Data Path Deep Sleep"},
4730 	{AMD_CG_SUPPORT_HDP_SD, "Host Data Path Shutdown"},
4731 	{AMD_CG_SUPPORT_IH_CG, "Interrupt Handler Clock Gating"},
4732 	{AMD_CG_SUPPORT_JPEG_MGCG, "JPEG Medium Grain Clock Gating"},
4733 	{AMD_CG_SUPPORT_REPEATER_FGCG, "Repeater Fine Grain Clock Gating"},
4734 	{AMD_CG_SUPPORT_GFX_PERF_CLK, "Perfmon Clock Gating"},
4735 	{AMD_CG_SUPPORT_ATHUB_MGCG, "Address Translation Hub Medium Grain Clock Gating"},
4736 	{AMD_CG_SUPPORT_ATHUB_LS, "Address Translation Hub Light Sleep"},
4737 	{0, NULL},
4738 };
4739 
4740 static void amdgpu_parse_cg_state(struct seq_file *m, u64 flags)
4741 {
4742 	int i;
4743 
4744 	for (i = 0; clocks[i].flag; i++)
4745 		seq_printf(m, "\t%s: %s\n", clocks[i].name,
4746 			   (flags & clocks[i].flag) ? "On" : "Off");
4747 }
4748 
4749 static int amdgpu_debugfs_pm_info_show(struct seq_file *m, void *unused)
4750 {
4751 	struct amdgpu_device *adev = (struct amdgpu_device *)m->private;
4752 	struct drm_device *dev = adev_to_drm(adev);
4753 	u64 flags = 0;
4754 	int r;
4755 
4756 	if (amdgpu_in_reset(adev))
4757 		return -EPERM;
4758 	if (adev->in_suspend && !adev->in_runpm)
4759 		return -EPERM;
4760 
4761 	r = pm_runtime_get_sync(dev->dev);
4762 	if (r < 0) {
4763 		pm_runtime_put_autosuspend(dev->dev);
4764 		return r;
4765 	}
4766 
4767 	if (amdgpu_dpm_debugfs_print_current_performance_level(adev, m)) {
4768 		r = amdgpu_debugfs_pm_info_pp(m, adev);
4769 		if (r)
4770 			goto out;
4771 	}
4772 
4773 	amdgpu_device_ip_get_clockgating_state(adev, &flags);
4774 
4775 	seq_printf(m, "Clock Gating Flags Mask: 0x%llx\n", flags);
4776 	amdgpu_parse_cg_state(m, flags);
4777 	seq_printf(m, "\n");
4778 
4779 out:
4780 	pm_runtime_mark_last_busy(dev->dev);
4781 	pm_runtime_put_autosuspend(dev->dev);
4782 
4783 	return r;
4784 }
4785 
4786 DEFINE_SHOW_ATTRIBUTE(amdgpu_debugfs_pm_info);
4787 
4788 /*
4789  * amdgpu_pm_priv_buffer_read - Read memory region allocated to FW
4790  *
4791  * Reads debug memory region allocated to PMFW
4792  */
4793 static ssize_t amdgpu_pm_prv_buffer_read(struct file *f, char __user *buf,
4794 					 size_t size, loff_t *pos)
4795 {
4796 	struct amdgpu_device *adev = file_inode(f)->i_private;
4797 	size_t smu_prv_buf_size;
4798 	void *smu_prv_buf;
4799 	int ret = 0;
4800 
4801 	if (amdgpu_in_reset(adev))
4802 		return -EPERM;
4803 	if (adev->in_suspend && !adev->in_runpm)
4804 		return -EPERM;
4805 
4806 	ret = amdgpu_dpm_get_smu_prv_buf_details(adev, &smu_prv_buf, &smu_prv_buf_size);
4807 	if (ret)
4808 		return ret;
4809 
4810 	if (!smu_prv_buf || !smu_prv_buf_size)
4811 		return -EINVAL;
4812 
4813 	return simple_read_from_buffer(buf, size, pos, smu_prv_buf,
4814 				       smu_prv_buf_size);
4815 }
4816 
4817 static const struct file_operations amdgpu_debugfs_pm_prv_buffer_fops = {
4818 	.owner = THIS_MODULE,
4819 	.open = simple_open,
4820 	.read = amdgpu_pm_prv_buffer_read,
4821 	.llseek = default_llseek,
4822 };
4823 
4824 #endif
4825 
4826 void amdgpu_debugfs_pm_init(struct amdgpu_device *adev)
4827 {
4828 #if defined(CONFIG_DEBUG_FS)
4829 	struct drm_minor *minor = adev_to_drm(adev)->primary;
4830 	struct dentry *root = minor->debugfs_root;
4831 
4832 	if (!adev->pm.dpm_enabled)
4833 		return;
4834 
4835 	debugfs_create_file("amdgpu_pm_info", 0444, root, adev,
4836 			    &amdgpu_debugfs_pm_info_fops);
4837 
4838 	if (adev->pm.smu_prv_buffer_size > 0)
4839 		debugfs_create_file_size("amdgpu_pm_prv_buffer", 0444, root,
4840 					 adev,
4841 					 &amdgpu_debugfs_pm_prv_buffer_fops,
4842 					 adev->pm.smu_prv_buffer_size);
4843 
4844 	amdgpu_dpm_stb_debug_fs_init(adev);
4845 #endif
4846 }
4847