xref: /linux/drivers/gpu/drm/radeon/ni_dpm.c (revision b7e1e969c887c897947fdc3754fe9b0c24acb155)
1 /*
2  * Copyright 2012 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  */
23 
24 #include <linux/math64.h>
25 #include <linux/pci.h>
26 #include <linux/seq_file.h>
27 
28 #include "atom.h"
29 #include "evergreen.h"
30 #include "ni_dpm.h"
31 #include "nid.h"
32 #include "r600_dpm.h"
33 #include "rv770.h"
34 #include "radeon.h"
35 #include "radeon_asic.h"
36 
37 #define MC_CG_ARB_FREQ_F0           0x0a
38 #define MC_CG_ARB_FREQ_F1           0x0b
39 #define MC_CG_ARB_FREQ_F2           0x0c
40 #define MC_CG_ARB_FREQ_F3           0x0d
41 
42 #define SMC_RAM_END 0xC000
43 
44 static const struct ni_cac_weights cac_weights_cayman_xt =
45 {
46 	0x15,
47 	0x2,
48 	0x19,
49 	0x2,
50 	0x8,
51 	0x14,
52 	0x2,
53 	0x16,
54 	0xE,
55 	0x17,
56 	0x13,
57 	0x2B,
58 	0x10,
59 	0x7,
60 	0x5,
61 	0x5,
62 	0x5,
63 	0x2,
64 	0x3,
65 	0x9,
66 	0x10,
67 	0x10,
68 	0x2B,
69 	0xA,
70 	0x9,
71 	0x4,
72 	0xD,
73 	0xD,
74 	0x3E,
75 	0x18,
76 	0x14,
77 	0,
78 	0x3,
79 	0x3,
80 	0x5,
81 	0,
82 	0x2,
83 	0,
84 	0,
85 	0,
86 	0,
87 	0,
88 	0,
89 	0,
90 	0,
91 	0,
92 	0x1CC,
93 	0,
94 	0x164,
95 	1,
96 	1,
97 	1,
98 	1,
99 	12,
100 	12,
101 	12,
102 	0x12,
103 	0x1F,
104 	132,
105 	5,
106 	7,
107 	0,
108 	{ 0, 0, 0, 0, 0, 0, 0, 0 },
109 	{ 0, 0, 0, 0 },
110 	true
111 };
112 
113 static const struct ni_cac_weights cac_weights_cayman_pro =
114 {
115 	0x16,
116 	0x4,
117 	0x10,
118 	0x2,
119 	0xA,
120 	0x16,
121 	0x2,
122 	0x18,
123 	0x10,
124 	0x1A,
125 	0x16,
126 	0x2D,
127 	0x12,
128 	0xA,
129 	0x6,
130 	0x6,
131 	0x6,
132 	0x2,
133 	0x4,
134 	0xB,
135 	0x11,
136 	0x11,
137 	0x2D,
138 	0xC,
139 	0xC,
140 	0x7,
141 	0x10,
142 	0x10,
143 	0x3F,
144 	0x1A,
145 	0x16,
146 	0,
147 	0x7,
148 	0x4,
149 	0x6,
150 	1,
151 	0x2,
152 	0x1,
153 	0,
154 	0,
155 	0,
156 	0,
157 	0,
158 	0,
159 	0x30,
160 	0,
161 	0x1CF,
162 	0,
163 	0x166,
164 	1,
165 	1,
166 	1,
167 	1,
168 	12,
169 	12,
170 	12,
171 	0x15,
172 	0x1F,
173 	132,
174 	6,
175 	6,
176 	0,
177 	{ 0, 0, 0, 0, 0, 0, 0, 0 },
178 	{ 0, 0, 0, 0 },
179 	true
180 };
181 
182 static const struct ni_cac_weights cac_weights_cayman_le =
183 {
184 	0x7,
185 	0xE,
186 	0x1,
187 	0xA,
188 	0x1,
189 	0x3F,
190 	0x2,
191 	0x18,
192 	0x10,
193 	0x1A,
194 	0x1,
195 	0x3F,
196 	0x1,
197 	0xE,
198 	0x6,
199 	0x6,
200 	0x6,
201 	0x2,
202 	0x4,
203 	0x9,
204 	0x1A,
205 	0x1A,
206 	0x2C,
207 	0xA,
208 	0x11,
209 	0x8,
210 	0x19,
211 	0x19,
212 	0x1,
213 	0x1,
214 	0x1A,
215 	0,
216 	0x8,
217 	0x5,
218 	0x8,
219 	0x1,
220 	0x3,
221 	0x1,
222 	0,
223 	0,
224 	0,
225 	0,
226 	0,
227 	0,
228 	0x38,
229 	0x38,
230 	0x239,
231 	0x3,
232 	0x18A,
233 	1,
234 	1,
235 	1,
236 	1,
237 	12,
238 	12,
239 	12,
240 	0x15,
241 	0x22,
242 	132,
243 	6,
244 	6,
245 	0,
246 	{ 0, 0, 0, 0, 0, 0, 0, 0 },
247 	{ 0, 0, 0, 0 },
248 	true
249 };
250 
251 #define NISLANDS_MGCG_SEQUENCE  300
252 
253 static const u32 cayman_cgcg_cgls_default[] =
254 {
255 	0x000008f8, 0x00000010, 0xffffffff,
256 	0x000008fc, 0x00000000, 0xffffffff,
257 	0x000008f8, 0x00000011, 0xffffffff,
258 	0x000008fc, 0x00000000, 0xffffffff,
259 	0x000008f8, 0x00000012, 0xffffffff,
260 	0x000008fc, 0x00000000, 0xffffffff,
261 	0x000008f8, 0x00000013, 0xffffffff,
262 	0x000008fc, 0x00000000, 0xffffffff,
263 	0x000008f8, 0x00000014, 0xffffffff,
264 	0x000008fc, 0x00000000, 0xffffffff,
265 	0x000008f8, 0x00000015, 0xffffffff,
266 	0x000008fc, 0x00000000, 0xffffffff,
267 	0x000008f8, 0x00000016, 0xffffffff,
268 	0x000008fc, 0x00000000, 0xffffffff,
269 	0x000008f8, 0x00000017, 0xffffffff,
270 	0x000008fc, 0x00000000, 0xffffffff,
271 	0x000008f8, 0x00000018, 0xffffffff,
272 	0x000008fc, 0x00000000, 0xffffffff,
273 	0x000008f8, 0x00000019, 0xffffffff,
274 	0x000008fc, 0x00000000, 0xffffffff,
275 	0x000008f8, 0x0000001a, 0xffffffff,
276 	0x000008fc, 0x00000000, 0xffffffff,
277 	0x000008f8, 0x0000001b, 0xffffffff,
278 	0x000008fc, 0x00000000, 0xffffffff,
279 	0x000008f8, 0x00000020, 0xffffffff,
280 	0x000008fc, 0x00000000, 0xffffffff,
281 	0x000008f8, 0x00000021, 0xffffffff,
282 	0x000008fc, 0x00000000, 0xffffffff,
283 	0x000008f8, 0x00000022, 0xffffffff,
284 	0x000008fc, 0x00000000, 0xffffffff,
285 	0x000008f8, 0x00000023, 0xffffffff,
286 	0x000008fc, 0x00000000, 0xffffffff,
287 	0x000008f8, 0x00000024, 0xffffffff,
288 	0x000008fc, 0x00000000, 0xffffffff,
289 	0x000008f8, 0x00000025, 0xffffffff,
290 	0x000008fc, 0x00000000, 0xffffffff,
291 	0x000008f8, 0x00000026, 0xffffffff,
292 	0x000008fc, 0x00000000, 0xffffffff,
293 	0x000008f8, 0x00000027, 0xffffffff,
294 	0x000008fc, 0x00000000, 0xffffffff,
295 	0x000008f8, 0x00000028, 0xffffffff,
296 	0x000008fc, 0x00000000, 0xffffffff,
297 	0x000008f8, 0x00000029, 0xffffffff,
298 	0x000008fc, 0x00000000, 0xffffffff,
299 	0x000008f8, 0x0000002a, 0xffffffff,
300 	0x000008fc, 0x00000000, 0xffffffff,
301 	0x000008f8, 0x0000002b, 0xffffffff,
302 	0x000008fc, 0x00000000, 0xffffffff
303 };
304 #define CAYMAN_CGCG_CGLS_DEFAULT_LENGTH sizeof(cayman_cgcg_cgls_default) / (3 * sizeof(u32))
305 
306 static const u32 cayman_cgcg_cgls_disable[] =
307 {
308 	0x000008f8, 0x00000010, 0xffffffff,
309 	0x000008fc, 0xffffffff, 0xffffffff,
310 	0x000008f8, 0x00000011, 0xffffffff,
311 	0x000008fc, 0xffffffff, 0xffffffff,
312 	0x000008f8, 0x00000012, 0xffffffff,
313 	0x000008fc, 0xffffffff, 0xffffffff,
314 	0x000008f8, 0x00000013, 0xffffffff,
315 	0x000008fc, 0xffffffff, 0xffffffff,
316 	0x000008f8, 0x00000014, 0xffffffff,
317 	0x000008fc, 0xffffffff, 0xffffffff,
318 	0x000008f8, 0x00000015, 0xffffffff,
319 	0x000008fc, 0xffffffff, 0xffffffff,
320 	0x000008f8, 0x00000016, 0xffffffff,
321 	0x000008fc, 0xffffffff, 0xffffffff,
322 	0x000008f8, 0x00000017, 0xffffffff,
323 	0x000008fc, 0xffffffff, 0xffffffff,
324 	0x000008f8, 0x00000018, 0xffffffff,
325 	0x000008fc, 0xffffffff, 0xffffffff,
326 	0x000008f8, 0x00000019, 0xffffffff,
327 	0x000008fc, 0xffffffff, 0xffffffff,
328 	0x000008f8, 0x0000001a, 0xffffffff,
329 	0x000008fc, 0xffffffff, 0xffffffff,
330 	0x000008f8, 0x0000001b, 0xffffffff,
331 	0x000008fc, 0xffffffff, 0xffffffff,
332 	0x000008f8, 0x00000020, 0xffffffff,
333 	0x000008fc, 0x00000000, 0xffffffff,
334 	0x000008f8, 0x00000021, 0xffffffff,
335 	0x000008fc, 0x00000000, 0xffffffff,
336 	0x000008f8, 0x00000022, 0xffffffff,
337 	0x000008fc, 0x00000000, 0xffffffff,
338 	0x000008f8, 0x00000023, 0xffffffff,
339 	0x000008fc, 0x00000000, 0xffffffff,
340 	0x000008f8, 0x00000024, 0xffffffff,
341 	0x000008fc, 0x00000000, 0xffffffff,
342 	0x000008f8, 0x00000025, 0xffffffff,
343 	0x000008fc, 0x00000000, 0xffffffff,
344 	0x000008f8, 0x00000026, 0xffffffff,
345 	0x000008fc, 0x00000000, 0xffffffff,
346 	0x000008f8, 0x00000027, 0xffffffff,
347 	0x000008fc, 0x00000000, 0xffffffff,
348 	0x000008f8, 0x00000028, 0xffffffff,
349 	0x000008fc, 0x00000000, 0xffffffff,
350 	0x000008f8, 0x00000029, 0xffffffff,
351 	0x000008fc, 0x00000000, 0xffffffff,
352 	0x000008f8, 0x0000002a, 0xffffffff,
353 	0x000008fc, 0x00000000, 0xffffffff,
354 	0x000008f8, 0x0000002b, 0xffffffff,
355 	0x000008fc, 0x00000000, 0xffffffff,
356 	0x00000644, 0x000f7902, 0x001f4180,
357 	0x00000644, 0x000f3802, 0x001f4180
358 };
359 #define CAYMAN_CGCG_CGLS_DISABLE_LENGTH sizeof(cayman_cgcg_cgls_disable) / (3 * sizeof(u32))
360 
361 static const u32 cayman_cgcg_cgls_enable[] =
362 {
363 	0x00000644, 0x000f7882, 0x001f4080,
364 	0x000008f8, 0x00000010, 0xffffffff,
365 	0x000008fc, 0x00000000, 0xffffffff,
366 	0x000008f8, 0x00000011, 0xffffffff,
367 	0x000008fc, 0x00000000, 0xffffffff,
368 	0x000008f8, 0x00000012, 0xffffffff,
369 	0x000008fc, 0x00000000, 0xffffffff,
370 	0x000008f8, 0x00000013, 0xffffffff,
371 	0x000008fc, 0x00000000, 0xffffffff,
372 	0x000008f8, 0x00000014, 0xffffffff,
373 	0x000008fc, 0x00000000, 0xffffffff,
374 	0x000008f8, 0x00000015, 0xffffffff,
375 	0x000008fc, 0x00000000, 0xffffffff,
376 	0x000008f8, 0x00000016, 0xffffffff,
377 	0x000008fc, 0x00000000, 0xffffffff,
378 	0x000008f8, 0x00000017, 0xffffffff,
379 	0x000008fc, 0x00000000, 0xffffffff,
380 	0x000008f8, 0x00000018, 0xffffffff,
381 	0x000008fc, 0x00000000, 0xffffffff,
382 	0x000008f8, 0x00000019, 0xffffffff,
383 	0x000008fc, 0x00000000, 0xffffffff,
384 	0x000008f8, 0x0000001a, 0xffffffff,
385 	0x000008fc, 0x00000000, 0xffffffff,
386 	0x000008f8, 0x0000001b, 0xffffffff,
387 	0x000008fc, 0x00000000, 0xffffffff,
388 	0x000008f8, 0x00000020, 0xffffffff,
389 	0x000008fc, 0xffffffff, 0xffffffff,
390 	0x000008f8, 0x00000021, 0xffffffff,
391 	0x000008fc, 0xffffffff, 0xffffffff,
392 	0x000008f8, 0x00000022, 0xffffffff,
393 	0x000008fc, 0xffffffff, 0xffffffff,
394 	0x000008f8, 0x00000023, 0xffffffff,
395 	0x000008fc, 0xffffffff, 0xffffffff,
396 	0x000008f8, 0x00000024, 0xffffffff,
397 	0x000008fc, 0xffffffff, 0xffffffff,
398 	0x000008f8, 0x00000025, 0xffffffff,
399 	0x000008fc, 0xffffffff, 0xffffffff,
400 	0x000008f8, 0x00000026, 0xffffffff,
401 	0x000008fc, 0xffffffff, 0xffffffff,
402 	0x000008f8, 0x00000027, 0xffffffff,
403 	0x000008fc, 0xffffffff, 0xffffffff,
404 	0x000008f8, 0x00000028, 0xffffffff,
405 	0x000008fc, 0xffffffff, 0xffffffff,
406 	0x000008f8, 0x00000029, 0xffffffff,
407 	0x000008fc, 0xffffffff, 0xffffffff,
408 	0x000008f8, 0x0000002a, 0xffffffff,
409 	0x000008fc, 0xffffffff, 0xffffffff,
410 	0x000008f8, 0x0000002b, 0xffffffff,
411 	0x000008fc, 0xffffffff, 0xffffffff
412 };
413 #define CAYMAN_CGCG_CGLS_ENABLE_LENGTH  sizeof(cayman_cgcg_cgls_enable) / (3 * sizeof(u32))
414 
415 static const u32 cayman_mgcg_default[] =
416 {
417 	0x0000802c, 0xc0000000, 0xffffffff,
418 	0x00003fc4, 0xc0000000, 0xffffffff,
419 	0x00005448, 0x00000100, 0xffffffff,
420 	0x000055e4, 0x00000100, 0xffffffff,
421 	0x0000160c, 0x00000100, 0xffffffff,
422 	0x00008984, 0x06000100, 0xffffffff,
423 	0x0000c164, 0x00000100, 0xffffffff,
424 	0x00008a18, 0x00000100, 0xffffffff,
425 	0x0000897c, 0x06000100, 0xffffffff,
426 	0x00008b28, 0x00000100, 0xffffffff,
427 	0x00009144, 0x00800200, 0xffffffff,
428 	0x00009a60, 0x00000100, 0xffffffff,
429 	0x00009868, 0x00000100, 0xffffffff,
430 	0x00008d58, 0x00000100, 0xffffffff,
431 	0x00009510, 0x00000100, 0xffffffff,
432 	0x0000949c, 0x00000100, 0xffffffff,
433 	0x00009654, 0x00000100, 0xffffffff,
434 	0x00009030, 0x00000100, 0xffffffff,
435 	0x00009034, 0x00000100, 0xffffffff,
436 	0x00009038, 0x00000100, 0xffffffff,
437 	0x0000903c, 0x00000100, 0xffffffff,
438 	0x00009040, 0x00000100, 0xffffffff,
439 	0x0000a200, 0x00000100, 0xffffffff,
440 	0x0000a204, 0x00000100, 0xffffffff,
441 	0x0000a208, 0x00000100, 0xffffffff,
442 	0x0000a20c, 0x00000100, 0xffffffff,
443 	0x00009744, 0x00000100, 0xffffffff,
444 	0x00003f80, 0x00000100, 0xffffffff,
445 	0x0000a210, 0x00000100, 0xffffffff,
446 	0x0000a214, 0x00000100, 0xffffffff,
447 	0x000004d8, 0x00000100, 0xffffffff,
448 	0x00009664, 0x00000100, 0xffffffff,
449 	0x00009698, 0x00000100, 0xffffffff,
450 	0x000004d4, 0x00000200, 0xffffffff,
451 	0x000004d0, 0x00000000, 0xffffffff,
452 	0x000030cc, 0x00000104, 0xffffffff,
453 	0x0000d0c0, 0x00000100, 0xffffffff,
454 	0x0000d8c0, 0x00000100, 0xffffffff,
455 	0x0000802c, 0x40000000, 0xffffffff,
456 	0x00003fc4, 0x40000000, 0xffffffff,
457 	0x0000915c, 0x00010000, 0xffffffff,
458 	0x00009160, 0x00030002, 0xffffffff,
459 	0x00009164, 0x00050004, 0xffffffff,
460 	0x00009168, 0x00070006, 0xffffffff,
461 	0x00009178, 0x00070000, 0xffffffff,
462 	0x0000917c, 0x00030002, 0xffffffff,
463 	0x00009180, 0x00050004, 0xffffffff,
464 	0x0000918c, 0x00010006, 0xffffffff,
465 	0x00009190, 0x00090008, 0xffffffff,
466 	0x00009194, 0x00070000, 0xffffffff,
467 	0x00009198, 0x00030002, 0xffffffff,
468 	0x0000919c, 0x00050004, 0xffffffff,
469 	0x000091a8, 0x00010006, 0xffffffff,
470 	0x000091ac, 0x00090008, 0xffffffff,
471 	0x000091b0, 0x00070000, 0xffffffff,
472 	0x000091b4, 0x00030002, 0xffffffff,
473 	0x000091b8, 0x00050004, 0xffffffff,
474 	0x000091c4, 0x00010006, 0xffffffff,
475 	0x000091c8, 0x00090008, 0xffffffff,
476 	0x000091cc, 0x00070000, 0xffffffff,
477 	0x000091d0, 0x00030002, 0xffffffff,
478 	0x000091d4, 0x00050004, 0xffffffff,
479 	0x000091e0, 0x00010006, 0xffffffff,
480 	0x000091e4, 0x00090008, 0xffffffff,
481 	0x000091e8, 0x00000000, 0xffffffff,
482 	0x000091ec, 0x00070000, 0xffffffff,
483 	0x000091f0, 0x00030002, 0xffffffff,
484 	0x000091f4, 0x00050004, 0xffffffff,
485 	0x00009200, 0x00010006, 0xffffffff,
486 	0x00009204, 0x00090008, 0xffffffff,
487 	0x00009208, 0x00070000, 0xffffffff,
488 	0x0000920c, 0x00030002, 0xffffffff,
489 	0x00009210, 0x00050004, 0xffffffff,
490 	0x0000921c, 0x00010006, 0xffffffff,
491 	0x00009220, 0x00090008, 0xffffffff,
492 	0x00009224, 0x00070000, 0xffffffff,
493 	0x00009228, 0x00030002, 0xffffffff,
494 	0x0000922c, 0x00050004, 0xffffffff,
495 	0x00009238, 0x00010006, 0xffffffff,
496 	0x0000923c, 0x00090008, 0xffffffff,
497 	0x00009240, 0x00070000, 0xffffffff,
498 	0x00009244, 0x00030002, 0xffffffff,
499 	0x00009248, 0x00050004, 0xffffffff,
500 	0x00009254, 0x00010006, 0xffffffff,
501 	0x00009258, 0x00090008, 0xffffffff,
502 	0x0000925c, 0x00070000, 0xffffffff,
503 	0x00009260, 0x00030002, 0xffffffff,
504 	0x00009264, 0x00050004, 0xffffffff,
505 	0x00009270, 0x00010006, 0xffffffff,
506 	0x00009274, 0x00090008, 0xffffffff,
507 	0x00009278, 0x00070000, 0xffffffff,
508 	0x0000927c, 0x00030002, 0xffffffff,
509 	0x00009280, 0x00050004, 0xffffffff,
510 	0x0000928c, 0x00010006, 0xffffffff,
511 	0x00009290, 0x00090008, 0xffffffff,
512 	0x000092a8, 0x00070000, 0xffffffff,
513 	0x000092ac, 0x00030002, 0xffffffff,
514 	0x000092b0, 0x00050004, 0xffffffff,
515 	0x000092bc, 0x00010006, 0xffffffff,
516 	0x000092c0, 0x00090008, 0xffffffff,
517 	0x000092c4, 0x00070000, 0xffffffff,
518 	0x000092c8, 0x00030002, 0xffffffff,
519 	0x000092cc, 0x00050004, 0xffffffff,
520 	0x000092d8, 0x00010006, 0xffffffff,
521 	0x000092dc, 0x00090008, 0xffffffff,
522 	0x00009294, 0x00000000, 0xffffffff,
523 	0x0000802c, 0x40010000, 0xffffffff,
524 	0x00003fc4, 0x40010000, 0xffffffff,
525 	0x0000915c, 0x00010000, 0xffffffff,
526 	0x00009160, 0x00030002, 0xffffffff,
527 	0x00009164, 0x00050004, 0xffffffff,
528 	0x00009168, 0x00070006, 0xffffffff,
529 	0x00009178, 0x00070000, 0xffffffff,
530 	0x0000917c, 0x00030002, 0xffffffff,
531 	0x00009180, 0x00050004, 0xffffffff,
532 	0x0000918c, 0x00010006, 0xffffffff,
533 	0x00009190, 0x00090008, 0xffffffff,
534 	0x00009194, 0x00070000, 0xffffffff,
535 	0x00009198, 0x00030002, 0xffffffff,
536 	0x0000919c, 0x00050004, 0xffffffff,
537 	0x000091a8, 0x00010006, 0xffffffff,
538 	0x000091ac, 0x00090008, 0xffffffff,
539 	0x000091b0, 0x00070000, 0xffffffff,
540 	0x000091b4, 0x00030002, 0xffffffff,
541 	0x000091b8, 0x00050004, 0xffffffff,
542 	0x000091c4, 0x00010006, 0xffffffff,
543 	0x000091c8, 0x00090008, 0xffffffff,
544 	0x000091cc, 0x00070000, 0xffffffff,
545 	0x000091d0, 0x00030002, 0xffffffff,
546 	0x000091d4, 0x00050004, 0xffffffff,
547 	0x000091e0, 0x00010006, 0xffffffff,
548 	0x000091e4, 0x00090008, 0xffffffff,
549 	0x000091e8, 0x00000000, 0xffffffff,
550 	0x000091ec, 0x00070000, 0xffffffff,
551 	0x000091f0, 0x00030002, 0xffffffff,
552 	0x000091f4, 0x00050004, 0xffffffff,
553 	0x00009200, 0x00010006, 0xffffffff,
554 	0x00009204, 0x00090008, 0xffffffff,
555 	0x00009208, 0x00070000, 0xffffffff,
556 	0x0000920c, 0x00030002, 0xffffffff,
557 	0x00009210, 0x00050004, 0xffffffff,
558 	0x0000921c, 0x00010006, 0xffffffff,
559 	0x00009220, 0x00090008, 0xffffffff,
560 	0x00009224, 0x00070000, 0xffffffff,
561 	0x00009228, 0x00030002, 0xffffffff,
562 	0x0000922c, 0x00050004, 0xffffffff,
563 	0x00009238, 0x00010006, 0xffffffff,
564 	0x0000923c, 0x00090008, 0xffffffff,
565 	0x00009240, 0x00070000, 0xffffffff,
566 	0x00009244, 0x00030002, 0xffffffff,
567 	0x00009248, 0x00050004, 0xffffffff,
568 	0x00009254, 0x00010006, 0xffffffff,
569 	0x00009258, 0x00090008, 0xffffffff,
570 	0x0000925c, 0x00070000, 0xffffffff,
571 	0x00009260, 0x00030002, 0xffffffff,
572 	0x00009264, 0x00050004, 0xffffffff,
573 	0x00009270, 0x00010006, 0xffffffff,
574 	0x00009274, 0x00090008, 0xffffffff,
575 	0x00009278, 0x00070000, 0xffffffff,
576 	0x0000927c, 0x00030002, 0xffffffff,
577 	0x00009280, 0x00050004, 0xffffffff,
578 	0x0000928c, 0x00010006, 0xffffffff,
579 	0x00009290, 0x00090008, 0xffffffff,
580 	0x000092a8, 0x00070000, 0xffffffff,
581 	0x000092ac, 0x00030002, 0xffffffff,
582 	0x000092b0, 0x00050004, 0xffffffff,
583 	0x000092bc, 0x00010006, 0xffffffff,
584 	0x000092c0, 0x00090008, 0xffffffff,
585 	0x000092c4, 0x00070000, 0xffffffff,
586 	0x000092c8, 0x00030002, 0xffffffff,
587 	0x000092cc, 0x00050004, 0xffffffff,
588 	0x000092d8, 0x00010006, 0xffffffff,
589 	0x000092dc, 0x00090008, 0xffffffff,
590 	0x00009294, 0x00000000, 0xffffffff,
591 	0x0000802c, 0xc0000000, 0xffffffff,
592 	0x00003fc4, 0xc0000000, 0xffffffff,
593 	0x000008f8, 0x00000010, 0xffffffff,
594 	0x000008fc, 0x00000000, 0xffffffff,
595 	0x000008f8, 0x00000011, 0xffffffff,
596 	0x000008fc, 0x00000000, 0xffffffff,
597 	0x000008f8, 0x00000012, 0xffffffff,
598 	0x000008fc, 0x00000000, 0xffffffff,
599 	0x000008f8, 0x00000013, 0xffffffff,
600 	0x000008fc, 0x00000000, 0xffffffff,
601 	0x000008f8, 0x00000014, 0xffffffff,
602 	0x000008fc, 0x00000000, 0xffffffff,
603 	0x000008f8, 0x00000015, 0xffffffff,
604 	0x000008fc, 0x00000000, 0xffffffff,
605 	0x000008f8, 0x00000016, 0xffffffff,
606 	0x000008fc, 0x00000000, 0xffffffff,
607 	0x000008f8, 0x00000017, 0xffffffff,
608 	0x000008fc, 0x00000000, 0xffffffff,
609 	0x000008f8, 0x00000018, 0xffffffff,
610 	0x000008fc, 0x00000000, 0xffffffff,
611 	0x000008f8, 0x00000019, 0xffffffff,
612 	0x000008fc, 0x00000000, 0xffffffff,
613 	0x000008f8, 0x0000001a, 0xffffffff,
614 	0x000008fc, 0x00000000, 0xffffffff,
615 	0x000008f8, 0x0000001b, 0xffffffff,
616 	0x000008fc, 0x00000000, 0xffffffff
617 };
618 #define CAYMAN_MGCG_DEFAULT_LENGTH sizeof(cayman_mgcg_default) / (3 * sizeof(u32))
619 
620 static const u32 cayman_mgcg_disable[] =
621 {
622 	0x0000802c, 0xc0000000, 0xffffffff,
623 	0x000008f8, 0x00000000, 0xffffffff,
624 	0x000008fc, 0xffffffff, 0xffffffff,
625 	0x000008f8, 0x00000001, 0xffffffff,
626 	0x000008fc, 0xffffffff, 0xffffffff,
627 	0x000008f8, 0x00000002, 0xffffffff,
628 	0x000008fc, 0xffffffff, 0xffffffff,
629 	0x000008f8, 0x00000003, 0xffffffff,
630 	0x000008fc, 0xffffffff, 0xffffffff,
631 	0x00009150, 0x00600000, 0xffffffff
632 };
633 #define CAYMAN_MGCG_DISABLE_LENGTH   sizeof(cayman_mgcg_disable) / (3 * sizeof(u32))
634 
635 static const u32 cayman_mgcg_enable[] =
636 {
637 	0x0000802c, 0xc0000000, 0xffffffff,
638 	0x000008f8, 0x00000000, 0xffffffff,
639 	0x000008fc, 0x00000000, 0xffffffff,
640 	0x000008f8, 0x00000001, 0xffffffff,
641 	0x000008fc, 0x00000000, 0xffffffff,
642 	0x000008f8, 0x00000002, 0xffffffff,
643 	0x000008fc, 0x00600000, 0xffffffff,
644 	0x000008f8, 0x00000003, 0xffffffff,
645 	0x000008fc, 0x00000000, 0xffffffff,
646 	0x00009150, 0x96944200, 0xffffffff
647 };
648 
649 #define CAYMAN_MGCG_ENABLE_LENGTH   sizeof(cayman_mgcg_enable) / (3 * sizeof(u32))
650 
651 #define NISLANDS_SYSLS_SEQUENCE  100
652 
653 static const u32 cayman_sysls_default[] =
654 {
655 	/* Register,   Value,     Mask bits */
656 	0x000055e8, 0x00000000, 0xffffffff,
657 	0x0000d0bc, 0x00000000, 0xffffffff,
658 	0x0000d8bc, 0x00000000, 0xffffffff,
659 	0x000015c0, 0x000c1401, 0xffffffff,
660 	0x0000264c, 0x000c0400, 0xffffffff,
661 	0x00002648, 0x000c0400, 0xffffffff,
662 	0x00002650, 0x000c0400, 0xffffffff,
663 	0x000020b8, 0x000c0400, 0xffffffff,
664 	0x000020bc, 0x000c0400, 0xffffffff,
665 	0x000020c0, 0x000c0c80, 0xffffffff,
666 	0x0000f4a0, 0x000000c0, 0xffffffff,
667 	0x0000f4a4, 0x00680fff, 0xffffffff,
668 	0x00002f50, 0x00000404, 0xffffffff,
669 	0x000004c8, 0x00000001, 0xffffffff,
670 	0x000064ec, 0x00000000, 0xffffffff,
671 	0x00000c7c, 0x00000000, 0xffffffff,
672 	0x00008dfc, 0x00000000, 0xffffffff
673 };
674 #define CAYMAN_SYSLS_DEFAULT_LENGTH sizeof(cayman_sysls_default) / (3 * sizeof(u32))
675 
676 static const u32 cayman_sysls_disable[] =
677 {
678 	/* Register,   Value,     Mask bits */
679 	0x0000d0c0, 0x00000000, 0xffffffff,
680 	0x0000d8c0, 0x00000000, 0xffffffff,
681 	0x000055e8, 0x00000000, 0xffffffff,
682 	0x0000d0bc, 0x00000000, 0xffffffff,
683 	0x0000d8bc, 0x00000000, 0xffffffff,
684 	0x000015c0, 0x00041401, 0xffffffff,
685 	0x0000264c, 0x00040400, 0xffffffff,
686 	0x00002648, 0x00040400, 0xffffffff,
687 	0x00002650, 0x00040400, 0xffffffff,
688 	0x000020b8, 0x00040400, 0xffffffff,
689 	0x000020bc, 0x00040400, 0xffffffff,
690 	0x000020c0, 0x00040c80, 0xffffffff,
691 	0x0000f4a0, 0x000000c0, 0xffffffff,
692 	0x0000f4a4, 0x00680000, 0xffffffff,
693 	0x00002f50, 0x00000404, 0xffffffff,
694 	0x000004c8, 0x00000001, 0xffffffff,
695 	0x000064ec, 0x00007ffd, 0xffffffff,
696 	0x00000c7c, 0x0000ff00, 0xffffffff,
697 	0x00008dfc, 0x0000007f, 0xffffffff
698 };
699 #define CAYMAN_SYSLS_DISABLE_LENGTH sizeof(cayman_sysls_disable) / (3 * sizeof(u32))
700 
701 static const u32 cayman_sysls_enable[] =
702 {
703 	/* Register,   Value,     Mask bits */
704 	0x000055e8, 0x00000001, 0xffffffff,
705 	0x0000d0bc, 0x00000100, 0xffffffff,
706 	0x0000d8bc, 0x00000100, 0xffffffff,
707 	0x000015c0, 0x000c1401, 0xffffffff,
708 	0x0000264c, 0x000c0400, 0xffffffff,
709 	0x00002648, 0x000c0400, 0xffffffff,
710 	0x00002650, 0x000c0400, 0xffffffff,
711 	0x000020b8, 0x000c0400, 0xffffffff,
712 	0x000020bc, 0x000c0400, 0xffffffff,
713 	0x000020c0, 0x000c0c80, 0xffffffff,
714 	0x0000f4a0, 0x000000c0, 0xffffffff,
715 	0x0000f4a4, 0x00680fff, 0xffffffff,
716 	0x00002f50, 0x00000903, 0xffffffff,
717 	0x000004c8, 0x00000000, 0xffffffff,
718 	0x000064ec, 0x00000000, 0xffffffff,
719 	0x00000c7c, 0x00000000, 0xffffffff,
720 	0x00008dfc, 0x00000000, 0xffffffff
721 };
722 #define CAYMAN_SYSLS_ENABLE_LENGTH sizeof(cayman_sysls_enable) / (3 * sizeof(u32))
723 
724 extern int ni_mc_load_microcode(struct radeon_device *rdev);
725 
ni_get_pi(struct radeon_device * rdev)726 struct ni_power_info *ni_get_pi(struct radeon_device *rdev)
727 {
728 	struct ni_power_info *pi = rdev->pm.dpm.priv;
729 
730 	return pi;
731 }
732 
ni_get_ps(struct radeon_ps * rps)733 struct ni_ps *ni_get_ps(struct radeon_ps *rps)
734 {
735 	struct ni_ps *ps = rps->ps_priv;
736 
737 	return ps;
738 }
739 
ni_calculate_leakage_for_v_and_t_formula(const struct ni_leakage_coeffients * coeff,u16 v,s32 t,u32 ileakage,u32 * leakage)740 static void ni_calculate_leakage_for_v_and_t_formula(const struct ni_leakage_coeffients *coeff,
741 						     u16 v, s32 t,
742 						     u32 ileakage,
743 						     u32 *leakage)
744 {
745 	s64 kt, kv, leakage_w, i_leakage, vddc, temperature;
746 
747 	i_leakage = div64_s64(drm_int2fixp(ileakage), 1000);
748 	vddc = div64_s64(drm_int2fixp(v), 1000);
749 	temperature = div64_s64(drm_int2fixp(t), 1000);
750 
751 	kt = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->at), 1000),
752 			  drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bt), 1000), temperature)));
753 	kv = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->av), 1000),
754 			  drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bv), 1000), vddc)));
755 
756 	leakage_w = drm_fixp_mul(drm_fixp_mul(drm_fixp_mul(i_leakage, kt), kv), vddc);
757 
758 	*leakage = drm_fixp2int(leakage_w * 1000);
759 }
760 
ni_calculate_leakage_for_v_and_t(struct radeon_device * rdev,const struct ni_leakage_coeffients * coeff,u16 v,s32 t,u32 i_leakage,u32 * leakage)761 static void ni_calculate_leakage_for_v_and_t(struct radeon_device *rdev,
762 					     const struct ni_leakage_coeffients *coeff,
763 					     u16 v,
764 					     s32 t,
765 					     u32 i_leakage,
766 					     u32 *leakage)
767 {
768 	ni_calculate_leakage_for_v_and_t_formula(coeff, v, t, i_leakage, leakage);
769 }
770 
ni_dpm_vblank_too_short(struct radeon_device * rdev)771 bool ni_dpm_vblank_too_short(struct radeon_device *rdev)
772 {
773 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
774 	u32 vblank_time = r600_dpm_get_vblank_time(rdev);
775 	/* we never hit the non-gddr5 limit so disable it */
776 	u32 switch_limit = pi->mem_gddr5 ? 450 : 0;
777 
778 	if (vblank_time < switch_limit)
779 		return true;
780 	else
781 		return false;
782 
783 }
784 
ni_apply_state_adjust_rules(struct radeon_device * rdev,struct radeon_ps * rps)785 static void ni_apply_state_adjust_rules(struct radeon_device *rdev,
786 					struct radeon_ps *rps)
787 {
788 	struct ni_ps *ps = ni_get_ps(rps);
789 	struct radeon_clock_and_voltage_limits *max_limits;
790 	bool disable_mclk_switching;
791 	u32 mclk;
792 	u16 vddci;
793 	int i;
794 
795 	if ((rdev->pm.dpm.new_active_crtc_count > 1) ||
796 	    ni_dpm_vblank_too_short(rdev))
797 		disable_mclk_switching = true;
798 	else
799 		disable_mclk_switching = false;
800 
801 	if (rdev->pm.dpm.ac_power)
802 		max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac;
803 	else
804 		max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc;
805 
806 	if (rdev->pm.dpm.ac_power == false) {
807 		for (i = 0; i < ps->performance_level_count; i++) {
808 			if (ps->performance_levels[i].mclk > max_limits->mclk)
809 				ps->performance_levels[i].mclk = max_limits->mclk;
810 			if (ps->performance_levels[i].sclk > max_limits->sclk)
811 				ps->performance_levels[i].sclk = max_limits->sclk;
812 			if (ps->performance_levels[i].vddc > max_limits->vddc)
813 				ps->performance_levels[i].vddc = max_limits->vddc;
814 			if (ps->performance_levels[i].vddci > max_limits->vddci)
815 				ps->performance_levels[i].vddci = max_limits->vddci;
816 		}
817 	}
818 
819 	/* XXX validate the min clocks required for display */
820 
821 	/* adjust low state */
822 	if (disable_mclk_switching) {
823 		ps->performance_levels[0].mclk =
824 			ps->performance_levels[ps->performance_level_count - 1].mclk;
825 		ps->performance_levels[0].vddci =
826 			ps->performance_levels[ps->performance_level_count - 1].vddci;
827 	}
828 
829 	btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk,
830 				  &ps->performance_levels[0].sclk,
831 				  &ps->performance_levels[0].mclk);
832 
833 	for (i = 1; i < ps->performance_level_count; i++) {
834 		if (ps->performance_levels[i].sclk < ps->performance_levels[i - 1].sclk)
835 			ps->performance_levels[i].sclk = ps->performance_levels[i - 1].sclk;
836 		if (ps->performance_levels[i].vddc < ps->performance_levels[i - 1].vddc)
837 			ps->performance_levels[i].vddc = ps->performance_levels[i - 1].vddc;
838 	}
839 
840 	/* adjust remaining states */
841 	if (disable_mclk_switching) {
842 		mclk = ps->performance_levels[0].mclk;
843 		vddci = ps->performance_levels[0].vddci;
844 		for (i = 1; i < ps->performance_level_count; i++) {
845 			if (mclk < ps->performance_levels[i].mclk)
846 				mclk = ps->performance_levels[i].mclk;
847 			if (vddci < ps->performance_levels[i].vddci)
848 				vddci = ps->performance_levels[i].vddci;
849 		}
850 		for (i = 0; i < ps->performance_level_count; i++) {
851 			ps->performance_levels[i].mclk = mclk;
852 			ps->performance_levels[i].vddci = vddci;
853 		}
854 	} else {
855 		for (i = 1; i < ps->performance_level_count; i++) {
856 			if (ps->performance_levels[i].mclk < ps->performance_levels[i - 1].mclk)
857 				ps->performance_levels[i].mclk = ps->performance_levels[i - 1].mclk;
858 			if (ps->performance_levels[i].vddci < ps->performance_levels[i - 1].vddci)
859 				ps->performance_levels[i].vddci = ps->performance_levels[i - 1].vddci;
860 		}
861 	}
862 
863 	for (i = 1; i < ps->performance_level_count; i++)
864 		btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk,
865 					  &ps->performance_levels[i].sclk,
866 					  &ps->performance_levels[i].mclk);
867 
868 	for (i = 0; i < ps->performance_level_count; i++)
869 		btc_adjust_clock_combinations(rdev, max_limits,
870 					      &ps->performance_levels[i]);
871 
872 	for (i = 0; i < ps->performance_level_count; i++) {
873 		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk,
874 						   ps->performance_levels[i].sclk,
875 						   max_limits->vddc,  &ps->performance_levels[i].vddc);
876 		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddci_dependency_on_mclk,
877 						   ps->performance_levels[i].mclk,
878 						   max_limits->vddci, &ps->performance_levels[i].vddci);
879 		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk,
880 						   ps->performance_levels[i].mclk,
881 						   max_limits->vddc,  &ps->performance_levels[i].vddc);
882 		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk,
883 						   rdev->clock.current_dispclk,
884 						   max_limits->vddc,  &ps->performance_levels[i].vddc);
885 	}
886 
887 	for (i = 0; i < ps->performance_level_count; i++) {
888 		btc_apply_voltage_delta_rules(rdev,
889 					      max_limits->vddc, max_limits->vddci,
890 					      &ps->performance_levels[i].vddc,
891 					      &ps->performance_levels[i].vddci);
892 	}
893 
894 	ps->dc_compatible = true;
895 	for (i = 0; i < ps->performance_level_count; i++) {
896 		if (ps->performance_levels[i].vddc > rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.vddc)
897 			ps->dc_compatible = false;
898 
899 		if (ps->performance_levels[i].vddc < rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2)
900 			ps->performance_levels[i].flags &= ~ATOM_PPLIB_R600_FLAGS_PCIEGEN2;
901 	}
902 }
903 
ni_cg_clockgating_default(struct radeon_device * rdev)904 static void ni_cg_clockgating_default(struct radeon_device *rdev)
905 {
906 	u32 count;
907 	const u32 *ps = NULL;
908 
909 	ps = (const u32 *)&cayman_cgcg_cgls_default;
910 	count = CAYMAN_CGCG_CGLS_DEFAULT_LENGTH;
911 
912 	btc_program_mgcg_hw_sequence(rdev, ps, count);
913 }
914 
ni_gfx_clockgating_enable(struct radeon_device * rdev,bool enable)915 static void ni_gfx_clockgating_enable(struct radeon_device *rdev,
916 				      bool enable)
917 {
918 	u32 count;
919 	const u32 *ps = NULL;
920 
921 	if (enable) {
922 		ps = (const u32 *)&cayman_cgcg_cgls_enable;
923 		count = CAYMAN_CGCG_CGLS_ENABLE_LENGTH;
924 	} else {
925 		ps = (const u32 *)&cayman_cgcg_cgls_disable;
926 		count = CAYMAN_CGCG_CGLS_DISABLE_LENGTH;
927 	}
928 
929 	btc_program_mgcg_hw_sequence(rdev, ps, count);
930 }
931 
ni_mg_clockgating_default(struct radeon_device * rdev)932 static void ni_mg_clockgating_default(struct radeon_device *rdev)
933 {
934 	u32 count;
935 	const u32 *ps = NULL;
936 
937 	ps = (const u32 *)&cayman_mgcg_default;
938 	count = CAYMAN_MGCG_DEFAULT_LENGTH;
939 
940 	btc_program_mgcg_hw_sequence(rdev, ps, count);
941 }
942 
ni_mg_clockgating_enable(struct radeon_device * rdev,bool enable)943 static void ni_mg_clockgating_enable(struct radeon_device *rdev,
944 				     bool enable)
945 {
946 	u32 count;
947 	const u32 *ps = NULL;
948 
949 	if (enable) {
950 		ps = (const u32 *)&cayman_mgcg_enable;
951 		count = CAYMAN_MGCG_ENABLE_LENGTH;
952 	} else {
953 		ps = (const u32 *)&cayman_mgcg_disable;
954 		count = CAYMAN_MGCG_DISABLE_LENGTH;
955 	}
956 
957 	btc_program_mgcg_hw_sequence(rdev, ps, count);
958 }
959 
ni_ls_clockgating_default(struct radeon_device * rdev)960 static void ni_ls_clockgating_default(struct radeon_device *rdev)
961 {
962 	u32 count;
963 	const u32 *ps = NULL;
964 
965 	ps = (const u32 *)&cayman_sysls_default;
966 	count = CAYMAN_SYSLS_DEFAULT_LENGTH;
967 
968 	btc_program_mgcg_hw_sequence(rdev, ps, count);
969 }
970 
ni_ls_clockgating_enable(struct radeon_device * rdev,bool enable)971 static void ni_ls_clockgating_enable(struct radeon_device *rdev,
972 				     bool enable)
973 {
974 	u32 count;
975 	const u32 *ps = NULL;
976 
977 	if (enable) {
978 		ps = (const u32 *)&cayman_sysls_enable;
979 		count = CAYMAN_SYSLS_ENABLE_LENGTH;
980 	} else {
981 		ps = (const u32 *)&cayman_sysls_disable;
982 		count = CAYMAN_SYSLS_DISABLE_LENGTH;
983 	}
984 
985 	btc_program_mgcg_hw_sequence(rdev, ps, count);
986 
987 }
988 
ni_patch_single_dependency_table_based_on_leakage(struct radeon_device * rdev,struct radeon_clock_voltage_dependency_table * table)989 static int ni_patch_single_dependency_table_based_on_leakage(struct radeon_device *rdev,
990 							     struct radeon_clock_voltage_dependency_table *table)
991 {
992 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
993 	u32 i;
994 
995 	if (table) {
996 		for (i = 0; i < table->count; i++) {
997 			if (0xff01 == table->entries[i].v) {
998 				if (pi->max_vddc == 0)
999 					return -EINVAL;
1000 				table->entries[i].v = pi->max_vddc;
1001 			}
1002 		}
1003 	}
1004 	return 0;
1005 }
1006 
ni_patch_dependency_tables_based_on_leakage(struct radeon_device * rdev)1007 static int ni_patch_dependency_tables_based_on_leakage(struct radeon_device *rdev)
1008 {
1009 	int ret = 0;
1010 
1011 	ret = ni_patch_single_dependency_table_based_on_leakage(rdev,
1012 								&rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk);
1013 
1014 	ret = ni_patch_single_dependency_table_based_on_leakage(rdev,
1015 								&rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk);
1016 	return ret;
1017 }
1018 
ni_stop_dpm(struct radeon_device * rdev)1019 static void ni_stop_dpm(struct radeon_device *rdev)
1020 {
1021 	WREG32_P(GENERAL_PWRMGT, 0, ~GLOBAL_PWRMGT_EN);
1022 }
1023 
1024 #if 0
1025 static int ni_notify_hw_of_power_source(struct radeon_device *rdev,
1026 					bool ac_power)
1027 {
1028 	if (ac_power)
1029 		return (rv770_send_msg_to_smc(rdev, PPSMC_MSG_RunningOnAC) == PPSMC_Result_OK) ?
1030 			0 : -EINVAL;
1031 
1032 	return 0;
1033 }
1034 #endif
1035 
ni_send_msg_to_smc_with_parameter(struct radeon_device * rdev,PPSMC_Msg msg,u32 parameter)1036 static PPSMC_Result ni_send_msg_to_smc_with_parameter(struct radeon_device *rdev,
1037 						      PPSMC_Msg msg, u32 parameter)
1038 {
1039 	WREG32(SMC_SCRATCH0, parameter);
1040 	return rv770_send_msg_to_smc(rdev, msg);
1041 }
1042 
ni_restrict_performance_levels_before_switch(struct radeon_device * rdev)1043 static int ni_restrict_performance_levels_before_switch(struct radeon_device *rdev)
1044 {
1045 	if (rv770_send_msg_to_smc(rdev, PPSMC_MSG_NoForcedLevel) != PPSMC_Result_OK)
1046 		return -EINVAL;
1047 
1048 	return (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) == PPSMC_Result_OK) ?
1049 		0 : -EINVAL;
1050 }
1051 
ni_dpm_force_performance_level(struct radeon_device * rdev,enum radeon_dpm_forced_level level)1052 int ni_dpm_force_performance_level(struct radeon_device *rdev,
1053 				   enum radeon_dpm_forced_level level)
1054 {
1055 	if (level == RADEON_DPM_FORCED_LEVEL_HIGH) {
1056 		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK)
1057 			return -EINVAL;
1058 
1059 		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 1) != PPSMC_Result_OK)
1060 			return -EINVAL;
1061 	} else if (level == RADEON_DPM_FORCED_LEVEL_LOW) {
1062 		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK)
1063 			return -EINVAL;
1064 
1065 		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) != PPSMC_Result_OK)
1066 			return -EINVAL;
1067 	} else if (level == RADEON_DPM_FORCED_LEVEL_AUTO) {
1068 		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK)
1069 			return -EINVAL;
1070 
1071 		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK)
1072 			return -EINVAL;
1073 	}
1074 
1075 	rdev->pm.dpm.forced_level = level;
1076 
1077 	return 0;
1078 }
1079 
ni_stop_smc(struct radeon_device * rdev)1080 static void ni_stop_smc(struct radeon_device *rdev)
1081 {
1082 	u32 tmp;
1083 	int i;
1084 
1085 	for (i = 0; i < rdev->usec_timeout; i++) {
1086 		tmp = RREG32(LB_SYNC_RESET_SEL) & LB_SYNC_RESET_SEL_MASK;
1087 		if (tmp != 1)
1088 			break;
1089 		udelay(1);
1090 	}
1091 
1092 	udelay(100);
1093 
1094 	r7xx_stop_smc(rdev);
1095 }
1096 
ni_process_firmware_header(struct radeon_device * rdev)1097 static int ni_process_firmware_header(struct radeon_device *rdev)
1098 {
1099 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1100 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1101 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1102 	u32 tmp;
1103 	int ret;
1104 
1105 	ret = rv770_read_smc_sram_dword(rdev,
1106 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1107 					NISLANDS_SMC_FIRMWARE_HEADER_stateTable,
1108 					&tmp, pi->sram_end);
1109 
1110 	if (ret)
1111 		return ret;
1112 
1113 	pi->state_table_start = (u16)tmp;
1114 
1115 	ret = rv770_read_smc_sram_dword(rdev,
1116 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1117 					NISLANDS_SMC_FIRMWARE_HEADER_softRegisters,
1118 					&tmp, pi->sram_end);
1119 
1120 	if (ret)
1121 		return ret;
1122 
1123 	pi->soft_regs_start = (u16)tmp;
1124 
1125 	ret = rv770_read_smc_sram_dword(rdev,
1126 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1127 					NISLANDS_SMC_FIRMWARE_HEADER_mcRegisterTable,
1128 					&tmp, pi->sram_end);
1129 
1130 	if (ret)
1131 		return ret;
1132 
1133 	eg_pi->mc_reg_table_start = (u16)tmp;
1134 
1135 	ret = rv770_read_smc_sram_dword(rdev,
1136 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1137 					NISLANDS_SMC_FIRMWARE_HEADER_fanTable,
1138 					&tmp, pi->sram_end);
1139 
1140 	if (ret)
1141 		return ret;
1142 
1143 	ni_pi->fan_table_start = (u16)tmp;
1144 
1145 	ret = rv770_read_smc_sram_dword(rdev,
1146 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1147 					NISLANDS_SMC_FIRMWARE_HEADER_mcArbDramAutoRefreshTable,
1148 					&tmp, pi->sram_end);
1149 
1150 	if (ret)
1151 		return ret;
1152 
1153 	ni_pi->arb_table_start = (u16)tmp;
1154 
1155 	ret = rv770_read_smc_sram_dword(rdev,
1156 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1157 					NISLANDS_SMC_FIRMWARE_HEADER_cacTable,
1158 					&tmp, pi->sram_end);
1159 
1160 	if (ret)
1161 		return ret;
1162 
1163 	ni_pi->cac_table_start = (u16)tmp;
1164 
1165 	ret = rv770_read_smc_sram_dword(rdev,
1166 					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1167 					NISLANDS_SMC_FIRMWARE_HEADER_spllTable,
1168 					&tmp, pi->sram_end);
1169 
1170 	if (ret)
1171 		return ret;
1172 
1173 	ni_pi->spll_table_start = (u16)tmp;
1174 
1175 
1176 	return ret;
1177 }
1178 
ni_read_clock_registers(struct radeon_device * rdev)1179 static void ni_read_clock_registers(struct radeon_device *rdev)
1180 {
1181 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1182 
1183 	ni_pi->clock_registers.cg_spll_func_cntl = RREG32(CG_SPLL_FUNC_CNTL);
1184 	ni_pi->clock_registers.cg_spll_func_cntl_2 = RREG32(CG_SPLL_FUNC_CNTL_2);
1185 	ni_pi->clock_registers.cg_spll_func_cntl_3 = RREG32(CG_SPLL_FUNC_CNTL_3);
1186 	ni_pi->clock_registers.cg_spll_func_cntl_4 = RREG32(CG_SPLL_FUNC_CNTL_4);
1187 	ni_pi->clock_registers.cg_spll_spread_spectrum = RREG32(CG_SPLL_SPREAD_SPECTRUM);
1188 	ni_pi->clock_registers.cg_spll_spread_spectrum_2 = RREG32(CG_SPLL_SPREAD_SPECTRUM_2);
1189 	ni_pi->clock_registers.mpll_ad_func_cntl = RREG32(MPLL_AD_FUNC_CNTL);
1190 	ni_pi->clock_registers.mpll_ad_func_cntl_2 = RREG32(MPLL_AD_FUNC_CNTL_2);
1191 	ni_pi->clock_registers.mpll_dq_func_cntl = RREG32(MPLL_DQ_FUNC_CNTL);
1192 	ni_pi->clock_registers.mpll_dq_func_cntl_2 = RREG32(MPLL_DQ_FUNC_CNTL_2);
1193 	ni_pi->clock_registers.mclk_pwrmgt_cntl = RREG32(MCLK_PWRMGT_CNTL);
1194 	ni_pi->clock_registers.dll_cntl = RREG32(DLL_CNTL);
1195 	ni_pi->clock_registers.mpll_ss1 = RREG32(MPLL_SS1);
1196 	ni_pi->clock_registers.mpll_ss2 = RREG32(MPLL_SS2);
1197 }
1198 
1199 #if 0
1200 static int ni_enter_ulp_state(struct radeon_device *rdev)
1201 {
1202 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1203 
1204 	if (pi->gfx_clock_gating) {
1205 		WREG32_P(SCLK_PWRMGT_CNTL, 0, ~DYN_GFX_CLK_OFF_EN);
1206 		WREG32_P(SCLK_PWRMGT_CNTL, GFX_CLK_FORCE_ON, ~GFX_CLK_FORCE_ON);
1207 		WREG32_P(SCLK_PWRMGT_CNTL, 0, ~GFX_CLK_FORCE_ON);
1208 		RREG32(GB_ADDR_CONFIG);
1209 	}
1210 
1211 	WREG32_P(SMC_MSG, HOST_SMC_MSG(PPSMC_MSG_SwitchToMinimumPower),
1212 		 ~HOST_SMC_MSG_MASK);
1213 
1214 	udelay(25000);
1215 
1216 	return 0;
1217 }
1218 #endif
1219 
ni_program_response_times(struct radeon_device * rdev)1220 static void ni_program_response_times(struct radeon_device *rdev)
1221 {
1222 	u32 voltage_response_time, backbias_response_time, acpi_delay_time, vbi_time_out;
1223 	u32 vddc_dly, bb_dly, acpi_dly, vbi_dly, mclk_switch_limit;
1224 	u32 reference_clock;
1225 
1226 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mvdd_chg_time, 1);
1227 
1228 	voltage_response_time = (u32)rdev->pm.dpm.voltage_response_time;
1229 	backbias_response_time = (u32)rdev->pm.dpm.backbias_response_time;
1230 
1231 	if (voltage_response_time == 0)
1232 		voltage_response_time = 1000;
1233 
1234 	if (backbias_response_time == 0)
1235 		backbias_response_time = 1000;
1236 
1237 	acpi_delay_time = 15000;
1238 	vbi_time_out = 100000;
1239 
1240 	reference_clock = radeon_get_xclk(rdev);
1241 
1242 	vddc_dly = (voltage_response_time  * reference_clock) / 1600;
1243 	bb_dly   = (backbias_response_time * reference_clock) / 1600;
1244 	acpi_dly = (acpi_delay_time * reference_clock) / 1600;
1245 	vbi_dly  = (vbi_time_out * reference_clock) / 1600;
1246 
1247 	mclk_switch_limit = (460 * reference_clock) / 100;
1248 
1249 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_vreg,  vddc_dly);
1250 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_bbias, bb_dly);
1251 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_acpi,  acpi_dly);
1252 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_chg_timeout, vbi_dly);
1253 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mc_block_delay, 0xAA);
1254 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_switch_lim, mclk_switch_limit);
1255 }
1256 
ni_populate_smc_voltage_table(struct radeon_device * rdev,struct atom_voltage_table * voltage_table,NISLANDS_SMC_STATETABLE * table)1257 static void ni_populate_smc_voltage_table(struct radeon_device *rdev,
1258 					  struct atom_voltage_table *voltage_table,
1259 					  NISLANDS_SMC_STATETABLE *table)
1260 {
1261 	unsigned int i;
1262 
1263 	for (i = 0; i < voltage_table->count; i++) {
1264 		table->highSMIO[i] = 0;
1265 		table->lowSMIO[i] |= cpu_to_be32(voltage_table->entries[i].smio_low);
1266 	}
1267 }
1268 
ni_populate_smc_voltage_tables(struct radeon_device * rdev,NISLANDS_SMC_STATETABLE * table)1269 static void ni_populate_smc_voltage_tables(struct radeon_device *rdev,
1270 					   NISLANDS_SMC_STATETABLE *table)
1271 {
1272 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1273 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1274 	unsigned char i;
1275 
1276 	if (eg_pi->vddc_voltage_table.count) {
1277 		ni_populate_smc_voltage_table(rdev, &eg_pi->vddc_voltage_table, table);
1278 		table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] = 0;
1279 		table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] =
1280 			cpu_to_be32(eg_pi->vddc_voltage_table.mask_low);
1281 
1282 		for (i = 0; i < eg_pi->vddc_voltage_table.count; i++) {
1283 			if (pi->max_vddc_in_table <= eg_pi->vddc_voltage_table.entries[i].value) {
1284 				table->maxVDDCIndexInPPTable = i;
1285 				break;
1286 			}
1287 		}
1288 	}
1289 
1290 	if (eg_pi->vddci_voltage_table.count) {
1291 		ni_populate_smc_voltage_table(rdev, &eg_pi->vddci_voltage_table, table);
1292 
1293 		table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] = 0;
1294 		table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] =
1295 			cpu_to_be32(eg_pi->vddci_voltage_table.mask_low);
1296 	}
1297 }
1298 
ni_populate_voltage_value(struct radeon_device * rdev,struct atom_voltage_table * table,u16 value,NISLANDS_SMC_VOLTAGE_VALUE * voltage)1299 static int ni_populate_voltage_value(struct radeon_device *rdev,
1300 				     struct atom_voltage_table *table,
1301 				     u16 value,
1302 				     NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1303 {
1304 	unsigned int i;
1305 
1306 	for (i = 0; i < table->count; i++) {
1307 		if (value <= table->entries[i].value) {
1308 			voltage->index = (u8)i;
1309 			voltage->value = cpu_to_be16(table->entries[i].value);
1310 			break;
1311 		}
1312 	}
1313 
1314 	if (i >= table->count)
1315 		return -EINVAL;
1316 
1317 	return 0;
1318 }
1319 
ni_populate_mvdd_value(struct radeon_device * rdev,u32 mclk,NISLANDS_SMC_VOLTAGE_VALUE * voltage)1320 static void ni_populate_mvdd_value(struct radeon_device *rdev,
1321 				   u32 mclk,
1322 				   NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1323 {
1324 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1325 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1326 
1327 	if (!pi->mvdd_control) {
1328 		voltage->index = eg_pi->mvdd_high_index;
1329 		voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1330 		return;
1331 	}
1332 
1333 	if (mclk <= pi->mvdd_split_frequency) {
1334 		voltage->index = eg_pi->mvdd_low_index;
1335 		voltage->value = cpu_to_be16(MVDD_LOW_VALUE);
1336 	} else {
1337 		voltage->index = eg_pi->mvdd_high_index;
1338 		voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1339 	}
1340 }
1341 
ni_get_std_voltage_value(struct radeon_device * rdev,NISLANDS_SMC_VOLTAGE_VALUE * voltage,u16 * std_voltage)1342 static int ni_get_std_voltage_value(struct radeon_device *rdev,
1343 				    NISLANDS_SMC_VOLTAGE_VALUE *voltage,
1344 				    u16 *std_voltage)
1345 {
1346 	if (rdev->pm.dpm.dyn_state.cac_leakage_table.entries &&
1347 	    ((u32)voltage->index < rdev->pm.dpm.dyn_state.cac_leakage_table.count))
1348 		*std_voltage = rdev->pm.dpm.dyn_state.cac_leakage_table.entries[voltage->index].vddc;
1349 	else
1350 		*std_voltage = be16_to_cpu(voltage->value);
1351 
1352 	return 0;
1353 }
1354 
ni_populate_std_voltage_value(struct radeon_device * rdev,u16 value,u8 index,NISLANDS_SMC_VOLTAGE_VALUE * voltage)1355 static void ni_populate_std_voltage_value(struct radeon_device *rdev,
1356 					  u16 value, u8 index,
1357 					  NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1358 {
1359 	voltage->index = index;
1360 	voltage->value = cpu_to_be16(value);
1361 }
1362 
ni_get_smc_power_scaling_factor(struct radeon_device * rdev)1363 static u32 ni_get_smc_power_scaling_factor(struct radeon_device *rdev)
1364 {
1365 	u32 xclk_period;
1366 	u32 xclk = radeon_get_xclk(rdev);
1367 	u32 tmp = RREG32(CG_CAC_CTRL) & TID_CNT_MASK;
1368 
1369 	xclk_period = (1000000000UL / xclk);
1370 	xclk_period /= 10000UL;
1371 
1372 	return tmp * xclk_period;
1373 }
1374 
ni_scale_power_for_smc(u32 power_in_watts,u32 scaling_factor)1375 static u32 ni_scale_power_for_smc(u32 power_in_watts, u32 scaling_factor)
1376 {
1377 	return (power_in_watts * scaling_factor) << 2;
1378 }
1379 
ni_calculate_power_boost_limit(struct radeon_device * rdev,struct radeon_ps * radeon_state,u32 near_tdp_limit)1380 static u32 ni_calculate_power_boost_limit(struct radeon_device *rdev,
1381 					  struct radeon_ps *radeon_state,
1382 					  u32 near_tdp_limit)
1383 {
1384 	struct ni_ps *state = ni_get_ps(radeon_state);
1385 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1386 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1387 	u32 power_boost_limit = 0;
1388 	int ret;
1389 
1390 	if (ni_pi->enable_power_containment &&
1391 	    ni_pi->use_power_boost_limit) {
1392 		NISLANDS_SMC_VOLTAGE_VALUE vddc;
1393 		u16 std_vddc_med;
1394 		u16 std_vddc_high;
1395 		u64 tmp, n, d;
1396 
1397 		if (state->performance_level_count < 3)
1398 			return 0;
1399 
1400 		ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1401 						state->performance_levels[state->performance_level_count - 2].vddc,
1402 						&vddc);
1403 		if (ret)
1404 			return 0;
1405 
1406 		ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_med);
1407 		if (ret)
1408 			return 0;
1409 
1410 		ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1411 						state->performance_levels[state->performance_level_count - 1].vddc,
1412 						&vddc);
1413 		if (ret)
1414 			return 0;
1415 
1416 		ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_high);
1417 		if (ret)
1418 			return 0;
1419 
1420 		n = ((u64)near_tdp_limit * ((u64)std_vddc_med * (u64)std_vddc_med) * 90);
1421 		d = ((u64)std_vddc_high * (u64)std_vddc_high * 100);
1422 		tmp = div64_u64(n, d);
1423 
1424 		if (tmp >> 32)
1425 			return 0;
1426 		power_boost_limit = (u32)tmp;
1427 	}
1428 
1429 	return power_boost_limit;
1430 }
1431 
ni_calculate_adjusted_tdp_limits(struct radeon_device * rdev,bool adjust_polarity,u32 tdp_adjustment,u32 * tdp_limit,u32 * near_tdp_limit)1432 static int ni_calculate_adjusted_tdp_limits(struct radeon_device *rdev,
1433 					    bool adjust_polarity,
1434 					    u32 tdp_adjustment,
1435 					    u32 *tdp_limit,
1436 					    u32 *near_tdp_limit)
1437 {
1438 	if (tdp_adjustment > (u32)rdev->pm.dpm.tdp_od_limit)
1439 		return -EINVAL;
1440 
1441 	if (adjust_polarity) {
1442 		*tdp_limit = ((100 + tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100;
1443 		*near_tdp_limit = rdev->pm.dpm.near_tdp_limit + (*tdp_limit - rdev->pm.dpm.tdp_limit);
1444 	} else {
1445 		*tdp_limit = ((100 - tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100;
1446 		*near_tdp_limit = rdev->pm.dpm.near_tdp_limit - (rdev->pm.dpm.tdp_limit - *tdp_limit);
1447 	}
1448 
1449 	return 0;
1450 }
1451 
ni_populate_smc_tdp_limits(struct radeon_device * rdev,struct radeon_ps * radeon_state)1452 static int ni_populate_smc_tdp_limits(struct radeon_device *rdev,
1453 				      struct radeon_ps *radeon_state)
1454 {
1455 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1456 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1457 
1458 	if (ni_pi->enable_power_containment) {
1459 		NISLANDS_SMC_STATETABLE *smc_table = &ni_pi->smc_statetable;
1460 		u32 scaling_factor = ni_get_smc_power_scaling_factor(rdev);
1461 		u32 tdp_limit;
1462 		u32 near_tdp_limit;
1463 		u32 power_boost_limit;
1464 		int ret;
1465 
1466 		if (scaling_factor == 0)
1467 			return -EINVAL;
1468 
1469 		memset(smc_table, 0, sizeof(NISLANDS_SMC_STATETABLE));
1470 
1471 		ret = ni_calculate_adjusted_tdp_limits(rdev,
1472 						       false, /* ??? */
1473 						       rdev->pm.dpm.tdp_adjustment,
1474 						       &tdp_limit,
1475 						       &near_tdp_limit);
1476 		if (ret)
1477 			return ret;
1478 
1479 		power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state,
1480 								   near_tdp_limit);
1481 
1482 		smc_table->dpm2Params.TDPLimit =
1483 			cpu_to_be32(ni_scale_power_for_smc(tdp_limit, scaling_factor));
1484 		smc_table->dpm2Params.NearTDPLimit =
1485 			cpu_to_be32(ni_scale_power_for_smc(near_tdp_limit, scaling_factor));
1486 		smc_table->dpm2Params.SafePowerLimit =
1487 			cpu_to_be32(ni_scale_power_for_smc((near_tdp_limit * NISLANDS_DPM2_TDP_SAFE_LIMIT_PERCENT) / 100,
1488 							   scaling_factor));
1489 		smc_table->dpm2Params.PowerBoostLimit =
1490 			cpu_to_be32(ni_scale_power_for_smc(power_boost_limit, scaling_factor));
1491 
1492 		ret = rv770_copy_bytes_to_smc(rdev,
1493 					      (u16)(pi->state_table_start + offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) +
1494 						    offsetof(PP_NIslands_DPM2Parameters, TDPLimit)),
1495 					      (u8 *)(&smc_table->dpm2Params.TDPLimit),
1496 					      sizeof(u32) * 4, pi->sram_end);
1497 		if (ret)
1498 			return ret;
1499 	}
1500 
1501 	return 0;
1502 }
1503 
ni_copy_and_switch_arb_sets(struct radeon_device * rdev,u32 arb_freq_src,u32 arb_freq_dest)1504 int ni_copy_and_switch_arb_sets(struct radeon_device *rdev,
1505 				u32 arb_freq_src, u32 arb_freq_dest)
1506 {
1507 	u32 mc_arb_dram_timing;
1508 	u32 mc_arb_dram_timing2;
1509 	u32 burst_time;
1510 	u32 mc_cg_config;
1511 
1512 	switch (arb_freq_src) {
1513 	case MC_CG_ARB_FREQ_F0:
1514 		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING);
1515 		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2);
1516 		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE0_MASK) >> STATE0_SHIFT;
1517 		break;
1518 	case MC_CG_ARB_FREQ_F1:
1519 		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_1);
1520 		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_1);
1521 		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE1_MASK) >> STATE1_SHIFT;
1522 		break;
1523 	case MC_CG_ARB_FREQ_F2:
1524 		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_2);
1525 		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_2);
1526 		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE2_MASK) >> STATE2_SHIFT;
1527 		break;
1528 	case MC_CG_ARB_FREQ_F3:
1529 		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_3);
1530 		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_3);
1531 		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE3_MASK) >> STATE3_SHIFT;
1532 		break;
1533 	default:
1534 		return -EINVAL;
1535 	}
1536 
1537 	switch (arb_freq_dest) {
1538 	case MC_CG_ARB_FREQ_F0:
1539 		WREG32(MC_ARB_DRAM_TIMING, mc_arb_dram_timing);
1540 		WREG32(MC_ARB_DRAM_TIMING2, mc_arb_dram_timing2);
1541 		WREG32_P(MC_ARB_BURST_TIME, STATE0(burst_time), ~STATE0_MASK);
1542 		break;
1543 	case MC_CG_ARB_FREQ_F1:
1544 		WREG32(MC_ARB_DRAM_TIMING_1, mc_arb_dram_timing);
1545 		WREG32(MC_ARB_DRAM_TIMING2_1, mc_arb_dram_timing2);
1546 		WREG32_P(MC_ARB_BURST_TIME, STATE1(burst_time), ~STATE1_MASK);
1547 		break;
1548 	case MC_CG_ARB_FREQ_F2:
1549 		WREG32(MC_ARB_DRAM_TIMING_2, mc_arb_dram_timing);
1550 		WREG32(MC_ARB_DRAM_TIMING2_2, mc_arb_dram_timing2);
1551 		WREG32_P(MC_ARB_BURST_TIME, STATE2(burst_time), ~STATE2_MASK);
1552 		break;
1553 	case MC_CG_ARB_FREQ_F3:
1554 		WREG32(MC_ARB_DRAM_TIMING_3, mc_arb_dram_timing);
1555 		WREG32(MC_ARB_DRAM_TIMING2_3, mc_arb_dram_timing2);
1556 		WREG32_P(MC_ARB_BURST_TIME, STATE3(burst_time), ~STATE3_MASK);
1557 		break;
1558 	default:
1559 		return -EINVAL;
1560 	}
1561 
1562 	mc_cg_config = RREG32(MC_CG_CONFIG) | 0x0000000F;
1563 	WREG32(MC_CG_CONFIG, mc_cg_config);
1564 	WREG32_P(MC_ARB_CG, CG_ARB_REQ(arb_freq_dest), ~CG_ARB_REQ_MASK);
1565 
1566 	return 0;
1567 }
1568 
ni_init_arb_table_index(struct radeon_device * rdev)1569 static int ni_init_arb_table_index(struct radeon_device *rdev)
1570 {
1571 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1572 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1573 	u32 tmp;
1574 	int ret;
1575 
1576 	ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start,
1577 					&tmp, pi->sram_end);
1578 	if (ret)
1579 		return ret;
1580 
1581 	tmp &= 0x00FFFFFF;
1582 	tmp |= ((u32)MC_CG_ARB_FREQ_F1) << 24;
1583 
1584 	return rv770_write_smc_sram_dword(rdev, ni_pi->arb_table_start,
1585 					  tmp, pi->sram_end);
1586 }
1587 
ni_initial_switch_from_arb_f0_to_f1(struct radeon_device * rdev)1588 static int ni_initial_switch_from_arb_f0_to_f1(struct radeon_device *rdev)
1589 {
1590 	return ni_copy_and_switch_arb_sets(rdev, MC_CG_ARB_FREQ_F0, MC_CG_ARB_FREQ_F1);
1591 }
1592 
ni_force_switch_to_arb_f0(struct radeon_device * rdev)1593 static int ni_force_switch_to_arb_f0(struct radeon_device *rdev)
1594 {
1595 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1596 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1597 	u32 tmp;
1598 	int ret;
1599 
1600 	ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start,
1601 					&tmp, pi->sram_end);
1602 	if (ret)
1603 		return ret;
1604 
1605 	tmp = (tmp >> 24) & 0xff;
1606 
1607 	if (tmp == MC_CG_ARB_FREQ_F0)
1608 		return 0;
1609 
1610 	return ni_copy_and_switch_arb_sets(rdev, tmp, MC_CG_ARB_FREQ_F0);
1611 }
1612 
ni_populate_memory_timing_parameters(struct radeon_device * rdev,struct rv7xx_pl * pl,SMC_NIslands_MCArbDramTimingRegisterSet * arb_regs)1613 static int ni_populate_memory_timing_parameters(struct radeon_device *rdev,
1614 						struct rv7xx_pl *pl,
1615 						SMC_NIslands_MCArbDramTimingRegisterSet *arb_regs)
1616 {
1617 	u32 dram_timing;
1618 	u32 dram_timing2;
1619 
1620 	arb_regs->mc_arb_rfsh_rate =
1621 		(u8)rv770_calculate_memory_refresh_rate(rdev, pl->sclk);
1622 
1623 
1624 	radeon_atom_set_engine_dram_timings(rdev, pl->sclk, pl->mclk);
1625 
1626 	dram_timing = RREG32(MC_ARB_DRAM_TIMING);
1627 	dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2);
1628 
1629 	arb_regs->mc_arb_dram_timing  = cpu_to_be32(dram_timing);
1630 	arb_regs->mc_arb_dram_timing2 = cpu_to_be32(dram_timing2);
1631 
1632 	return 0;
1633 }
1634 
ni_do_program_memory_timing_parameters(struct radeon_device * rdev,struct radeon_ps * radeon_state,unsigned int first_arb_set)1635 static int ni_do_program_memory_timing_parameters(struct radeon_device *rdev,
1636 						  struct radeon_ps *radeon_state,
1637 						  unsigned int first_arb_set)
1638 {
1639 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1640 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1641 	struct ni_ps *state = ni_get_ps(radeon_state);
1642 	SMC_NIslands_MCArbDramTimingRegisterSet arb_regs = { 0 };
1643 	int i, ret = 0;
1644 
1645 	for (i = 0; i < state->performance_level_count; i++) {
1646 		ret = ni_populate_memory_timing_parameters(rdev, &state->performance_levels[i], &arb_regs);
1647 		if (ret)
1648 			break;
1649 
1650 		ret = rv770_copy_bytes_to_smc(rdev,
1651 					      (u16)(ni_pi->arb_table_start +
1652 						    offsetof(SMC_NIslands_MCArbDramTimingRegisters, data) +
1653 						    sizeof(SMC_NIslands_MCArbDramTimingRegisterSet) * (first_arb_set + i)),
1654 					      (u8 *)&arb_regs,
1655 					      (u16)sizeof(SMC_NIslands_MCArbDramTimingRegisterSet),
1656 					      pi->sram_end);
1657 		if (ret)
1658 			break;
1659 	}
1660 	return ret;
1661 }
1662 
ni_program_memory_timing_parameters(struct radeon_device * rdev,struct radeon_ps * radeon_new_state)1663 static int ni_program_memory_timing_parameters(struct radeon_device *rdev,
1664 					       struct radeon_ps *radeon_new_state)
1665 {
1666 	return ni_do_program_memory_timing_parameters(rdev, radeon_new_state,
1667 						      NISLANDS_DRIVER_STATE_ARB_INDEX);
1668 }
1669 
ni_populate_initial_mvdd_value(struct radeon_device * rdev,struct NISLANDS_SMC_VOLTAGE_VALUE * voltage)1670 static void ni_populate_initial_mvdd_value(struct radeon_device *rdev,
1671 					   struct NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1672 {
1673 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1674 
1675 	voltage->index = eg_pi->mvdd_high_index;
1676 	voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1677 }
1678 
ni_populate_smc_initial_state(struct radeon_device * rdev,struct radeon_ps * radeon_initial_state,NISLANDS_SMC_STATETABLE * table)1679 static int ni_populate_smc_initial_state(struct radeon_device *rdev,
1680 					 struct radeon_ps *radeon_initial_state,
1681 					 NISLANDS_SMC_STATETABLE *table)
1682 {
1683 	struct ni_ps *initial_state = ni_get_ps(radeon_initial_state);
1684 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1685 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1686 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1687 	u32 reg;
1688 	int ret;
1689 
1690 	table->initialState.level.mclk.vMPLL_AD_FUNC_CNTL =
1691 		cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl);
1692 	table->initialState.level.mclk.vMPLL_AD_FUNC_CNTL_2 =
1693 		cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl_2);
1694 	table->initialState.level.mclk.vMPLL_DQ_FUNC_CNTL =
1695 		cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl);
1696 	table->initialState.level.mclk.vMPLL_DQ_FUNC_CNTL_2 =
1697 		cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl_2);
1698 	table->initialState.level.mclk.vMCLK_PWRMGT_CNTL =
1699 		cpu_to_be32(ni_pi->clock_registers.mclk_pwrmgt_cntl);
1700 	table->initialState.level.mclk.vDLL_CNTL =
1701 		cpu_to_be32(ni_pi->clock_registers.dll_cntl);
1702 	table->initialState.level.mclk.vMPLL_SS =
1703 		cpu_to_be32(ni_pi->clock_registers.mpll_ss1);
1704 	table->initialState.level.mclk.vMPLL_SS2 =
1705 		cpu_to_be32(ni_pi->clock_registers.mpll_ss2);
1706 	table->initialState.level.mclk.mclk_value =
1707 		cpu_to_be32(initial_state->performance_levels[0].mclk);
1708 
1709 	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL =
1710 		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl);
1711 	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_2 =
1712 		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_2);
1713 	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_3 =
1714 		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_3);
1715 	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_4 =
1716 		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_4);
1717 	table->initialState.level.sclk.vCG_SPLL_SPREAD_SPECTRUM =
1718 		cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum);
1719 	table->initialState.level.sclk.vCG_SPLL_SPREAD_SPECTRUM_2 =
1720 		cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum_2);
1721 	table->initialState.level.sclk.sclk_value =
1722 		cpu_to_be32(initial_state->performance_levels[0].sclk);
1723 	table->initialState.level.arbRefreshState =
1724 		NISLANDS_INITIAL_STATE_ARB_INDEX;
1725 
1726 	table->initialState.level.ACIndex = 0;
1727 
1728 	ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1729 					initial_state->performance_levels[0].vddc,
1730 					&table->initialState.level.vddc);
1731 	if (!ret) {
1732 		u16 std_vddc;
1733 
1734 		ret = ni_get_std_voltage_value(rdev,
1735 					       &table->initialState.level.vddc,
1736 					       &std_vddc);
1737 		if (!ret)
1738 			ni_populate_std_voltage_value(rdev, std_vddc,
1739 						      table->initialState.level.vddc.index,
1740 						      &table->initialState.level.std_vddc);
1741 	}
1742 
1743 	if (eg_pi->vddci_control)
1744 		ni_populate_voltage_value(rdev,
1745 					  &eg_pi->vddci_voltage_table,
1746 					  initial_state->performance_levels[0].vddci,
1747 					  &table->initialState.level.vddci);
1748 
1749 	ni_populate_initial_mvdd_value(rdev, &table->initialState.level.mvdd);
1750 
1751 	reg = CG_R(0xffff) | CG_L(0);
1752 	table->initialState.level.aT = cpu_to_be32(reg);
1753 
1754 	table->initialState.level.bSP = cpu_to_be32(pi->dsp);
1755 
1756 	if (pi->boot_in_gen2)
1757 		table->initialState.level.gen2PCIE = 1;
1758 	else
1759 		table->initialState.level.gen2PCIE = 0;
1760 
1761 	if (pi->mem_gddr5) {
1762 		table->initialState.level.strobeMode =
1763 			cypress_get_strobe_mode_settings(rdev,
1764 							 initial_state->performance_levels[0].mclk);
1765 
1766 		if (initial_state->performance_levels[0].mclk > pi->mclk_edc_enable_threshold)
1767 			table->initialState.level.mcFlags = NISLANDS_SMC_MC_EDC_RD_FLAG | NISLANDS_SMC_MC_EDC_WR_FLAG;
1768 		else
1769 			table->initialState.level.mcFlags =  0;
1770 	}
1771 
1772 	table->initialState.levelCount = 1;
1773 
1774 	table->initialState.flags |= PPSMC_SWSTATE_FLAG_DC;
1775 
1776 	table->initialState.level.dpm2.MaxPS = 0;
1777 	table->initialState.level.dpm2.NearTDPDec = 0;
1778 	table->initialState.level.dpm2.AboveSafeInc = 0;
1779 	table->initialState.level.dpm2.BelowSafeInc = 0;
1780 
1781 	reg = MIN_POWER_MASK | MAX_POWER_MASK;
1782 	table->initialState.level.SQPowerThrottle = cpu_to_be32(reg);
1783 
1784 	reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
1785 	table->initialState.level.SQPowerThrottle_2 = cpu_to_be32(reg);
1786 
1787 	return 0;
1788 }
1789 
ni_populate_smc_acpi_state(struct radeon_device * rdev,NISLANDS_SMC_STATETABLE * table)1790 static int ni_populate_smc_acpi_state(struct radeon_device *rdev,
1791 				      NISLANDS_SMC_STATETABLE *table)
1792 {
1793 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1794 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1795 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1796 	u32 mpll_ad_func_cntl   = ni_pi->clock_registers.mpll_ad_func_cntl;
1797 	u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2;
1798 	u32 mpll_dq_func_cntl   = ni_pi->clock_registers.mpll_dq_func_cntl;
1799 	u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2;
1800 	u32 spll_func_cntl      = ni_pi->clock_registers.cg_spll_func_cntl;
1801 	u32 spll_func_cntl_2    = ni_pi->clock_registers.cg_spll_func_cntl_2;
1802 	u32 spll_func_cntl_3    = ni_pi->clock_registers.cg_spll_func_cntl_3;
1803 	u32 spll_func_cntl_4    = ni_pi->clock_registers.cg_spll_func_cntl_4;
1804 	u32 mclk_pwrmgt_cntl    = ni_pi->clock_registers.mclk_pwrmgt_cntl;
1805 	u32 dll_cntl            = ni_pi->clock_registers.dll_cntl;
1806 	u32 reg;
1807 	int ret;
1808 
1809 	table->ACPIState = table->initialState;
1810 
1811 	table->ACPIState.flags &= ~PPSMC_SWSTATE_FLAG_DC;
1812 
1813 	if (pi->acpi_vddc) {
1814 		ret = ni_populate_voltage_value(rdev,
1815 						&eg_pi->vddc_voltage_table,
1816 						pi->acpi_vddc, &table->ACPIState.level.vddc);
1817 		if (!ret) {
1818 			u16 std_vddc;
1819 
1820 			ret = ni_get_std_voltage_value(rdev,
1821 						       &table->ACPIState.level.vddc, &std_vddc);
1822 			if (!ret)
1823 				ni_populate_std_voltage_value(rdev, std_vddc,
1824 							      table->ACPIState.level.vddc.index,
1825 							      &table->ACPIState.level.std_vddc);
1826 		}
1827 
1828 		if (pi->pcie_gen2) {
1829 			if (pi->acpi_pcie_gen2)
1830 				table->ACPIState.level.gen2PCIE = 1;
1831 			else
1832 				table->ACPIState.level.gen2PCIE = 0;
1833 		} else {
1834 			table->ACPIState.level.gen2PCIE = 0;
1835 		}
1836 	} else {
1837 		ret = ni_populate_voltage_value(rdev,
1838 						&eg_pi->vddc_voltage_table,
1839 						pi->min_vddc_in_table,
1840 						&table->ACPIState.level.vddc);
1841 		if (!ret) {
1842 			u16 std_vddc;
1843 
1844 			ret = ni_get_std_voltage_value(rdev,
1845 						       &table->ACPIState.level.vddc,
1846 						       &std_vddc);
1847 			if (!ret)
1848 				ni_populate_std_voltage_value(rdev, std_vddc,
1849 							      table->ACPIState.level.vddc.index,
1850 							      &table->ACPIState.level.std_vddc);
1851 		}
1852 		table->ACPIState.level.gen2PCIE = 0;
1853 	}
1854 
1855 	if (eg_pi->acpi_vddci) {
1856 		if (eg_pi->vddci_control)
1857 			ni_populate_voltage_value(rdev,
1858 						  &eg_pi->vddci_voltage_table,
1859 						  eg_pi->acpi_vddci,
1860 						  &table->ACPIState.level.vddci);
1861 	}
1862 
1863 
1864 	mpll_ad_func_cntl &= ~PDNB;
1865 
1866 	mpll_ad_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN;
1867 
1868 	if (pi->mem_gddr5)
1869 		mpll_dq_func_cntl &= ~PDNB;
1870 	mpll_dq_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN | BYPASS;
1871 
1872 
1873 	mclk_pwrmgt_cntl |= (MRDCKA0_RESET |
1874 			     MRDCKA1_RESET |
1875 			     MRDCKB0_RESET |
1876 			     MRDCKB1_RESET |
1877 			     MRDCKC0_RESET |
1878 			     MRDCKC1_RESET |
1879 			     MRDCKD0_RESET |
1880 			     MRDCKD1_RESET);
1881 
1882 	mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB |
1883 			      MRDCKA1_PDNB |
1884 			      MRDCKB0_PDNB |
1885 			      MRDCKB1_PDNB |
1886 			      MRDCKC0_PDNB |
1887 			      MRDCKC1_PDNB |
1888 			      MRDCKD0_PDNB |
1889 			      MRDCKD1_PDNB);
1890 
1891 	dll_cntl |= (MRDCKA0_BYPASS |
1892 		     MRDCKA1_BYPASS |
1893 		     MRDCKB0_BYPASS |
1894 		     MRDCKB1_BYPASS |
1895 		     MRDCKC0_BYPASS |
1896 		     MRDCKC1_BYPASS |
1897 		     MRDCKD0_BYPASS |
1898 		     MRDCKD1_BYPASS);
1899 
1900 	spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
1901 	spll_func_cntl_2 |= SCLK_MUX_SEL(4);
1902 
1903 	table->ACPIState.level.mclk.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
1904 	table->ACPIState.level.mclk.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
1905 	table->ACPIState.level.mclk.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
1906 	table->ACPIState.level.mclk.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
1907 	table->ACPIState.level.mclk.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
1908 	table->ACPIState.level.mclk.vDLL_CNTL = cpu_to_be32(dll_cntl);
1909 
1910 	table->ACPIState.level.mclk.mclk_value = 0;
1911 
1912 	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
1913 	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
1914 	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
1915 	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(spll_func_cntl_4);
1916 
1917 	table->ACPIState.level.sclk.sclk_value = 0;
1918 
1919 	ni_populate_mvdd_value(rdev, 0, &table->ACPIState.level.mvdd);
1920 
1921 	if (eg_pi->dynamic_ac_timing)
1922 		table->ACPIState.level.ACIndex = 1;
1923 
1924 	table->ACPIState.level.dpm2.MaxPS = 0;
1925 	table->ACPIState.level.dpm2.NearTDPDec = 0;
1926 	table->ACPIState.level.dpm2.AboveSafeInc = 0;
1927 	table->ACPIState.level.dpm2.BelowSafeInc = 0;
1928 
1929 	reg = MIN_POWER_MASK | MAX_POWER_MASK;
1930 	table->ACPIState.level.SQPowerThrottle = cpu_to_be32(reg);
1931 
1932 	reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
1933 	table->ACPIState.level.SQPowerThrottle_2 = cpu_to_be32(reg);
1934 
1935 	return 0;
1936 }
1937 
ni_init_smc_table(struct radeon_device * rdev)1938 static int ni_init_smc_table(struct radeon_device *rdev)
1939 {
1940 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1941 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1942 	int ret;
1943 	struct radeon_ps *radeon_boot_state = rdev->pm.dpm.boot_ps;
1944 	NISLANDS_SMC_STATETABLE *table = &ni_pi->smc_statetable;
1945 
1946 	memset(table, 0, sizeof(NISLANDS_SMC_STATETABLE));
1947 
1948 	ni_populate_smc_voltage_tables(rdev, table);
1949 
1950 	switch (rdev->pm.int_thermal_type) {
1951 	case THERMAL_TYPE_NI:
1952 	case THERMAL_TYPE_EMC2103_WITH_INTERNAL:
1953 		table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_INTERNAL;
1954 		break;
1955 	case THERMAL_TYPE_NONE:
1956 		table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_NONE;
1957 		break;
1958 	default:
1959 		table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_EXTERNAL;
1960 		break;
1961 	}
1962 
1963 	if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_HARDWAREDC)
1964 		table->systemFlags |= PPSMC_SYSTEMFLAG_GPIO_DC;
1965 
1966 	if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_REGULATOR_HOT)
1967 		table->systemFlags |= PPSMC_SYSTEMFLAG_REGULATOR_HOT;
1968 
1969 	if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_STEPVDDC)
1970 		table->systemFlags |= PPSMC_SYSTEMFLAG_STEPVDDC;
1971 
1972 	if (pi->mem_gddr5)
1973 		table->systemFlags |= PPSMC_SYSTEMFLAG_GDDR5;
1974 
1975 	ret = ni_populate_smc_initial_state(rdev, radeon_boot_state, table);
1976 	if (ret)
1977 		return ret;
1978 
1979 	ret = ni_populate_smc_acpi_state(rdev, table);
1980 	if (ret)
1981 		return ret;
1982 
1983 	table->driverState.flags = table->initialState.flags;
1984 	table->driverState.levelCount = table->initialState.levelCount;
1985 	table->driverState.levels[0] = table->initialState.level;
1986 
1987 	table->ULVState = table->initialState;
1988 
1989 	ret = ni_do_program_memory_timing_parameters(rdev, radeon_boot_state,
1990 						     NISLANDS_INITIAL_STATE_ARB_INDEX);
1991 	if (ret)
1992 		return ret;
1993 
1994 	return rv770_copy_bytes_to_smc(rdev, pi->state_table_start, (u8 *)table,
1995 				       sizeof(NISLANDS_SMC_STATETABLE), pi->sram_end);
1996 }
1997 
ni_calculate_sclk_params(struct radeon_device * rdev,u32 engine_clock,NISLANDS_SMC_SCLK_VALUE * sclk)1998 static int ni_calculate_sclk_params(struct radeon_device *rdev,
1999 				    u32 engine_clock,
2000 				    NISLANDS_SMC_SCLK_VALUE *sclk)
2001 {
2002 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2003 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2004 	struct atom_clock_dividers dividers;
2005 	u32 spll_func_cntl = ni_pi->clock_registers.cg_spll_func_cntl;
2006 	u32 spll_func_cntl_2 = ni_pi->clock_registers.cg_spll_func_cntl_2;
2007 	u32 spll_func_cntl_3 = ni_pi->clock_registers.cg_spll_func_cntl_3;
2008 	u32 spll_func_cntl_4 = ni_pi->clock_registers.cg_spll_func_cntl_4;
2009 	u32 cg_spll_spread_spectrum = ni_pi->clock_registers.cg_spll_spread_spectrum;
2010 	u32 cg_spll_spread_spectrum_2 = ni_pi->clock_registers.cg_spll_spread_spectrum_2;
2011 	u64 tmp;
2012 	u32 reference_clock = rdev->clock.spll.reference_freq;
2013 	u32 reference_divider;
2014 	u32 fbdiv;
2015 	int ret;
2016 
2017 	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
2018 					     engine_clock, false, &dividers);
2019 	if (ret)
2020 		return ret;
2021 
2022 	reference_divider = 1 + dividers.ref_div;
2023 
2024 
2025 	tmp = (u64) engine_clock * reference_divider * dividers.post_div * 16834;
2026 	do_div(tmp, reference_clock);
2027 	fbdiv = (u32) tmp;
2028 
2029 	spll_func_cntl &= ~(SPLL_PDIV_A_MASK | SPLL_REF_DIV_MASK);
2030 	spll_func_cntl |= SPLL_REF_DIV(dividers.ref_div);
2031 	spll_func_cntl |= SPLL_PDIV_A(dividers.post_div);
2032 
2033 	spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
2034 	spll_func_cntl_2 |= SCLK_MUX_SEL(2);
2035 
2036 	spll_func_cntl_3 &= ~SPLL_FB_DIV_MASK;
2037 	spll_func_cntl_3 |= SPLL_FB_DIV(fbdiv);
2038 	spll_func_cntl_3 |= SPLL_DITHEN;
2039 
2040 	if (pi->sclk_ss) {
2041 		struct radeon_atom_ss ss;
2042 		u32 vco_freq = engine_clock * dividers.post_div;
2043 
2044 		if (radeon_atombios_get_asic_ss_info(rdev, &ss,
2045 						     ASIC_INTERNAL_ENGINE_SS, vco_freq)) {
2046 			u32 clk_s = reference_clock * 5 / (reference_divider * ss.rate);
2047 			u32 clk_v = 4 * ss.percentage * fbdiv / (clk_s * 10000);
2048 
2049 			cg_spll_spread_spectrum &= ~CLK_S_MASK;
2050 			cg_spll_spread_spectrum |= CLK_S(clk_s);
2051 			cg_spll_spread_spectrum |= SSEN;
2052 
2053 			cg_spll_spread_spectrum_2 &= ~CLK_V_MASK;
2054 			cg_spll_spread_spectrum_2 |= CLK_V(clk_v);
2055 		}
2056 	}
2057 
2058 	sclk->sclk_value = engine_clock;
2059 	sclk->vCG_SPLL_FUNC_CNTL = spll_func_cntl;
2060 	sclk->vCG_SPLL_FUNC_CNTL_2 = spll_func_cntl_2;
2061 	sclk->vCG_SPLL_FUNC_CNTL_3 = spll_func_cntl_3;
2062 	sclk->vCG_SPLL_FUNC_CNTL_4 = spll_func_cntl_4;
2063 	sclk->vCG_SPLL_SPREAD_SPECTRUM = cg_spll_spread_spectrum;
2064 	sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cg_spll_spread_spectrum_2;
2065 
2066 	return 0;
2067 }
2068 
ni_populate_sclk_value(struct radeon_device * rdev,u32 engine_clock,NISLANDS_SMC_SCLK_VALUE * sclk)2069 static int ni_populate_sclk_value(struct radeon_device *rdev,
2070 				  u32 engine_clock,
2071 				  NISLANDS_SMC_SCLK_VALUE *sclk)
2072 {
2073 	NISLANDS_SMC_SCLK_VALUE sclk_tmp;
2074 	int ret;
2075 
2076 	ret = ni_calculate_sclk_params(rdev, engine_clock, &sclk_tmp);
2077 	if (!ret) {
2078 		sclk->sclk_value = cpu_to_be32(sclk_tmp.sclk_value);
2079 		sclk->vCG_SPLL_FUNC_CNTL = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL);
2080 		sclk->vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_2);
2081 		sclk->vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_3);
2082 		sclk->vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_4);
2083 		sclk->vCG_SPLL_SPREAD_SPECTRUM = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM);
2084 		sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM_2);
2085 	}
2086 
2087 	return ret;
2088 }
2089 
ni_init_smc_spll_table(struct radeon_device * rdev)2090 static int ni_init_smc_spll_table(struct radeon_device *rdev)
2091 {
2092 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2093 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2094 	SMC_NISLANDS_SPLL_DIV_TABLE *spll_table;
2095 	NISLANDS_SMC_SCLK_VALUE sclk_params;
2096 	u32 fb_div;
2097 	u32 p_div;
2098 	u32 clk_s;
2099 	u32 clk_v;
2100 	u32 sclk = 0;
2101 	int i, ret;
2102 	u32 tmp;
2103 
2104 	if (ni_pi->spll_table_start == 0)
2105 		return -EINVAL;
2106 
2107 	spll_table = kzalloc(sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), GFP_KERNEL);
2108 	if (spll_table == NULL)
2109 		return -ENOMEM;
2110 
2111 	for (i = 0; i < 256; i++) {
2112 		ret = ni_calculate_sclk_params(rdev, sclk, &sclk_params);
2113 		if (ret)
2114 			break;
2115 
2116 		p_div = (sclk_params.vCG_SPLL_FUNC_CNTL & SPLL_PDIV_A_MASK) >> SPLL_PDIV_A_SHIFT;
2117 		fb_div = (sclk_params.vCG_SPLL_FUNC_CNTL_3 & SPLL_FB_DIV_MASK) >> SPLL_FB_DIV_SHIFT;
2118 		clk_s = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM & CLK_S_MASK) >> CLK_S_SHIFT;
2119 		clk_v = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM_2 & CLK_V_MASK) >> CLK_V_SHIFT;
2120 
2121 		fb_div &= ~0x00001FFF;
2122 		fb_div >>= 1;
2123 		clk_v >>= 6;
2124 
2125 		if (p_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT))
2126 			ret = -EINVAL;
2127 
2128 		if (clk_s & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT))
2129 			ret = -EINVAL;
2130 
2131 		if (fb_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT))
2132 			ret = -EINVAL;
2133 
2134 		if (clk_v & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT))
2135 			ret = -EINVAL;
2136 
2137 		if (ret)
2138 			break;
2139 
2140 		tmp = ((fb_div << SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK) |
2141 			((p_div << SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK);
2142 		spll_table->freq[i] = cpu_to_be32(tmp);
2143 
2144 		tmp = ((clk_v << SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK) |
2145 			((clk_s << SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK);
2146 		spll_table->ss[i] = cpu_to_be32(tmp);
2147 
2148 		sclk += 512;
2149 	}
2150 
2151 	if (!ret)
2152 		ret = rv770_copy_bytes_to_smc(rdev, ni_pi->spll_table_start, (u8 *)spll_table,
2153 					      sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), pi->sram_end);
2154 
2155 	kfree(spll_table);
2156 
2157 	return ret;
2158 }
2159 
ni_populate_mclk_value(struct radeon_device * rdev,u32 engine_clock,u32 memory_clock,NISLANDS_SMC_MCLK_VALUE * mclk,bool strobe_mode,bool dll_state_on)2160 static int ni_populate_mclk_value(struct radeon_device *rdev,
2161 				  u32 engine_clock,
2162 				  u32 memory_clock,
2163 				  NISLANDS_SMC_MCLK_VALUE *mclk,
2164 				  bool strobe_mode,
2165 				  bool dll_state_on)
2166 {
2167 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2168 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2169 	u32 mpll_ad_func_cntl = ni_pi->clock_registers.mpll_ad_func_cntl;
2170 	u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2;
2171 	u32 mpll_dq_func_cntl = ni_pi->clock_registers.mpll_dq_func_cntl;
2172 	u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2;
2173 	u32 mclk_pwrmgt_cntl = ni_pi->clock_registers.mclk_pwrmgt_cntl;
2174 	u32 dll_cntl = ni_pi->clock_registers.dll_cntl;
2175 	u32 mpll_ss1 = ni_pi->clock_registers.mpll_ss1;
2176 	u32 mpll_ss2 = ni_pi->clock_registers.mpll_ss2;
2177 	struct atom_clock_dividers dividers;
2178 	u32 ibias;
2179 	u32 dll_speed;
2180 	int ret;
2181 	u32 mc_seq_misc7;
2182 
2183 	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_MEMORY_PLL_PARAM,
2184 					     memory_clock, strobe_mode, &dividers);
2185 	if (ret)
2186 		return ret;
2187 
2188 	if (!strobe_mode) {
2189 		mc_seq_misc7 = RREG32(MC_SEQ_MISC7);
2190 
2191 		if (mc_seq_misc7 & 0x8000000)
2192 			dividers.post_div = 1;
2193 	}
2194 
2195 	ibias = cypress_map_clkf_to_ibias(rdev, dividers.whole_fb_div);
2196 
2197 	mpll_ad_func_cntl &= ~(CLKR_MASK |
2198 			       YCLK_POST_DIV_MASK |
2199 			       CLKF_MASK |
2200 			       CLKFRAC_MASK |
2201 			       IBIAS_MASK);
2202 	mpll_ad_func_cntl |= CLKR(dividers.ref_div);
2203 	mpll_ad_func_cntl |= YCLK_POST_DIV(dividers.post_div);
2204 	mpll_ad_func_cntl |= CLKF(dividers.whole_fb_div);
2205 	mpll_ad_func_cntl |= CLKFRAC(dividers.frac_fb_div);
2206 	mpll_ad_func_cntl |= IBIAS(ibias);
2207 
2208 	if (dividers.vco_mode)
2209 		mpll_ad_func_cntl_2 |= VCO_MODE;
2210 	else
2211 		mpll_ad_func_cntl_2 &= ~VCO_MODE;
2212 
2213 	if (pi->mem_gddr5) {
2214 		mpll_dq_func_cntl &= ~(CLKR_MASK |
2215 				       YCLK_POST_DIV_MASK |
2216 				       CLKF_MASK |
2217 				       CLKFRAC_MASK |
2218 				       IBIAS_MASK);
2219 		mpll_dq_func_cntl |= CLKR(dividers.ref_div);
2220 		mpll_dq_func_cntl |= YCLK_POST_DIV(dividers.post_div);
2221 		mpll_dq_func_cntl |= CLKF(dividers.whole_fb_div);
2222 		mpll_dq_func_cntl |= CLKFRAC(dividers.frac_fb_div);
2223 		mpll_dq_func_cntl |= IBIAS(ibias);
2224 
2225 		if (strobe_mode)
2226 			mpll_dq_func_cntl &= ~PDNB;
2227 		else
2228 			mpll_dq_func_cntl |= PDNB;
2229 
2230 		if (dividers.vco_mode)
2231 			mpll_dq_func_cntl_2 |= VCO_MODE;
2232 		else
2233 			mpll_dq_func_cntl_2 &= ~VCO_MODE;
2234 	}
2235 
2236 	if (pi->mclk_ss) {
2237 		struct radeon_atom_ss ss;
2238 		u32 vco_freq = memory_clock * dividers.post_div;
2239 
2240 		if (radeon_atombios_get_asic_ss_info(rdev, &ss,
2241 						     ASIC_INTERNAL_MEMORY_SS, vco_freq)) {
2242 			u32 reference_clock = rdev->clock.mpll.reference_freq;
2243 			u32 decoded_ref = rv740_get_decoded_reference_divider(dividers.ref_div);
2244 			u32 clk_s, clk_v;
2245 
2246 			if (!decoded_ref)
2247 				return -EINVAL;
2248 			clk_s = reference_clock * 5 / (decoded_ref * ss.rate);
2249 			clk_v = ss.percentage *
2250 				(0x4000 * dividers.whole_fb_div + 0x800 * dividers.frac_fb_div) / (clk_s * 625);
2251 
2252 			mpll_ss1 &= ~CLKV_MASK;
2253 			mpll_ss1 |= CLKV(clk_v);
2254 
2255 			mpll_ss2 &= ~CLKS_MASK;
2256 			mpll_ss2 |= CLKS(clk_s);
2257 		}
2258 	}
2259 
2260 	dll_speed = rv740_get_dll_speed(pi->mem_gddr5,
2261 					memory_clock);
2262 
2263 	mclk_pwrmgt_cntl &= ~DLL_SPEED_MASK;
2264 	mclk_pwrmgt_cntl |= DLL_SPEED(dll_speed);
2265 	if (dll_state_on)
2266 		mclk_pwrmgt_cntl |= (MRDCKA0_PDNB |
2267 				     MRDCKA1_PDNB |
2268 				     MRDCKB0_PDNB |
2269 				     MRDCKB1_PDNB |
2270 				     MRDCKC0_PDNB |
2271 				     MRDCKC1_PDNB |
2272 				     MRDCKD0_PDNB |
2273 				     MRDCKD1_PDNB);
2274 	else
2275 		mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB |
2276 				      MRDCKA1_PDNB |
2277 				      MRDCKB0_PDNB |
2278 				      MRDCKB1_PDNB |
2279 				      MRDCKC0_PDNB |
2280 				      MRDCKC1_PDNB |
2281 				      MRDCKD0_PDNB |
2282 				      MRDCKD1_PDNB);
2283 
2284 
2285 	mclk->mclk_value = cpu_to_be32(memory_clock);
2286 	mclk->vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
2287 	mclk->vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
2288 	mclk->vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
2289 	mclk->vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
2290 	mclk->vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
2291 	mclk->vDLL_CNTL = cpu_to_be32(dll_cntl);
2292 	mclk->vMPLL_SS = cpu_to_be32(mpll_ss1);
2293 	mclk->vMPLL_SS2 = cpu_to_be32(mpll_ss2);
2294 
2295 	return 0;
2296 }
2297 
ni_populate_smc_sp(struct radeon_device * rdev,struct radeon_ps * radeon_state,NISLANDS_SMC_SWSTATE * smc_state)2298 static void ni_populate_smc_sp(struct radeon_device *rdev,
2299 			       struct radeon_ps *radeon_state,
2300 			       NISLANDS_SMC_SWSTATE *smc_state)
2301 {
2302 	struct ni_ps *ps = ni_get_ps(radeon_state);
2303 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2304 	int i;
2305 
2306 	for (i = 0; i < ps->performance_level_count - 1; i++)
2307 		smc_state->levels[i].bSP = cpu_to_be32(pi->dsp);
2308 
2309 	smc_state->levels[ps->performance_level_count - 1].bSP =
2310 		cpu_to_be32(pi->psp);
2311 }
2312 
ni_convert_power_level_to_smc(struct radeon_device * rdev,struct rv7xx_pl * pl,NISLANDS_SMC_HW_PERFORMANCE_LEVEL * level)2313 static int ni_convert_power_level_to_smc(struct radeon_device *rdev,
2314 					 struct rv7xx_pl *pl,
2315 					 NISLANDS_SMC_HW_PERFORMANCE_LEVEL *level)
2316 {
2317 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2318 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2319 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2320 	int ret;
2321 	bool dll_state_on;
2322 	u16 std_vddc;
2323 	u32 tmp = RREG32(DC_STUTTER_CNTL);
2324 
2325 	level->gen2PCIE = pi->pcie_gen2 ?
2326 		((pl->flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2) ? 1 : 0) : 0;
2327 
2328 	ret = ni_populate_sclk_value(rdev, pl->sclk, &level->sclk);
2329 	if (ret)
2330 		return ret;
2331 
2332 	level->mcFlags =  0;
2333 	if (pi->mclk_stutter_mode_threshold &&
2334 	    (pl->mclk <= pi->mclk_stutter_mode_threshold) &&
2335 	    !eg_pi->uvd_enabled &&
2336 	    (tmp & DC_STUTTER_ENABLE_A) &&
2337 	    (tmp & DC_STUTTER_ENABLE_B))
2338 		level->mcFlags |= NISLANDS_SMC_MC_STUTTER_EN;
2339 
2340 	if (pi->mem_gddr5) {
2341 		if (pl->mclk > pi->mclk_edc_enable_threshold)
2342 			level->mcFlags |= NISLANDS_SMC_MC_EDC_RD_FLAG;
2343 		if (pl->mclk > eg_pi->mclk_edc_wr_enable_threshold)
2344 			level->mcFlags |= NISLANDS_SMC_MC_EDC_WR_FLAG;
2345 
2346 		level->strobeMode = cypress_get_strobe_mode_settings(rdev, pl->mclk);
2347 
2348 		if (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) {
2349 			if (cypress_get_mclk_frequency_ratio(rdev, pl->mclk, true) >=
2350 			    ((RREG32(MC_SEQ_MISC7) >> 16) & 0xf))
2351 				dll_state_on = ((RREG32(MC_SEQ_MISC5) >> 1) & 0x1) ? true : false;
2352 			else
2353 				dll_state_on = ((RREG32(MC_SEQ_MISC6) >> 1) & 0x1) ? true : false;
2354 		} else {
2355 			dll_state_on = false;
2356 			if (pl->mclk > ni_pi->mclk_rtt_mode_threshold)
2357 				level->mcFlags |= NISLANDS_SMC_MC_RTT_ENABLE;
2358 		}
2359 
2360 		ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk,
2361 					     &level->mclk,
2362 					     (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) != 0,
2363 					     dll_state_on);
2364 	} else
2365 		ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk, &level->mclk, 1, 1);
2366 
2367 	if (ret)
2368 		return ret;
2369 
2370 	ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
2371 					pl->vddc, &level->vddc);
2372 	if (ret)
2373 		return ret;
2374 
2375 	ret = ni_get_std_voltage_value(rdev, &level->vddc, &std_vddc);
2376 	if (ret)
2377 		return ret;
2378 
2379 	ni_populate_std_voltage_value(rdev, std_vddc,
2380 				      level->vddc.index, &level->std_vddc);
2381 
2382 	if (eg_pi->vddci_control) {
2383 		ret = ni_populate_voltage_value(rdev, &eg_pi->vddci_voltage_table,
2384 						pl->vddci, &level->vddci);
2385 		if (ret)
2386 			return ret;
2387 	}
2388 
2389 	ni_populate_mvdd_value(rdev, pl->mclk, &level->mvdd);
2390 
2391 	return ret;
2392 }
2393 
ni_populate_smc_t(struct radeon_device * rdev,struct radeon_ps * radeon_state,NISLANDS_SMC_SWSTATE * smc_state)2394 static int ni_populate_smc_t(struct radeon_device *rdev,
2395 			     struct radeon_ps *radeon_state,
2396 			     NISLANDS_SMC_SWSTATE *smc_state)
2397 {
2398 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2399 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2400 	struct ni_ps *state = ni_get_ps(radeon_state);
2401 	u32 a_t;
2402 	u32 t_l, t_h;
2403 	u32 high_bsp;
2404 	int i, ret;
2405 
2406 	if (state->performance_level_count >= 9)
2407 		return -EINVAL;
2408 
2409 	if (state->performance_level_count < 2) {
2410 		a_t = CG_R(0xffff) | CG_L(0);
2411 		smc_state->levels[0].aT = cpu_to_be32(a_t);
2412 		return 0;
2413 	}
2414 
2415 	smc_state->levels[0].aT = cpu_to_be32(0);
2416 
2417 	for (i = 0; i <= state->performance_level_count - 2; i++) {
2418 		if (eg_pi->uvd_enabled)
2419 			ret = r600_calculate_at(
2420 				1000 * (i * (eg_pi->smu_uvd_hs ? 2 : 8) + 2),
2421 				100 * R600_AH_DFLT,
2422 				state->performance_levels[i + 1].sclk,
2423 				state->performance_levels[i].sclk,
2424 				&t_l,
2425 				&t_h);
2426 		else
2427 			ret = r600_calculate_at(
2428 				1000 * (i + 1),
2429 				100 * R600_AH_DFLT,
2430 				state->performance_levels[i + 1].sclk,
2431 				state->performance_levels[i].sclk,
2432 				&t_l,
2433 				&t_h);
2434 
2435 		if (ret) {
2436 			t_h = (i + 1) * 1000 - 50 * R600_AH_DFLT;
2437 			t_l = (i + 1) * 1000 + 50 * R600_AH_DFLT;
2438 		}
2439 
2440 		a_t = be32_to_cpu(smc_state->levels[i].aT) & ~CG_R_MASK;
2441 		a_t |= CG_R(t_l * pi->bsp / 20000);
2442 		smc_state->levels[i].aT = cpu_to_be32(a_t);
2443 
2444 		high_bsp = (i == state->performance_level_count - 2) ?
2445 			pi->pbsp : pi->bsp;
2446 
2447 		a_t = CG_R(0xffff) | CG_L(t_h * high_bsp / 20000);
2448 		smc_state->levels[i + 1].aT = cpu_to_be32(a_t);
2449 	}
2450 
2451 	return 0;
2452 }
2453 
ni_populate_power_containment_values(struct radeon_device * rdev,struct radeon_ps * radeon_state,NISLANDS_SMC_SWSTATE * smc_state)2454 static int ni_populate_power_containment_values(struct radeon_device *rdev,
2455 						struct radeon_ps *radeon_state,
2456 						NISLANDS_SMC_SWSTATE *smc_state)
2457 {
2458 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2459 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2460 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2461 	struct ni_ps *state = ni_get_ps(radeon_state);
2462 	u32 prev_sclk;
2463 	u32 max_sclk;
2464 	u32 min_sclk;
2465 	int i, ret;
2466 	u32 tdp_limit;
2467 	u32 near_tdp_limit;
2468 	u32 power_boost_limit;
2469 	u8 max_ps_percent;
2470 
2471 	if (ni_pi->enable_power_containment == false)
2472 		return 0;
2473 
2474 	if (state->performance_level_count == 0)
2475 		return -EINVAL;
2476 
2477 	if (smc_state->levelCount != state->performance_level_count)
2478 		return -EINVAL;
2479 
2480 	ret = ni_calculate_adjusted_tdp_limits(rdev,
2481 					       false, /* ??? */
2482 					       rdev->pm.dpm.tdp_adjustment,
2483 					       &tdp_limit,
2484 					       &near_tdp_limit);
2485 	if (ret)
2486 		return ret;
2487 
2488 	power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state, near_tdp_limit);
2489 
2490 	ret = rv770_write_smc_sram_dword(rdev,
2491 					 pi->state_table_start +
2492 					 offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) +
2493 					 offsetof(PP_NIslands_DPM2Parameters, PowerBoostLimit),
2494 					 ni_scale_power_for_smc(power_boost_limit, ni_get_smc_power_scaling_factor(rdev)),
2495 					 pi->sram_end);
2496 	if (ret)
2497 		power_boost_limit = 0;
2498 
2499 	smc_state->levels[0].dpm2.MaxPS = 0;
2500 	smc_state->levels[0].dpm2.NearTDPDec = 0;
2501 	smc_state->levels[0].dpm2.AboveSafeInc = 0;
2502 	smc_state->levels[0].dpm2.BelowSafeInc = 0;
2503 	smc_state->levels[0].stateFlags |= power_boost_limit ? PPSMC_STATEFLAG_POWERBOOST : 0;
2504 
2505 	for (i = 1; i < state->performance_level_count; i++) {
2506 		prev_sclk = state->performance_levels[i-1].sclk;
2507 		max_sclk  = state->performance_levels[i].sclk;
2508 		max_ps_percent = (i != (state->performance_level_count - 1)) ?
2509 			NISLANDS_DPM2_MAXPS_PERCENT_M : NISLANDS_DPM2_MAXPS_PERCENT_H;
2510 
2511 		if (max_sclk < prev_sclk)
2512 			return -EINVAL;
2513 
2514 		if ((max_ps_percent == 0) || (prev_sclk == max_sclk) || eg_pi->uvd_enabled)
2515 			min_sclk = max_sclk;
2516 		else if (1 == i)
2517 			min_sclk = prev_sclk;
2518 		else
2519 			min_sclk = (prev_sclk * (u32)max_ps_percent) / 100;
2520 
2521 		if (min_sclk < state->performance_levels[0].sclk)
2522 			min_sclk = state->performance_levels[0].sclk;
2523 
2524 		if (min_sclk == 0)
2525 			return -EINVAL;
2526 
2527 		smc_state->levels[i].dpm2.MaxPS =
2528 			(u8)((NISLANDS_DPM2_MAX_PULSE_SKIP * (max_sclk - min_sclk)) / max_sclk);
2529 		smc_state->levels[i].dpm2.NearTDPDec = NISLANDS_DPM2_NEAR_TDP_DEC;
2530 		smc_state->levels[i].dpm2.AboveSafeInc = NISLANDS_DPM2_ABOVE_SAFE_INC;
2531 		smc_state->levels[i].dpm2.BelowSafeInc = NISLANDS_DPM2_BELOW_SAFE_INC;
2532 		smc_state->levels[i].stateFlags |=
2533 			((i != (state->performance_level_count - 1)) && power_boost_limit) ?
2534 			PPSMC_STATEFLAG_POWERBOOST : 0;
2535 	}
2536 
2537 	return 0;
2538 }
2539 
ni_populate_sq_ramping_values(struct radeon_device * rdev,struct radeon_ps * radeon_state,NISLANDS_SMC_SWSTATE * smc_state)2540 static int ni_populate_sq_ramping_values(struct radeon_device *rdev,
2541 					 struct radeon_ps *radeon_state,
2542 					 NISLANDS_SMC_SWSTATE *smc_state)
2543 {
2544 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2545 	struct ni_ps *state = ni_get_ps(radeon_state);
2546 	u32 sq_power_throttle;
2547 	u32 sq_power_throttle2;
2548 	bool enable_sq_ramping = ni_pi->enable_sq_ramping;
2549 	int i;
2550 
2551 	if (state->performance_level_count == 0)
2552 		return -EINVAL;
2553 
2554 	if (smc_state->levelCount != state->performance_level_count)
2555 		return -EINVAL;
2556 
2557 	if (rdev->pm.dpm.sq_ramping_threshold == 0)
2558 		return -EINVAL;
2559 
2560 	if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER > (MAX_POWER_MASK >> MAX_POWER_SHIFT))
2561 		enable_sq_ramping = false;
2562 
2563 	if (NISLANDS_DPM2_SQ_RAMP_MIN_POWER > (MIN_POWER_MASK >> MIN_POWER_SHIFT))
2564 		enable_sq_ramping = false;
2565 
2566 	if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA > (MAX_POWER_DELTA_MASK >> MAX_POWER_DELTA_SHIFT))
2567 		enable_sq_ramping = false;
2568 
2569 	if (NISLANDS_DPM2_SQ_RAMP_STI_SIZE > (STI_SIZE_MASK >> STI_SIZE_SHIFT))
2570 		enable_sq_ramping = false;
2571 
2572 	if (NISLANDS_DPM2_SQ_RAMP_LTI_RATIO > (LTI_RATIO_MASK >> LTI_RATIO_SHIFT))
2573 		enable_sq_ramping = false;
2574 
2575 	for (i = 0; i < state->performance_level_count; i++) {
2576 		sq_power_throttle  = 0;
2577 		sq_power_throttle2 = 0;
2578 
2579 		if ((state->performance_levels[i].sclk >= rdev->pm.dpm.sq_ramping_threshold) &&
2580 		    enable_sq_ramping) {
2581 			sq_power_throttle |= MAX_POWER(NISLANDS_DPM2_SQ_RAMP_MAX_POWER);
2582 			sq_power_throttle |= MIN_POWER(NISLANDS_DPM2_SQ_RAMP_MIN_POWER);
2583 			sq_power_throttle2 |= MAX_POWER_DELTA(NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA);
2584 			sq_power_throttle2 |= STI_SIZE(NISLANDS_DPM2_SQ_RAMP_STI_SIZE);
2585 			sq_power_throttle2 |= LTI_RATIO(NISLANDS_DPM2_SQ_RAMP_LTI_RATIO);
2586 		} else {
2587 			sq_power_throttle |= MAX_POWER_MASK | MIN_POWER_MASK;
2588 			sq_power_throttle2 |= MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
2589 		}
2590 
2591 		smc_state->levels[i].SQPowerThrottle   = cpu_to_be32(sq_power_throttle);
2592 		smc_state->levels[i].SQPowerThrottle_2 = cpu_to_be32(sq_power_throttle2);
2593 	}
2594 
2595 	return 0;
2596 }
2597 
ni_enable_power_containment(struct radeon_device * rdev,struct radeon_ps * radeon_new_state,bool enable)2598 static int ni_enable_power_containment(struct radeon_device *rdev,
2599 				       struct radeon_ps *radeon_new_state,
2600 				       bool enable)
2601 {
2602 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2603 	PPSMC_Result smc_result;
2604 	int ret = 0;
2605 
2606 	if (ni_pi->enable_power_containment) {
2607 		if (enable) {
2608 			if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) {
2609 				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingActive);
2610 				if (smc_result != PPSMC_Result_OK) {
2611 					ret = -EINVAL;
2612 					ni_pi->pc_enabled = false;
2613 				} else {
2614 					ni_pi->pc_enabled = true;
2615 				}
2616 			}
2617 		} else {
2618 			smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingInactive);
2619 			if (smc_result != PPSMC_Result_OK)
2620 				ret = -EINVAL;
2621 			ni_pi->pc_enabled = false;
2622 		}
2623 	}
2624 
2625 	return ret;
2626 }
2627 
ni_convert_power_state_to_smc(struct radeon_device * rdev,struct radeon_ps * radeon_state,NISLANDS_SMC_SWSTATE * smc_state)2628 static int ni_convert_power_state_to_smc(struct radeon_device *rdev,
2629 					 struct radeon_ps *radeon_state,
2630 					 NISLANDS_SMC_SWSTATE *smc_state)
2631 {
2632 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2633 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2634 	struct ni_ps *state = ni_get_ps(radeon_state);
2635 	int i, ret;
2636 	u32 threshold = state->performance_levels[state->performance_level_count - 1].sclk * 100 / 100;
2637 
2638 	if (!(radeon_state->caps & ATOM_PPLIB_DISALLOW_ON_DC))
2639 		smc_state->flags |= PPSMC_SWSTATE_FLAG_DC;
2640 
2641 	smc_state->levelCount = 0;
2642 
2643 	if (state->performance_level_count > NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE)
2644 		return -EINVAL;
2645 
2646 	for (i = 0; i < state->performance_level_count; i++) {
2647 		ret = ni_convert_power_level_to_smc(rdev, &state->performance_levels[i],
2648 						    &smc_state->levels[i]);
2649 		smc_state->levels[i].arbRefreshState =
2650 			(u8)(NISLANDS_DRIVER_STATE_ARB_INDEX + i);
2651 
2652 		if (ret)
2653 			return ret;
2654 
2655 		if (ni_pi->enable_power_containment)
2656 			smc_state->levels[i].displayWatermark =
2657 				(state->performance_levels[i].sclk < threshold) ?
2658 				PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH;
2659 		else
2660 			smc_state->levels[i].displayWatermark = (i < 2) ?
2661 				PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH;
2662 
2663 		if (eg_pi->dynamic_ac_timing)
2664 			smc_state->levels[i].ACIndex = NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i;
2665 		else
2666 			smc_state->levels[i].ACIndex = 0;
2667 
2668 		smc_state->levelCount++;
2669 	}
2670 
2671 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_watermark_threshold,
2672 				      cpu_to_be32(threshold / 512));
2673 
2674 	ni_populate_smc_sp(rdev, radeon_state, smc_state);
2675 
2676 	ret = ni_populate_power_containment_values(rdev, radeon_state, smc_state);
2677 	if (ret)
2678 		ni_pi->enable_power_containment = false;
2679 
2680 	ret = ni_populate_sq_ramping_values(rdev, radeon_state, smc_state);
2681 	if (ret)
2682 		ni_pi->enable_sq_ramping = false;
2683 
2684 	return ni_populate_smc_t(rdev, radeon_state, smc_state);
2685 }
2686 
ni_upload_sw_state(struct radeon_device * rdev,struct radeon_ps * radeon_new_state)2687 static int ni_upload_sw_state(struct radeon_device *rdev,
2688 			      struct radeon_ps *radeon_new_state)
2689 {
2690 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2691 	u16 address = pi->state_table_start +
2692 		offsetof(NISLANDS_SMC_STATETABLE, driverState);
2693 	NISLANDS_SMC_SWSTATE *smc_state;
2694 	size_t state_size = struct_size(smc_state, levels,
2695 			NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE);
2696 	int ret;
2697 
2698 	smc_state = kzalloc(state_size, GFP_KERNEL);
2699 	if (smc_state == NULL)
2700 		return -ENOMEM;
2701 
2702 	ret = ni_convert_power_state_to_smc(rdev, radeon_new_state, smc_state);
2703 	if (ret)
2704 		goto done;
2705 
2706 	ret = rv770_copy_bytes_to_smc(rdev, address, (u8 *)smc_state, state_size, pi->sram_end);
2707 
2708 done:
2709 	kfree(smc_state);
2710 
2711 	return ret;
2712 }
2713 
ni_set_mc_special_registers(struct radeon_device * rdev,struct ni_mc_reg_table * table)2714 static int ni_set_mc_special_registers(struct radeon_device *rdev,
2715 				       struct ni_mc_reg_table *table)
2716 {
2717 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2718 	u8 i, j, k;
2719 	u32 temp_reg;
2720 
2721 	for (i = 0, j = table->last; i < table->last; i++) {
2722 		switch (table->mc_reg_address[i].s1) {
2723 		case MC_SEQ_MISC1 >> 2:
2724 			if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2725 				return -EINVAL;
2726 			temp_reg = RREG32(MC_PMG_CMD_EMRS);
2727 			table->mc_reg_address[j].s1 = MC_PMG_CMD_EMRS >> 2;
2728 			table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_EMRS_LP >> 2;
2729 			for (k = 0; k < table->num_entries; k++)
2730 				table->mc_reg_table_entry[k].mc_data[j] =
2731 					((temp_reg & 0xffff0000)) |
2732 					((table->mc_reg_table_entry[k].mc_data[i] & 0xffff0000) >> 16);
2733 			j++;
2734 			if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2735 				return -EINVAL;
2736 
2737 			temp_reg = RREG32(MC_PMG_CMD_MRS);
2738 			table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS >> 2;
2739 			table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS_LP >> 2;
2740 			for(k = 0; k < table->num_entries; k++) {
2741 				table->mc_reg_table_entry[k].mc_data[j] =
2742 					(temp_reg & 0xffff0000) |
2743 					(table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff);
2744 				if (!pi->mem_gddr5)
2745 					table->mc_reg_table_entry[k].mc_data[j] |= 0x100;
2746 			}
2747 			j++;
2748 			break;
2749 		case MC_SEQ_RESERVE_M >> 2:
2750 			if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2751 				return -EINVAL;
2752 			temp_reg = RREG32(MC_PMG_CMD_MRS1);
2753 			table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS1 >> 2;
2754 			table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS1_LP >> 2;
2755 			for (k = 0; k < table->num_entries; k++)
2756 				table->mc_reg_table_entry[k].mc_data[j] =
2757 					(temp_reg & 0xffff0000) |
2758 					(table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff);
2759 			j++;
2760 			break;
2761 		default:
2762 			break;
2763 		}
2764 	}
2765 
2766 	table->last = j;
2767 
2768 	return 0;
2769 }
2770 
ni_check_s0_mc_reg_index(u16 in_reg,u16 * out_reg)2771 static bool ni_check_s0_mc_reg_index(u16 in_reg, u16 *out_reg)
2772 {
2773 	bool result = true;
2774 
2775 	switch (in_reg) {
2776 	case  MC_SEQ_RAS_TIMING >> 2:
2777 		*out_reg = MC_SEQ_RAS_TIMING_LP >> 2;
2778 		break;
2779 	case MC_SEQ_CAS_TIMING >> 2:
2780 		*out_reg = MC_SEQ_CAS_TIMING_LP >> 2;
2781 		break;
2782 	case MC_SEQ_MISC_TIMING >> 2:
2783 		*out_reg = MC_SEQ_MISC_TIMING_LP >> 2;
2784 		break;
2785 	case MC_SEQ_MISC_TIMING2 >> 2:
2786 		*out_reg = MC_SEQ_MISC_TIMING2_LP >> 2;
2787 		break;
2788 	case MC_SEQ_RD_CTL_D0 >> 2:
2789 		*out_reg = MC_SEQ_RD_CTL_D0_LP >> 2;
2790 		break;
2791 	case MC_SEQ_RD_CTL_D1 >> 2:
2792 		*out_reg = MC_SEQ_RD_CTL_D1_LP >> 2;
2793 		break;
2794 	case MC_SEQ_WR_CTL_D0 >> 2:
2795 		*out_reg = MC_SEQ_WR_CTL_D0_LP >> 2;
2796 		break;
2797 	case MC_SEQ_WR_CTL_D1 >> 2:
2798 		*out_reg = MC_SEQ_WR_CTL_D1_LP >> 2;
2799 		break;
2800 	case MC_PMG_CMD_EMRS >> 2:
2801 		*out_reg = MC_SEQ_PMG_CMD_EMRS_LP >> 2;
2802 		break;
2803 	case MC_PMG_CMD_MRS >> 2:
2804 		*out_reg = MC_SEQ_PMG_CMD_MRS_LP >> 2;
2805 		break;
2806 	case MC_PMG_CMD_MRS1 >> 2:
2807 		*out_reg = MC_SEQ_PMG_CMD_MRS1_LP >> 2;
2808 		break;
2809 	case MC_SEQ_PMG_TIMING >> 2:
2810 		*out_reg = MC_SEQ_PMG_TIMING_LP >> 2;
2811 		break;
2812 	case MC_PMG_CMD_MRS2 >> 2:
2813 		*out_reg = MC_SEQ_PMG_CMD_MRS2_LP >> 2;
2814 		break;
2815 	default:
2816 		result = false;
2817 		break;
2818 	}
2819 
2820 	return result;
2821 }
2822 
ni_set_valid_flag(struct ni_mc_reg_table * table)2823 static void ni_set_valid_flag(struct ni_mc_reg_table *table)
2824 {
2825 	u8 i, j;
2826 
2827 	for (i = 0; i < table->last; i++) {
2828 		for (j = 1; j < table->num_entries; j++) {
2829 			if (table->mc_reg_table_entry[j-1].mc_data[i] != table->mc_reg_table_entry[j].mc_data[i]) {
2830 				table->valid_flag |= 1 << i;
2831 				break;
2832 			}
2833 		}
2834 	}
2835 }
2836 
ni_set_s0_mc_reg_index(struct ni_mc_reg_table * table)2837 static void ni_set_s0_mc_reg_index(struct ni_mc_reg_table *table)
2838 {
2839 	u32 i;
2840 	u16 address;
2841 
2842 	for (i = 0; i < table->last; i++)
2843 		table->mc_reg_address[i].s0 =
2844 			ni_check_s0_mc_reg_index(table->mc_reg_address[i].s1, &address) ?
2845 			address : table->mc_reg_address[i].s1;
2846 }
2847 
ni_copy_vbios_mc_reg_table(struct atom_mc_reg_table * table,struct ni_mc_reg_table * ni_table)2848 static int ni_copy_vbios_mc_reg_table(struct atom_mc_reg_table *table,
2849 				      struct ni_mc_reg_table *ni_table)
2850 {
2851 	u8 i, j;
2852 
2853 	if (table->last > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2854 		return -EINVAL;
2855 	if (table->num_entries > MAX_AC_TIMING_ENTRIES)
2856 		return -EINVAL;
2857 
2858 	for (i = 0; i < table->last; i++)
2859 		ni_table->mc_reg_address[i].s1 = table->mc_reg_address[i].s1;
2860 	ni_table->last = table->last;
2861 
2862 	for (i = 0; i < table->num_entries; i++) {
2863 		ni_table->mc_reg_table_entry[i].mclk_max =
2864 			table->mc_reg_table_entry[i].mclk_max;
2865 		for (j = 0; j < table->last; j++)
2866 			ni_table->mc_reg_table_entry[i].mc_data[j] =
2867 				table->mc_reg_table_entry[i].mc_data[j];
2868 	}
2869 	ni_table->num_entries = table->num_entries;
2870 
2871 	return 0;
2872 }
2873 
ni_initialize_mc_reg_table(struct radeon_device * rdev)2874 static int ni_initialize_mc_reg_table(struct radeon_device *rdev)
2875 {
2876 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2877 	int ret;
2878 	struct atom_mc_reg_table *table;
2879 	struct ni_mc_reg_table *ni_table = &ni_pi->mc_reg_table;
2880 	u8 module_index = rv770_get_memory_module_index(rdev);
2881 
2882 	table = kzalloc(sizeof(struct atom_mc_reg_table), GFP_KERNEL);
2883 	if (!table)
2884 		return -ENOMEM;
2885 
2886 	WREG32(MC_SEQ_RAS_TIMING_LP, RREG32(MC_SEQ_RAS_TIMING));
2887 	WREG32(MC_SEQ_CAS_TIMING_LP, RREG32(MC_SEQ_CAS_TIMING));
2888 	WREG32(MC_SEQ_MISC_TIMING_LP, RREG32(MC_SEQ_MISC_TIMING));
2889 	WREG32(MC_SEQ_MISC_TIMING2_LP, RREG32(MC_SEQ_MISC_TIMING2));
2890 	WREG32(MC_SEQ_PMG_CMD_EMRS_LP, RREG32(MC_PMG_CMD_EMRS));
2891 	WREG32(MC_SEQ_PMG_CMD_MRS_LP, RREG32(MC_PMG_CMD_MRS));
2892 	WREG32(MC_SEQ_PMG_CMD_MRS1_LP, RREG32(MC_PMG_CMD_MRS1));
2893 	WREG32(MC_SEQ_WR_CTL_D0_LP, RREG32(MC_SEQ_WR_CTL_D0));
2894 	WREG32(MC_SEQ_WR_CTL_D1_LP, RREG32(MC_SEQ_WR_CTL_D1));
2895 	WREG32(MC_SEQ_RD_CTL_D0_LP, RREG32(MC_SEQ_RD_CTL_D0));
2896 	WREG32(MC_SEQ_RD_CTL_D1_LP, RREG32(MC_SEQ_RD_CTL_D1));
2897 	WREG32(MC_SEQ_PMG_TIMING_LP, RREG32(MC_SEQ_PMG_TIMING));
2898 	WREG32(MC_SEQ_PMG_CMD_MRS2_LP, RREG32(MC_PMG_CMD_MRS2));
2899 
2900 	ret = radeon_atom_init_mc_reg_table(rdev, module_index, table);
2901 
2902 	if (ret)
2903 		goto init_mc_done;
2904 
2905 	ret = ni_copy_vbios_mc_reg_table(table, ni_table);
2906 
2907 	if (ret)
2908 		goto init_mc_done;
2909 
2910 	ni_set_s0_mc_reg_index(ni_table);
2911 
2912 	ret = ni_set_mc_special_registers(rdev, ni_table);
2913 
2914 	if (ret)
2915 		goto init_mc_done;
2916 
2917 	ni_set_valid_flag(ni_table);
2918 
2919 init_mc_done:
2920 	kfree(table);
2921 
2922 	return ret;
2923 }
2924 
ni_populate_mc_reg_addresses(struct radeon_device * rdev,SMC_NIslands_MCRegisters * mc_reg_table)2925 static void ni_populate_mc_reg_addresses(struct radeon_device *rdev,
2926 					 SMC_NIslands_MCRegisters *mc_reg_table)
2927 {
2928 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2929 	u32 i, j;
2930 
2931 	for (i = 0, j = 0; j < ni_pi->mc_reg_table.last; j++) {
2932 		if (ni_pi->mc_reg_table.valid_flag & (1 << j)) {
2933 			if (i >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2934 				break;
2935 			mc_reg_table->address[i].s0 =
2936 				cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s0);
2937 			mc_reg_table->address[i].s1 =
2938 				cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s1);
2939 			i++;
2940 		}
2941 	}
2942 	mc_reg_table->last = (u8)i;
2943 }
2944 
2945 
ni_convert_mc_registers(struct ni_mc_reg_entry * entry,SMC_NIslands_MCRegisterSet * data,u32 num_entries,u32 valid_flag)2946 static void ni_convert_mc_registers(struct ni_mc_reg_entry *entry,
2947 				    SMC_NIslands_MCRegisterSet *data,
2948 				    u32 num_entries, u32 valid_flag)
2949 {
2950 	u32 i, j;
2951 
2952 	for (i = 0, j = 0; j < num_entries; j++) {
2953 		if (valid_flag & (1 << j)) {
2954 			data->value[i] = cpu_to_be32(entry->mc_data[j]);
2955 			i++;
2956 		}
2957 	}
2958 }
2959 
ni_convert_mc_reg_table_entry_to_smc(struct radeon_device * rdev,struct rv7xx_pl * pl,SMC_NIslands_MCRegisterSet * mc_reg_table_data)2960 static void ni_convert_mc_reg_table_entry_to_smc(struct radeon_device *rdev,
2961 						 struct rv7xx_pl *pl,
2962 						 SMC_NIslands_MCRegisterSet *mc_reg_table_data)
2963 {
2964 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2965 	u32 i = 0;
2966 
2967 	for (i = 0; i < ni_pi->mc_reg_table.num_entries; i++) {
2968 		if (pl->mclk <= ni_pi->mc_reg_table.mc_reg_table_entry[i].mclk_max)
2969 			break;
2970 	}
2971 
2972 	if ((i == ni_pi->mc_reg_table.num_entries) && (i > 0))
2973 		--i;
2974 
2975 	ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[i],
2976 				mc_reg_table_data,
2977 				ni_pi->mc_reg_table.last,
2978 				ni_pi->mc_reg_table.valid_flag);
2979 }
2980 
ni_convert_mc_reg_table_to_smc(struct radeon_device * rdev,struct radeon_ps * radeon_state,SMC_NIslands_MCRegisters * mc_reg_table)2981 static void ni_convert_mc_reg_table_to_smc(struct radeon_device *rdev,
2982 					   struct radeon_ps *radeon_state,
2983 					   SMC_NIslands_MCRegisters *mc_reg_table)
2984 {
2985 	struct ni_ps *state = ni_get_ps(radeon_state);
2986 	int i;
2987 
2988 	for (i = 0; i < state->performance_level_count; i++) {
2989 		ni_convert_mc_reg_table_entry_to_smc(rdev,
2990 						     &state->performance_levels[i],
2991 						     &mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i]);
2992 	}
2993 }
2994 
ni_populate_mc_reg_table(struct radeon_device * rdev,struct radeon_ps * radeon_boot_state)2995 static int ni_populate_mc_reg_table(struct radeon_device *rdev,
2996 				    struct radeon_ps *radeon_boot_state)
2997 {
2998 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2999 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3000 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3001 	struct ni_ps *boot_state = ni_get_ps(radeon_boot_state);
3002 	SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table;
3003 
3004 	memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters));
3005 
3006 	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_seq_index, 1);
3007 
3008 	ni_populate_mc_reg_addresses(rdev, mc_reg_table);
3009 
3010 	ni_convert_mc_reg_table_entry_to_smc(rdev, &boot_state->performance_levels[0],
3011 					     &mc_reg_table->data[0]);
3012 
3013 	ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[0],
3014 				&mc_reg_table->data[1],
3015 				ni_pi->mc_reg_table.last,
3016 				ni_pi->mc_reg_table.valid_flag);
3017 
3018 	ni_convert_mc_reg_table_to_smc(rdev, radeon_boot_state, mc_reg_table);
3019 
3020 	return rv770_copy_bytes_to_smc(rdev, eg_pi->mc_reg_table_start,
3021 				       (u8 *)mc_reg_table,
3022 				       sizeof(SMC_NIslands_MCRegisters),
3023 				       pi->sram_end);
3024 }
3025 
ni_upload_mc_reg_table(struct radeon_device * rdev,struct radeon_ps * radeon_new_state)3026 static int ni_upload_mc_reg_table(struct radeon_device *rdev,
3027 				  struct radeon_ps *radeon_new_state)
3028 {
3029 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3030 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3031 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3032 	struct ni_ps *ni_new_state = ni_get_ps(radeon_new_state);
3033 	SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table;
3034 	u16 address;
3035 
3036 	memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters));
3037 
3038 	ni_convert_mc_reg_table_to_smc(rdev, radeon_new_state, mc_reg_table);
3039 
3040 	address = eg_pi->mc_reg_table_start +
3041 		(u16)offsetof(SMC_NIslands_MCRegisters, data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT]);
3042 
3043 	return rv770_copy_bytes_to_smc(rdev, address,
3044 				       (u8 *)&mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT],
3045 				       sizeof(SMC_NIslands_MCRegisterSet) * ni_new_state->performance_level_count,
3046 				       pi->sram_end);
3047 }
3048 
ni_init_driver_calculated_leakage_table(struct radeon_device * rdev,PP_NIslands_CACTABLES * cac_tables)3049 static int ni_init_driver_calculated_leakage_table(struct radeon_device *rdev,
3050 						   PP_NIslands_CACTABLES *cac_tables)
3051 {
3052 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3053 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3054 	u32 leakage = 0;
3055 	unsigned int i, j, table_size;
3056 	s32 t;
3057 	u32 smc_leakage, max_leakage = 0;
3058 	u32 scaling_factor;
3059 
3060 	table_size = eg_pi->vddc_voltage_table.count;
3061 
3062 	if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size)
3063 		table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES;
3064 
3065 	scaling_factor = ni_get_smc_power_scaling_factor(rdev);
3066 
3067 	for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) {
3068 		for (j = 0; j < table_size; j++) {
3069 			t = (1000 * ((i + 1) * 8));
3070 
3071 			if (t < ni_pi->cac_data.leakage_minimum_temperature)
3072 				t = ni_pi->cac_data.leakage_minimum_temperature;
3073 
3074 			ni_calculate_leakage_for_v_and_t(rdev,
3075 							 &ni_pi->cac_data.leakage_coefficients,
3076 							 eg_pi->vddc_voltage_table.entries[j].value,
3077 							 t,
3078 							 ni_pi->cac_data.i_leakage,
3079 							 &leakage);
3080 
3081 			smc_leakage = ni_scale_power_for_smc(leakage, scaling_factor) / 1000;
3082 			if (smc_leakage > max_leakage)
3083 				max_leakage = smc_leakage;
3084 
3085 			cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(smc_leakage);
3086 		}
3087 	}
3088 
3089 	for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) {
3090 		for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3091 			cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(max_leakage);
3092 	}
3093 	return 0;
3094 }
3095 
ni_init_simplified_leakage_table(struct radeon_device * rdev,PP_NIslands_CACTABLES * cac_tables)3096 static int ni_init_simplified_leakage_table(struct radeon_device *rdev,
3097 					    PP_NIslands_CACTABLES *cac_tables)
3098 {
3099 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3100 	struct radeon_cac_leakage_table *leakage_table =
3101 		&rdev->pm.dpm.dyn_state.cac_leakage_table;
3102 	u32 i, j, table_size;
3103 	u32 smc_leakage, max_leakage = 0;
3104 	u32 scaling_factor;
3105 
3106 	table_size = leakage_table->count;
3107 
3108 	if (eg_pi->vddc_voltage_table.count != table_size)
3109 		table_size = (eg_pi->vddc_voltage_table.count < leakage_table->count) ?
3110 			eg_pi->vddc_voltage_table.count : leakage_table->count;
3111 
3112 	if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size)
3113 		table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES;
3114 
3115 	if (table_size == 0)
3116 		return -EINVAL;
3117 
3118 	scaling_factor = ni_get_smc_power_scaling_factor(rdev);
3119 
3120 	for (j = 0; j < table_size; j++) {
3121 		smc_leakage = leakage_table->entries[j].leakage;
3122 
3123 		if (smc_leakage > max_leakage)
3124 			max_leakage = smc_leakage;
3125 
3126 		for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3127 			cac_tables->cac_lkge_lut[i][j] =
3128 				cpu_to_be32(ni_scale_power_for_smc(smc_leakage, scaling_factor));
3129 	}
3130 
3131 	for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) {
3132 		for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3133 			cac_tables->cac_lkge_lut[i][j] =
3134 				cpu_to_be32(ni_scale_power_for_smc(max_leakage, scaling_factor));
3135 	}
3136 	return 0;
3137 }
3138 
ni_initialize_smc_cac_tables(struct radeon_device * rdev)3139 static int ni_initialize_smc_cac_tables(struct radeon_device *rdev)
3140 {
3141 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3142 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3143 	PP_NIslands_CACTABLES *cac_tables = NULL;
3144 	int i, ret;
3145 	u32 reg;
3146 
3147 	if (ni_pi->enable_cac == false)
3148 		return 0;
3149 
3150 	cac_tables = kzalloc(sizeof(PP_NIslands_CACTABLES), GFP_KERNEL);
3151 	if (!cac_tables)
3152 		return -ENOMEM;
3153 
3154 	reg = RREG32(CG_CAC_CTRL) & ~(TID_CNT_MASK | TID_UNIT_MASK);
3155 	reg |= (TID_CNT(ni_pi->cac_weights->tid_cnt) |
3156 		TID_UNIT(ni_pi->cac_weights->tid_unit));
3157 	WREG32(CG_CAC_CTRL, reg);
3158 
3159 	for (i = 0; i < NISLANDS_DCCAC_MAX_LEVELS; i++)
3160 		ni_pi->dc_cac_table[i] = ni_pi->cac_weights->dc_cac[i];
3161 
3162 	for (i = 0; i < SMC_NISLANDS_BIF_LUT_NUM_OF_ENTRIES; i++)
3163 		cac_tables->cac_bif_lut[i] = ni_pi->cac_weights->pcie_cac[i];
3164 
3165 	ni_pi->cac_data.i_leakage = rdev->pm.dpm.cac_leakage;
3166 	ni_pi->cac_data.pwr_const = 0;
3167 	ni_pi->cac_data.dc_cac_value = ni_pi->dc_cac_table[NISLANDS_DCCAC_LEVEL_0];
3168 	ni_pi->cac_data.bif_cac_value = 0;
3169 	ni_pi->cac_data.mc_wr_weight = ni_pi->cac_weights->mc_write_weight;
3170 	ni_pi->cac_data.mc_rd_weight = ni_pi->cac_weights->mc_read_weight;
3171 	ni_pi->cac_data.allow_ovrflw = 0;
3172 	ni_pi->cac_data.l2num_win_tdp = ni_pi->lta_window_size;
3173 	ni_pi->cac_data.num_win_tdp = 0;
3174 	ni_pi->cac_data.lts_truncate_n = ni_pi->lts_truncate;
3175 
3176 	if (ni_pi->driver_calculate_cac_leakage)
3177 		ret = ni_init_driver_calculated_leakage_table(rdev, cac_tables);
3178 	else
3179 		ret = ni_init_simplified_leakage_table(rdev, cac_tables);
3180 
3181 	if (ret)
3182 		goto done_free;
3183 
3184 	cac_tables->pwr_const      = cpu_to_be32(ni_pi->cac_data.pwr_const);
3185 	cac_tables->dc_cacValue    = cpu_to_be32(ni_pi->cac_data.dc_cac_value);
3186 	cac_tables->bif_cacValue   = cpu_to_be32(ni_pi->cac_data.bif_cac_value);
3187 	cac_tables->AllowOvrflw    = ni_pi->cac_data.allow_ovrflw;
3188 	cac_tables->MCWrWeight     = ni_pi->cac_data.mc_wr_weight;
3189 	cac_tables->MCRdWeight     = ni_pi->cac_data.mc_rd_weight;
3190 	cac_tables->numWin_TDP     = ni_pi->cac_data.num_win_tdp;
3191 	cac_tables->l2numWin_TDP   = ni_pi->cac_data.l2num_win_tdp;
3192 	cac_tables->lts_truncate_n = ni_pi->cac_data.lts_truncate_n;
3193 
3194 	ret = rv770_copy_bytes_to_smc(rdev, ni_pi->cac_table_start, (u8 *)cac_tables,
3195 				      sizeof(PP_NIslands_CACTABLES), pi->sram_end);
3196 
3197 done_free:
3198 	if (ret) {
3199 		ni_pi->enable_cac = false;
3200 		ni_pi->enable_power_containment = false;
3201 	}
3202 
3203 	kfree(cac_tables);
3204 
3205 	return 0;
3206 }
3207 
ni_initialize_hardware_cac_manager(struct radeon_device * rdev)3208 static int ni_initialize_hardware_cac_manager(struct radeon_device *rdev)
3209 {
3210 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3211 	u32 reg;
3212 
3213 	if (!ni_pi->enable_cac ||
3214 	    !ni_pi->cac_configuration_required)
3215 		return 0;
3216 
3217 	if (ni_pi->cac_weights == NULL)
3218 		return -EINVAL;
3219 
3220 	reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_0) & ~(WEIGHT_TCP_SIG0_MASK |
3221 						      WEIGHT_TCP_SIG1_MASK |
3222 						      WEIGHT_TA_SIG_MASK);
3223 	reg |= (WEIGHT_TCP_SIG0(ni_pi->cac_weights->weight_tcp_sig0) |
3224 		WEIGHT_TCP_SIG1(ni_pi->cac_weights->weight_tcp_sig1) |
3225 		WEIGHT_TA_SIG(ni_pi->cac_weights->weight_ta_sig));
3226 	WREG32_CG(CG_CAC_REGION_1_WEIGHT_0, reg);
3227 
3228 	reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_1) & ~(WEIGHT_TCC_EN0_MASK |
3229 						      WEIGHT_TCC_EN1_MASK |
3230 						      WEIGHT_TCC_EN2_MASK);
3231 	reg |= (WEIGHT_TCC_EN0(ni_pi->cac_weights->weight_tcc_en0) |
3232 		WEIGHT_TCC_EN1(ni_pi->cac_weights->weight_tcc_en1) |
3233 		WEIGHT_TCC_EN2(ni_pi->cac_weights->weight_tcc_en2));
3234 	WREG32_CG(CG_CAC_REGION_1_WEIGHT_1, reg);
3235 
3236 	reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_0) & ~(WEIGHT_CB_EN0_MASK |
3237 						      WEIGHT_CB_EN1_MASK |
3238 						      WEIGHT_CB_EN2_MASK |
3239 						      WEIGHT_CB_EN3_MASK);
3240 	reg |= (WEIGHT_CB_EN0(ni_pi->cac_weights->weight_cb_en0) |
3241 		WEIGHT_CB_EN1(ni_pi->cac_weights->weight_cb_en1) |
3242 		WEIGHT_CB_EN2(ni_pi->cac_weights->weight_cb_en2) |
3243 		WEIGHT_CB_EN3(ni_pi->cac_weights->weight_cb_en3));
3244 	WREG32_CG(CG_CAC_REGION_2_WEIGHT_0, reg);
3245 
3246 	reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_1) & ~(WEIGHT_DB_SIG0_MASK |
3247 						      WEIGHT_DB_SIG1_MASK |
3248 						      WEIGHT_DB_SIG2_MASK |
3249 						      WEIGHT_DB_SIG3_MASK);
3250 	reg |= (WEIGHT_DB_SIG0(ni_pi->cac_weights->weight_db_sig0) |
3251 		WEIGHT_DB_SIG1(ni_pi->cac_weights->weight_db_sig1) |
3252 		WEIGHT_DB_SIG2(ni_pi->cac_weights->weight_db_sig2) |
3253 		WEIGHT_DB_SIG3(ni_pi->cac_weights->weight_db_sig3));
3254 	WREG32_CG(CG_CAC_REGION_2_WEIGHT_1, reg);
3255 
3256 	reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_2) & ~(WEIGHT_SXM_SIG0_MASK |
3257 						      WEIGHT_SXM_SIG1_MASK |
3258 						      WEIGHT_SXM_SIG2_MASK |
3259 						      WEIGHT_SXS_SIG0_MASK |
3260 						      WEIGHT_SXS_SIG1_MASK);
3261 	reg |= (WEIGHT_SXM_SIG0(ni_pi->cac_weights->weight_sxm_sig0) |
3262 		WEIGHT_SXM_SIG1(ni_pi->cac_weights->weight_sxm_sig1) |
3263 		WEIGHT_SXM_SIG2(ni_pi->cac_weights->weight_sxm_sig2) |
3264 		WEIGHT_SXS_SIG0(ni_pi->cac_weights->weight_sxs_sig0) |
3265 		WEIGHT_SXS_SIG1(ni_pi->cac_weights->weight_sxs_sig1));
3266 	WREG32_CG(CG_CAC_REGION_2_WEIGHT_2, reg);
3267 
3268 	reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_0) & ~(WEIGHT_XBR_0_MASK |
3269 						      WEIGHT_XBR_1_MASK |
3270 						      WEIGHT_XBR_2_MASK |
3271 						      WEIGHT_SPI_SIG0_MASK);
3272 	reg |= (WEIGHT_XBR_0(ni_pi->cac_weights->weight_xbr_0) |
3273 		WEIGHT_XBR_1(ni_pi->cac_weights->weight_xbr_1) |
3274 		WEIGHT_XBR_2(ni_pi->cac_weights->weight_xbr_2) |
3275 		WEIGHT_SPI_SIG0(ni_pi->cac_weights->weight_spi_sig0));
3276 	WREG32_CG(CG_CAC_REGION_3_WEIGHT_0, reg);
3277 
3278 	reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_1) & ~(WEIGHT_SPI_SIG1_MASK |
3279 						      WEIGHT_SPI_SIG2_MASK |
3280 						      WEIGHT_SPI_SIG3_MASK |
3281 						      WEIGHT_SPI_SIG4_MASK |
3282 						      WEIGHT_SPI_SIG5_MASK);
3283 	reg |= (WEIGHT_SPI_SIG1(ni_pi->cac_weights->weight_spi_sig1) |
3284 		WEIGHT_SPI_SIG2(ni_pi->cac_weights->weight_spi_sig2) |
3285 		WEIGHT_SPI_SIG3(ni_pi->cac_weights->weight_spi_sig3) |
3286 		WEIGHT_SPI_SIG4(ni_pi->cac_weights->weight_spi_sig4) |
3287 		WEIGHT_SPI_SIG5(ni_pi->cac_weights->weight_spi_sig5));
3288 	WREG32_CG(CG_CAC_REGION_3_WEIGHT_1, reg);
3289 
3290 	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_0) & ~(WEIGHT_LDS_SIG0_MASK |
3291 						      WEIGHT_LDS_SIG1_MASK |
3292 						      WEIGHT_SC_MASK);
3293 	reg |= (WEIGHT_LDS_SIG0(ni_pi->cac_weights->weight_lds_sig0) |
3294 		WEIGHT_LDS_SIG1(ni_pi->cac_weights->weight_lds_sig1) |
3295 		WEIGHT_SC(ni_pi->cac_weights->weight_sc));
3296 	WREG32_CG(CG_CAC_REGION_4_WEIGHT_0, reg);
3297 
3298 	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_1) & ~(WEIGHT_BIF_MASK |
3299 						      WEIGHT_CP_MASK |
3300 						      WEIGHT_PA_SIG0_MASK |
3301 						      WEIGHT_PA_SIG1_MASK |
3302 						      WEIGHT_VGT_SIG0_MASK);
3303 	reg |= (WEIGHT_BIF(ni_pi->cac_weights->weight_bif) |
3304 		WEIGHT_CP(ni_pi->cac_weights->weight_cp) |
3305 		WEIGHT_PA_SIG0(ni_pi->cac_weights->weight_pa_sig0) |
3306 		WEIGHT_PA_SIG1(ni_pi->cac_weights->weight_pa_sig1) |
3307 		WEIGHT_VGT_SIG0(ni_pi->cac_weights->weight_vgt_sig0));
3308 	WREG32_CG(CG_CAC_REGION_4_WEIGHT_1, reg);
3309 
3310 	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_2) & ~(WEIGHT_VGT_SIG1_MASK |
3311 						      WEIGHT_VGT_SIG2_MASK |
3312 						      WEIGHT_DC_SIG0_MASK |
3313 						      WEIGHT_DC_SIG1_MASK |
3314 						      WEIGHT_DC_SIG2_MASK);
3315 	reg |= (WEIGHT_VGT_SIG1(ni_pi->cac_weights->weight_vgt_sig1) |
3316 		WEIGHT_VGT_SIG2(ni_pi->cac_weights->weight_vgt_sig2) |
3317 		WEIGHT_DC_SIG0(ni_pi->cac_weights->weight_dc_sig0) |
3318 		WEIGHT_DC_SIG1(ni_pi->cac_weights->weight_dc_sig1) |
3319 		WEIGHT_DC_SIG2(ni_pi->cac_weights->weight_dc_sig2));
3320 	WREG32_CG(CG_CAC_REGION_4_WEIGHT_2, reg);
3321 
3322 	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_3) & ~(WEIGHT_DC_SIG3_MASK |
3323 						      WEIGHT_UVD_SIG0_MASK |
3324 						      WEIGHT_UVD_SIG1_MASK |
3325 						      WEIGHT_SPARE0_MASK |
3326 						      WEIGHT_SPARE1_MASK);
3327 	reg |= (WEIGHT_DC_SIG3(ni_pi->cac_weights->weight_dc_sig3) |
3328 		WEIGHT_UVD_SIG0(ni_pi->cac_weights->weight_uvd_sig0) |
3329 		WEIGHT_UVD_SIG1(ni_pi->cac_weights->weight_uvd_sig1) |
3330 		WEIGHT_SPARE0(ni_pi->cac_weights->weight_spare0) |
3331 		WEIGHT_SPARE1(ni_pi->cac_weights->weight_spare1));
3332 	WREG32_CG(CG_CAC_REGION_4_WEIGHT_3, reg);
3333 
3334 	reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_0) & ~(WEIGHT_SQ_VSP_MASK |
3335 						      WEIGHT_SQ_VSP0_MASK);
3336 	reg |= (WEIGHT_SQ_VSP(ni_pi->cac_weights->weight_sq_vsp) |
3337 		WEIGHT_SQ_VSP0(ni_pi->cac_weights->weight_sq_vsp0));
3338 	WREG32_CG(CG_CAC_REGION_5_WEIGHT_0, reg);
3339 
3340 	reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_1) & ~(WEIGHT_SQ_GPR_MASK);
3341 	reg |= WEIGHT_SQ_GPR(ni_pi->cac_weights->weight_sq_gpr);
3342 	WREG32_CG(CG_CAC_REGION_5_WEIGHT_1, reg);
3343 
3344 	reg = RREG32_CG(CG_CAC_REGION_4_OVERRIDE_4) & ~(OVR_MODE_SPARE_0_MASK |
3345 							OVR_VAL_SPARE_0_MASK |
3346 							OVR_MODE_SPARE_1_MASK |
3347 							OVR_VAL_SPARE_1_MASK);
3348 	reg |= (OVR_MODE_SPARE_0(ni_pi->cac_weights->ovr_mode_spare_0) |
3349 		OVR_VAL_SPARE_0(ni_pi->cac_weights->ovr_val_spare_0) |
3350 		OVR_MODE_SPARE_1(ni_pi->cac_weights->ovr_mode_spare_1) |
3351 		OVR_VAL_SPARE_1(ni_pi->cac_weights->ovr_val_spare_1));
3352 	WREG32_CG(CG_CAC_REGION_4_OVERRIDE_4, reg);
3353 
3354 	reg = RREG32(SQ_CAC_THRESHOLD) & ~(VSP_MASK |
3355 					   VSP0_MASK |
3356 					   GPR_MASK);
3357 	reg |= (VSP(ni_pi->cac_weights->vsp) |
3358 		VSP0(ni_pi->cac_weights->vsp0) |
3359 		GPR(ni_pi->cac_weights->gpr));
3360 	WREG32(SQ_CAC_THRESHOLD, reg);
3361 
3362 	reg = (MCDW_WR_ENABLE |
3363 	       MCDX_WR_ENABLE |
3364 	       MCDY_WR_ENABLE |
3365 	       MCDZ_WR_ENABLE |
3366 	       INDEX(0x09D4));
3367 	WREG32(MC_CG_CONFIG, reg);
3368 
3369 	reg = (READ_WEIGHT(ni_pi->cac_weights->mc_read_weight) |
3370 	       WRITE_WEIGHT(ni_pi->cac_weights->mc_write_weight) |
3371 	       ALLOW_OVERFLOW);
3372 	WREG32(MC_CG_DATAPORT, reg);
3373 
3374 	return 0;
3375 }
3376 
ni_enable_smc_cac(struct radeon_device * rdev,struct radeon_ps * radeon_new_state,bool enable)3377 static int ni_enable_smc_cac(struct radeon_device *rdev,
3378 			     struct radeon_ps *radeon_new_state,
3379 			     bool enable)
3380 {
3381 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3382 	int ret = 0;
3383 	PPSMC_Result smc_result;
3384 
3385 	if (ni_pi->enable_cac) {
3386 		if (enable) {
3387 			if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) {
3388 				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_CollectCAC_PowerCorreln);
3389 
3390 				if (ni_pi->support_cac_long_term_average) {
3391 					smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgEnable);
3392 					if (PPSMC_Result_OK != smc_result)
3393 						ni_pi->support_cac_long_term_average = false;
3394 				}
3395 
3396 				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_EnableCac);
3397 				if (PPSMC_Result_OK != smc_result)
3398 					ret = -EINVAL;
3399 
3400 				ni_pi->cac_enabled = (PPSMC_Result_OK == smc_result) ? true : false;
3401 			}
3402 		} else if (ni_pi->cac_enabled) {
3403 			smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_DisableCac);
3404 
3405 			ni_pi->cac_enabled = false;
3406 
3407 			if (ni_pi->support_cac_long_term_average) {
3408 				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgDisable);
3409 				if (PPSMC_Result_OK != smc_result)
3410 					ni_pi->support_cac_long_term_average = false;
3411 			}
3412 		}
3413 	}
3414 
3415 	return ret;
3416 }
3417 
ni_pcie_performance_request(struct radeon_device * rdev,u8 perf_req,bool advertise)3418 static int ni_pcie_performance_request(struct radeon_device *rdev,
3419 				       u8 perf_req, bool advertise)
3420 {
3421 #if defined(CONFIG_ACPI)
3422 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3423 
3424 	if ((perf_req == PCIE_PERF_REQ_PECI_GEN1) ||
3425 	    (perf_req == PCIE_PERF_REQ_PECI_GEN2)) {
3426 		if (eg_pi->pcie_performance_request_registered == false)
3427 			radeon_acpi_pcie_notify_device_ready(rdev);
3428 		eg_pi->pcie_performance_request_registered = true;
3429 		return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise);
3430 	} else if ((perf_req == PCIE_PERF_REQ_REMOVE_REGISTRY) &&
3431 		    eg_pi->pcie_performance_request_registered) {
3432 		eg_pi->pcie_performance_request_registered = false;
3433 		return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise);
3434 	}
3435 #endif
3436 	return 0;
3437 }
3438 
ni_advertise_gen2_capability(struct radeon_device * rdev)3439 static int ni_advertise_gen2_capability(struct radeon_device *rdev)
3440 {
3441 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3442 	u32 tmp;
3443 
3444 	tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
3445 
3446 	if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3447 	    (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2))
3448 		pi->pcie_gen2 = true;
3449 	else
3450 		pi->pcie_gen2 = false;
3451 
3452 	if (!pi->pcie_gen2)
3453 		ni_pcie_performance_request(rdev, PCIE_PERF_REQ_PECI_GEN2, true);
3454 
3455 	return 0;
3456 }
3457 
ni_enable_bif_dynamic_pcie_gen2(struct radeon_device * rdev,bool enable)3458 static void ni_enable_bif_dynamic_pcie_gen2(struct radeon_device *rdev,
3459 					    bool enable)
3460 {
3461 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3462 	u32 tmp, bif;
3463 
3464 	tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
3465 
3466 	if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3467 	    (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2)) {
3468 		if (enable) {
3469 			if (!pi->boot_in_gen2) {
3470 				bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK;
3471 				bif |= CG_CLIENT_REQ(0xd);
3472 				WREG32(CG_BIF_REQ_AND_RSP, bif);
3473 			}
3474 			tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK;
3475 			tmp |= LC_HW_VOLTAGE_IF_CONTROL(1);
3476 			tmp |= LC_GEN2_EN_STRAP;
3477 
3478 			tmp |= LC_CLR_FAILED_SPD_CHANGE_CNT;
3479 			WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3480 			udelay(10);
3481 			tmp &= ~LC_CLR_FAILED_SPD_CHANGE_CNT;
3482 			WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3483 		} else {
3484 			if (!pi->boot_in_gen2) {
3485 				bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK;
3486 				bif |= CG_CLIENT_REQ(0xd);
3487 				WREG32(CG_BIF_REQ_AND_RSP, bif);
3488 
3489 				tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK;
3490 				tmp &= ~LC_GEN2_EN_STRAP;
3491 			}
3492 			WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3493 		}
3494 	}
3495 }
3496 
ni_enable_dynamic_pcie_gen2(struct radeon_device * rdev,bool enable)3497 static void ni_enable_dynamic_pcie_gen2(struct radeon_device *rdev,
3498 					bool enable)
3499 {
3500 	ni_enable_bif_dynamic_pcie_gen2(rdev, enable);
3501 
3502 	if (enable)
3503 		WREG32_P(GENERAL_PWRMGT, ENABLE_GEN2PCIE, ~ENABLE_GEN2PCIE);
3504 	else
3505 		WREG32_P(GENERAL_PWRMGT, 0, ~ENABLE_GEN2PCIE);
3506 }
3507 
ni_set_uvd_clock_before_set_eng_clock(struct radeon_device * rdev,struct radeon_ps * new_ps,struct radeon_ps * old_ps)3508 void ni_set_uvd_clock_before_set_eng_clock(struct radeon_device *rdev,
3509 					   struct radeon_ps *new_ps,
3510 					   struct radeon_ps *old_ps)
3511 {
3512 	struct ni_ps *new_state = ni_get_ps(new_ps);
3513 	struct ni_ps *current_state = ni_get_ps(old_ps);
3514 
3515 	if ((new_ps->vclk == old_ps->vclk) &&
3516 	    (new_ps->dclk == old_ps->dclk))
3517 		return;
3518 
3519 	if (new_state->performance_levels[new_state->performance_level_count - 1].sclk >=
3520 	    current_state->performance_levels[current_state->performance_level_count - 1].sclk)
3521 		return;
3522 
3523 	radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk);
3524 }
3525 
ni_set_uvd_clock_after_set_eng_clock(struct radeon_device * rdev,struct radeon_ps * new_ps,struct radeon_ps * old_ps)3526 void ni_set_uvd_clock_after_set_eng_clock(struct radeon_device *rdev,
3527 					  struct radeon_ps *new_ps,
3528 					  struct radeon_ps *old_ps)
3529 {
3530 	struct ni_ps *new_state = ni_get_ps(new_ps);
3531 	struct ni_ps *current_state = ni_get_ps(old_ps);
3532 
3533 	if ((new_ps->vclk == old_ps->vclk) &&
3534 	    (new_ps->dclk == old_ps->dclk))
3535 		return;
3536 
3537 	if (new_state->performance_levels[new_state->performance_level_count - 1].sclk <
3538 	    current_state->performance_levels[current_state->performance_level_count - 1].sclk)
3539 		return;
3540 
3541 	radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk);
3542 }
3543 
ni_dpm_setup_asic(struct radeon_device * rdev)3544 void ni_dpm_setup_asic(struct radeon_device *rdev)
3545 {
3546 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3547 	int r;
3548 
3549 	r = ni_mc_load_microcode(rdev);
3550 	if (r)
3551 		DRM_ERROR("Failed to load MC firmware!\n");
3552 	ni_read_clock_registers(rdev);
3553 	btc_read_arb_registers(rdev);
3554 	rv770_get_memory_type(rdev);
3555 	if (eg_pi->pcie_performance_request)
3556 		ni_advertise_gen2_capability(rdev);
3557 	rv770_get_pcie_gen2_status(rdev);
3558 	rv770_enable_acpi_pm(rdev);
3559 }
3560 
ni_update_current_ps(struct radeon_device * rdev,struct radeon_ps * rps)3561 void ni_update_current_ps(struct radeon_device *rdev,
3562 			  struct radeon_ps *rps)
3563 {
3564 	struct ni_ps *new_ps = ni_get_ps(rps);
3565 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3566 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3567 
3568 	eg_pi->current_rps = *rps;
3569 	ni_pi->current_ps = *new_ps;
3570 	eg_pi->current_rps.ps_priv = &ni_pi->current_ps;
3571 }
3572 
ni_update_requested_ps(struct radeon_device * rdev,struct radeon_ps * rps)3573 void ni_update_requested_ps(struct radeon_device *rdev,
3574 			    struct radeon_ps *rps)
3575 {
3576 	struct ni_ps *new_ps = ni_get_ps(rps);
3577 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3578 	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3579 
3580 	eg_pi->requested_rps = *rps;
3581 	ni_pi->requested_ps = *new_ps;
3582 	eg_pi->requested_rps.ps_priv = &ni_pi->requested_ps;
3583 }
3584 
ni_dpm_enable(struct radeon_device * rdev)3585 int ni_dpm_enable(struct radeon_device *rdev)
3586 {
3587 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3588 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3589 	struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps;
3590 	int ret;
3591 
3592 	if (pi->gfx_clock_gating)
3593 		ni_cg_clockgating_default(rdev);
3594 	if (btc_dpm_enabled(rdev))
3595 		return -EINVAL;
3596 	if (pi->mg_clock_gating)
3597 		ni_mg_clockgating_default(rdev);
3598 	if (eg_pi->ls_clock_gating)
3599 		ni_ls_clockgating_default(rdev);
3600 	if (pi->voltage_control) {
3601 		rv770_enable_voltage_control(rdev, true);
3602 		ret = cypress_construct_voltage_tables(rdev);
3603 		if (ret) {
3604 			DRM_ERROR("cypress_construct_voltage_tables failed\n");
3605 			return ret;
3606 		}
3607 	}
3608 	if (eg_pi->dynamic_ac_timing) {
3609 		ret = ni_initialize_mc_reg_table(rdev);
3610 		if (ret)
3611 			eg_pi->dynamic_ac_timing = false;
3612 	}
3613 	if (pi->dynamic_ss)
3614 		cypress_enable_spread_spectrum(rdev, true);
3615 	if (pi->thermal_protection)
3616 		rv770_enable_thermal_protection(rdev, true);
3617 	rv770_setup_bsp(rdev);
3618 	rv770_program_git(rdev);
3619 	rv770_program_tp(rdev);
3620 	rv770_program_tpp(rdev);
3621 	rv770_program_sstp(rdev);
3622 	cypress_enable_display_gap(rdev);
3623 	rv770_program_vc(rdev);
3624 	if (pi->dynamic_pcie_gen2)
3625 		ni_enable_dynamic_pcie_gen2(rdev, true);
3626 	ret = rv770_upload_firmware(rdev);
3627 	if (ret) {
3628 		DRM_ERROR("rv770_upload_firmware failed\n");
3629 		return ret;
3630 	}
3631 	ret = ni_process_firmware_header(rdev);
3632 	if (ret) {
3633 		DRM_ERROR("ni_process_firmware_header failed\n");
3634 		return ret;
3635 	}
3636 	ret = ni_initial_switch_from_arb_f0_to_f1(rdev);
3637 	if (ret) {
3638 		DRM_ERROR("ni_initial_switch_from_arb_f0_to_f1 failed\n");
3639 		return ret;
3640 	}
3641 	ret = ni_init_smc_table(rdev);
3642 	if (ret) {
3643 		DRM_ERROR("ni_init_smc_table failed\n");
3644 		return ret;
3645 	}
3646 	ret = ni_init_smc_spll_table(rdev);
3647 	if (ret) {
3648 		DRM_ERROR("ni_init_smc_spll_table failed\n");
3649 		return ret;
3650 	}
3651 	ret = ni_init_arb_table_index(rdev);
3652 	if (ret) {
3653 		DRM_ERROR("ni_init_arb_table_index failed\n");
3654 		return ret;
3655 	}
3656 	if (eg_pi->dynamic_ac_timing) {
3657 		ret = ni_populate_mc_reg_table(rdev, boot_ps);
3658 		if (ret) {
3659 			DRM_ERROR("ni_populate_mc_reg_table failed\n");
3660 			return ret;
3661 		}
3662 	}
3663 	ret = ni_initialize_smc_cac_tables(rdev);
3664 	if (ret) {
3665 		DRM_ERROR("ni_initialize_smc_cac_tables failed\n");
3666 		return ret;
3667 	}
3668 	ret = ni_initialize_hardware_cac_manager(rdev);
3669 	if (ret) {
3670 		DRM_ERROR("ni_initialize_hardware_cac_manager failed\n");
3671 		return ret;
3672 	}
3673 	ret = ni_populate_smc_tdp_limits(rdev, boot_ps);
3674 	if (ret) {
3675 		DRM_ERROR("ni_populate_smc_tdp_limits failed\n");
3676 		return ret;
3677 	}
3678 	ni_program_response_times(rdev);
3679 	r7xx_start_smc(rdev);
3680 	ret = cypress_notify_smc_display_change(rdev, false);
3681 	if (ret) {
3682 		DRM_ERROR("cypress_notify_smc_display_change failed\n");
3683 		return ret;
3684 	}
3685 	cypress_enable_sclk_control(rdev, true);
3686 	if (eg_pi->memory_transition)
3687 		cypress_enable_mclk_control(rdev, true);
3688 	cypress_start_dpm(rdev);
3689 	if (pi->gfx_clock_gating)
3690 		ni_gfx_clockgating_enable(rdev, true);
3691 	if (pi->mg_clock_gating)
3692 		ni_mg_clockgating_enable(rdev, true);
3693 	if (eg_pi->ls_clock_gating)
3694 		ni_ls_clockgating_enable(rdev, true);
3695 
3696 	rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, true);
3697 
3698 	ni_update_current_ps(rdev, boot_ps);
3699 
3700 	return 0;
3701 }
3702 
ni_dpm_disable(struct radeon_device * rdev)3703 void ni_dpm_disable(struct radeon_device *rdev)
3704 {
3705 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3706 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3707 	struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps;
3708 
3709 	if (!btc_dpm_enabled(rdev))
3710 		return;
3711 	rv770_clear_vc(rdev);
3712 	if (pi->thermal_protection)
3713 		rv770_enable_thermal_protection(rdev, false);
3714 	ni_enable_power_containment(rdev, boot_ps, false);
3715 	ni_enable_smc_cac(rdev, boot_ps, false);
3716 	cypress_enable_spread_spectrum(rdev, false);
3717 	rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, false);
3718 	if (pi->dynamic_pcie_gen2)
3719 		ni_enable_dynamic_pcie_gen2(rdev, false);
3720 
3721 	if (rdev->irq.installed &&
3722 	    r600_is_internal_thermal_sensor(rdev->pm.int_thermal_type)) {
3723 		rdev->irq.dpm_thermal = false;
3724 		radeon_irq_set(rdev);
3725 	}
3726 
3727 	if (pi->gfx_clock_gating)
3728 		ni_gfx_clockgating_enable(rdev, false);
3729 	if (pi->mg_clock_gating)
3730 		ni_mg_clockgating_enable(rdev, false);
3731 	if (eg_pi->ls_clock_gating)
3732 		ni_ls_clockgating_enable(rdev, false);
3733 	ni_stop_dpm(rdev);
3734 	btc_reset_to_default(rdev);
3735 	ni_stop_smc(rdev);
3736 	ni_force_switch_to_arb_f0(rdev);
3737 
3738 	ni_update_current_ps(rdev, boot_ps);
3739 }
3740 
ni_power_control_set_level(struct radeon_device * rdev)3741 static int ni_power_control_set_level(struct radeon_device *rdev)
3742 {
3743 	struct radeon_ps *new_ps = rdev->pm.dpm.requested_ps;
3744 	int ret;
3745 
3746 	ret = ni_restrict_performance_levels_before_switch(rdev);
3747 	if (ret)
3748 		return ret;
3749 	ret = rv770_halt_smc(rdev);
3750 	if (ret)
3751 		return ret;
3752 	ret = ni_populate_smc_tdp_limits(rdev, new_ps);
3753 	if (ret)
3754 		return ret;
3755 	ret = rv770_resume_smc(rdev);
3756 	if (ret)
3757 		return ret;
3758 	ret = rv770_set_sw_state(rdev);
3759 	if (ret)
3760 		return ret;
3761 
3762 	return 0;
3763 }
3764 
ni_dpm_pre_set_power_state(struct radeon_device * rdev)3765 int ni_dpm_pre_set_power_state(struct radeon_device *rdev)
3766 {
3767 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3768 	struct radeon_ps requested_ps = *rdev->pm.dpm.requested_ps;
3769 	struct radeon_ps *new_ps = &requested_ps;
3770 
3771 	ni_update_requested_ps(rdev, new_ps);
3772 
3773 	ni_apply_state_adjust_rules(rdev, &eg_pi->requested_rps);
3774 
3775 	return 0;
3776 }
3777 
ni_dpm_set_power_state(struct radeon_device * rdev)3778 int ni_dpm_set_power_state(struct radeon_device *rdev)
3779 {
3780 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3781 	struct radeon_ps *new_ps = &eg_pi->requested_rps;
3782 	struct radeon_ps *old_ps = &eg_pi->current_rps;
3783 	int ret;
3784 
3785 	ret = ni_restrict_performance_levels_before_switch(rdev);
3786 	if (ret) {
3787 		DRM_ERROR("ni_restrict_performance_levels_before_switch failed\n");
3788 		return ret;
3789 	}
3790 	ni_set_uvd_clock_before_set_eng_clock(rdev, new_ps, old_ps);
3791 	ret = ni_enable_power_containment(rdev, new_ps, false);
3792 	if (ret) {
3793 		DRM_ERROR("ni_enable_power_containment failed\n");
3794 		return ret;
3795 	}
3796 	ret = ni_enable_smc_cac(rdev, new_ps, false);
3797 	if (ret) {
3798 		DRM_ERROR("ni_enable_smc_cac failed\n");
3799 		return ret;
3800 	}
3801 	ret = rv770_halt_smc(rdev);
3802 	if (ret) {
3803 		DRM_ERROR("rv770_halt_smc failed\n");
3804 		return ret;
3805 	}
3806 	if (eg_pi->smu_uvd_hs)
3807 		btc_notify_uvd_to_smc(rdev, new_ps);
3808 	ret = ni_upload_sw_state(rdev, new_ps);
3809 	if (ret) {
3810 		DRM_ERROR("ni_upload_sw_state failed\n");
3811 		return ret;
3812 	}
3813 	if (eg_pi->dynamic_ac_timing) {
3814 		ret = ni_upload_mc_reg_table(rdev, new_ps);
3815 		if (ret) {
3816 			DRM_ERROR("ni_upload_mc_reg_table failed\n");
3817 			return ret;
3818 		}
3819 	}
3820 	ret = ni_program_memory_timing_parameters(rdev, new_ps);
3821 	if (ret) {
3822 		DRM_ERROR("ni_program_memory_timing_parameters failed\n");
3823 		return ret;
3824 	}
3825 	ret = rv770_resume_smc(rdev);
3826 	if (ret) {
3827 		DRM_ERROR("rv770_resume_smc failed\n");
3828 		return ret;
3829 	}
3830 	ret = rv770_set_sw_state(rdev);
3831 	if (ret) {
3832 		DRM_ERROR("rv770_set_sw_state failed\n");
3833 		return ret;
3834 	}
3835 	ni_set_uvd_clock_after_set_eng_clock(rdev, new_ps, old_ps);
3836 	ret = ni_enable_smc_cac(rdev, new_ps, true);
3837 	if (ret) {
3838 		DRM_ERROR("ni_enable_smc_cac failed\n");
3839 		return ret;
3840 	}
3841 	ret = ni_enable_power_containment(rdev, new_ps, true);
3842 	if (ret) {
3843 		DRM_ERROR("ni_enable_power_containment failed\n");
3844 		return ret;
3845 	}
3846 
3847 	/* update tdp */
3848 	ret = ni_power_control_set_level(rdev);
3849 	if (ret) {
3850 		DRM_ERROR("ni_power_control_set_level failed\n");
3851 		return ret;
3852 	}
3853 
3854 	return 0;
3855 }
3856 
ni_dpm_post_set_power_state(struct radeon_device * rdev)3857 void ni_dpm_post_set_power_state(struct radeon_device *rdev)
3858 {
3859 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3860 	struct radeon_ps *new_ps = &eg_pi->requested_rps;
3861 
3862 	ni_update_current_ps(rdev, new_ps);
3863 }
3864 
3865 #if 0
3866 void ni_dpm_reset_asic(struct radeon_device *rdev)
3867 {
3868 	ni_restrict_performance_levels_before_switch(rdev);
3869 	rv770_set_boot_state(rdev);
3870 }
3871 #endif
3872 
3873 union power_info {
3874 	struct _ATOM_POWERPLAY_INFO info;
3875 	struct _ATOM_POWERPLAY_INFO_V2 info_2;
3876 	struct _ATOM_POWERPLAY_INFO_V3 info_3;
3877 	struct _ATOM_PPLIB_POWERPLAYTABLE pplib;
3878 	struct _ATOM_PPLIB_POWERPLAYTABLE2 pplib2;
3879 	struct _ATOM_PPLIB_POWERPLAYTABLE3 pplib3;
3880 };
3881 
3882 union pplib_clock_info {
3883 	struct _ATOM_PPLIB_R600_CLOCK_INFO r600;
3884 	struct _ATOM_PPLIB_RS780_CLOCK_INFO rs780;
3885 	struct _ATOM_PPLIB_EVERGREEN_CLOCK_INFO evergreen;
3886 	struct _ATOM_PPLIB_SUMO_CLOCK_INFO sumo;
3887 };
3888 
3889 union pplib_power_state {
3890 	struct _ATOM_PPLIB_STATE v1;
3891 	struct _ATOM_PPLIB_STATE_V2 v2;
3892 };
3893 
ni_parse_pplib_non_clock_info(struct radeon_device * rdev,struct radeon_ps * rps,struct _ATOM_PPLIB_NONCLOCK_INFO * non_clock_info,u8 table_rev)3894 static void ni_parse_pplib_non_clock_info(struct radeon_device *rdev,
3895 					  struct radeon_ps *rps,
3896 					  struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info,
3897 					  u8 table_rev)
3898 {
3899 	rps->caps = le32_to_cpu(non_clock_info->ulCapsAndSettings);
3900 	rps->class = le16_to_cpu(non_clock_info->usClassification);
3901 	rps->class2 = le16_to_cpu(non_clock_info->usClassification2);
3902 
3903 	if (ATOM_PPLIB_NONCLOCKINFO_VER1 < table_rev) {
3904 		rps->vclk = le32_to_cpu(non_clock_info->ulVCLK);
3905 		rps->dclk = le32_to_cpu(non_clock_info->ulDCLK);
3906 	} else if (r600_is_uvd_state(rps->class, rps->class2)) {
3907 		rps->vclk = RV770_DEFAULT_VCLK_FREQ;
3908 		rps->dclk = RV770_DEFAULT_DCLK_FREQ;
3909 	} else {
3910 		rps->vclk = 0;
3911 		rps->dclk = 0;
3912 	}
3913 
3914 	if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT)
3915 		rdev->pm.dpm.boot_ps = rps;
3916 	if (rps->class & ATOM_PPLIB_CLASSIFICATION_UVDSTATE)
3917 		rdev->pm.dpm.uvd_ps = rps;
3918 }
3919 
ni_parse_pplib_clock_info(struct radeon_device * rdev,struct radeon_ps * rps,int index,union pplib_clock_info * clock_info)3920 static void ni_parse_pplib_clock_info(struct radeon_device *rdev,
3921 				      struct radeon_ps *rps, int index,
3922 				      union pplib_clock_info *clock_info)
3923 {
3924 	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3925 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3926 	struct ni_ps *ps = ni_get_ps(rps);
3927 	struct rv7xx_pl *pl = &ps->performance_levels[index];
3928 
3929 	ps->performance_level_count = index + 1;
3930 
3931 	pl->sclk = le16_to_cpu(clock_info->evergreen.usEngineClockLow);
3932 	pl->sclk |= clock_info->evergreen.ucEngineClockHigh << 16;
3933 	pl->mclk = le16_to_cpu(clock_info->evergreen.usMemoryClockLow);
3934 	pl->mclk |= clock_info->evergreen.ucMemoryClockHigh << 16;
3935 
3936 	pl->vddc = le16_to_cpu(clock_info->evergreen.usVDDC);
3937 	pl->vddci = le16_to_cpu(clock_info->evergreen.usVDDCI);
3938 	pl->flags = le32_to_cpu(clock_info->evergreen.ulFlags);
3939 
3940 	/* patch up vddc if necessary */
3941 	if (pl->vddc == 0xff01) {
3942 		if (pi->max_vddc)
3943 			pl->vddc = pi->max_vddc;
3944 	}
3945 
3946 	if (rps->class & ATOM_PPLIB_CLASSIFICATION_ACPI) {
3947 		pi->acpi_vddc = pl->vddc;
3948 		eg_pi->acpi_vddci = pl->vddci;
3949 		if (ps->performance_levels[0].flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2)
3950 			pi->acpi_pcie_gen2 = true;
3951 		else
3952 			pi->acpi_pcie_gen2 = false;
3953 	}
3954 
3955 	if (rps->class2 & ATOM_PPLIB_CLASSIFICATION2_ULV) {
3956 		eg_pi->ulv.supported = true;
3957 		eg_pi->ulv.pl = pl;
3958 	}
3959 
3960 	if (pi->min_vddc_in_table > pl->vddc)
3961 		pi->min_vddc_in_table = pl->vddc;
3962 
3963 	if (pi->max_vddc_in_table < pl->vddc)
3964 		pi->max_vddc_in_table = pl->vddc;
3965 
3966 	/* patch up boot state */
3967 	if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT) {
3968 		u16 vddc, vddci, mvdd;
3969 		radeon_atombios_get_default_voltages(rdev, &vddc, &vddci, &mvdd);
3970 		pl->mclk = rdev->clock.default_mclk;
3971 		pl->sclk = rdev->clock.default_sclk;
3972 		pl->vddc = vddc;
3973 		pl->vddci = vddci;
3974 	}
3975 
3976 	if ((rps->class & ATOM_PPLIB_CLASSIFICATION_UI_MASK) ==
3977 	    ATOM_PPLIB_CLASSIFICATION_UI_PERFORMANCE) {
3978 		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.sclk = pl->sclk;
3979 		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.mclk = pl->mclk;
3980 		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddc = pl->vddc;
3981 		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddci = pl->vddci;
3982 	}
3983 }
3984 
ni_parse_power_table(struct radeon_device * rdev)3985 static int ni_parse_power_table(struct radeon_device *rdev)
3986 {
3987 	struct radeon_mode_info *mode_info = &rdev->mode_info;
3988 	struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info;
3989 	union pplib_power_state *power_state;
3990 	int i, j;
3991 	union pplib_clock_info *clock_info;
3992 	union power_info *power_info;
3993 	int index = GetIndexIntoMasterTable(DATA, PowerPlayInfo);
3994 	u16 data_offset;
3995 	u8 frev, crev;
3996 	struct ni_ps *ps;
3997 
3998 	if (!atom_parse_data_header(mode_info->atom_context, index, NULL,
3999 				   &frev, &crev, &data_offset))
4000 		return -EINVAL;
4001 	power_info = (union power_info *)(mode_info->atom_context->bios + data_offset);
4002 
4003 	rdev->pm.dpm.ps = kcalloc(power_info->pplib.ucNumStates,
4004 				  sizeof(struct radeon_ps),
4005 				  GFP_KERNEL);
4006 	if (!rdev->pm.dpm.ps)
4007 		return -ENOMEM;
4008 
4009 	for (i = 0; i < power_info->pplib.ucNumStates; i++) {
4010 		power_state = (union pplib_power_state *)
4011 			(mode_info->atom_context->bios + data_offset +
4012 			 le16_to_cpu(power_info->pplib.usStateArrayOffset) +
4013 			 i * power_info->pplib.ucStateEntrySize);
4014 		non_clock_info = (struct _ATOM_PPLIB_NONCLOCK_INFO *)
4015 			(mode_info->atom_context->bios + data_offset +
4016 			 le16_to_cpu(power_info->pplib.usNonClockInfoArrayOffset) +
4017 			 (power_state->v1.ucNonClockStateIndex *
4018 			  power_info->pplib.ucNonClockSize));
4019 		if (power_info->pplib.ucStateEntrySize - 1) {
4020 			u8 *idx;
4021 			ps = kzalloc(sizeof(struct ni_ps), GFP_KERNEL);
4022 			if (ps == NULL) {
4023 				kfree(rdev->pm.dpm.ps);
4024 				return -ENOMEM;
4025 			}
4026 			rdev->pm.dpm.ps[i].ps_priv = ps;
4027 			ni_parse_pplib_non_clock_info(rdev, &rdev->pm.dpm.ps[i],
4028 							 non_clock_info,
4029 							 power_info->pplib.ucNonClockSize);
4030 			idx = (u8 *)&power_state->v1.ucClockStateIndices[0];
4031 			for (j = 0; j < (power_info->pplib.ucStateEntrySize - 1); j++) {
4032 				clock_info = (union pplib_clock_info *)
4033 					(mode_info->atom_context->bios + data_offset +
4034 					 le16_to_cpu(power_info->pplib.usClockInfoArrayOffset) +
4035 					 (idx[j] * power_info->pplib.ucClockInfoSize));
4036 				ni_parse_pplib_clock_info(rdev,
4037 							  &rdev->pm.dpm.ps[i], j,
4038 							  clock_info);
4039 			}
4040 		}
4041 	}
4042 	rdev->pm.dpm.num_ps = power_info->pplib.ucNumStates;
4043 	return 0;
4044 }
4045 
ni_dpm_init(struct radeon_device * rdev)4046 int ni_dpm_init(struct radeon_device *rdev)
4047 {
4048 	struct rv7xx_power_info *pi;
4049 	struct evergreen_power_info *eg_pi;
4050 	struct ni_power_info *ni_pi;
4051 	struct atom_clock_dividers dividers;
4052 	int ret;
4053 
4054 	ni_pi = kzalloc(sizeof(struct ni_power_info), GFP_KERNEL);
4055 	if (ni_pi == NULL)
4056 		return -ENOMEM;
4057 	rdev->pm.dpm.priv = ni_pi;
4058 	eg_pi = &ni_pi->eg;
4059 	pi = &eg_pi->rv7xx;
4060 
4061 	rv770_get_max_vddc(rdev);
4062 
4063 	eg_pi->ulv.supported = false;
4064 	pi->acpi_vddc = 0;
4065 	eg_pi->acpi_vddci = 0;
4066 	pi->min_vddc_in_table = 0;
4067 	pi->max_vddc_in_table = 0;
4068 
4069 	ret = r600_get_platform_caps(rdev);
4070 	if (ret)
4071 		return ret;
4072 
4073 	ret = ni_parse_power_table(rdev);
4074 	if (ret)
4075 		return ret;
4076 	ret = r600_parse_extended_power_table(rdev);
4077 	if (ret)
4078 		return ret;
4079 
4080 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries =
4081 		kcalloc(4,
4082 			sizeof(struct radeon_clock_voltage_dependency_entry),
4083 			GFP_KERNEL);
4084 	if (!rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries) {
4085 		r600_free_extended_power_table(rdev);
4086 		return -ENOMEM;
4087 	}
4088 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.count = 4;
4089 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].clk = 0;
4090 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].v = 0;
4091 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].clk = 36000;
4092 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].v = 720;
4093 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].clk = 54000;
4094 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].v = 810;
4095 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].clk = 72000;
4096 	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].v = 900;
4097 
4098 	ni_patch_dependency_tables_based_on_leakage(rdev);
4099 
4100 	if (rdev->pm.dpm.voltage_response_time == 0)
4101 		rdev->pm.dpm.voltage_response_time = R600_VOLTAGERESPONSETIME_DFLT;
4102 	if (rdev->pm.dpm.backbias_response_time == 0)
4103 		rdev->pm.dpm.backbias_response_time = R600_BACKBIASRESPONSETIME_DFLT;
4104 
4105 	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
4106 					     0, false, &dividers);
4107 	if (ret)
4108 		pi->ref_div = dividers.ref_div + 1;
4109 	else
4110 		pi->ref_div = R600_REFERENCEDIVIDER_DFLT;
4111 
4112 	pi->rlp = RV770_RLP_DFLT;
4113 	pi->rmp = RV770_RMP_DFLT;
4114 	pi->lhp = RV770_LHP_DFLT;
4115 	pi->lmp = RV770_LMP_DFLT;
4116 
4117 	eg_pi->ats[0].rlp = RV770_RLP_DFLT;
4118 	eg_pi->ats[0].rmp = RV770_RMP_DFLT;
4119 	eg_pi->ats[0].lhp = RV770_LHP_DFLT;
4120 	eg_pi->ats[0].lmp = RV770_LMP_DFLT;
4121 
4122 	eg_pi->ats[1].rlp = BTC_RLP_UVD_DFLT;
4123 	eg_pi->ats[1].rmp = BTC_RMP_UVD_DFLT;
4124 	eg_pi->ats[1].lhp = BTC_LHP_UVD_DFLT;
4125 	eg_pi->ats[1].lmp = BTC_LMP_UVD_DFLT;
4126 
4127 	eg_pi->smu_uvd_hs = true;
4128 
4129 	if (rdev->pdev->device == 0x6707) {
4130 		pi->mclk_strobe_mode_threshold = 55000;
4131 		pi->mclk_edc_enable_threshold = 55000;
4132 		eg_pi->mclk_edc_wr_enable_threshold = 55000;
4133 	} else {
4134 		pi->mclk_strobe_mode_threshold = 40000;
4135 		pi->mclk_edc_enable_threshold = 40000;
4136 		eg_pi->mclk_edc_wr_enable_threshold = 40000;
4137 	}
4138 	ni_pi->mclk_rtt_mode_threshold = eg_pi->mclk_edc_wr_enable_threshold;
4139 
4140 	pi->voltage_control =
4141 		radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDC, 0);
4142 
4143 	pi->mvdd_control =
4144 		radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_MVDDC, 0);
4145 
4146 	eg_pi->vddci_control =
4147 		radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDCI, 0);
4148 
4149 	rv770_get_engine_memory_ss(rdev);
4150 
4151 	pi->asi = RV770_ASI_DFLT;
4152 	pi->pasi = CYPRESS_HASI_DFLT;
4153 	pi->vrc = CYPRESS_VRC_DFLT;
4154 
4155 	pi->power_gating = false;
4156 
4157 	pi->gfx_clock_gating = true;
4158 
4159 	pi->mg_clock_gating = true;
4160 	pi->mgcgtssm = true;
4161 	eg_pi->ls_clock_gating = false;
4162 	eg_pi->sclk_deep_sleep = false;
4163 
4164 	pi->dynamic_pcie_gen2 = true;
4165 
4166 	if (rdev->pm.int_thermal_type != THERMAL_TYPE_NONE)
4167 		pi->thermal_protection = true;
4168 	else
4169 		pi->thermal_protection = false;
4170 
4171 	pi->display_gap = true;
4172 
4173 	pi->dcodt = true;
4174 
4175 	pi->ulps = true;
4176 
4177 	eg_pi->dynamic_ac_timing = true;
4178 	eg_pi->abm = true;
4179 	eg_pi->mcls = true;
4180 	eg_pi->light_sleep = true;
4181 	eg_pi->memory_transition = true;
4182 #if defined(CONFIG_ACPI)
4183 	eg_pi->pcie_performance_request =
4184 		radeon_acpi_is_pcie_performance_request_supported(rdev);
4185 #else
4186 	eg_pi->pcie_performance_request = false;
4187 #endif
4188 
4189 	eg_pi->dll_default_on = false;
4190 
4191 	eg_pi->sclk_deep_sleep = false;
4192 
4193 	pi->mclk_stutter_mode_threshold = 0;
4194 
4195 	pi->sram_end = SMC_RAM_END;
4196 
4197 	rdev->pm.dpm.dyn_state.mclk_sclk_ratio = 3;
4198 	rdev->pm.dpm.dyn_state.vddc_vddci_delta = 200;
4199 	rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2 = 900;
4200 	rdev->pm.dpm.dyn_state.valid_sclk_values.count = ARRAY_SIZE(btc_valid_sclk);
4201 	rdev->pm.dpm.dyn_state.valid_sclk_values.values = btc_valid_sclk;
4202 	rdev->pm.dpm.dyn_state.valid_mclk_values.count = 0;
4203 	rdev->pm.dpm.dyn_state.valid_mclk_values.values = NULL;
4204 	rdev->pm.dpm.dyn_state.sclk_mclk_delta = 12500;
4205 
4206 	ni_pi->cac_data.leakage_coefficients.at = 516;
4207 	ni_pi->cac_data.leakage_coefficients.bt = 18;
4208 	ni_pi->cac_data.leakage_coefficients.av = 51;
4209 	ni_pi->cac_data.leakage_coefficients.bv = 2957;
4210 
4211 	switch (rdev->pdev->device) {
4212 	case 0x6700:
4213 	case 0x6701:
4214 	case 0x6702:
4215 	case 0x6703:
4216 	case 0x6718:
4217 		ni_pi->cac_weights = &cac_weights_cayman_xt;
4218 		break;
4219 	case 0x6705:
4220 	case 0x6719:
4221 	case 0x671D:
4222 	case 0x671C:
4223 	default:
4224 		ni_pi->cac_weights = &cac_weights_cayman_pro;
4225 		break;
4226 	case 0x6704:
4227 	case 0x6706:
4228 	case 0x6707:
4229 	case 0x6708:
4230 	case 0x6709:
4231 		ni_pi->cac_weights = &cac_weights_cayman_le;
4232 		break;
4233 	}
4234 
4235 	if (ni_pi->cac_weights->enable_power_containment_by_default) {
4236 		ni_pi->enable_power_containment = true;
4237 		ni_pi->enable_cac = true;
4238 		ni_pi->enable_sq_ramping = true;
4239 	} else {
4240 		ni_pi->enable_power_containment = false;
4241 		ni_pi->enable_cac = false;
4242 		ni_pi->enable_sq_ramping = false;
4243 	}
4244 
4245 	ni_pi->driver_calculate_cac_leakage = false;
4246 	ni_pi->cac_configuration_required = true;
4247 
4248 	if (ni_pi->cac_configuration_required) {
4249 		ni_pi->support_cac_long_term_average = true;
4250 		ni_pi->lta_window_size = ni_pi->cac_weights->l2_lta_window_size;
4251 		ni_pi->lts_truncate = ni_pi->cac_weights->lts_truncate;
4252 	} else {
4253 		ni_pi->support_cac_long_term_average = false;
4254 		ni_pi->lta_window_size = 0;
4255 		ni_pi->lts_truncate = 0;
4256 	}
4257 
4258 	ni_pi->use_power_boost_limit = true;
4259 
4260 	/* make sure dc limits are valid */
4261 	if ((rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.sclk == 0) ||
4262 	    (rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.mclk == 0))
4263 		rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc =
4264 			rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac;
4265 
4266 	return 0;
4267 }
4268 
ni_dpm_fini(struct radeon_device * rdev)4269 void ni_dpm_fini(struct radeon_device *rdev)
4270 {
4271 	int i;
4272 
4273 	for (i = 0; i < rdev->pm.dpm.num_ps; i++) {
4274 		kfree(rdev->pm.dpm.ps[i].ps_priv);
4275 	}
4276 	kfree(rdev->pm.dpm.ps);
4277 	kfree(rdev->pm.dpm.priv);
4278 	kfree(rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries);
4279 	r600_free_extended_power_table(rdev);
4280 }
4281 
ni_dpm_print_power_state(struct radeon_device * rdev,struct radeon_ps * rps)4282 void ni_dpm_print_power_state(struct radeon_device *rdev,
4283 			      struct radeon_ps *rps)
4284 {
4285 	struct ni_ps *ps = ni_get_ps(rps);
4286 	struct rv7xx_pl *pl;
4287 	int i;
4288 
4289 	r600_dpm_print_class_info(rps->class, rps->class2);
4290 	r600_dpm_print_cap_info(rps->caps);
4291 	printk("\tuvd    vclk: %d dclk: %d\n", rps->vclk, rps->dclk);
4292 	for (i = 0; i < ps->performance_level_count; i++) {
4293 		pl = &ps->performance_levels[i];
4294 		if (rdev->family >= CHIP_TAHITI)
4295 			printk("\t\tpower level %d    sclk: %u mclk: %u vddc: %u vddci: %u pcie gen: %u\n",
4296 			       i, pl->sclk, pl->mclk, pl->vddc, pl->vddci, pl->pcie_gen + 1);
4297 		else
4298 			printk("\t\tpower level %d    sclk: %u mclk: %u vddc: %u vddci: %u\n",
4299 			       i, pl->sclk, pl->mclk, pl->vddc, pl->vddci);
4300 	}
4301 	r600_dpm_print_ps_status(rdev, rps);
4302 }
4303 
ni_dpm_debugfs_print_current_performance_level(struct radeon_device * rdev,struct seq_file * m)4304 void ni_dpm_debugfs_print_current_performance_level(struct radeon_device *rdev,
4305 						    struct seq_file *m)
4306 {
4307 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4308 	struct radeon_ps *rps = &eg_pi->current_rps;
4309 	struct ni_ps *ps = ni_get_ps(rps);
4310 	struct rv7xx_pl *pl;
4311 	u32 current_index =
4312 		(RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4313 		CURRENT_STATE_INDEX_SHIFT;
4314 
4315 	if (current_index >= ps->performance_level_count) {
4316 		seq_printf(m, "invalid dpm profile %d\n", current_index);
4317 	} else {
4318 		pl = &ps->performance_levels[current_index];
4319 		seq_printf(m, "uvd    vclk: %d dclk: %d\n", rps->vclk, rps->dclk);
4320 		seq_printf(m, "power level %d    sclk: %u mclk: %u vddc: %u vddci: %u\n",
4321 			   current_index, pl->sclk, pl->mclk, pl->vddc, pl->vddci);
4322 	}
4323 }
4324 
ni_dpm_get_current_sclk(struct radeon_device * rdev)4325 u32 ni_dpm_get_current_sclk(struct radeon_device *rdev)
4326 {
4327 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4328 	struct radeon_ps *rps = &eg_pi->current_rps;
4329 	struct ni_ps *ps = ni_get_ps(rps);
4330 	struct rv7xx_pl *pl;
4331 	u32 current_index =
4332 		(RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4333 		CURRENT_STATE_INDEX_SHIFT;
4334 
4335 	if (current_index >= ps->performance_level_count) {
4336 		return 0;
4337 	} else {
4338 		pl = &ps->performance_levels[current_index];
4339 		return pl->sclk;
4340 	}
4341 }
4342 
ni_dpm_get_current_mclk(struct radeon_device * rdev)4343 u32 ni_dpm_get_current_mclk(struct radeon_device *rdev)
4344 {
4345 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4346 	struct radeon_ps *rps = &eg_pi->current_rps;
4347 	struct ni_ps *ps = ni_get_ps(rps);
4348 	struct rv7xx_pl *pl;
4349 	u32 current_index =
4350 		(RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4351 		CURRENT_STATE_INDEX_SHIFT;
4352 
4353 	if (current_index >= ps->performance_level_count) {
4354 		return 0;
4355 	} else {
4356 		pl = &ps->performance_levels[current_index];
4357 		return pl->mclk;
4358 	}
4359 }
4360 
ni_dpm_get_sclk(struct radeon_device * rdev,bool low)4361 u32 ni_dpm_get_sclk(struct radeon_device *rdev, bool low)
4362 {
4363 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4364 	struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps);
4365 
4366 	if (low)
4367 		return requested_state->performance_levels[0].sclk;
4368 	else
4369 		return requested_state->performance_levels[requested_state->performance_level_count - 1].sclk;
4370 }
4371 
ni_dpm_get_mclk(struct radeon_device * rdev,bool low)4372 u32 ni_dpm_get_mclk(struct radeon_device *rdev, bool low)
4373 {
4374 	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4375 	struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps);
4376 
4377 	if (low)
4378 		return requested_state->performance_levels[0].mclk;
4379 	else
4380 		return requested_state->performance_levels[requested_state->performance_level_count - 1].mclk;
4381 }
4382 
4383