GNU Linux-libre 5.19-rc6-gnu
[releases.git] / drivers / gpu / drm / radeon / ni_dpm.c
1 /*
2  * Copyright 2012 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  */
23
24 #include <linux/math64.h>
25 #include <linux/pci.h>
26 #include <linux/seq_file.h>
27
28 #include "atom.h"
29 #include "evergreen.h"
30 #include "ni_dpm.h"
31 #include "nid.h"
32 #include "r600_dpm.h"
33 #include "rv770.h"
34 #include "radeon.h"
35 #include "radeon_asic.h"
36
37 #define MC_CG_ARB_FREQ_F0           0x0a
38 #define MC_CG_ARB_FREQ_F1           0x0b
39 #define MC_CG_ARB_FREQ_F2           0x0c
40 #define MC_CG_ARB_FREQ_F3           0x0d
41
42 #define SMC_RAM_END 0xC000
43
44 static const struct ni_cac_weights cac_weights_cayman_xt =
45 {
46         0x15,
47         0x2,
48         0x19,
49         0x2,
50         0x8,
51         0x14,
52         0x2,
53         0x16,
54         0xE,
55         0x17,
56         0x13,
57         0x2B,
58         0x10,
59         0x7,
60         0x5,
61         0x5,
62         0x5,
63         0x2,
64         0x3,
65         0x9,
66         0x10,
67         0x10,
68         0x2B,
69         0xA,
70         0x9,
71         0x4,
72         0xD,
73         0xD,
74         0x3E,
75         0x18,
76         0x14,
77         0,
78         0x3,
79         0x3,
80         0x5,
81         0,
82         0x2,
83         0,
84         0,
85         0,
86         0,
87         0,
88         0,
89         0,
90         0,
91         0,
92         0x1CC,
93         0,
94         0x164,
95         1,
96         1,
97         1,
98         1,
99         12,
100         12,
101         12,
102         0x12,
103         0x1F,
104         132,
105         5,
106         7,
107         0,
108         { 0, 0, 0, 0, 0, 0, 0, 0 },
109         { 0, 0, 0, 0 },
110         true
111 };
112
113 static const struct ni_cac_weights cac_weights_cayman_pro =
114 {
115         0x16,
116         0x4,
117         0x10,
118         0x2,
119         0xA,
120         0x16,
121         0x2,
122         0x18,
123         0x10,
124         0x1A,
125         0x16,
126         0x2D,
127         0x12,
128         0xA,
129         0x6,
130         0x6,
131         0x6,
132         0x2,
133         0x4,
134         0xB,
135         0x11,
136         0x11,
137         0x2D,
138         0xC,
139         0xC,
140         0x7,
141         0x10,
142         0x10,
143         0x3F,
144         0x1A,
145         0x16,
146         0,
147         0x7,
148         0x4,
149         0x6,
150         1,
151         0x2,
152         0x1,
153         0,
154         0,
155         0,
156         0,
157         0,
158         0,
159         0x30,
160         0,
161         0x1CF,
162         0,
163         0x166,
164         1,
165         1,
166         1,
167         1,
168         12,
169         12,
170         12,
171         0x15,
172         0x1F,
173         132,
174         6,
175         6,
176         0,
177         { 0, 0, 0, 0, 0, 0, 0, 0 },
178         { 0, 0, 0, 0 },
179         true
180 };
181
182 static const struct ni_cac_weights cac_weights_cayman_le =
183 {
184         0x7,
185         0xE,
186         0x1,
187         0xA,
188         0x1,
189         0x3F,
190         0x2,
191         0x18,
192         0x10,
193         0x1A,
194         0x1,
195         0x3F,
196         0x1,
197         0xE,
198         0x6,
199         0x6,
200         0x6,
201         0x2,
202         0x4,
203         0x9,
204         0x1A,
205         0x1A,
206         0x2C,
207         0xA,
208         0x11,
209         0x8,
210         0x19,
211         0x19,
212         0x1,
213         0x1,
214         0x1A,
215         0,
216         0x8,
217         0x5,
218         0x8,
219         0x1,
220         0x3,
221         0x1,
222         0,
223         0,
224         0,
225         0,
226         0,
227         0,
228         0x38,
229         0x38,
230         0x239,
231         0x3,
232         0x18A,
233         1,
234         1,
235         1,
236         1,
237         12,
238         12,
239         12,
240         0x15,
241         0x22,
242         132,
243         6,
244         6,
245         0,
246         { 0, 0, 0, 0, 0, 0, 0, 0 },
247         { 0, 0, 0, 0 },
248         true
249 };
250
251 #define NISLANDS_MGCG_SEQUENCE  300
252
253 static const u32 cayman_cgcg_cgls_default[] =
254 {
255         0x000008f8, 0x00000010, 0xffffffff,
256         0x000008fc, 0x00000000, 0xffffffff,
257         0x000008f8, 0x00000011, 0xffffffff,
258         0x000008fc, 0x00000000, 0xffffffff,
259         0x000008f8, 0x00000012, 0xffffffff,
260         0x000008fc, 0x00000000, 0xffffffff,
261         0x000008f8, 0x00000013, 0xffffffff,
262         0x000008fc, 0x00000000, 0xffffffff,
263         0x000008f8, 0x00000014, 0xffffffff,
264         0x000008fc, 0x00000000, 0xffffffff,
265         0x000008f8, 0x00000015, 0xffffffff,
266         0x000008fc, 0x00000000, 0xffffffff,
267         0x000008f8, 0x00000016, 0xffffffff,
268         0x000008fc, 0x00000000, 0xffffffff,
269         0x000008f8, 0x00000017, 0xffffffff,
270         0x000008fc, 0x00000000, 0xffffffff,
271         0x000008f8, 0x00000018, 0xffffffff,
272         0x000008fc, 0x00000000, 0xffffffff,
273         0x000008f8, 0x00000019, 0xffffffff,
274         0x000008fc, 0x00000000, 0xffffffff,
275         0x000008f8, 0x0000001a, 0xffffffff,
276         0x000008fc, 0x00000000, 0xffffffff,
277         0x000008f8, 0x0000001b, 0xffffffff,
278         0x000008fc, 0x00000000, 0xffffffff,
279         0x000008f8, 0x00000020, 0xffffffff,
280         0x000008fc, 0x00000000, 0xffffffff,
281         0x000008f8, 0x00000021, 0xffffffff,
282         0x000008fc, 0x00000000, 0xffffffff,
283         0x000008f8, 0x00000022, 0xffffffff,
284         0x000008fc, 0x00000000, 0xffffffff,
285         0x000008f8, 0x00000023, 0xffffffff,
286         0x000008fc, 0x00000000, 0xffffffff,
287         0x000008f8, 0x00000024, 0xffffffff,
288         0x000008fc, 0x00000000, 0xffffffff,
289         0x000008f8, 0x00000025, 0xffffffff,
290         0x000008fc, 0x00000000, 0xffffffff,
291         0x000008f8, 0x00000026, 0xffffffff,
292         0x000008fc, 0x00000000, 0xffffffff,
293         0x000008f8, 0x00000027, 0xffffffff,
294         0x000008fc, 0x00000000, 0xffffffff,
295         0x000008f8, 0x00000028, 0xffffffff,
296         0x000008fc, 0x00000000, 0xffffffff,
297         0x000008f8, 0x00000029, 0xffffffff,
298         0x000008fc, 0x00000000, 0xffffffff,
299         0x000008f8, 0x0000002a, 0xffffffff,
300         0x000008fc, 0x00000000, 0xffffffff,
301         0x000008f8, 0x0000002b, 0xffffffff,
302         0x000008fc, 0x00000000, 0xffffffff
303 };
304 #define CAYMAN_CGCG_CGLS_DEFAULT_LENGTH sizeof(cayman_cgcg_cgls_default) / (3 * sizeof(u32))
305
306 static const u32 cayman_cgcg_cgls_disable[] =
307 {
308         0x000008f8, 0x00000010, 0xffffffff,
309         0x000008fc, 0xffffffff, 0xffffffff,
310         0x000008f8, 0x00000011, 0xffffffff,
311         0x000008fc, 0xffffffff, 0xffffffff,
312         0x000008f8, 0x00000012, 0xffffffff,
313         0x000008fc, 0xffffffff, 0xffffffff,
314         0x000008f8, 0x00000013, 0xffffffff,
315         0x000008fc, 0xffffffff, 0xffffffff,
316         0x000008f8, 0x00000014, 0xffffffff,
317         0x000008fc, 0xffffffff, 0xffffffff,
318         0x000008f8, 0x00000015, 0xffffffff,
319         0x000008fc, 0xffffffff, 0xffffffff,
320         0x000008f8, 0x00000016, 0xffffffff,
321         0x000008fc, 0xffffffff, 0xffffffff,
322         0x000008f8, 0x00000017, 0xffffffff,
323         0x000008fc, 0xffffffff, 0xffffffff,
324         0x000008f8, 0x00000018, 0xffffffff,
325         0x000008fc, 0xffffffff, 0xffffffff,
326         0x000008f8, 0x00000019, 0xffffffff,
327         0x000008fc, 0xffffffff, 0xffffffff,
328         0x000008f8, 0x0000001a, 0xffffffff,
329         0x000008fc, 0xffffffff, 0xffffffff,
330         0x000008f8, 0x0000001b, 0xffffffff,
331         0x000008fc, 0xffffffff, 0xffffffff,
332         0x000008f8, 0x00000020, 0xffffffff,
333         0x000008fc, 0x00000000, 0xffffffff,
334         0x000008f8, 0x00000021, 0xffffffff,
335         0x000008fc, 0x00000000, 0xffffffff,
336         0x000008f8, 0x00000022, 0xffffffff,
337         0x000008fc, 0x00000000, 0xffffffff,
338         0x000008f8, 0x00000023, 0xffffffff,
339         0x000008fc, 0x00000000, 0xffffffff,
340         0x000008f8, 0x00000024, 0xffffffff,
341         0x000008fc, 0x00000000, 0xffffffff,
342         0x000008f8, 0x00000025, 0xffffffff,
343         0x000008fc, 0x00000000, 0xffffffff,
344         0x000008f8, 0x00000026, 0xffffffff,
345         0x000008fc, 0x00000000, 0xffffffff,
346         0x000008f8, 0x00000027, 0xffffffff,
347         0x000008fc, 0x00000000, 0xffffffff,
348         0x000008f8, 0x00000028, 0xffffffff,
349         0x000008fc, 0x00000000, 0xffffffff,
350         0x000008f8, 0x00000029, 0xffffffff,
351         0x000008fc, 0x00000000, 0xffffffff,
352         0x000008f8, 0x0000002a, 0xffffffff,
353         0x000008fc, 0x00000000, 0xffffffff,
354         0x000008f8, 0x0000002b, 0xffffffff,
355         0x000008fc, 0x00000000, 0xffffffff,
356         0x00000644, 0x000f7902, 0x001f4180,
357         0x00000644, 0x000f3802, 0x001f4180
358 };
359 #define CAYMAN_CGCG_CGLS_DISABLE_LENGTH sizeof(cayman_cgcg_cgls_disable) / (3 * sizeof(u32))
360
361 static const u32 cayman_cgcg_cgls_enable[] =
362 {
363         0x00000644, 0x000f7882, 0x001f4080,
364         0x000008f8, 0x00000010, 0xffffffff,
365         0x000008fc, 0x00000000, 0xffffffff,
366         0x000008f8, 0x00000011, 0xffffffff,
367         0x000008fc, 0x00000000, 0xffffffff,
368         0x000008f8, 0x00000012, 0xffffffff,
369         0x000008fc, 0x00000000, 0xffffffff,
370         0x000008f8, 0x00000013, 0xffffffff,
371         0x000008fc, 0x00000000, 0xffffffff,
372         0x000008f8, 0x00000014, 0xffffffff,
373         0x000008fc, 0x00000000, 0xffffffff,
374         0x000008f8, 0x00000015, 0xffffffff,
375         0x000008fc, 0x00000000, 0xffffffff,
376         0x000008f8, 0x00000016, 0xffffffff,
377         0x000008fc, 0x00000000, 0xffffffff,
378         0x000008f8, 0x00000017, 0xffffffff,
379         0x000008fc, 0x00000000, 0xffffffff,
380         0x000008f8, 0x00000018, 0xffffffff,
381         0x000008fc, 0x00000000, 0xffffffff,
382         0x000008f8, 0x00000019, 0xffffffff,
383         0x000008fc, 0x00000000, 0xffffffff,
384         0x000008f8, 0x0000001a, 0xffffffff,
385         0x000008fc, 0x00000000, 0xffffffff,
386         0x000008f8, 0x0000001b, 0xffffffff,
387         0x000008fc, 0x00000000, 0xffffffff,
388         0x000008f8, 0x00000020, 0xffffffff,
389         0x000008fc, 0xffffffff, 0xffffffff,
390         0x000008f8, 0x00000021, 0xffffffff,
391         0x000008fc, 0xffffffff, 0xffffffff,
392         0x000008f8, 0x00000022, 0xffffffff,
393         0x000008fc, 0xffffffff, 0xffffffff,
394         0x000008f8, 0x00000023, 0xffffffff,
395         0x000008fc, 0xffffffff, 0xffffffff,
396         0x000008f8, 0x00000024, 0xffffffff,
397         0x000008fc, 0xffffffff, 0xffffffff,
398         0x000008f8, 0x00000025, 0xffffffff,
399         0x000008fc, 0xffffffff, 0xffffffff,
400         0x000008f8, 0x00000026, 0xffffffff,
401         0x000008fc, 0xffffffff, 0xffffffff,
402         0x000008f8, 0x00000027, 0xffffffff,
403         0x000008fc, 0xffffffff, 0xffffffff,
404         0x000008f8, 0x00000028, 0xffffffff,
405         0x000008fc, 0xffffffff, 0xffffffff,
406         0x000008f8, 0x00000029, 0xffffffff,
407         0x000008fc, 0xffffffff, 0xffffffff,
408         0x000008f8, 0x0000002a, 0xffffffff,
409         0x000008fc, 0xffffffff, 0xffffffff,
410         0x000008f8, 0x0000002b, 0xffffffff,
411         0x000008fc, 0xffffffff, 0xffffffff
412 };
413 #define CAYMAN_CGCG_CGLS_ENABLE_LENGTH  sizeof(cayman_cgcg_cgls_enable) / (3 * sizeof(u32))
414
415 static const u32 cayman_mgcg_default[] =
416 {
417         0x0000802c, 0xc0000000, 0xffffffff,
418         0x00003fc4, 0xc0000000, 0xffffffff,
419         0x00005448, 0x00000100, 0xffffffff,
420         0x000055e4, 0x00000100, 0xffffffff,
421         0x0000160c, 0x00000100, 0xffffffff,
422         0x00008984, 0x06000100, 0xffffffff,
423         0x0000c164, 0x00000100, 0xffffffff,
424         0x00008a18, 0x00000100, 0xffffffff,
425         0x0000897c, 0x06000100, 0xffffffff,
426         0x00008b28, 0x00000100, 0xffffffff,
427         0x00009144, 0x00800200, 0xffffffff,
428         0x00009a60, 0x00000100, 0xffffffff,
429         0x00009868, 0x00000100, 0xffffffff,
430         0x00008d58, 0x00000100, 0xffffffff,
431         0x00009510, 0x00000100, 0xffffffff,
432         0x0000949c, 0x00000100, 0xffffffff,
433         0x00009654, 0x00000100, 0xffffffff,
434         0x00009030, 0x00000100, 0xffffffff,
435         0x00009034, 0x00000100, 0xffffffff,
436         0x00009038, 0x00000100, 0xffffffff,
437         0x0000903c, 0x00000100, 0xffffffff,
438         0x00009040, 0x00000100, 0xffffffff,
439         0x0000a200, 0x00000100, 0xffffffff,
440         0x0000a204, 0x00000100, 0xffffffff,
441         0x0000a208, 0x00000100, 0xffffffff,
442         0x0000a20c, 0x00000100, 0xffffffff,
443         0x00009744, 0x00000100, 0xffffffff,
444         0x00003f80, 0x00000100, 0xffffffff,
445         0x0000a210, 0x00000100, 0xffffffff,
446         0x0000a214, 0x00000100, 0xffffffff,
447         0x000004d8, 0x00000100, 0xffffffff,
448         0x00009664, 0x00000100, 0xffffffff,
449         0x00009698, 0x00000100, 0xffffffff,
450         0x000004d4, 0x00000200, 0xffffffff,
451         0x000004d0, 0x00000000, 0xffffffff,
452         0x000030cc, 0x00000104, 0xffffffff,
453         0x0000d0c0, 0x00000100, 0xffffffff,
454         0x0000d8c0, 0x00000100, 0xffffffff,
455         0x0000802c, 0x40000000, 0xffffffff,
456         0x00003fc4, 0x40000000, 0xffffffff,
457         0x0000915c, 0x00010000, 0xffffffff,
458         0x00009160, 0x00030002, 0xffffffff,
459         0x00009164, 0x00050004, 0xffffffff,
460         0x00009168, 0x00070006, 0xffffffff,
461         0x00009178, 0x00070000, 0xffffffff,
462         0x0000917c, 0x00030002, 0xffffffff,
463         0x00009180, 0x00050004, 0xffffffff,
464         0x0000918c, 0x00010006, 0xffffffff,
465         0x00009190, 0x00090008, 0xffffffff,
466         0x00009194, 0x00070000, 0xffffffff,
467         0x00009198, 0x00030002, 0xffffffff,
468         0x0000919c, 0x00050004, 0xffffffff,
469         0x000091a8, 0x00010006, 0xffffffff,
470         0x000091ac, 0x00090008, 0xffffffff,
471         0x000091b0, 0x00070000, 0xffffffff,
472         0x000091b4, 0x00030002, 0xffffffff,
473         0x000091b8, 0x00050004, 0xffffffff,
474         0x000091c4, 0x00010006, 0xffffffff,
475         0x000091c8, 0x00090008, 0xffffffff,
476         0x000091cc, 0x00070000, 0xffffffff,
477         0x000091d0, 0x00030002, 0xffffffff,
478         0x000091d4, 0x00050004, 0xffffffff,
479         0x000091e0, 0x00010006, 0xffffffff,
480         0x000091e4, 0x00090008, 0xffffffff,
481         0x000091e8, 0x00000000, 0xffffffff,
482         0x000091ec, 0x00070000, 0xffffffff,
483         0x000091f0, 0x00030002, 0xffffffff,
484         0x000091f4, 0x00050004, 0xffffffff,
485         0x00009200, 0x00010006, 0xffffffff,
486         0x00009204, 0x00090008, 0xffffffff,
487         0x00009208, 0x00070000, 0xffffffff,
488         0x0000920c, 0x00030002, 0xffffffff,
489         0x00009210, 0x00050004, 0xffffffff,
490         0x0000921c, 0x00010006, 0xffffffff,
491         0x00009220, 0x00090008, 0xffffffff,
492         0x00009224, 0x00070000, 0xffffffff,
493         0x00009228, 0x00030002, 0xffffffff,
494         0x0000922c, 0x00050004, 0xffffffff,
495         0x00009238, 0x00010006, 0xffffffff,
496         0x0000923c, 0x00090008, 0xffffffff,
497         0x00009240, 0x00070000, 0xffffffff,
498         0x00009244, 0x00030002, 0xffffffff,
499         0x00009248, 0x00050004, 0xffffffff,
500         0x00009254, 0x00010006, 0xffffffff,
501         0x00009258, 0x00090008, 0xffffffff,
502         0x0000925c, 0x00070000, 0xffffffff,
503         0x00009260, 0x00030002, 0xffffffff,
504         0x00009264, 0x00050004, 0xffffffff,
505         0x00009270, 0x00010006, 0xffffffff,
506         0x00009274, 0x00090008, 0xffffffff,
507         0x00009278, 0x00070000, 0xffffffff,
508         0x0000927c, 0x00030002, 0xffffffff,
509         0x00009280, 0x00050004, 0xffffffff,
510         0x0000928c, 0x00010006, 0xffffffff,
511         0x00009290, 0x00090008, 0xffffffff,
512         0x000092a8, 0x00070000, 0xffffffff,
513         0x000092ac, 0x00030002, 0xffffffff,
514         0x000092b0, 0x00050004, 0xffffffff,
515         0x000092bc, 0x00010006, 0xffffffff,
516         0x000092c0, 0x00090008, 0xffffffff,
517         0x000092c4, 0x00070000, 0xffffffff,
518         0x000092c8, 0x00030002, 0xffffffff,
519         0x000092cc, 0x00050004, 0xffffffff,
520         0x000092d8, 0x00010006, 0xffffffff,
521         0x000092dc, 0x00090008, 0xffffffff,
522         0x00009294, 0x00000000, 0xffffffff,
523         0x0000802c, 0x40010000, 0xffffffff,
524         0x00003fc4, 0x40010000, 0xffffffff,
525         0x0000915c, 0x00010000, 0xffffffff,
526         0x00009160, 0x00030002, 0xffffffff,
527         0x00009164, 0x00050004, 0xffffffff,
528         0x00009168, 0x00070006, 0xffffffff,
529         0x00009178, 0x00070000, 0xffffffff,
530         0x0000917c, 0x00030002, 0xffffffff,
531         0x00009180, 0x00050004, 0xffffffff,
532         0x0000918c, 0x00010006, 0xffffffff,
533         0x00009190, 0x00090008, 0xffffffff,
534         0x00009194, 0x00070000, 0xffffffff,
535         0x00009198, 0x00030002, 0xffffffff,
536         0x0000919c, 0x00050004, 0xffffffff,
537         0x000091a8, 0x00010006, 0xffffffff,
538         0x000091ac, 0x00090008, 0xffffffff,
539         0x000091b0, 0x00070000, 0xffffffff,
540         0x000091b4, 0x00030002, 0xffffffff,
541         0x000091b8, 0x00050004, 0xffffffff,
542         0x000091c4, 0x00010006, 0xffffffff,
543         0x000091c8, 0x00090008, 0xffffffff,
544         0x000091cc, 0x00070000, 0xffffffff,
545         0x000091d0, 0x00030002, 0xffffffff,
546         0x000091d4, 0x00050004, 0xffffffff,
547         0x000091e0, 0x00010006, 0xffffffff,
548         0x000091e4, 0x00090008, 0xffffffff,
549         0x000091e8, 0x00000000, 0xffffffff,
550         0x000091ec, 0x00070000, 0xffffffff,
551         0x000091f0, 0x00030002, 0xffffffff,
552         0x000091f4, 0x00050004, 0xffffffff,
553         0x00009200, 0x00010006, 0xffffffff,
554         0x00009204, 0x00090008, 0xffffffff,
555         0x00009208, 0x00070000, 0xffffffff,
556         0x0000920c, 0x00030002, 0xffffffff,
557         0x00009210, 0x00050004, 0xffffffff,
558         0x0000921c, 0x00010006, 0xffffffff,
559         0x00009220, 0x00090008, 0xffffffff,
560         0x00009224, 0x00070000, 0xffffffff,
561         0x00009228, 0x00030002, 0xffffffff,
562         0x0000922c, 0x00050004, 0xffffffff,
563         0x00009238, 0x00010006, 0xffffffff,
564         0x0000923c, 0x00090008, 0xffffffff,
565         0x00009240, 0x00070000, 0xffffffff,
566         0x00009244, 0x00030002, 0xffffffff,
567         0x00009248, 0x00050004, 0xffffffff,
568         0x00009254, 0x00010006, 0xffffffff,
569         0x00009258, 0x00090008, 0xffffffff,
570         0x0000925c, 0x00070000, 0xffffffff,
571         0x00009260, 0x00030002, 0xffffffff,
572         0x00009264, 0x00050004, 0xffffffff,
573         0x00009270, 0x00010006, 0xffffffff,
574         0x00009274, 0x00090008, 0xffffffff,
575         0x00009278, 0x00070000, 0xffffffff,
576         0x0000927c, 0x00030002, 0xffffffff,
577         0x00009280, 0x00050004, 0xffffffff,
578         0x0000928c, 0x00010006, 0xffffffff,
579         0x00009290, 0x00090008, 0xffffffff,
580         0x000092a8, 0x00070000, 0xffffffff,
581         0x000092ac, 0x00030002, 0xffffffff,
582         0x000092b0, 0x00050004, 0xffffffff,
583         0x000092bc, 0x00010006, 0xffffffff,
584         0x000092c0, 0x00090008, 0xffffffff,
585         0x000092c4, 0x00070000, 0xffffffff,
586         0x000092c8, 0x00030002, 0xffffffff,
587         0x000092cc, 0x00050004, 0xffffffff,
588         0x000092d8, 0x00010006, 0xffffffff,
589         0x000092dc, 0x00090008, 0xffffffff,
590         0x00009294, 0x00000000, 0xffffffff,
591         0x0000802c, 0xc0000000, 0xffffffff,
592         0x00003fc4, 0xc0000000, 0xffffffff,
593         0x000008f8, 0x00000010, 0xffffffff,
594         0x000008fc, 0x00000000, 0xffffffff,
595         0x000008f8, 0x00000011, 0xffffffff,
596         0x000008fc, 0x00000000, 0xffffffff,
597         0x000008f8, 0x00000012, 0xffffffff,
598         0x000008fc, 0x00000000, 0xffffffff,
599         0x000008f8, 0x00000013, 0xffffffff,
600         0x000008fc, 0x00000000, 0xffffffff,
601         0x000008f8, 0x00000014, 0xffffffff,
602         0x000008fc, 0x00000000, 0xffffffff,
603         0x000008f8, 0x00000015, 0xffffffff,
604         0x000008fc, 0x00000000, 0xffffffff,
605         0x000008f8, 0x00000016, 0xffffffff,
606         0x000008fc, 0x00000000, 0xffffffff,
607         0x000008f8, 0x00000017, 0xffffffff,
608         0x000008fc, 0x00000000, 0xffffffff,
609         0x000008f8, 0x00000018, 0xffffffff,
610         0x000008fc, 0x00000000, 0xffffffff,
611         0x000008f8, 0x00000019, 0xffffffff,
612         0x000008fc, 0x00000000, 0xffffffff,
613         0x000008f8, 0x0000001a, 0xffffffff,
614         0x000008fc, 0x00000000, 0xffffffff,
615         0x000008f8, 0x0000001b, 0xffffffff,
616         0x000008fc, 0x00000000, 0xffffffff
617 };
618 #define CAYMAN_MGCG_DEFAULT_LENGTH sizeof(cayman_mgcg_default) / (3 * sizeof(u32))
619
620 static const u32 cayman_mgcg_disable[] =
621 {
622         0x0000802c, 0xc0000000, 0xffffffff,
623         0x000008f8, 0x00000000, 0xffffffff,
624         0x000008fc, 0xffffffff, 0xffffffff,
625         0x000008f8, 0x00000001, 0xffffffff,
626         0x000008fc, 0xffffffff, 0xffffffff,
627         0x000008f8, 0x00000002, 0xffffffff,
628         0x000008fc, 0xffffffff, 0xffffffff,
629         0x000008f8, 0x00000003, 0xffffffff,
630         0x000008fc, 0xffffffff, 0xffffffff,
631         0x00009150, 0x00600000, 0xffffffff
632 };
633 #define CAYMAN_MGCG_DISABLE_LENGTH   sizeof(cayman_mgcg_disable) / (3 * sizeof(u32))
634
635 static const u32 cayman_mgcg_enable[] =
636 {
637         0x0000802c, 0xc0000000, 0xffffffff,
638         0x000008f8, 0x00000000, 0xffffffff,
639         0x000008fc, 0x00000000, 0xffffffff,
640         0x000008f8, 0x00000001, 0xffffffff,
641         0x000008fc, 0x00000000, 0xffffffff,
642         0x000008f8, 0x00000002, 0xffffffff,
643         0x000008fc, 0x00600000, 0xffffffff,
644         0x000008f8, 0x00000003, 0xffffffff,
645         0x000008fc, 0x00000000, 0xffffffff,
646         0x00009150, 0x96944200, 0xffffffff
647 };
648
649 #define CAYMAN_MGCG_ENABLE_LENGTH   sizeof(cayman_mgcg_enable) / (3 * sizeof(u32))
650
651 #define NISLANDS_SYSLS_SEQUENCE  100
652
653 static const u32 cayman_sysls_default[] =
654 {
655         /* Register,   Value,     Mask bits */
656         0x000055e8, 0x00000000, 0xffffffff,
657         0x0000d0bc, 0x00000000, 0xffffffff,
658         0x0000d8bc, 0x00000000, 0xffffffff,
659         0x000015c0, 0x000c1401, 0xffffffff,
660         0x0000264c, 0x000c0400, 0xffffffff,
661         0x00002648, 0x000c0400, 0xffffffff,
662         0x00002650, 0x000c0400, 0xffffffff,
663         0x000020b8, 0x000c0400, 0xffffffff,
664         0x000020bc, 0x000c0400, 0xffffffff,
665         0x000020c0, 0x000c0c80, 0xffffffff,
666         0x0000f4a0, 0x000000c0, 0xffffffff,
667         0x0000f4a4, 0x00680fff, 0xffffffff,
668         0x00002f50, 0x00000404, 0xffffffff,
669         0x000004c8, 0x00000001, 0xffffffff,
670         0x000064ec, 0x00000000, 0xffffffff,
671         0x00000c7c, 0x00000000, 0xffffffff,
672         0x00008dfc, 0x00000000, 0xffffffff
673 };
674 #define CAYMAN_SYSLS_DEFAULT_LENGTH sizeof(cayman_sysls_default) / (3 * sizeof(u32))
675
676 static const u32 cayman_sysls_disable[] =
677 {
678         /* Register,   Value,     Mask bits */
679         0x0000d0c0, 0x00000000, 0xffffffff,
680         0x0000d8c0, 0x00000000, 0xffffffff,
681         0x000055e8, 0x00000000, 0xffffffff,
682         0x0000d0bc, 0x00000000, 0xffffffff,
683         0x0000d8bc, 0x00000000, 0xffffffff,
684         0x000015c0, 0x00041401, 0xffffffff,
685         0x0000264c, 0x00040400, 0xffffffff,
686         0x00002648, 0x00040400, 0xffffffff,
687         0x00002650, 0x00040400, 0xffffffff,
688         0x000020b8, 0x00040400, 0xffffffff,
689         0x000020bc, 0x00040400, 0xffffffff,
690         0x000020c0, 0x00040c80, 0xffffffff,
691         0x0000f4a0, 0x000000c0, 0xffffffff,
692         0x0000f4a4, 0x00680000, 0xffffffff,
693         0x00002f50, 0x00000404, 0xffffffff,
694         0x000004c8, 0x00000001, 0xffffffff,
695         0x000064ec, 0x00007ffd, 0xffffffff,
696         0x00000c7c, 0x0000ff00, 0xffffffff,
697         0x00008dfc, 0x0000007f, 0xffffffff
698 };
699 #define CAYMAN_SYSLS_DISABLE_LENGTH sizeof(cayman_sysls_disable) / (3 * sizeof(u32))
700
701 static const u32 cayman_sysls_enable[] =
702 {
703         /* Register,   Value,     Mask bits */
704         0x000055e8, 0x00000001, 0xffffffff,
705         0x0000d0bc, 0x00000100, 0xffffffff,
706         0x0000d8bc, 0x00000100, 0xffffffff,
707         0x000015c0, 0x000c1401, 0xffffffff,
708         0x0000264c, 0x000c0400, 0xffffffff,
709         0x00002648, 0x000c0400, 0xffffffff,
710         0x00002650, 0x000c0400, 0xffffffff,
711         0x000020b8, 0x000c0400, 0xffffffff,
712         0x000020bc, 0x000c0400, 0xffffffff,
713         0x000020c0, 0x000c0c80, 0xffffffff,
714         0x0000f4a0, 0x000000c0, 0xffffffff,
715         0x0000f4a4, 0x00680fff, 0xffffffff,
716         0x00002f50, 0x00000903, 0xffffffff,
717         0x000004c8, 0x00000000, 0xffffffff,
718         0x000064ec, 0x00000000, 0xffffffff,
719         0x00000c7c, 0x00000000, 0xffffffff,
720         0x00008dfc, 0x00000000, 0xffffffff
721 };
722 #define CAYMAN_SYSLS_ENABLE_LENGTH sizeof(cayman_sysls_enable) / (3 * sizeof(u32))
723
724 extern int ni_mc_load_microcode(struct radeon_device *rdev);
725
726 struct ni_power_info *ni_get_pi(struct radeon_device *rdev)
727 {
728         struct ni_power_info *pi = rdev->pm.dpm.priv;
729
730         return pi;
731 }
732
733 struct ni_ps *ni_get_ps(struct radeon_ps *rps)
734 {
735         struct ni_ps *ps = rps->ps_priv;
736
737         return ps;
738 }
739
740 static void ni_calculate_leakage_for_v_and_t_formula(const struct ni_leakage_coeffients *coeff,
741                                                      u16 v, s32 t,
742                                                      u32 ileakage,
743                                                      u32 *leakage)
744 {
745         s64 kt, kv, leakage_w, i_leakage, vddc, temperature;
746
747         i_leakage = div64_s64(drm_int2fixp(ileakage), 1000);
748         vddc = div64_s64(drm_int2fixp(v), 1000);
749         temperature = div64_s64(drm_int2fixp(t), 1000);
750
751         kt = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->at), 1000),
752                           drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bt), 1000), temperature)));
753         kv = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->av), 1000),
754                           drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bv), 1000), vddc)));
755
756         leakage_w = drm_fixp_mul(drm_fixp_mul(drm_fixp_mul(i_leakage, kt), kv), vddc);
757
758         *leakage = drm_fixp2int(leakage_w * 1000);
759 }
760
761 static void ni_calculate_leakage_for_v_and_t(struct radeon_device *rdev,
762                                              const struct ni_leakage_coeffients *coeff,
763                                              u16 v,
764                                              s32 t,
765                                              u32 i_leakage,
766                                              u32 *leakage)
767 {
768         ni_calculate_leakage_for_v_and_t_formula(coeff, v, t, i_leakage, leakage);
769 }
770
771 bool ni_dpm_vblank_too_short(struct radeon_device *rdev)
772 {
773         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
774         u32 vblank_time = r600_dpm_get_vblank_time(rdev);
775         /* we never hit the non-gddr5 limit so disable it */
776         u32 switch_limit = pi->mem_gddr5 ? 450 : 0;
777
778         if (vblank_time < switch_limit)
779                 return true;
780         else
781                 return false;
782
783 }
784
785 static void ni_apply_state_adjust_rules(struct radeon_device *rdev,
786                                         struct radeon_ps *rps)
787 {
788         struct ni_ps *ps = ni_get_ps(rps);
789         struct radeon_clock_and_voltage_limits *max_limits;
790         bool disable_mclk_switching;
791         u32 mclk;
792         u16 vddci;
793         int i;
794
795         if ((rdev->pm.dpm.new_active_crtc_count > 1) ||
796             ni_dpm_vblank_too_short(rdev))
797                 disable_mclk_switching = true;
798         else
799                 disable_mclk_switching = false;
800
801         if (rdev->pm.dpm.ac_power)
802                 max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac;
803         else
804                 max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc;
805
806         if (rdev->pm.dpm.ac_power == false) {
807                 for (i = 0; i < ps->performance_level_count; i++) {
808                         if (ps->performance_levels[i].mclk > max_limits->mclk)
809                                 ps->performance_levels[i].mclk = max_limits->mclk;
810                         if (ps->performance_levels[i].sclk > max_limits->sclk)
811                                 ps->performance_levels[i].sclk = max_limits->sclk;
812                         if (ps->performance_levels[i].vddc > max_limits->vddc)
813                                 ps->performance_levels[i].vddc = max_limits->vddc;
814                         if (ps->performance_levels[i].vddci > max_limits->vddci)
815                                 ps->performance_levels[i].vddci = max_limits->vddci;
816                 }
817         }
818
819         /* XXX validate the min clocks required for display */
820
821         /* adjust low state */
822         if (disable_mclk_switching) {
823                 ps->performance_levels[0].mclk =
824                         ps->performance_levels[ps->performance_level_count - 1].mclk;
825                 ps->performance_levels[0].vddci =
826                         ps->performance_levels[ps->performance_level_count - 1].vddci;
827         }
828
829         btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk,
830                                   &ps->performance_levels[0].sclk,
831                                   &ps->performance_levels[0].mclk);
832
833         for (i = 1; i < ps->performance_level_count; i++) {
834                 if (ps->performance_levels[i].sclk < ps->performance_levels[i - 1].sclk)
835                         ps->performance_levels[i].sclk = ps->performance_levels[i - 1].sclk;
836                 if (ps->performance_levels[i].vddc < ps->performance_levels[i - 1].vddc)
837                         ps->performance_levels[i].vddc = ps->performance_levels[i - 1].vddc;
838         }
839
840         /* adjust remaining states */
841         if (disable_mclk_switching) {
842                 mclk = ps->performance_levels[0].mclk;
843                 vddci = ps->performance_levels[0].vddci;
844                 for (i = 1; i < ps->performance_level_count; i++) {
845                         if (mclk < ps->performance_levels[i].mclk)
846                                 mclk = ps->performance_levels[i].mclk;
847                         if (vddci < ps->performance_levels[i].vddci)
848                                 vddci = ps->performance_levels[i].vddci;
849                 }
850                 for (i = 0; i < ps->performance_level_count; i++) {
851                         ps->performance_levels[i].mclk = mclk;
852                         ps->performance_levels[i].vddci = vddci;
853                 }
854         } else {
855                 for (i = 1; i < ps->performance_level_count; i++) {
856                         if (ps->performance_levels[i].mclk < ps->performance_levels[i - 1].mclk)
857                                 ps->performance_levels[i].mclk = ps->performance_levels[i - 1].mclk;
858                         if (ps->performance_levels[i].vddci < ps->performance_levels[i - 1].vddci)
859                                 ps->performance_levels[i].vddci = ps->performance_levels[i - 1].vddci;
860                 }
861         }
862
863         for (i = 1; i < ps->performance_level_count; i++)
864                 btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk,
865                                           &ps->performance_levels[i].sclk,
866                                           &ps->performance_levels[i].mclk);
867
868         for (i = 0; i < ps->performance_level_count; i++)
869                 btc_adjust_clock_combinations(rdev, max_limits,
870                                               &ps->performance_levels[i]);
871
872         for (i = 0; i < ps->performance_level_count; i++) {
873                 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk,
874                                                    ps->performance_levels[i].sclk,
875                                                    max_limits->vddc,  &ps->performance_levels[i].vddc);
876                 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddci_dependency_on_mclk,
877                                                    ps->performance_levels[i].mclk,
878                                                    max_limits->vddci, &ps->performance_levels[i].vddci);
879                 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk,
880                                                    ps->performance_levels[i].mclk,
881                                                    max_limits->vddc,  &ps->performance_levels[i].vddc);
882                 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk,
883                                                    rdev->clock.current_dispclk,
884                                                    max_limits->vddc,  &ps->performance_levels[i].vddc);
885         }
886
887         for (i = 0; i < ps->performance_level_count; i++) {
888                 btc_apply_voltage_delta_rules(rdev,
889                                               max_limits->vddc, max_limits->vddci,
890                                               &ps->performance_levels[i].vddc,
891                                               &ps->performance_levels[i].vddci);
892         }
893
894         ps->dc_compatible = true;
895         for (i = 0; i < ps->performance_level_count; i++) {
896                 if (ps->performance_levels[i].vddc > rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.vddc)
897                         ps->dc_compatible = false;
898
899                 if (ps->performance_levels[i].vddc < rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2)
900                         ps->performance_levels[i].flags &= ~ATOM_PPLIB_R600_FLAGS_PCIEGEN2;
901         }
902 }
903
904 static void ni_cg_clockgating_default(struct radeon_device *rdev)
905 {
906         u32 count;
907         const u32 *ps = NULL;
908
909         ps = (const u32 *)&cayman_cgcg_cgls_default;
910         count = CAYMAN_CGCG_CGLS_DEFAULT_LENGTH;
911
912         btc_program_mgcg_hw_sequence(rdev, ps, count);
913 }
914
915 static void ni_gfx_clockgating_enable(struct radeon_device *rdev,
916                                       bool enable)
917 {
918         u32 count;
919         const u32 *ps = NULL;
920
921         if (enable) {
922                 ps = (const u32 *)&cayman_cgcg_cgls_enable;
923                 count = CAYMAN_CGCG_CGLS_ENABLE_LENGTH;
924         } else {
925                 ps = (const u32 *)&cayman_cgcg_cgls_disable;
926                 count = CAYMAN_CGCG_CGLS_DISABLE_LENGTH;
927         }
928
929         btc_program_mgcg_hw_sequence(rdev, ps, count);
930 }
931
932 static void ni_mg_clockgating_default(struct radeon_device *rdev)
933 {
934         u32 count;
935         const u32 *ps = NULL;
936
937         ps = (const u32 *)&cayman_mgcg_default;
938         count = CAYMAN_MGCG_DEFAULT_LENGTH;
939
940         btc_program_mgcg_hw_sequence(rdev, ps, count);
941 }
942
943 static void ni_mg_clockgating_enable(struct radeon_device *rdev,
944                                      bool enable)
945 {
946         u32 count;
947         const u32 *ps = NULL;
948
949         if (enable) {
950                 ps = (const u32 *)&cayman_mgcg_enable;
951                 count = CAYMAN_MGCG_ENABLE_LENGTH;
952         } else {
953                 ps = (const u32 *)&cayman_mgcg_disable;
954                 count = CAYMAN_MGCG_DISABLE_LENGTH;
955         }
956
957         btc_program_mgcg_hw_sequence(rdev, ps, count);
958 }
959
960 static void ni_ls_clockgating_default(struct radeon_device *rdev)
961 {
962         u32 count;
963         const u32 *ps = NULL;
964
965         ps = (const u32 *)&cayman_sysls_default;
966         count = CAYMAN_SYSLS_DEFAULT_LENGTH;
967
968         btc_program_mgcg_hw_sequence(rdev, ps, count);
969 }
970
971 static void ni_ls_clockgating_enable(struct radeon_device *rdev,
972                                      bool enable)
973 {
974         u32 count;
975         const u32 *ps = NULL;
976
977         if (enable) {
978                 ps = (const u32 *)&cayman_sysls_enable;
979                 count = CAYMAN_SYSLS_ENABLE_LENGTH;
980         } else {
981                 ps = (const u32 *)&cayman_sysls_disable;
982                 count = CAYMAN_SYSLS_DISABLE_LENGTH;
983         }
984
985         btc_program_mgcg_hw_sequence(rdev, ps, count);
986
987 }
988
989 static int ni_patch_single_dependency_table_based_on_leakage(struct radeon_device *rdev,
990                                                              struct radeon_clock_voltage_dependency_table *table)
991 {
992         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
993         u32 i;
994
995         if (table) {
996                 for (i = 0; i < table->count; i++) {
997                         if (0xff01 == table->entries[i].v) {
998                                 if (pi->max_vddc == 0)
999                                         return -EINVAL;
1000                                 table->entries[i].v = pi->max_vddc;
1001                         }
1002                 }
1003         }
1004         return 0;
1005 }
1006
1007 static int ni_patch_dependency_tables_based_on_leakage(struct radeon_device *rdev)
1008 {
1009         int ret = 0;
1010
1011         ret = ni_patch_single_dependency_table_based_on_leakage(rdev,
1012                                                                 &rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk);
1013
1014         ret = ni_patch_single_dependency_table_based_on_leakage(rdev,
1015                                                                 &rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk);
1016         return ret;
1017 }
1018
1019 static void ni_stop_dpm(struct radeon_device *rdev)
1020 {
1021         WREG32_P(GENERAL_PWRMGT, 0, ~GLOBAL_PWRMGT_EN);
1022 }
1023
1024 #if 0
1025 static int ni_notify_hw_of_power_source(struct radeon_device *rdev,
1026                                         bool ac_power)
1027 {
1028         if (ac_power)
1029                 return (rv770_send_msg_to_smc(rdev, PPSMC_MSG_RunningOnAC) == PPSMC_Result_OK) ?
1030                         0 : -EINVAL;
1031
1032         return 0;
1033 }
1034 #endif
1035
1036 static PPSMC_Result ni_send_msg_to_smc_with_parameter(struct radeon_device *rdev,
1037                                                       PPSMC_Msg msg, u32 parameter)
1038 {
1039         WREG32(SMC_SCRATCH0, parameter);
1040         return rv770_send_msg_to_smc(rdev, msg);
1041 }
1042
1043 static int ni_restrict_performance_levels_before_switch(struct radeon_device *rdev)
1044 {
1045         if (rv770_send_msg_to_smc(rdev, PPSMC_MSG_NoForcedLevel) != PPSMC_Result_OK)
1046                 return -EINVAL;
1047
1048         return (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) == PPSMC_Result_OK) ?
1049                 0 : -EINVAL;
1050 }
1051
1052 int ni_dpm_force_performance_level(struct radeon_device *rdev,
1053                                    enum radeon_dpm_forced_level level)
1054 {
1055         if (level == RADEON_DPM_FORCED_LEVEL_HIGH) {
1056                 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK)
1057                         return -EINVAL;
1058
1059                 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 1) != PPSMC_Result_OK)
1060                         return -EINVAL;
1061         } else if (level == RADEON_DPM_FORCED_LEVEL_LOW) {
1062                 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK)
1063                         return -EINVAL;
1064
1065                 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) != PPSMC_Result_OK)
1066                         return -EINVAL;
1067         } else if (level == RADEON_DPM_FORCED_LEVEL_AUTO) {
1068                 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK)
1069                         return -EINVAL;
1070
1071                 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK)
1072                         return -EINVAL;
1073         }
1074
1075         rdev->pm.dpm.forced_level = level;
1076
1077         return 0;
1078 }
1079
1080 static void ni_stop_smc(struct radeon_device *rdev)
1081 {
1082         u32 tmp;
1083         int i;
1084
1085         for (i = 0; i < rdev->usec_timeout; i++) {
1086                 tmp = RREG32(LB_SYNC_RESET_SEL) & LB_SYNC_RESET_SEL_MASK;
1087                 if (tmp != 1)
1088                         break;
1089                 udelay(1);
1090         }
1091
1092         udelay(100);
1093
1094         r7xx_stop_smc(rdev);
1095 }
1096
1097 static int ni_process_firmware_header(struct radeon_device *rdev)
1098 {
1099         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1100         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1101         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1102         u32 tmp;
1103         int ret;
1104
1105         ret = rv770_read_smc_sram_dword(rdev,
1106                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1107                                         NISLANDS_SMC_FIRMWARE_HEADER_stateTable,
1108                                         &tmp, pi->sram_end);
1109
1110         if (ret)
1111                 return ret;
1112
1113         pi->state_table_start = (u16)tmp;
1114
1115         ret = rv770_read_smc_sram_dword(rdev,
1116                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1117                                         NISLANDS_SMC_FIRMWARE_HEADER_softRegisters,
1118                                         &tmp, pi->sram_end);
1119
1120         if (ret)
1121                 return ret;
1122
1123         pi->soft_regs_start = (u16)tmp;
1124
1125         ret = rv770_read_smc_sram_dword(rdev,
1126                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1127                                         NISLANDS_SMC_FIRMWARE_HEADER_mcRegisterTable,
1128                                         &tmp, pi->sram_end);
1129
1130         if (ret)
1131                 return ret;
1132
1133         eg_pi->mc_reg_table_start = (u16)tmp;
1134
1135         ret = rv770_read_smc_sram_dword(rdev,
1136                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1137                                         NISLANDS_SMC_FIRMWARE_HEADER_fanTable,
1138                                         &tmp, pi->sram_end);
1139
1140         if (ret)
1141                 return ret;
1142
1143         ni_pi->fan_table_start = (u16)tmp;
1144
1145         ret = rv770_read_smc_sram_dword(rdev,
1146                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1147                                         NISLANDS_SMC_FIRMWARE_HEADER_mcArbDramAutoRefreshTable,
1148                                         &tmp, pi->sram_end);
1149
1150         if (ret)
1151                 return ret;
1152
1153         ni_pi->arb_table_start = (u16)tmp;
1154
1155         ret = rv770_read_smc_sram_dword(rdev,
1156                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1157                                         NISLANDS_SMC_FIRMWARE_HEADER_cacTable,
1158                                         &tmp, pi->sram_end);
1159
1160         if (ret)
1161                 return ret;
1162
1163         ni_pi->cac_table_start = (u16)tmp;
1164
1165         ret = rv770_read_smc_sram_dword(rdev,
1166                                         NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1167                                         NISLANDS_SMC_FIRMWARE_HEADER_spllTable,
1168                                         &tmp, pi->sram_end);
1169
1170         if (ret)
1171                 return ret;
1172
1173         ni_pi->spll_table_start = (u16)tmp;
1174
1175
1176         return ret;
1177 }
1178
1179 static void ni_read_clock_registers(struct radeon_device *rdev)
1180 {
1181         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1182
1183         ni_pi->clock_registers.cg_spll_func_cntl = RREG32(CG_SPLL_FUNC_CNTL);
1184         ni_pi->clock_registers.cg_spll_func_cntl_2 = RREG32(CG_SPLL_FUNC_CNTL_2);
1185         ni_pi->clock_registers.cg_spll_func_cntl_3 = RREG32(CG_SPLL_FUNC_CNTL_3);
1186         ni_pi->clock_registers.cg_spll_func_cntl_4 = RREG32(CG_SPLL_FUNC_CNTL_4);
1187         ni_pi->clock_registers.cg_spll_spread_spectrum = RREG32(CG_SPLL_SPREAD_SPECTRUM);
1188         ni_pi->clock_registers.cg_spll_spread_spectrum_2 = RREG32(CG_SPLL_SPREAD_SPECTRUM_2);
1189         ni_pi->clock_registers.mpll_ad_func_cntl = RREG32(MPLL_AD_FUNC_CNTL);
1190         ni_pi->clock_registers.mpll_ad_func_cntl_2 = RREG32(MPLL_AD_FUNC_CNTL_2);
1191         ni_pi->clock_registers.mpll_dq_func_cntl = RREG32(MPLL_DQ_FUNC_CNTL);
1192         ni_pi->clock_registers.mpll_dq_func_cntl_2 = RREG32(MPLL_DQ_FUNC_CNTL_2);
1193         ni_pi->clock_registers.mclk_pwrmgt_cntl = RREG32(MCLK_PWRMGT_CNTL);
1194         ni_pi->clock_registers.dll_cntl = RREG32(DLL_CNTL);
1195         ni_pi->clock_registers.mpll_ss1 = RREG32(MPLL_SS1);
1196         ni_pi->clock_registers.mpll_ss2 = RREG32(MPLL_SS2);
1197 }
1198
1199 #if 0
1200 static int ni_enter_ulp_state(struct radeon_device *rdev)
1201 {
1202         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1203
1204         if (pi->gfx_clock_gating) {
1205                 WREG32_P(SCLK_PWRMGT_CNTL, 0, ~DYN_GFX_CLK_OFF_EN);
1206                 WREG32_P(SCLK_PWRMGT_CNTL, GFX_CLK_FORCE_ON, ~GFX_CLK_FORCE_ON);
1207                 WREG32_P(SCLK_PWRMGT_CNTL, 0, ~GFX_CLK_FORCE_ON);
1208                 RREG32(GB_ADDR_CONFIG);
1209         }
1210
1211         WREG32_P(SMC_MSG, HOST_SMC_MSG(PPSMC_MSG_SwitchToMinimumPower),
1212                  ~HOST_SMC_MSG_MASK);
1213
1214         udelay(25000);
1215
1216         return 0;
1217 }
1218 #endif
1219
1220 static void ni_program_response_times(struct radeon_device *rdev)
1221 {
1222         u32 voltage_response_time, backbias_response_time, acpi_delay_time, vbi_time_out;
1223         u32 vddc_dly, bb_dly, acpi_dly, vbi_dly, mclk_switch_limit;
1224         u32 reference_clock;
1225
1226         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mvdd_chg_time, 1);
1227
1228         voltage_response_time = (u32)rdev->pm.dpm.voltage_response_time;
1229         backbias_response_time = (u32)rdev->pm.dpm.backbias_response_time;
1230
1231         if (voltage_response_time == 0)
1232                 voltage_response_time = 1000;
1233
1234         if (backbias_response_time == 0)
1235                 backbias_response_time = 1000;
1236
1237         acpi_delay_time = 15000;
1238         vbi_time_out = 100000;
1239
1240         reference_clock = radeon_get_xclk(rdev);
1241
1242         vddc_dly = (voltage_response_time  * reference_clock) / 1600;
1243         bb_dly   = (backbias_response_time * reference_clock) / 1600;
1244         acpi_dly = (acpi_delay_time * reference_clock) / 1600;
1245         vbi_dly  = (vbi_time_out * reference_clock) / 1600;
1246
1247         mclk_switch_limit = (460 * reference_clock) / 100;
1248
1249         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_vreg,  vddc_dly);
1250         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_bbias, bb_dly);
1251         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_acpi,  acpi_dly);
1252         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_chg_timeout, vbi_dly);
1253         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mc_block_delay, 0xAA);
1254         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_switch_lim, mclk_switch_limit);
1255 }
1256
1257 static void ni_populate_smc_voltage_table(struct radeon_device *rdev,
1258                                           struct atom_voltage_table *voltage_table,
1259                                           NISLANDS_SMC_STATETABLE *table)
1260 {
1261         unsigned int i;
1262
1263         for (i = 0; i < voltage_table->count; i++) {
1264                 table->highSMIO[i] = 0;
1265                 table->lowSMIO[i] |= cpu_to_be32(voltage_table->entries[i].smio_low);
1266         }
1267 }
1268
1269 static void ni_populate_smc_voltage_tables(struct radeon_device *rdev,
1270                                            NISLANDS_SMC_STATETABLE *table)
1271 {
1272         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1273         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1274         unsigned char i;
1275
1276         if (eg_pi->vddc_voltage_table.count) {
1277                 ni_populate_smc_voltage_table(rdev, &eg_pi->vddc_voltage_table, table);
1278                 table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] = 0;
1279                 table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] =
1280                         cpu_to_be32(eg_pi->vddc_voltage_table.mask_low);
1281
1282                 for (i = 0; i < eg_pi->vddc_voltage_table.count; i++) {
1283                         if (pi->max_vddc_in_table <= eg_pi->vddc_voltage_table.entries[i].value) {
1284                                 table->maxVDDCIndexInPPTable = i;
1285                                 break;
1286                         }
1287                 }
1288         }
1289
1290         if (eg_pi->vddci_voltage_table.count) {
1291                 ni_populate_smc_voltage_table(rdev, &eg_pi->vddci_voltage_table, table);
1292
1293                 table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] = 0;
1294                 table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] =
1295                         cpu_to_be32(eg_pi->vddci_voltage_table.mask_low);
1296         }
1297 }
1298
1299 static int ni_populate_voltage_value(struct radeon_device *rdev,
1300                                      struct atom_voltage_table *table,
1301                                      u16 value,
1302                                      NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1303 {
1304         unsigned int i;
1305
1306         for (i = 0; i < table->count; i++) {
1307                 if (value <= table->entries[i].value) {
1308                         voltage->index = (u8)i;
1309                         voltage->value = cpu_to_be16(table->entries[i].value);
1310                         break;
1311                 }
1312         }
1313
1314         if (i >= table->count)
1315                 return -EINVAL;
1316
1317         return 0;
1318 }
1319
1320 static void ni_populate_mvdd_value(struct radeon_device *rdev,
1321                                    u32 mclk,
1322                                    NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1323 {
1324         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1325         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1326
1327         if (!pi->mvdd_control) {
1328                 voltage->index = eg_pi->mvdd_high_index;
1329                 voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1330                 return;
1331         }
1332
1333         if (mclk <= pi->mvdd_split_frequency) {
1334                 voltage->index = eg_pi->mvdd_low_index;
1335                 voltage->value = cpu_to_be16(MVDD_LOW_VALUE);
1336         } else {
1337                 voltage->index = eg_pi->mvdd_high_index;
1338                 voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1339         }
1340 }
1341
1342 static int ni_get_std_voltage_value(struct radeon_device *rdev,
1343                                     NISLANDS_SMC_VOLTAGE_VALUE *voltage,
1344                                     u16 *std_voltage)
1345 {
1346         if (rdev->pm.dpm.dyn_state.cac_leakage_table.entries &&
1347             ((u32)voltage->index < rdev->pm.dpm.dyn_state.cac_leakage_table.count))
1348                 *std_voltage = rdev->pm.dpm.dyn_state.cac_leakage_table.entries[voltage->index].vddc;
1349         else
1350                 *std_voltage = be16_to_cpu(voltage->value);
1351
1352         return 0;
1353 }
1354
1355 static void ni_populate_std_voltage_value(struct radeon_device *rdev,
1356                                           u16 value, u8 index,
1357                                           NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1358 {
1359         voltage->index = index;
1360         voltage->value = cpu_to_be16(value);
1361 }
1362
1363 static u32 ni_get_smc_power_scaling_factor(struct radeon_device *rdev)
1364 {
1365         u32 xclk_period;
1366         u32 xclk = radeon_get_xclk(rdev);
1367         u32 tmp = RREG32(CG_CAC_CTRL) & TID_CNT_MASK;
1368
1369         xclk_period = (1000000000UL / xclk);
1370         xclk_period /= 10000UL;
1371
1372         return tmp * xclk_period;
1373 }
1374
1375 static u32 ni_scale_power_for_smc(u32 power_in_watts, u32 scaling_factor)
1376 {
1377         return (power_in_watts * scaling_factor) << 2;
1378 }
1379
1380 static u32 ni_calculate_power_boost_limit(struct radeon_device *rdev,
1381                                           struct radeon_ps *radeon_state,
1382                                           u32 near_tdp_limit)
1383 {
1384         struct ni_ps *state = ni_get_ps(radeon_state);
1385         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1386         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1387         u32 power_boost_limit = 0;
1388         int ret;
1389
1390         if (ni_pi->enable_power_containment &&
1391             ni_pi->use_power_boost_limit) {
1392                 NISLANDS_SMC_VOLTAGE_VALUE vddc;
1393                 u16 std_vddc_med;
1394                 u16 std_vddc_high;
1395                 u64 tmp, n, d;
1396
1397                 if (state->performance_level_count < 3)
1398                         return 0;
1399
1400                 ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1401                                                 state->performance_levels[state->performance_level_count - 2].vddc,
1402                                                 &vddc);
1403                 if (ret)
1404                         return 0;
1405
1406                 ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_med);
1407                 if (ret)
1408                         return 0;
1409
1410                 ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1411                                                 state->performance_levels[state->performance_level_count - 1].vddc,
1412                                                 &vddc);
1413                 if (ret)
1414                         return 0;
1415
1416                 ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_high);
1417                 if (ret)
1418                         return 0;
1419
1420                 n = ((u64)near_tdp_limit * ((u64)std_vddc_med * (u64)std_vddc_med) * 90);
1421                 d = ((u64)std_vddc_high * (u64)std_vddc_high * 100);
1422                 tmp = div64_u64(n, d);
1423
1424                 if (tmp >> 32)
1425                         return 0;
1426                 power_boost_limit = (u32)tmp;
1427         }
1428
1429         return power_boost_limit;
1430 }
1431
1432 static int ni_calculate_adjusted_tdp_limits(struct radeon_device *rdev,
1433                                             bool adjust_polarity,
1434                                             u32 tdp_adjustment,
1435                                             u32 *tdp_limit,
1436                                             u32 *near_tdp_limit)
1437 {
1438         if (tdp_adjustment > (u32)rdev->pm.dpm.tdp_od_limit)
1439                 return -EINVAL;
1440
1441         if (adjust_polarity) {
1442                 *tdp_limit = ((100 + tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100;
1443                 *near_tdp_limit = rdev->pm.dpm.near_tdp_limit + (*tdp_limit - rdev->pm.dpm.tdp_limit);
1444         } else {
1445                 *tdp_limit = ((100 - tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100;
1446                 *near_tdp_limit = rdev->pm.dpm.near_tdp_limit - (rdev->pm.dpm.tdp_limit - *tdp_limit);
1447         }
1448
1449         return 0;
1450 }
1451
1452 static int ni_populate_smc_tdp_limits(struct radeon_device *rdev,
1453                                       struct radeon_ps *radeon_state)
1454 {
1455         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1456         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1457
1458         if (ni_pi->enable_power_containment) {
1459                 NISLANDS_SMC_STATETABLE *smc_table = &ni_pi->smc_statetable;
1460                 u32 scaling_factor = ni_get_smc_power_scaling_factor(rdev);
1461                 u32 tdp_limit;
1462                 u32 near_tdp_limit;
1463                 u32 power_boost_limit;
1464                 int ret;
1465
1466                 if (scaling_factor == 0)
1467                         return -EINVAL;
1468
1469                 memset(smc_table, 0, sizeof(NISLANDS_SMC_STATETABLE));
1470
1471                 ret = ni_calculate_adjusted_tdp_limits(rdev,
1472                                                        false, /* ??? */
1473                                                        rdev->pm.dpm.tdp_adjustment,
1474                                                        &tdp_limit,
1475                                                        &near_tdp_limit);
1476                 if (ret)
1477                         return ret;
1478
1479                 power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state,
1480                                                                    near_tdp_limit);
1481
1482                 smc_table->dpm2Params.TDPLimit =
1483                         cpu_to_be32(ni_scale_power_for_smc(tdp_limit, scaling_factor));
1484                 smc_table->dpm2Params.NearTDPLimit =
1485                         cpu_to_be32(ni_scale_power_for_smc(near_tdp_limit, scaling_factor));
1486                 smc_table->dpm2Params.SafePowerLimit =
1487                         cpu_to_be32(ni_scale_power_for_smc((near_tdp_limit * NISLANDS_DPM2_TDP_SAFE_LIMIT_PERCENT) / 100,
1488                                                            scaling_factor));
1489                 smc_table->dpm2Params.PowerBoostLimit =
1490                         cpu_to_be32(ni_scale_power_for_smc(power_boost_limit, scaling_factor));
1491
1492                 ret = rv770_copy_bytes_to_smc(rdev,
1493                                               (u16)(pi->state_table_start + offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) +
1494                                                     offsetof(PP_NIslands_DPM2Parameters, TDPLimit)),
1495                                               (u8 *)(&smc_table->dpm2Params.TDPLimit),
1496                                               sizeof(u32) * 4, pi->sram_end);
1497                 if (ret)
1498                         return ret;
1499         }
1500
1501         return 0;
1502 }
1503
1504 int ni_copy_and_switch_arb_sets(struct radeon_device *rdev,
1505                                 u32 arb_freq_src, u32 arb_freq_dest)
1506 {
1507         u32 mc_arb_dram_timing;
1508         u32 mc_arb_dram_timing2;
1509         u32 burst_time;
1510         u32 mc_cg_config;
1511
1512         switch (arb_freq_src) {
1513         case MC_CG_ARB_FREQ_F0:
1514                 mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING);
1515                 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2);
1516                 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE0_MASK) >> STATE0_SHIFT;
1517                 break;
1518         case MC_CG_ARB_FREQ_F1:
1519                 mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_1);
1520                 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_1);
1521                 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE1_MASK) >> STATE1_SHIFT;
1522                 break;
1523         case MC_CG_ARB_FREQ_F2:
1524                 mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_2);
1525                 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_2);
1526                 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE2_MASK) >> STATE2_SHIFT;
1527                 break;
1528         case MC_CG_ARB_FREQ_F3:
1529                 mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_3);
1530                 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_3);
1531                 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE3_MASK) >> STATE3_SHIFT;
1532                 break;
1533         default:
1534                 return -EINVAL;
1535         }
1536
1537         switch (arb_freq_dest) {
1538         case MC_CG_ARB_FREQ_F0:
1539                 WREG32(MC_ARB_DRAM_TIMING, mc_arb_dram_timing);
1540                 WREG32(MC_ARB_DRAM_TIMING2, mc_arb_dram_timing2);
1541                 WREG32_P(MC_ARB_BURST_TIME, STATE0(burst_time), ~STATE0_MASK);
1542                 break;
1543         case MC_CG_ARB_FREQ_F1:
1544                 WREG32(MC_ARB_DRAM_TIMING_1, mc_arb_dram_timing);
1545                 WREG32(MC_ARB_DRAM_TIMING2_1, mc_arb_dram_timing2);
1546                 WREG32_P(MC_ARB_BURST_TIME, STATE1(burst_time), ~STATE1_MASK);
1547                 break;
1548         case MC_CG_ARB_FREQ_F2:
1549                 WREG32(MC_ARB_DRAM_TIMING_2, mc_arb_dram_timing);
1550                 WREG32(MC_ARB_DRAM_TIMING2_2, mc_arb_dram_timing2);
1551                 WREG32_P(MC_ARB_BURST_TIME, STATE2(burst_time), ~STATE2_MASK);
1552                 break;
1553         case MC_CG_ARB_FREQ_F3:
1554                 WREG32(MC_ARB_DRAM_TIMING_3, mc_arb_dram_timing);
1555                 WREG32(MC_ARB_DRAM_TIMING2_3, mc_arb_dram_timing2);
1556                 WREG32_P(MC_ARB_BURST_TIME, STATE3(burst_time), ~STATE3_MASK);
1557                 break;
1558         default:
1559                 return -EINVAL;
1560         }
1561
1562         mc_cg_config = RREG32(MC_CG_CONFIG) | 0x0000000F;
1563         WREG32(MC_CG_CONFIG, mc_cg_config);
1564         WREG32_P(MC_ARB_CG, CG_ARB_REQ(arb_freq_dest), ~CG_ARB_REQ_MASK);
1565
1566         return 0;
1567 }
1568
1569 static int ni_init_arb_table_index(struct radeon_device *rdev)
1570 {
1571         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1572         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1573         u32 tmp;
1574         int ret;
1575
1576         ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start,
1577                                         &tmp, pi->sram_end);
1578         if (ret)
1579                 return ret;
1580
1581         tmp &= 0x00FFFFFF;
1582         tmp |= ((u32)MC_CG_ARB_FREQ_F1) << 24;
1583
1584         return rv770_write_smc_sram_dword(rdev, ni_pi->arb_table_start,
1585                                           tmp, pi->sram_end);
1586 }
1587
1588 static int ni_initial_switch_from_arb_f0_to_f1(struct radeon_device *rdev)
1589 {
1590         return ni_copy_and_switch_arb_sets(rdev, MC_CG_ARB_FREQ_F0, MC_CG_ARB_FREQ_F1);
1591 }
1592
1593 static int ni_force_switch_to_arb_f0(struct radeon_device *rdev)
1594 {
1595         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1596         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1597         u32 tmp;
1598         int ret;
1599
1600         ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start,
1601                                         &tmp, pi->sram_end);
1602         if (ret)
1603                 return ret;
1604
1605         tmp = (tmp >> 24) & 0xff;
1606
1607         if (tmp == MC_CG_ARB_FREQ_F0)
1608                 return 0;
1609
1610         return ni_copy_and_switch_arb_sets(rdev, tmp, MC_CG_ARB_FREQ_F0);
1611 }
1612
1613 static int ni_populate_memory_timing_parameters(struct radeon_device *rdev,
1614                                                 struct rv7xx_pl *pl,
1615                                                 SMC_NIslands_MCArbDramTimingRegisterSet *arb_regs)
1616 {
1617         u32 dram_timing;
1618         u32 dram_timing2;
1619
1620         arb_regs->mc_arb_rfsh_rate =
1621                 (u8)rv770_calculate_memory_refresh_rate(rdev, pl->sclk);
1622
1623
1624         radeon_atom_set_engine_dram_timings(rdev, pl->sclk, pl->mclk);
1625
1626         dram_timing = RREG32(MC_ARB_DRAM_TIMING);
1627         dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2);
1628
1629         arb_regs->mc_arb_dram_timing  = cpu_to_be32(dram_timing);
1630         arb_regs->mc_arb_dram_timing2 = cpu_to_be32(dram_timing2);
1631
1632         return 0;
1633 }
1634
1635 static int ni_do_program_memory_timing_parameters(struct radeon_device *rdev,
1636                                                   struct radeon_ps *radeon_state,
1637                                                   unsigned int first_arb_set)
1638 {
1639         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1640         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1641         struct ni_ps *state = ni_get_ps(radeon_state);
1642         SMC_NIslands_MCArbDramTimingRegisterSet arb_regs = { 0 };
1643         int i, ret = 0;
1644
1645         for (i = 0; i < state->performance_level_count; i++) {
1646                 ret = ni_populate_memory_timing_parameters(rdev, &state->performance_levels[i], &arb_regs);
1647                 if (ret)
1648                         break;
1649
1650                 ret = rv770_copy_bytes_to_smc(rdev,
1651                                               (u16)(ni_pi->arb_table_start +
1652                                                     offsetof(SMC_NIslands_MCArbDramTimingRegisters, data) +
1653                                                     sizeof(SMC_NIslands_MCArbDramTimingRegisterSet) * (first_arb_set + i)),
1654                                               (u8 *)&arb_regs,
1655                                               (u16)sizeof(SMC_NIslands_MCArbDramTimingRegisterSet),
1656                                               pi->sram_end);
1657                 if (ret)
1658                         break;
1659         }
1660         return ret;
1661 }
1662
1663 static int ni_program_memory_timing_parameters(struct radeon_device *rdev,
1664                                                struct radeon_ps *radeon_new_state)
1665 {
1666         return ni_do_program_memory_timing_parameters(rdev, radeon_new_state,
1667                                                       NISLANDS_DRIVER_STATE_ARB_INDEX);
1668 }
1669
1670 static void ni_populate_initial_mvdd_value(struct radeon_device *rdev,
1671                                            struct NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1672 {
1673         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1674
1675         voltage->index = eg_pi->mvdd_high_index;
1676         voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1677 }
1678
1679 static int ni_populate_smc_initial_state(struct radeon_device *rdev,
1680                                          struct radeon_ps *radeon_initial_state,
1681                                          NISLANDS_SMC_STATETABLE *table)
1682 {
1683         struct ni_ps *initial_state = ni_get_ps(radeon_initial_state);
1684         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1685         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1686         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1687         u32 reg;
1688         int ret;
1689
1690         table->initialState.level.mclk.vMPLL_AD_FUNC_CNTL =
1691                 cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl);
1692         table->initialState.level.mclk.vMPLL_AD_FUNC_CNTL_2 =
1693                 cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl_2);
1694         table->initialState.level.mclk.vMPLL_DQ_FUNC_CNTL =
1695                 cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl);
1696         table->initialState.level.mclk.vMPLL_DQ_FUNC_CNTL_2 =
1697                 cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl_2);
1698         table->initialState.level.mclk.vMCLK_PWRMGT_CNTL =
1699                 cpu_to_be32(ni_pi->clock_registers.mclk_pwrmgt_cntl);
1700         table->initialState.level.mclk.vDLL_CNTL =
1701                 cpu_to_be32(ni_pi->clock_registers.dll_cntl);
1702         table->initialState.level.mclk.vMPLL_SS =
1703                 cpu_to_be32(ni_pi->clock_registers.mpll_ss1);
1704         table->initialState.level.mclk.vMPLL_SS2 =
1705                 cpu_to_be32(ni_pi->clock_registers.mpll_ss2);
1706         table->initialState.level.mclk.mclk_value =
1707                 cpu_to_be32(initial_state->performance_levels[0].mclk);
1708
1709         table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL =
1710                 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl);
1711         table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_2 =
1712                 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_2);
1713         table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_3 =
1714                 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_3);
1715         table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_4 =
1716                 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_4);
1717         table->initialState.level.sclk.vCG_SPLL_SPREAD_SPECTRUM =
1718                 cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum);
1719         table->initialState.level.sclk.vCG_SPLL_SPREAD_SPECTRUM_2 =
1720                 cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum_2);
1721         table->initialState.level.sclk.sclk_value =
1722                 cpu_to_be32(initial_state->performance_levels[0].sclk);
1723         table->initialState.level.arbRefreshState =
1724                 NISLANDS_INITIAL_STATE_ARB_INDEX;
1725
1726         table->initialState.level.ACIndex = 0;
1727
1728         ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1729                                         initial_state->performance_levels[0].vddc,
1730                                         &table->initialState.level.vddc);
1731         if (!ret) {
1732                 u16 std_vddc;
1733
1734                 ret = ni_get_std_voltage_value(rdev,
1735                                                &table->initialState.level.vddc,
1736                                                &std_vddc);
1737                 if (!ret)
1738                         ni_populate_std_voltage_value(rdev, std_vddc,
1739                                                       table->initialState.level.vddc.index,
1740                                                       &table->initialState.level.std_vddc);
1741         }
1742
1743         if (eg_pi->vddci_control)
1744                 ni_populate_voltage_value(rdev,
1745                                           &eg_pi->vddci_voltage_table,
1746                                           initial_state->performance_levels[0].vddci,
1747                                           &table->initialState.level.vddci);
1748
1749         ni_populate_initial_mvdd_value(rdev, &table->initialState.level.mvdd);
1750
1751         reg = CG_R(0xffff) | CG_L(0);
1752         table->initialState.level.aT = cpu_to_be32(reg);
1753
1754         table->initialState.level.bSP = cpu_to_be32(pi->dsp);
1755
1756         if (pi->boot_in_gen2)
1757                 table->initialState.level.gen2PCIE = 1;
1758         else
1759                 table->initialState.level.gen2PCIE = 0;
1760
1761         if (pi->mem_gddr5) {
1762                 table->initialState.level.strobeMode =
1763                         cypress_get_strobe_mode_settings(rdev,
1764                                                          initial_state->performance_levels[0].mclk);
1765
1766                 if (initial_state->performance_levels[0].mclk > pi->mclk_edc_enable_threshold)
1767                         table->initialState.level.mcFlags = NISLANDS_SMC_MC_EDC_RD_FLAG | NISLANDS_SMC_MC_EDC_WR_FLAG;
1768                 else
1769                         table->initialState.level.mcFlags =  0;
1770         }
1771
1772         table->initialState.levelCount = 1;
1773
1774         table->initialState.flags |= PPSMC_SWSTATE_FLAG_DC;
1775
1776         table->initialState.level.dpm2.MaxPS = 0;
1777         table->initialState.level.dpm2.NearTDPDec = 0;
1778         table->initialState.level.dpm2.AboveSafeInc = 0;
1779         table->initialState.level.dpm2.BelowSafeInc = 0;
1780
1781         reg = MIN_POWER_MASK | MAX_POWER_MASK;
1782         table->initialState.level.SQPowerThrottle = cpu_to_be32(reg);
1783
1784         reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
1785         table->initialState.level.SQPowerThrottle_2 = cpu_to_be32(reg);
1786
1787         return 0;
1788 }
1789
1790 static int ni_populate_smc_acpi_state(struct radeon_device *rdev,
1791                                       NISLANDS_SMC_STATETABLE *table)
1792 {
1793         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1794         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1795         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1796         u32 mpll_ad_func_cntl   = ni_pi->clock_registers.mpll_ad_func_cntl;
1797         u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2;
1798         u32 mpll_dq_func_cntl   = ni_pi->clock_registers.mpll_dq_func_cntl;
1799         u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2;
1800         u32 spll_func_cntl      = ni_pi->clock_registers.cg_spll_func_cntl;
1801         u32 spll_func_cntl_2    = ni_pi->clock_registers.cg_spll_func_cntl_2;
1802         u32 spll_func_cntl_3    = ni_pi->clock_registers.cg_spll_func_cntl_3;
1803         u32 spll_func_cntl_4    = ni_pi->clock_registers.cg_spll_func_cntl_4;
1804         u32 mclk_pwrmgt_cntl    = ni_pi->clock_registers.mclk_pwrmgt_cntl;
1805         u32 dll_cntl            = ni_pi->clock_registers.dll_cntl;
1806         u32 reg;
1807         int ret;
1808
1809         table->ACPIState = table->initialState;
1810
1811         table->ACPIState.flags &= ~PPSMC_SWSTATE_FLAG_DC;
1812
1813         if (pi->acpi_vddc) {
1814                 ret = ni_populate_voltage_value(rdev,
1815                                                 &eg_pi->vddc_voltage_table,
1816                                                 pi->acpi_vddc, &table->ACPIState.level.vddc);
1817                 if (!ret) {
1818                         u16 std_vddc;
1819
1820                         ret = ni_get_std_voltage_value(rdev,
1821                                                        &table->ACPIState.level.vddc, &std_vddc);
1822                         if (!ret)
1823                                 ni_populate_std_voltage_value(rdev, std_vddc,
1824                                                               table->ACPIState.level.vddc.index,
1825                                                               &table->ACPIState.level.std_vddc);
1826                 }
1827
1828                 if (pi->pcie_gen2) {
1829                         if (pi->acpi_pcie_gen2)
1830                                 table->ACPIState.level.gen2PCIE = 1;
1831                         else
1832                                 table->ACPIState.level.gen2PCIE = 0;
1833                 } else {
1834                         table->ACPIState.level.gen2PCIE = 0;
1835                 }
1836         } else {
1837                 ret = ni_populate_voltage_value(rdev,
1838                                                 &eg_pi->vddc_voltage_table,
1839                                                 pi->min_vddc_in_table,
1840                                                 &table->ACPIState.level.vddc);
1841                 if (!ret) {
1842                         u16 std_vddc;
1843
1844                         ret = ni_get_std_voltage_value(rdev,
1845                                                        &table->ACPIState.level.vddc,
1846                                                        &std_vddc);
1847                         if (!ret)
1848                                 ni_populate_std_voltage_value(rdev, std_vddc,
1849                                                               table->ACPIState.level.vddc.index,
1850                                                               &table->ACPIState.level.std_vddc);
1851                 }
1852                 table->ACPIState.level.gen2PCIE = 0;
1853         }
1854
1855         if (eg_pi->acpi_vddci) {
1856                 if (eg_pi->vddci_control)
1857                         ni_populate_voltage_value(rdev,
1858                                                   &eg_pi->vddci_voltage_table,
1859                                                   eg_pi->acpi_vddci,
1860                                                   &table->ACPIState.level.vddci);
1861         }
1862
1863
1864         mpll_ad_func_cntl &= ~PDNB;
1865
1866         mpll_ad_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN;
1867
1868         if (pi->mem_gddr5)
1869                 mpll_dq_func_cntl &= ~PDNB;
1870         mpll_dq_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN | BYPASS;
1871
1872
1873         mclk_pwrmgt_cntl |= (MRDCKA0_RESET |
1874                              MRDCKA1_RESET |
1875                              MRDCKB0_RESET |
1876                              MRDCKB1_RESET |
1877                              MRDCKC0_RESET |
1878                              MRDCKC1_RESET |
1879                              MRDCKD0_RESET |
1880                              MRDCKD1_RESET);
1881
1882         mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB |
1883                               MRDCKA1_PDNB |
1884                               MRDCKB0_PDNB |
1885                               MRDCKB1_PDNB |
1886                               MRDCKC0_PDNB |
1887                               MRDCKC1_PDNB |
1888                               MRDCKD0_PDNB |
1889                               MRDCKD1_PDNB);
1890
1891         dll_cntl |= (MRDCKA0_BYPASS |
1892                      MRDCKA1_BYPASS |
1893                      MRDCKB0_BYPASS |
1894                      MRDCKB1_BYPASS |
1895                      MRDCKC0_BYPASS |
1896                      MRDCKC1_BYPASS |
1897                      MRDCKD0_BYPASS |
1898                      MRDCKD1_BYPASS);
1899
1900         spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
1901         spll_func_cntl_2 |= SCLK_MUX_SEL(4);
1902
1903         table->ACPIState.level.mclk.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
1904         table->ACPIState.level.mclk.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
1905         table->ACPIState.level.mclk.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
1906         table->ACPIState.level.mclk.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
1907         table->ACPIState.level.mclk.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
1908         table->ACPIState.level.mclk.vDLL_CNTL = cpu_to_be32(dll_cntl);
1909
1910         table->ACPIState.level.mclk.mclk_value = 0;
1911
1912         table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
1913         table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
1914         table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
1915         table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(spll_func_cntl_4);
1916
1917         table->ACPIState.level.sclk.sclk_value = 0;
1918
1919         ni_populate_mvdd_value(rdev, 0, &table->ACPIState.level.mvdd);
1920
1921         if (eg_pi->dynamic_ac_timing)
1922                 table->ACPIState.level.ACIndex = 1;
1923
1924         table->ACPIState.level.dpm2.MaxPS = 0;
1925         table->ACPIState.level.dpm2.NearTDPDec = 0;
1926         table->ACPIState.level.dpm2.AboveSafeInc = 0;
1927         table->ACPIState.level.dpm2.BelowSafeInc = 0;
1928
1929         reg = MIN_POWER_MASK | MAX_POWER_MASK;
1930         table->ACPIState.level.SQPowerThrottle = cpu_to_be32(reg);
1931
1932         reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
1933         table->ACPIState.level.SQPowerThrottle_2 = cpu_to_be32(reg);
1934
1935         return 0;
1936 }
1937
1938 static int ni_init_smc_table(struct radeon_device *rdev)
1939 {
1940         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1941         struct ni_power_info *ni_pi = ni_get_pi(rdev);
1942         int ret;
1943         struct radeon_ps *radeon_boot_state = rdev->pm.dpm.boot_ps;
1944         NISLANDS_SMC_STATETABLE *table = &ni_pi->smc_statetable;
1945
1946         memset(table, 0, sizeof(NISLANDS_SMC_STATETABLE));
1947
1948         ni_populate_smc_voltage_tables(rdev, table);
1949
1950         switch (rdev->pm.int_thermal_type) {
1951         case THERMAL_TYPE_NI:
1952         case THERMAL_TYPE_EMC2103_WITH_INTERNAL:
1953                 table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_INTERNAL;
1954                 break;
1955         case THERMAL_TYPE_NONE:
1956                 table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_NONE;
1957                 break;
1958         default:
1959                 table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_EXTERNAL;
1960                 break;
1961         }
1962
1963         if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_HARDWAREDC)
1964                 table->systemFlags |= PPSMC_SYSTEMFLAG_GPIO_DC;
1965
1966         if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_REGULATOR_HOT)
1967                 table->systemFlags |= PPSMC_SYSTEMFLAG_REGULATOR_HOT;
1968
1969         if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_STEPVDDC)
1970                 table->systemFlags |= PPSMC_SYSTEMFLAG_STEPVDDC;
1971
1972         if (pi->mem_gddr5)
1973                 table->systemFlags |= PPSMC_SYSTEMFLAG_GDDR5;
1974
1975         ret = ni_populate_smc_initial_state(rdev, radeon_boot_state, table);
1976         if (ret)
1977                 return ret;
1978
1979         ret = ni_populate_smc_acpi_state(rdev, table);
1980         if (ret)
1981                 return ret;
1982
1983         table->driverState.flags = table->initialState.flags;
1984         table->driverState.levelCount = table->initialState.levelCount;
1985         table->driverState.levels[0] = table->initialState.level;
1986
1987         table->ULVState = table->initialState;
1988
1989         ret = ni_do_program_memory_timing_parameters(rdev, radeon_boot_state,
1990                                                      NISLANDS_INITIAL_STATE_ARB_INDEX);
1991         if (ret)
1992                 return ret;
1993
1994         return rv770_copy_bytes_to_smc(rdev, pi->state_table_start, (u8 *)table,
1995                                        sizeof(NISLANDS_SMC_STATETABLE), pi->sram_end);
1996 }
1997
1998 static int ni_calculate_sclk_params(struct radeon_device *rdev,
1999                                     u32 engine_clock,
2000                                     NISLANDS_SMC_SCLK_VALUE *sclk)
2001 {
2002         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2003         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2004         struct atom_clock_dividers dividers;
2005         u32 spll_func_cntl = ni_pi->clock_registers.cg_spll_func_cntl;
2006         u32 spll_func_cntl_2 = ni_pi->clock_registers.cg_spll_func_cntl_2;
2007         u32 spll_func_cntl_3 = ni_pi->clock_registers.cg_spll_func_cntl_3;
2008         u32 spll_func_cntl_4 = ni_pi->clock_registers.cg_spll_func_cntl_4;
2009         u32 cg_spll_spread_spectrum = ni_pi->clock_registers.cg_spll_spread_spectrum;
2010         u32 cg_spll_spread_spectrum_2 = ni_pi->clock_registers.cg_spll_spread_spectrum_2;
2011         u64 tmp;
2012         u32 reference_clock = rdev->clock.spll.reference_freq;
2013         u32 reference_divider;
2014         u32 fbdiv;
2015         int ret;
2016
2017         ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
2018                                              engine_clock, false, &dividers);
2019         if (ret)
2020                 return ret;
2021
2022         reference_divider = 1 + dividers.ref_div;
2023
2024
2025         tmp = (u64) engine_clock * reference_divider * dividers.post_div * 16834;
2026         do_div(tmp, reference_clock);
2027         fbdiv = (u32) tmp;
2028
2029         spll_func_cntl &= ~(SPLL_PDIV_A_MASK | SPLL_REF_DIV_MASK);
2030         spll_func_cntl |= SPLL_REF_DIV(dividers.ref_div);
2031         spll_func_cntl |= SPLL_PDIV_A(dividers.post_div);
2032
2033         spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
2034         spll_func_cntl_2 |= SCLK_MUX_SEL(2);
2035
2036         spll_func_cntl_3 &= ~SPLL_FB_DIV_MASK;
2037         spll_func_cntl_3 |= SPLL_FB_DIV(fbdiv);
2038         spll_func_cntl_3 |= SPLL_DITHEN;
2039
2040         if (pi->sclk_ss) {
2041                 struct radeon_atom_ss ss;
2042                 u32 vco_freq = engine_clock * dividers.post_div;
2043
2044                 if (radeon_atombios_get_asic_ss_info(rdev, &ss,
2045                                                      ASIC_INTERNAL_ENGINE_SS, vco_freq)) {
2046                         u32 clk_s = reference_clock * 5 / (reference_divider * ss.rate);
2047                         u32 clk_v = 4 * ss.percentage * fbdiv / (clk_s * 10000);
2048
2049                         cg_spll_spread_spectrum &= ~CLK_S_MASK;
2050                         cg_spll_spread_spectrum |= CLK_S(clk_s);
2051                         cg_spll_spread_spectrum |= SSEN;
2052
2053                         cg_spll_spread_spectrum_2 &= ~CLK_V_MASK;
2054                         cg_spll_spread_spectrum_2 |= CLK_V(clk_v);
2055                 }
2056         }
2057
2058         sclk->sclk_value = engine_clock;
2059         sclk->vCG_SPLL_FUNC_CNTL = spll_func_cntl;
2060         sclk->vCG_SPLL_FUNC_CNTL_2 = spll_func_cntl_2;
2061         sclk->vCG_SPLL_FUNC_CNTL_3 = spll_func_cntl_3;
2062         sclk->vCG_SPLL_FUNC_CNTL_4 = spll_func_cntl_4;
2063         sclk->vCG_SPLL_SPREAD_SPECTRUM = cg_spll_spread_spectrum;
2064         sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cg_spll_spread_spectrum_2;
2065
2066         return 0;
2067 }
2068
2069 static int ni_populate_sclk_value(struct radeon_device *rdev,
2070                                   u32 engine_clock,
2071                                   NISLANDS_SMC_SCLK_VALUE *sclk)
2072 {
2073         NISLANDS_SMC_SCLK_VALUE sclk_tmp;
2074         int ret;
2075
2076         ret = ni_calculate_sclk_params(rdev, engine_clock, &sclk_tmp);
2077         if (!ret) {
2078                 sclk->sclk_value = cpu_to_be32(sclk_tmp.sclk_value);
2079                 sclk->vCG_SPLL_FUNC_CNTL = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL);
2080                 sclk->vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_2);
2081                 sclk->vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_3);
2082                 sclk->vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_4);
2083                 sclk->vCG_SPLL_SPREAD_SPECTRUM = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM);
2084                 sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM_2);
2085         }
2086
2087         return ret;
2088 }
2089
2090 static int ni_init_smc_spll_table(struct radeon_device *rdev)
2091 {
2092         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2093         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2094         SMC_NISLANDS_SPLL_DIV_TABLE *spll_table;
2095         NISLANDS_SMC_SCLK_VALUE sclk_params;
2096         u32 fb_div;
2097         u32 p_div;
2098         u32 clk_s;
2099         u32 clk_v;
2100         u32 sclk = 0;
2101         int i, ret;
2102         u32 tmp;
2103
2104         if (ni_pi->spll_table_start == 0)
2105                 return -EINVAL;
2106
2107         spll_table = kzalloc(sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), GFP_KERNEL);
2108         if (spll_table == NULL)
2109                 return -ENOMEM;
2110
2111         for (i = 0; i < 256; i++) {
2112                 ret = ni_calculate_sclk_params(rdev, sclk, &sclk_params);
2113                 if (ret)
2114                         break;
2115
2116                 p_div = (sclk_params.vCG_SPLL_FUNC_CNTL & SPLL_PDIV_A_MASK) >> SPLL_PDIV_A_SHIFT;
2117                 fb_div = (sclk_params.vCG_SPLL_FUNC_CNTL_3 & SPLL_FB_DIV_MASK) >> SPLL_FB_DIV_SHIFT;
2118                 clk_s = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM & CLK_S_MASK) >> CLK_S_SHIFT;
2119                 clk_v = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM_2 & CLK_V_MASK) >> CLK_V_SHIFT;
2120
2121                 fb_div &= ~0x00001FFF;
2122                 fb_div >>= 1;
2123                 clk_v >>= 6;
2124
2125                 if (p_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT))
2126                         ret = -EINVAL;
2127
2128                 if (clk_s & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT))
2129                         ret = -EINVAL;
2130
2131                 if (fb_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT))
2132                         ret = -EINVAL;
2133
2134                 if (clk_v & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT))
2135                         ret = -EINVAL;
2136
2137                 if (ret)
2138                         break;
2139
2140                 tmp = ((fb_div << SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK) |
2141                         ((p_div << SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK);
2142                 spll_table->freq[i] = cpu_to_be32(tmp);
2143
2144                 tmp = ((clk_v << SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK) |
2145                         ((clk_s << SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK);
2146                 spll_table->ss[i] = cpu_to_be32(tmp);
2147
2148                 sclk += 512;
2149         }
2150
2151         if (!ret)
2152                 ret = rv770_copy_bytes_to_smc(rdev, ni_pi->spll_table_start, (u8 *)spll_table,
2153                                               sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), pi->sram_end);
2154
2155         kfree(spll_table);
2156
2157         return ret;
2158 }
2159
2160 static int ni_populate_mclk_value(struct radeon_device *rdev,
2161                                   u32 engine_clock,
2162                                   u32 memory_clock,
2163                                   NISLANDS_SMC_MCLK_VALUE *mclk,
2164                                   bool strobe_mode,
2165                                   bool dll_state_on)
2166 {
2167         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2168         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2169         u32 mpll_ad_func_cntl = ni_pi->clock_registers.mpll_ad_func_cntl;
2170         u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2;
2171         u32 mpll_dq_func_cntl = ni_pi->clock_registers.mpll_dq_func_cntl;
2172         u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2;
2173         u32 mclk_pwrmgt_cntl = ni_pi->clock_registers.mclk_pwrmgt_cntl;
2174         u32 dll_cntl = ni_pi->clock_registers.dll_cntl;
2175         u32 mpll_ss1 = ni_pi->clock_registers.mpll_ss1;
2176         u32 mpll_ss2 = ni_pi->clock_registers.mpll_ss2;
2177         struct atom_clock_dividers dividers;
2178         u32 ibias;
2179         u32 dll_speed;
2180         int ret;
2181         u32 mc_seq_misc7;
2182
2183         ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_MEMORY_PLL_PARAM,
2184                                              memory_clock, strobe_mode, &dividers);
2185         if (ret)
2186                 return ret;
2187
2188         if (!strobe_mode) {
2189                 mc_seq_misc7 = RREG32(MC_SEQ_MISC7);
2190
2191                 if (mc_seq_misc7 & 0x8000000)
2192                         dividers.post_div = 1;
2193         }
2194
2195         ibias = cypress_map_clkf_to_ibias(rdev, dividers.whole_fb_div);
2196
2197         mpll_ad_func_cntl &= ~(CLKR_MASK |
2198                                YCLK_POST_DIV_MASK |
2199                                CLKF_MASK |
2200                                CLKFRAC_MASK |
2201                                IBIAS_MASK);
2202         mpll_ad_func_cntl |= CLKR(dividers.ref_div);
2203         mpll_ad_func_cntl |= YCLK_POST_DIV(dividers.post_div);
2204         mpll_ad_func_cntl |= CLKF(dividers.whole_fb_div);
2205         mpll_ad_func_cntl |= CLKFRAC(dividers.frac_fb_div);
2206         mpll_ad_func_cntl |= IBIAS(ibias);
2207
2208         if (dividers.vco_mode)
2209                 mpll_ad_func_cntl_2 |= VCO_MODE;
2210         else
2211                 mpll_ad_func_cntl_2 &= ~VCO_MODE;
2212
2213         if (pi->mem_gddr5) {
2214                 mpll_dq_func_cntl &= ~(CLKR_MASK |
2215                                        YCLK_POST_DIV_MASK |
2216                                        CLKF_MASK |
2217                                        CLKFRAC_MASK |
2218                                        IBIAS_MASK);
2219                 mpll_dq_func_cntl |= CLKR(dividers.ref_div);
2220                 mpll_dq_func_cntl |= YCLK_POST_DIV(dividers.post_div);
2221                 mpll_dq_func_cntl |= CLKF(dividers.whole_fb_div);
2222                 mpll_dq_func_cntl |= CLKFRAC(dividers.frac_fb_div);
2223                 mpll_dq_func_cntl |= IBIAS(ibias);
2224
2225                 if (strobe_mode)
2226                         mpll_dq_func_cntl &= ~PDNB;
2227                 else
2228                         mpll_dq_func_cntl |= PDNB;
2229
2230                 if (dividers.vco_mode)
2231                         mpll_dq_func_cntl_2 |= VCO_MODE;
2232                 else
2233                         mpll_dq_func_cntl_2 &= ~VCO_MODE;
2234         }
2235
2236         if (pi->mclk_ss) {
2237                 struct radeon_atom_ss ss;
2238                 u32 vco_freq = memory_clock * dividers.post_div;
2239
2240                 if (radeon_atombios_get_asic_ss_info(rdev, &ss,
2241                                                      ASIC_INTERNAL_MEMORY_SS, vco_freq)) {
2242                         u32 reference_clock = rdev->clock.mpll.reference_freq;
2243                         u32 decoded_ref = rv740_get_decoded_reference_divider(dividers.ref_div);
2244                         u32 clk_s = reference_clock * 5 / (decoded_ref * ss.rate);
2245                         u32 clk_v = ss.percentage *
2246                                 (0x4000 * dividers.whole_fb_div + 0x800 * dividers.frac_fb_div) / (clk_s * 625);
2247
2248                         mpll_ss1 &= ~CLKV_MASK;
2249                         mpll_ss1 |= CLKV(clk_v);
2250
2251                         mpll_ss2 &= ~CLKS_MASK;
2252                         mpll_ss2 |= CLKS(clk_s);
2253                 }
2254         }
2255
2256         dll_speed = rv740_get_dll_speed(pi->mem_gddr5,
2257                                         memory_clock);
2258
2259         mclk_pwrmgt_cntl &= ~DLL_SPEED_MASK;
2260         mclk_pwrmgt_cntl |= DLL_SPEED(dll_speed);
2261         if (dll_state_on)
2262                 mclk_pwrmgt_cntl |= (MRDCKA0_PDNB |
2263                                      MRDCKA1_PDNB |
2264                                      MRDCKB0_PDNB |
2265                                      MRDCKB1_PDNB |
2266                                      MRDCKC0_PDNB |
2267                                      MRDCKC1_PDNB |
2268                                      MRDCKD0_PDNB |
2269                                      MRDCKD1_PDNB);
2270         else
2271                 mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB |
2272                                       MRDCKA1_PDNB |
2273                                       MRDCKB0_PDNB |
2274                                       MRDCKB1_PDNB |
2275                                       MRDCKC0_PDNB |
2276                                       MRDCKC1_PDNB |
2277                                       MRDCKD0_PDNB |
2278                                       MRDCKD1_PDNB);
2279
2280
2281         mclk->mclk_value = cpu_to_be32(memory_clock);
2282         mclk->vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
2283         mclk->vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
2284         mclk->vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
2285         mclk->vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
2286         mclk->vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
2287         mclk->vDLL_CNTL = cpu_to_be32(dll_cntl);
2288         mclk->vMPLL_SS = cpu_to_be32(mpll_ss1);
2289         mclk->vMPLL_SS2 = cpu_to_be32(mpll_ss2);
2290
2291         return 0;
2292 }
2293
2294 static void ni_populate_smc_sp(struct radeon_device *rdev,
2295                                struct radeon_ps *radeon_state,
2296                                NISLANDS_SMC_SWSTATE *smc_state)
2297 {
2298         struct ni_ps *ps = ni_get_ps(radeon_state);
2299         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2300         int i;
2301
2302         for (i = 0; i < ps->performance_level_count - 1; i++)
2303                 smc_state->levels[i].bSP = cpu_to_be32(pi->dsp);
2304
2305         smc_state->levels[ps->performance_level_count - 1].bSP =
2306                 cpu_to_be32(pi->psp);
2307 }
2308
2309 static int ni_convert_power_level_to_smc(struct radeon_device *rdev,
2310                                          struct rv7xx_pl *pl,
2311                                          NISLANDS_SMC_HW_PERFORMANCE_LEVEL *level)
2312 {
2313         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2314         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2315         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2316         int ret;
2317         bool dll_state_on;
2318         u16 std_vddc;
2319         u32 tmp = RREG32(DC_STUTTER_CNTL);
2320
2321         level->gen2PCIE = pi->pcie_gen2 ?
2322                 ((pl->flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2) ? 1 : 0) : 0;
2323
2324         ret = ni_populate_sclk_value(rdev, pl->sclk, &level->sclk);
2325         if (ret)
2326                 return ret;
2327
2328         level->mcFlags =  0;
2329         if (pi->mclk_stutter_mode_threshold &&
2330             (pl->mclk <= pi->mclk_stutter_mode_threshold) &&
2331             !eg_pi->uvd_enabled &&
2332             (tmp & DC_STUTTER_ENABLE_A) &&
2333             (tmp & DC_STUTTER_ENABLE_B))
2334                 level->mcFlags |= NISLANDS_SMC_MC_STUTTER_EN;
2335
2336         if (pi->mem_gddr5) {
2337                 if (pl->mclk > pi->mclk_edc_enable_threshold)
2338                         level->mcFlags |= NISLANDS_SMC_MC_EDC_RD_FLAG;
2339                 if (pl->mclk > eg_pi->mclk_edc_wr_enable_threshold)
2340                         level->mcFlags |= NISLANDS_SMC_MC_EDC_WR_FLAG;
2341
2342                 level->strobeMode = cypress_get_strobe_mode_settings(rdev, pl->mclk);
2343
2344                 if (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) {
2345                         if (cypress_get_mclk_frequency_ratio(rdev, pl->mclk, true) >=
2346                             ((RREG32(MC_SEQ_MISC7) >> 16) & 0xf))
2347                                 dll_state_on = ((RREG32(MC_SEQ_MISC5) >> 1) & 0x1) ? true : false;
2348                         else
2349                                 dll_state_on = ((RREG32(MC_SEQ_MISC6) >> 1) & 0x1) ? true : false;
2350                 } else {
2351                         dll_state_on = false;
2352                         if (pl->mclk > ni_pi->mclk_rtt_mode_threshold)
2353                                 level->mcFlags |= NISLANDS_SMC_MC_RTT_ENABLE;
2354                 }
2355
2356                 ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk,
2357                                              &level->mclk,
2358                                              (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) != 0,
2359                                              dll_state_on);
2360         } else
2361                 ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk, &level->mclk, 1, 1);
2362
2363         if (ret)
2364                 return ret;
2365
2366         ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
2367                                         pl->vddc, &level->vddc);
2368         if (ret)
2369                 return ret;
2370
2371         ret = ni_get_std_voltage_value(rdev, &level->vddc, &std_vddc);
2372         if (ret)
2373                 return ret;
2374
2375         ni_populate_std_voltage_value(rdev, std_vddc,
2376                                       level->vddc.index, &level->std_vddc);
2377
2378         if (eg_pi->vddci_control) {
2379                 ret = ni_populate_voltage_value(rdev, &eg_pi->vddci_voltage_table,
2380                                                 pl->vddci, &level->vddci);
2381                 if (ret)
2382                         return ret;
2383         }
2384
2385         ni_populate_mvdd_value(rdev, pl->mclk, &level->mvdd);
2386
2387         return ret;
2388 }
2389
2390 static int ni_populate_smc_t(struct radeon_device *rdev,
2391                              struct radeon_ps *radeon_state,
2392                              NISLANDS_SMC_SWSTATE *smc_state)
2393 {
2394         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2395         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2396         struct ni_ps *state = ni_get_ps(radeon_state);
2397         u32 a_t;
2398         u32 t_l, t_h;
2399         u32 high_bsp;
2400         int i, ret;
2401
2402         if (state->performance_level_count >= 9)
2403                 return -EINVAL;
2404
2405         if (state->performance_level_count < 2) {
2406                 a_t = CG_R(0xffff) | CG_L(0);
2407                 smc_state->levels[0].aT = cpu_to_be32(a_t);
2408                 return 0;
2409         }
2410
2411         smc_state->levels[0].aT = cpu_to_be32(0);
2412
2413         for (i = 0; i <= state->performance_level_count - 2; i++) {
2414                 if (eg_pi->uvd_enabled)
2415                         ret = r600_calculate_at(
2416                                 1000 * (i * (eg_pi->smu_uvd_hs ? 2 : 8) + 2),
2417                                 100 * R600_AH_DFLT,
2418                                 state->performance_levels[i + 1].sclk,
2419                                 state->performance_levels[i].sclk,
2420                                 &t_l,
2421                                 &t_h);
2422                 else
2423                         ret = r600_calculate_at(
2424                                 1000 * (i + 1),
2425                                 100 * R600_AH_DFLT,
2426                                 state->performance_levels[i + 1].sclk,
2427                                 state->performance_levels[i].sclk,
2428                                 &t_l,
2429                                 &t_h);
2430
2431                 if (ret) {
2432                         t_h = (i + 1) * 1000 - 50 * R600_AH_DFLT;
2433                         t_l = (i + 1) * 1000 + 50 * R600_AH_DFLT;
2434                 }
2435
2436                 a_t = be32_to_cpu(smc_state->levels[i].aT) & ~CG_R_MASK;
2437                 a_t |= CG_R(t_l * pi->bsp / 20000);
2438                 smc_state->levels[i].aT = cpu_to_be32(a_t);
2439
2440                 high_bsp = (i == state->performance_level_count - 2) ?
2441                         pi->pbsp : pi->bsp;
2442
2443                 a_t = CG_R(0xffff) | CG_L(t_h * high_bsp / 20000);
2444                 smc_state->levels[i + 1].aT = cpu_to_be32(a_t);
2445         }
2446
2447         return 0;
2448 }
2449
2450 static int ni_populate_power_containment_values(struct radeon_device *rdev,
2451                                                 struct radeon_ps *radeon_state,
2452                                                 NISLANDS_SMC_SWSTATE *smc_state)
2453 {
2454         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2455         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2456         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2457         struct ni_ps *state = ni_get_ps(radeon_state);
2458         u32 prev_sclk;
2459         u32 max_sclk;
2460         u32 min_sclk;
2461         int i, ret;
2462         u32 tdp_limit;
2463         u32 near_tdp_limit;
2464         u32 power_boost_limit;
2465         u8 max_ps_percent;
2466
2467         if (ni_pi->enable_power_containment == false)
2468                 return 0;
2469
2470         if (state->performance_level_count == 0)
2471                 return -EINVAL;
2472
2473         if (smc_state->levelCount != state->performance_level_count)
2474                 return -EINVAL;
2475
2476         ret = ni_calculate_adjusted_tdp_limits(rdev,
2477                                                false, /* ??? */
2478                                                rdev->pm.dpm.tdp_adjustment,
2479                                                &tdp_limit,
2480                                                &near_tdp_limit);
2481         if (ret)
2482                 return ret;
2483
2484         power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state, near_tdp_limit);
2485
2486         ret = rv770_write_smc_sram_dword(rdev,
2487                                          pi->state_table_start +
2488                                          offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) +
2489                                          offsetof(PP_NIslands_DPM2Parameters, PowerBoostLimit),
2490                                          ni_scale_power_for_smc(power_boost_limit, ni_get_smc_power_scaling_factor(rdev)),
2491                                          pi->sram_end);
2492         if (ret)
2493                 power_boost_limit = 0;
2494
2495         smc_state->levels[0].dpm2.MaxPS = 0;
2496         smc_state->levels[0].dpm2.NearTDPDec = 0;
2497         smc_state->levels[0].dpm2.AboveSafeInc = 0;
2498         smc_state->levels[0].dpm2.BelowSafeInc = 0;
2499         smc_state->levels[0].stateFlags |= power_boost_limit ? PPSMC_STATEFLAG_POWERBOOST : 0;
2500
2501         for (i = 1; i < state->performance_level_count; i++) {
2502                 prev_sclk = state->performance_levels[i-1].sclk;
2503                 max_sclk  = state->performance_levels[i].sclk;
2504                 max_ps_percent = (i != (state->performance_level_count - 1)) ?
2505                         NISLANDS_DPM2_MAXPS_PERCENT_M : NISLANDS_DPM2_MAXPS_PERCENT_H;
2506
2507                 if (max_sclk < prev_sclk)
2508                         return -EINVAL;
2509
2510                 if ((max_ps_percent == 0) || (prev_sclk == max_sclk) || eg_pi->uvd_enabled)
2511                         min_sclk = max_sclk;
2512                 else if (1 == i)
2513                         min_sclk = prev_sclk;
2514                 else
2515                         min_sclk = (prev_sclk * (u32)max_ps_percent) / 100;
2516
2517                 if (min_sclk < state->performance_levels[0].sclk)
2518                         min_sclk = state->performance_levels[0].sclk;
2519
2520                 if (min_sclk == 0)
2521                         return -EINVAL;
2522
2523                 smc_state->levels[i].dpm2.MaxPS =
2524                         (u8)((NISLANDS_DPM2_MAX_PULSE_SKIP * (max_sclk - min_sclk)) / max_sclk);
2525                 smc_state->levels[i].dpm2.NearTDPDec = NISLANDS_DPM2_NEAR_TDP_DEC;
2526                 smc_state->levels[i].dpm2.AboveSafeInc = NISLANDS_DPM2_ABOVE_SAFE_INC;
2527                 smc_state->levels[i].dpm2.BelowSafeInc = NISLANDS_DPM2_BELOW_SAFE_INC;
2528                 smc_state->levels[i].stateFlags |=
2529                         ((i != (state->performance_level_count - 1)) && power_boost_limit) ?
2530                         PPSMC_STATEFLAG_POWERBOOST : 0;
2531         }
2532
2533         return 0;
2534 }
2535
2536 static int ni_populate_sq_ramping_values(struct radeon_device *rdev,
2537                                          struct radeon_ps *radeon_state,
2538                                          NISLANDS_SMC_SWSTATE *smc_state)
2539 {
2540         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2541         struct ni_ps *state = ni_get_ps(radeon_state);
2542         u32 sq_power_throttle;
2543         u32 sq_power_throttle2;
2544         bool enable_sq_ramping = ni_pi->enable_sq_ramping;
2545         int i;
2546
2547         if (state->performance_level_count == 0)
2548                 return -EINVAL;
2549
2550         if (smc_state->levelCount != state->performance_level_count)
2551                 return -EINVAL;
2552
2553         if (rdev->pm.dpm.sq_ramping_threshold == 0)
2554                 return -EINVAL;
2555
2556         if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER > (MAX_POWER_MASK >> MAX_POWER_SHIFT))
2557                 enable_sq_ramping = false;
2558
2559         if (NISLANDS_DPM2_SQ_RAMP_MIN_POWER > (MIN_POWER_MASK >> MIN_POWER_SHIFT))
2560                 enable_sq_ramping = false;
2561
2562         if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA > (MAX_POWER_DELTA_MASK >> MAX_POWER_DELTA_SHIFT))
2563                 enable_sq_ramping = false;
2564
2565         if (NISLANDS_DPM2_SQ_RAMP_STI_SIZE > (STI_SIZE_MASK >> STI_SIZE_SHIFT))
2566                 enable_sq_ramping = false;
2567
2568         if (NISLANDS_DPM2_SQ_RAMP_LTI_RATIO > (LTI_RATIO_MASK >> LTI_RATIO_SHIFT))
2569                 enable_sq_ramping = false;
2570
2571         for (i = 0; i < state->performance_level_count; i++) {
2572                 sq_power_throttle  = 0;
2573                 sq_power_throttle2 = 0;
2574
2575                 if ((state->performance_levels[i].sclk >= rdev->pm.dpm.sq_ramping_threshold) &&
2576                     enable_sq_ramping) {
2577                         sq_power_throttle |= MAX_POWER(NISLANDS_DPM2_SQ_RAMP_MAX_POWER);
2578                         sq_power_throttle |= MIN_POWER(NISLANDS_DPM2_SQ_RAMP_MIN_POWER);
2579                         sq_power_throttle2 |= MAX_POWER_DELTA(NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA);
2580                         sq_power_throttle2 |= STI_SIZE(NISLANDS_DPM2_SQ_RAMP_STI_SIZE);
2581                         sq_power_throttle2 |= LTI_RATIO(NISLANDS_DPM2_SQ_RAMP_LTI_RATIO);
2582                 } else {
2583                         sq_power_throttle |= MAX_POWER_MASK | MIN_POWER_MASK;
2584                         sq_power_throttle2 |= MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
2585                 }
2586
2587                 smc_state->levels[i].SQPowerThrottle   = cpu_to_be32(sq_power_throttle);
2588                 smc_state->levels[i].SQPowerThrottle_2 = cpu_to_be32(sq_power_throttle2);
2589         }
2590
2591         return 0;
2592 }
2593
2594 static int ni_enable_power_containment(struct radeon_device *rdev,
2595                                        struct radeon_ps *radeon_new_state,
2596                                        bool enable)
2597 {
2598         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2599         PPSMC_Result smc_result;
2600         int ret = 0;
2601
2602         if (ni_pi->enable_power_containment) {
2603                 if (enable) {
2604                         if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) {
2605                                 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingActive);
2606                                 if (smc_result != PPSMC_Result_OK) {
2607                                         ret = -EINVAL;
2608                                         ni_pi->pc_enabled = false;
2609                                 } else {
2610                                         ni_pi->pc_enabled = true;
2611                                 }
2612                         }
2613                 } else {
2614                         smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingInactive);
2615                         if (smc_result != PPSMC_Result_OK)
2616                                 ret = -EINVAL;
2617                         ni_pi->pc_enabled = false;
2618                 }
2619         }
2620
2621         return ret;
2622 }
2623
2624 static int ni_convert_power_state_to_smc(struct radeon_device *rdev,
2625                                          struct radeon_ps *radeon_state,
2626                                          NISLANDS_SMC_SWSTATE *smc_state)
2627 {
2628         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2629         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2630         struct ni_ps *state = ni_get_ps(radeon_state);
2631         int i, ret;
2632         u32 threshold = state->performance_levels[state->performance_level_count - 1].sclk * 100 / 100;
2633
2634         if (!(radeon_state->caps & ATOM_PPLIB_DISALLOW_ON_DC))
2635                 smc_state->flags |= PPSMC_SWSTATE_FLAG_DC;
2636
2637         smc_state->levelCount = 0;
2638
2639         if (state->performance_level_count > NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE)
2640                 return -EINVAL;
2641
2642         for (i = 0; i < state->performance_level_count; i++) {
2643                 ret = ni_convert_power_level_to_smc(rdev, &state->performance_levels[i],
2644                                                     &smc_state->levels[i]);
2645                 smc_state->levels[i].arbRefreshState =
2646                         (u8)(NISLANDS_DRIVER_STATE_ARB_INDEX + i);
2647
2648                 if (ret)
2649                         return ret;
2650
2651                 if (ni_pi->enable_power_containment)
2652                         smc_state->levels[i].displayWatermark =
2653                                 (state->performance_levels[i].sclk < threshold) ?
2654                                 PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH;
2655                 else
2656                         smc_state->levels[i].displayWatermark = (i < 2) ?
2657                                 PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH;
2658
2659                 if (eg_pi->dynamic_ac_timing)
2660                         smc_state->levels[i].ACIndex = NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i;
2661                 else
2662                         smc_state->levels[i].ACIndex = 0;
2663
2664                 smc_state->levelCount++;
2665         }
2666
2667         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_watermark_threshold,
2668                                       cpu_to_be32(threshold / 512));
2669
2670         ni_populate_smc_sp(rdev, radeon_state, smc_state);
2671
2672         ret = ni_populate_power_containment_values(rdev, radeon_state, smc_state);
2673         if (ret)
2674                 ni_pi->enable_power_containment = false;
2675
2676         ret = ni_populate_sq_ramping_values(rdev, radeon_state, smc_state);
2677         if (ret)
2678                 ni_pi->enable_sq_ramping = false;
2679
2680         return ni_populate_smc_t(rdev, radeon_state, smc_state);
2681 }
2682
2683 static int ni_upload_sw_state(struct radeon_device *rdev,
2684                               struct radeon_ps *radeon_new_state)
2685 {
2686         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2687         u16 address = pi->state_table_start +
2688                 offsetof(NISLANDS_SMC_STATETABLE, driverState);
2689         NISLANDS_SMC_SWSTATE *smc_state;
2690         size_t state_size = struct_size(smc_state, levels,
2691                         NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE);
2692         int ret;
2693
2694         smc_state = kzalloc(state_size, GFP_KERNEL);
2695         if (smc_state == NULL)
2696                 return -ENOMEM;
2697
2698         ret = ni_convert_power_state_to_smc(rdev, radeon_new_state, smc_state);
2699         if (ret)
2700                 goto done;
2701
2702         ret = rv770_copy_bytes_to_smc(rdev, address, (u8 *)smc_state, state_size, pi->sram_end);
2703
2704 done:
2705         kfree(smc_state);
2706
2707         return ret;
2708 }
2709
2710 static int ni_set_mc_special_registers(struct radeon_device *rdev,
2711                                        struct ni_mc_reg_table *table)
2712 {
2713         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2714         u8 i, j, k;
2715         u32 temp_reg;
2716
2717         for (i = 0, j = table->last; i < table->last; i++) {
2718                 switch (table->mc_reg_address[i].s1) {
2719                 case MC_SEQ_MISC1 >> 2:
2720                         if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2721                                 return -EINVAL;
2722                         temp_reg = RREG32(MC_PMG_CMD_EMRS);
2723                         table->mc_reg_address[j].s1 = MC_PMG_CMD_EMRS >> 2;
2724                         table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_EMRS_LP >> 2;
2725                         for (k = 0; k < table->num_entries; k++)
2726                                 table->mc_reg_table_entry[k].mc_data[j] =
2727                                         ((temp_reg & 0xffff0000)) |
2728                                         ((table->mc_reg_table_entry[k].mc_data[i] & 0xffff0000) >> 16);
2729                         j++;
2730                         if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2731                                 return -EINVAL;
2732
2733                         temp_reg = RREG32(MC_PMG_CMD_MRS);
2734                         table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS >> 2;
2735                         table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS_LP >> 2;
2736                         for(k = 0; k < table->num_entries; k++) {
2737                                 table->mc_reg_table_entry[k].mc_data[j] =
2738                                         (temp_reg & 0xffff0000) |
2739                                         (table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff);
2740                                 if (!pi->mem_gddr5)
2741                                         table->mc_reg_table_entry[k].mc_data[j] |= 0x100;
2742                         }
2743                         j++;
2744                         if (j > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2745                                 return -EINVAL;
2746                         break;
2747                 case MC_SEQ_RESERVE_M >> 2:
2748                         temp_reg = RREG32(MC_PMG_CMD_MRS1);
2749                         table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS1 >> 2;
2750                         table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS1_LP >> 2;
2751                         for (k = 0; k < table->num_entries; k++)
2752                                 table->mc_reg_table_entry[k].mc_data[j] =
2753                                         (temp_reg & 0xffff0000) |
2754                                         (table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff);
2755                         j++;
2756                         if (j > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2757                                 return -EINVAL;
2758                         break;
2759                 default:
2760                         break;
2761                 }
2762         }
2763
2764         table->last = j;
2765
2766         return 0;
2767 }
2768
2769 static bool ni_check_s0_mc_reg_index(u16 in_reg, u16 *out_reg)
2770 {
2771         bool result = true;
2772
2773         switch (in_reg) {
2774         case  MC_SEQ_RAS_TIMING >> 2:
2775                 *out_reg = MC_SEQ_RAS_TIMING_LP >> 2;
2776                 break;
2777         case MC_SEQ_CAS_TIMING >> 2:
2778                 *out_reg = MC_SEQ_CAS_TIMING_LP >> 2;
2779                 break;
2780         case MC_SEQ_MISC_TIMING >> 2:
2781                 *out_reg = MC_SEQ_MISC_TIMING_LP >> 2;
2782                 break;
2783         case MC_SEQ_MISC_TIMING2 >> 2:
2784                 *out_reg = MC_SEQ_MISC_TIMING2_LP >> 2;
2785                 break;
2786         case MC_SEQ_RD_CTL_D0 >> 2:
2787                 *out_reg = MC_SEQ_RD_CTL_D0_LP >> 2;
2788                 break;
2789         case MC_SEQ_RD_CTL_D1 >> 2:
2790                 *out_reg = MC_SEQ_RD_CTL_D1_LP >> 2;
2791                 break;
2792         case MC_SEQ_WR_CTL_D0 >> 2:
2793                 *out_reg = MC_SEQ_WR_CTL_D0_LP >> 2;
2794                 break;
2795         case MC_SEQ_WR_CTL_D1 >> 2:
2796                 *out_reg = MC_SEQ_WR_CTL_D1_LP >> 2;
2797                 break;
2798         case MC_PMG_CMD_EMRS >> 2:
2799                 *out_reg = MC_SEQ_PMG_CMD_EMRS_LP >> 2;
2800                 break;
2801         case MC_PMG_CMD_MRS >> 2:
2802                 *out_reg = MC_SEQ_PMG_CMD_MRS_LP >> 2;
2803                 break;
2804         case MC_PMG_CMD_MRS1 >> 2:
2805                 *out_reg = MC_SEQ_PMG_CMD_MRS1_LP >> 2;
2806                 break;
2807         case MC_SEQ_PMG_TIMING >> 2:
2808                 *out_reg = MC_SEQ_PMG_TIMING_LP >> 2;
2809                 break;
2810         case MC_PMG_CMD_MRS2 >> 2:
2811                 *out_reg = MC_SEQ_PMG_CMD_MRS2_LP >> 2;
2812                 break;
2813         default:
2814                 result = false;
2815                 break;
2816         }
2817
2818         return result;
2819 }
2820
2821 static void ni_set_valid_flag(struct ni_mc_reg_table *table)
2822 {
2823         u8 i, j;
2824
2825         for (i = 0; i < table->last; i++) {
2826                 for (j = 1; j < table->num_entries; j++) {
2827                         if (table->mc_reg_table_entry[j-1].mc_data[i] != table->mc_reg_table_entry[j].mc_data[i]) {
2828                                 table->valid_flag |= 1 << i;
2829                                 break;
2830                         }
2831                 }
2832         }
2833 }
2834
2835 static void ni_set_s0_mc_reg_index(struct ni_mc_reg_table *table)
2836 {
2837         u32 i;
2838         u16 address;
2839
2840         for (i = 0; i < table->last; i++)
2841                 table->mc_reg_address[i].s0 =
2842                         ni_check_s0_mc_reg_index(table->mc_reg_address[i].s1, &address) ?
2843                         address : table->mc_reg_address[i].s1;
2844 }
2845
2846 static int ni_copy_vbios_mc_reg_table(struct atom_mc_reg_table *table,
2847                                       struct ni_mc_reg_table *ni_table)
2848 {
2849         u8 i, j;
2850
2851         if (table->last > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2852                 return -EINVAL;
2853         if (table->num_entries > MAX_AC_TIMING_ENTRIES)
2854                 return -EINVAL;
2855
2856         for (i = 0; i < table->last; i++)
2857                 ni_table->mc_reg_address[i].s1 = table->mc_reg_address[i].s1;
2858         ni_table->last = table->last;
2859
2860         for (i = 0; i < table->num_entries; i++) {
2861                 ni_table->mc_reg_table_entry[i].mclk_max =
2862                         table->mc_reg_table_entry[i].mclk_max;
2863                 for (j = 0; j < table->last; j++)
2864                         ni_table->mc_reg_table_entry[i].mc_data[j] =
2865                                 table->mc_reg_table_entry[i].mc_data[j];
2866         }
2867         ni_table->num_entries = table->num_entries;
2868
2869         return 0;
2870 }
2871
2872 static int ni_initialize_mc_reg_table(struct radeon_device *rdev)
2873 {
2874         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2875         int ret;
2876         struct atom_mc_reg_table *table;
2877         struct ni_mc_reg_table *ni_table = &ni_pi->mc_reg_table;
2878         u8 module_index = rv770_get_memory_module_index(rdev);
2879
2880         table = kzalloc(sizeof(struct atom_mc_reg_table), GFP_KERNEL);
2881         if (!table)
2882                 return -ENOMEM;
2883
2884         WREG32(MC_SEQ_RAS_TIMING_LP, RREG32(MC_SEQ_RAS_TIMING));
2885         WREG32(MC_SEQ_CAS_TIMING_LP, RREG32(MC_SEQ_CAS_TIMING));
2886         WREG32(MC_SEQ_MISC_TIMING_LP, RREG32(MC_SEQ_MISC_TIMING));
2887         WREG32(MC_SEQ_MISC_TIMING2_LP, RREG32(MC_SEQ_MISC_TIMING2));
2888         WREG32(MC_SEQ_PMG_CMD_EMRS_LP, RREG32(MC_PMG_CMD_EMRS));
2889         WREG32(MC_SEQ_PMG_CMD_MRS_LP, RREG32(MC_PMG_CMD_MRS));
2890         WREG32(MC_SEQ_PMG_CMD_MRS1_LP, RREG32(MC_PMG_CMD_MRS1));
2891         WREG32(MC_SEQ_WR_CTL_D0_LP, RREG32(MC_SEQ_WR_CTL_D0));
2892         WREG32(MC_SEQ_WR_CTL_D1_LP, RREG32(MC_SEQ_WR_CTL_D1));
2893         WREG32(MC_SEQ_RD_CTL_D0_LP, RREG32(MC_SEQ_RD_CTL_D0));
2894         WREG32(MC_SEQ_RD_CTL_D1_LP, RREG32(MC_SEQ_RD_CTL_D1));
2895         WREG32(MC_SEQ_PMG_TIMING_LP, RREG32(MC_SEQ_PMG_TIMING));
2896         WREG32(MC_SEQ_PMG_CMD_MRS2_LP, RREG32(MC_PMG_CMD_MRS2));
2897
2898         ret = radeon_atom_init_mc_reg_table(rdev, module_index, table);
2899
2900         if (ret)
2901                 goto init_mc_done;
2902
2903         ret = ni_copy_vbios_mc_reg_table(table, ni_table);
2904
2905         if (ret)
2906                 goto init_mc_done;
2907
2908         ni_set_s0_mc_reg_index(ni_table);
2909
2910         ret = ni_set_mc_special_registers(rdev, ni_table);
2911
2912         if (ret)
2913                 goto init_mc_done;
2914
2915         ni_set_valid_flag(ni_table);
2916
2917 init_mc_done:
2918         kfree(table);
2919
2920         return ret;
2921 }
2922
2923 static void ni_populate_mc_reg_addresses(struct radeon_device *rdev,
2924                                          SMC_NIslands_MCRegisters *mc_reg_table)
2925 {
2926         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2927         u32 i, j;
2928
2929         for (i = 0, j = 0; j < ni_pi->mc_reg_table.last; j++) {
2930                 if (ni_pi->mc_reg_table.valid_flag & (1 << j)) {
2931                         if (i >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2932                                 break;
2933                         mc_reg_table->address[i].s0 =
2934                                 cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s0);
2935                         mc_reg_table->address[i].s1 =
2936                                 cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s1);
2937                         i++;
2938                 }
2939         }
2940         mc_reg_table->last = (u8)i;
2941 }
2942
2943
2944 static void ni_convert_mc_registers(struct ni_mc_reg_entry *entry,
2945                                     SMC_NIslands_MCRegisterSet *data,
2946                                     u32 num_entries, u32 valid_flag)
2947 {
2948         u32 i, j;
2949
2950         for (i = 0, j = 0; j < num_entries; j++) {
2951                 if (valid_flag & (1 << j)) {
2952                         data->value[i] = cpu_to_be32(entry->mc_data[j]);
2953                         i++;
2954                 }
2955         }
2956 }
2957
2958 static void ni_convert_mc_reg_table_entry_to_smc(struct radeon_device *rdev,
2959                                                  struct rv7xx_pl *pl,
2960                                                  SMC_NIslands_MCRegisterSet *mc_reg_table_data)
2961 {
2962         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2963         u32 i = 0;
2964
2965         for (i = 0; i < ni_pi->mc_reg_table.num_entries; i++) {
2966                 if (pl->mclk <= ni_pi->mc_reg_table.mc_reg_table_entry[i].mclk_max)
2967                         break;
2968         }
2969
2970         if ((i == ni_pi->mc_reg_table.num_entries) && (i > 0))
2971                 --i;
2972
2973         ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[i],
2974                                 mc_reg_table_data,
2975                                 ni_pi->mc_reg_table.last,
2976                                 ni_pi->mc_reg_table.valid_flag);
2977 }
2978
2979 static void ni_convert_mc_reg_table_to_smc(struct radeon_device *rdev,
2980                                            struct radeon_ps *radeon_state,
2981                                            SMC_NIslands_MCRegisters *mc_reg_table)
2982 {
2983         struct ni_ps *state = ni_get_ps(radeon_state);
2984         int i;
2985
2986         for (i = 0; i < state->performance_level_count; i++) {
2987                 ni_convert_mc_reg_table_entry_to_smc(rdev,
2988                                                      &state->performance_levels[i],
2989                                                      &mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i]);
2990         }
2991 }
2992
2993 static int ni_populate_mc_reg_table(struct radeon_device *rdev,
2994                                     struct radeon_ps *radeon_boot_state)
2995 {
2996         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2997         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2998         struct ni_power_info *ni_pi = ni_get_pi(rdev);
2999         struct ni_ps *boot_state = ni_get_ps(radeon_boot_state);
3000         SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table;
3001
3002         memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters));
3003
3004         rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_seq_index, 1);
3005
3006         ni_populate_mc_reg_addresses(rdev, mc_reg_table);
3007
3008         ni_convert_mc_reg_table_entry_to_smc(rdev, &boot_state->performance_levels[0],
3009                                              &mc_reg_table->data[0]);
3010
3011         ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[0],
3012                                 &mc_reg_table->data[1],
3013                                 ni_pi->mc_reg_table.last,
3014                                 ni_pi->mc_reg_table.valid_flag);
3015
3016         ni_convert_mc_reg_table_to_smc(rdev, radeon_boot_state, mc_reg_table);
3017
3018         return rv770_copy_bytes_to_smc(rdev, eg_pi->mc_reg_table_start,
3019                                        (u8 *)mc_reg_table,
3020                                        sizeof(SMC_NIslands_MCRegisters),
3021                                        pi->sram_end);
3022 }
3023
3024 static int ni_upload_mc_reg_table(struct radeon_device *rdev,
3025                                   struct radeon_ps *radeon_new_state)
3026 {
3027         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3028         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3029         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3030         struct ni_ps *ni_new_state = ni_get_ps(radeon_new_state);
3031         SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table;
3032         u16 address;
3033
3034         memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters));
3035
3036         ni_convert_mc_reg_table_to_smc(rdev, radeon_new_state, mc_reg_table);
3037
3038         address = eg_pi->mc_reg_table_start +
3039                 (u16)offsetof(SMC_NIslands_MCRegisters, data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT]);
3040
3041         return rv770_copy_bytes_to_smc(rdev, address,
3042                                        (u8 *)&mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT],
3043                                        sizeof(SMC_NIslands_MCRegisterSet) * ni_new_state->performance_level_count,
3044                                        pi->sram_end);
3045 }
3046
3047 static int ni_init_driver_calculated_leakage_table(struct radeon_device *rdev,
3048                                                    PP_NIslands_CACTABLES *cac_tables)
3049 {
3050         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3051         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3052         u32 leakage = 0;
3053         unsigned int i, j, table_size;
3054         s32 t;
3055         u32 smc_leakage, max_leakage = 0;
3056         u32 scaling_factor;
3057
3058         table_size = eg_pi->vddc_voltage_table.count;
3059
3060         if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size)
3061                 table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES;
3062
3063         scaling_factor = ni_get_smc_power_scaling_factor(rdev);
3064
3065         for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) {
3066                 for (j = 0; j < table_size; j++) {
3067                         t = (1000 * ((i + 1) * 8));
3068
3069                         if (t < ni_pi->cac_data.leakage_minimum_temperature)
3070                                 t = ni_pi->cac_data.leakage_minimum_temperature;
3071
3072                         ni_calculate_leakage_for_v_and_t(rdev,
3073                                                          &ni_pi->cac_data.leakage_coefficients,
3074                                                          eg_pi->vddc_voltage_table.entries[j].value,
3075                                                          t,
3076                                                          ni_pi->cac_data.i_leakage,
3077                                                          &leakage);
3078
3079                         smc_leakage = ni_scale_power_for_smc(leakage, scaling_factor) / 1000;
3080                         if (smc_leakage > max_leakage)
3081                                 max_leakage = smc_leakage;
3082
3083                         cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(smc_leakage);
3084                 }
3085         }
3086
3087         for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) {
3088                 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3089                         cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(max_leakage);
3090         }
3091         return 0;
3092 }
3093
3094 static int ni_init_simplified_leakage_table(struct radeon_device *rdev,
3095                                             PP_NIslands_CACTABLES *cac_tables)
3096 {
3097         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3098         struct radeon_cac_leakage_table *leakage_table =
3099                 &rdev->pm.dpm.dyn_state.cac_leakage_table;
3100         u32 i, j, table_size;
3101         u32 smc_leakage, max_leakage = 0;
3102         u32 scaling_factor;
3103
3104         if (!leakage_table)
3105                 return -EINVAL;
3106
3107         table_size = leakage_table->count;
3108
3109         if (eg_pi->vddc_voltage_table.count != table_size)
3110                 table_size = (eg_pi->vddc_voltage_table.count < leakage_table->count) ?
3111                         eg_pi->vddc_voltage_table.count : leakage_table->count;
3112
3113         if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size)
3114                 table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES;
3115
3116         if (table_size == 0)
3117                 return -EINVAL;
3118
3119         scaling_factor = ni_get_smc_power_scaling_factor(rdev);
3120
3121         for (j = 0; j < table_size; j++) {
3122                 smc_leakage = leakage_table->entries[j].leakage;
3123
3124                 if (smc_leakage > max_leakage)
3125                         max_leakage = smc_leakage;
3126
3127                 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3128                         cac_tables->cac_lkge_lut[i][j] =
3129                                 cpu_to_be32(ni_scale_power_for_smc(smc_leakage, scaling_factor));
3130         }
3131
3132         for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) {
3133                 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3134                         cac_tables->cac_lkge_lut[i][j] =
3135                                 cpu_to_be32(ni_scale_power_for_smc(max_leakage, scaling_factor));
3136         }
3137         return 0;
3138 }
3139
3140 static int ni_initialize_smc_cac_tables(struct radeon_device *rdev)
3141 {
3142         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3143         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3144         PP_NIslands_CACTABLES *cac_tables = NULL;
3145         int i, ret;
3146         u32 reg;
3147
3148         if (ni_pi->enable_cac == false)
3149                 return 0;
3150
3151         cac_tables = kzalloc(sizeof(PP_NIslands_CACTABLES), GFP_KERNEL);
3152         if (!cac_tables)
3153                 return -ENOMEM;
3154
3155         reg = RREG32(CG_CAC_CTRL) & ~(TID_CNT_MASK | TID_UNIT_MASK);
3156         reg |= (TID_CNT(ni_pi->cac_weights->tid_cnt) |
3157                 TID_UNIT(ni_pi->cac_weights->tid_unit));
3158         WREG32(CG_CAC_CTRL, reg);
3159
3160         for (i = 0; i < NISLANDS_DCCAC_MAX_LEVELS; i++)
3161                 ni_pi->dc_cac_table[i] = ni_pi->cac_weights->dc_cac[i];
3162
3163         for (i = 0; i < SMC_NISLANDS_BIF_LUT_NUM_OF_ENTRIES; i++)
3164                 cac_tables->cac_bif_lut[i] = ni_pi->cac_weights->pcie_cac[i];
3165
3166         ni_pi->cac_data.i_leakage = rdev->pm.dpm.cac_leakage;
3167         ni_pi->cac_data.pwr_const = 0;
3168         ni_pi->cac_data.dc_cac_value = ni_pi->dc_cac_table[NISLANDS_DCCAC_LEVEL_0];
3169         ni_pi->cac_data.bif_cac_value = 0;
3170         ni_pi->cac_data.mc_wr_weight = ni_pi->cac_weights->mc_write_weight;
3171         ni_pi->cac_data.mc_rd_weight = ni_pi->cac_weights->mc_read_weight;
3172         ni_pi->cac_data.allow_ovrflw = 0;
3173         ni_pi->cac_data.l2num_win_tdp = ni_pi->lta_window_size;
3174         ni_pi->cac_data.num_win_tdp = 0;
3175         ni_pi->cac_data.lts_truncate_n = ni_pi->lts_truncate;
3176
3177         if (ni_pi->driver_calculate_cac_leakage)
3178                 ret = ni_init_driver_calculated_leakage_table(rdev, cac_tables);
3179         else
3180                 ret = ni_init_simplified_leakage_table(rdev, cac_tables);
3181
3182         if (ret)
3183                 goto done_free;
3184
3185         cac_tables->pwr_const      = cpu_to_be32(ni_pi->cac_data.pwr_const);
3186         cac_tables->dc_cacValue    = cpu_to_be32(ni_pi->cac_data.dc_cac_value);
3187         cac_tables->bif_cacValue   = cpu_to_be32(ni_pi->cac_data.bif_cac_value);
3188         cac_tables->AllowOvrflw    = ni_pi->cac_data.allow_ovrflw;
3189         cac_tables->MCWrWeight     = ni_pi->cac_data.mc_wr_weight;
3190         cac_tables->MCRdWeight     = ni_pi->cac_data.mc_rd_weight;
3191         cac_tables->numWin_TDP     = ni_pi->cac_data.num_win_tdp;
3192         cac_tables->l2numWin_TDP   = ni_pi->cac_data.l2num_win_tdp;
3193         cac_tables->lts_truncate_n = ni_pi->cac_data.lts_truncate_n;
3194
3195         ret = rv770_copy_bytes_to_smc(rdev, ni_pi->cac_table_start, (u8 *)cac_tables,
3196                                       sizeof(PP_NIslands_CACTABLES), pi->sram_end);
3197
3198 done_free:
3199         if (ret) {
3200                 ni_pi->enable_cac = false;
3201                 ni_pi->enable_power_containment = false;
3202         }
3203
3204         kfree(cac_tables);
3205
3206         return 0;
3207 }
3208
3209 static int ni_initialize_hardware_cac_manager(struct radeon_device *rdev)
3210 {
3211         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3212         u32 reg;
3213
3214         if (!ni_pi->enable_cac ||
3215             !ni_pi->cac_configuration_required)
3216                 return 0;
3217
3218         if (ni_pi->cac_weights == NULL)
3219                 return -EINVAL;
3220
3221         reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_0) & ~(WEIGHT_TCP_SIG0_MASK |
3222                                                       WEIGHT_TCP_SIG1_MASK |
3223                                                       WEIGHT_TA_SIG_MASK);
3224         reg |= (WEIGHT_TCP_SIG0(ni_pi->cac_weights->weight_tcp_sig0) |
3225                 WEIGHT_TCP_SIG1(ni_pi->cac_weights->weight_tcp_sig1) |
3226                 WEIGHT_TA_SIG(ni_pi->cac_weights->weight_ta_sig));
3227         WREG32_CG(CG_CAC_REGION_1_WEIGHT_0, reg);
3228
3229         reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_1) & ~(WEIGHT_TCC_EN0_MASK |
3230                                                       WEIGHT_TCC_EN1_MASK |
3231                                                       WEIGHT_TCC_EN2_MASK);
3232         reg |= (WEIGHT_TCC_EN0(ni_pi->cac_weights->weight_tcc_en0) |
3233                 WEIGHT_TCC_EN1(ni_pi->cac_weights->weight_tcc_en1) |
3234                 WEIGHT_TCC_EN2(ni_pi->cac_weights->weight_tcc_en2));
3235         WREG32_CG(CG_CAC_REGION_1_WEIGHT_1, reg);
3236
3237         reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_0) & ~(WEIGHT_CB_EN0_MASK |
3238                                                       WEIGHT_CB_EN1_MASK |
3239                                                       WEIGHT_CB_EN2_MASK |
3240                                                       WEIGHT_CB_EN3_MASK);
3241         reg |= (WEIGHT_CB_EN0(ni_pi->cac_weights->weight_cb_en0) |
3242                 WEIGHT_CB_EN1(ni_pi->cac_weights->weight_cb_en1) |
3243                 WEIGHT_CB_EN2(ni_pi->cac_weights->weight_cb_en2) |
3244                 WEIGHT_CB_EN3(ni_pi->cac_weights->weight_cb_en3));
3245         WREG32_CG(CG_CAC_REGION_2_WEIGHT_0, reg);
3246
3247         reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_1) & ~(WEIGHT_DB_SIG0_MASK |
3248                                                       WEIGHT_DB_SIG1_MASK |
3249                                                       WEIGHT_DB_SIG2_MASK |
3250                                                       WEIGHT_DB_SIG3_MASK);
3251         reg |= (WEIGHT_DB_SIG0(ni_pi->cac_weights->weight_db_sig0) |
3252                 WEIGHT_DB_SIG1(ni_pi->cac_weights->weight_db_sig1) |
3253                 WEIGHT_DB_SIG2(ni_pi->cac_weights->weight_db_sig2) |
3254                 WEIGHT_DB_SIG3(ni_pi->cac_weights->weight_db_sig3));
3255         WREG32_CG(CG_CAC_REGION_2_WEIGHT_1, reg);
3256
3257         reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_2) & ~(WEIGHT_SXM_SIG0_MASK |
3258                                                       WEIGHT_SXM_SIG1_MASK |
3259                                                       WEIGHT_SXM_SIG2_MASK |
3260                                                       WEIGHT_SXS_SIG0_MASK |
3261                                                       WEIGHT_SXS_SIG1_MASK);
3262         reg |= (WEIGHT_SXM_SIG0(ni_pi->cac_weights->weight_sxm_sig0) |
3263                 WEIGHT_SXM_SIG1(ni_pi->cac_weights->weight_sxm_sig1) |
3264                 WEIGHT_SXM_SIG2(ni_pi->cac_weights->weight_sxm_sig2) |
3265                 WEIGHT_SXS_SIG0(ni_pi->cac_weights->weight_sxs_sig0) |
3266                 WEIGHT_SXS_SIG1(ni_pi->cac_weights->weight_sxs_sig1));
3267         WREG32_CG(CG_CAC_REGION_2_WEIGHT_2, reg);
3268
3269         reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_0) & ~(WEIGHT_XBR_0_MASK |
3270                                                       WEIGHT_XBR_1_MASK |
3271                                                       WEIGHT_XBR_2_MASK |
3272                                                       WEIGHT_SPI_SIG0_MASK);
3273         reg |= (WEIGHT_XBR_0(ni_pi->cac_weights->weight_xbr_0) |
3274                 WEIGHT_XBR_1(ni_pi->cac_weights->weight_xbr_1) |
3275                 WEIGHT_XBR_2(ni_pi->cac_weights->weight_xbr_2) |
3276                 WEIGHT_SPI_SIG0(ni_pi->cac_weights->weight_spi_sig0));
3277         WREG32_CG(CG_CAC_REGION_3_WEIGHT_0, reg);
3278
3279         reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_1) & ~(WEIGHT_SPI_SIG1_MASK |
3280                                                       WEIGHT_SPI_SIG2_MASK |
3281                                                       WEIGHT_SPI_SIG3_MASK |
3282                                                       WEIGHT_SPI_SIG4_MASK |
3283                                                       WEIGHT_SPI_SIG5_MASK);
3284         reg |= (WEIGHT_SPI_SIG1(ni_pi->cac_weights->weight_spi_sig1) |
3285                 WEIGHT_SPI_SIG2(ni_pi->cac_weights->weight_spi_sig2) |
3286                 WEIGHT_SPI_SIG3(ni_pi->cac_weights->weight_spi_sig3) |
3287                 WEIGHT_SPI_SIG4(ni_pi->cac_weights->weight_spi_sig4) |
3288                 WEIGHT_SPI_SIG5(ni_pi->cac_weights->weight_spi_sig5));
3289         WREG32_CG(CG_CAC_REGION_3_WEIGHT_1, reg);
3290
3291         reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_0) & ~(WEIGHT_LDS_SIG0_MASK |
3292                                                       WEIGHT_LDS_SIG1_MASK |
3293                                                       WEIGHT_SC_MASK);
3294         reg |= (WEIGHT_LDS_SIG0(ni_pi->cac_weights->weight_lds_sig0) |
3295                 WEIGHT_LDS_SIG1(ni_pi->cac_weights->weight_lds_sig1) |
3296                 WEIGHT_SC(ni_pi->cac_weights->weight_sc));
3297         WREG32_CG(CG_CAC_REGION_4_WEIGHT_0, reg);
3298
3299         reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_1) & ~(WEIGHT_BIF_MASK |
3300                                                       WEIGHT_CP_MASK |
3301                                                       WEIGHT_PA_SIG0_MASK |
3302                                                       WEIGHT_PA_SIG1_MASK |
3303                                                       WEIGHT_VGT_SIG0_MASK);
3304         reg |= (WEIGHT_BIF(ni_pi->cac_weights->weight_bif) |
3305                 WEIGHT_CP(ni_pi->cac_weights->weight_cp) |
3306                 WEIGHT_PA_SIG0(ni_pi->cac_weights->weight_pa_sig0) |
3307                 WEIGHT_PA_SIG1(ni_pi->cac_weights->weight_pa_sig1) |
3308                 WEIGHT_VGT_SIG0(ni_pi->cac_weights->weight_vgt_sig0));
3309         WREG32_CG(CG_CAC_REGION_4_WEIGHT_1, reg);
3310
3311         reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_2) & ~(WEIGHT_VGT_SIG1_MASK |
3312                                                       WEIGHT_VGT_SIG2_MASK |
3313                                                       WEIGHT_DC_SIG0_MASK |
3314                                                       WEIGHT_DC_SIG1_MASK |
3315                                                       WEIGHT_DC_SIG2_MASK);
3316         reg |= (WEIGHT_VGT_SIG1(ni_pi->cac_weights->weight_vgt_sig1) |
3317                 WEIGHT_VGT_SIG2(ni_pi->cac_weights->weight_vgt_sig2) |
3318                 WEIGHT_DC_SIG0(ni_pi->cac_weights->weight_dc_sig0) |
3319                 WEIGHT_DC_SIG1(ni_pi->cac_weights->weight_dc_sig1) |
3320                 WEIGHT_DC_SIG2(ni_pi->cac_weights->weight_dc_sig2));
3321         WREG32_CG(CG_CAC_REGION_4_WEIGHT_2, reg);
3322
3323         reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_3) & ~(WEIGHT_DC_SIG3_MASK |
3324                                                       WEIGHT_UVD_SIG0_MASK |
3325                                                       WEIGHT_UVD_SIG1_MASK |
3326                                                       WEIGHT_SPARE0_MASK |
3327                                                       WEIGHT_SPARE1_MASK);
3328         reg |= (WEIGHT_DC_SIG3(ni_pi->cac_weights->weight_dc_sig3) |
3329                 WEIGHT_UVD_SIG0(ni_pi->cac_weights->weight_uvd_sig0) |
3330                 WEIGHT_UVD_SIG1(ni_pi->cac_weights->weight_uvd_sig1) |
3331                 WEIGHT_SPARE0(ni_pi->cac_weights->weight_spare0) |
3332                 WEIGHT_SPARE1(ni_pi->cac_weights->weight_spare1));
3333         WREG32_CG(CG_CAC_REGION_4_WEIGHT_3, reg);
3334
3335         reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_0) & ~(WEIGHT_SQ_VSP_MASK |
3336                                                       WEIGHT_SQ_VSP0_MASK);
3337         reg |= (WEIGHT_SQ_VSP(ni_pi->cac_weights->weight_sq_vsp) |
3338                 WEIGHT_SQ_VSP0(ni_pi->cac_weights->weight_sq_vsp0));
3339         WREG32_CG(CG_CAC_REGION_5_WEIGHT_0, reg);
3340
3341         reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_1) & ~(WEIGHT_SQ_GPR_MASK);
3342         reg |= WEIGHT_SQ_GPR(ni_pi->cac_weights->weight_sq_gpr);
3343         WREG32_CG(CG_CAC_REGION_5_WEIGHT_1, reg);
3344
3345         reg = RREG32_CG(CG_CAC_REGION_4_OVERRIDE_4) & ~(OVR_MODE_SPARE_0_MASK |
3346                                                         OVR_VAL_SPARE_0_MASK |
3347                                                         OVR_MODE_SPARE_1_MASK |
3348                                                         OVR_VAL_SPARE_1_MASK);
3349         reg |= (OVR_MODE_SPARE_0(ni_pi->cac_weights->ovr_mode_spare_0) |
3350                 OVR_VAL_SPARE_0(ni_pi->cac_weights->ovr_val_spare_0) |
3351                 OVR_MODE_SPARE_1(ni_pi->cac_weights->ovr_mode_spare_1) |
3352                 OVR_VAL_SPARE_1(ni_pi->cac_weights->ovr_val_spare_1));
3353         WREG32_CG(CG_CAC_REGION_4_OVERRIDE_4, reg);
3354
3355         reg = RREG32(SQ_CAC_THRESHOLD) & ~(VSP_MASK |
3356                                            VSP0_MASK |
3357                                            GPR_MASK);
3358         reg |= (VSP(ni_pi->cac_weights->vsp) |
3359                 VSP0(ni_pi->cac_weights->vsp0) |
3360                 GPR(ni_pi->cac_weights->gpr));
3361         WREG32(SQ_CAC_THRESHOLD, reg);
3362
3363         reg = (MCDW_WR_ENABLE |
3364                MCDX_WR_ENABLE |
3365                MCDY_WR_ENABLE |
3366                MCDZ_WR_ENABLE |
3367                INDEX(0x09D4));
3368         WREG32(MC_CG_CONFIG, reg);
3369
3370         reg = (READ_WEIGHT(ni_pi->cac_weights->mc_read_weight) |
3371                WRITE_WEIGHT(ni_pi->cac_weights->mc_write_weight) |
3372                ALLOW_OVERFLOW);
3373         WREG32(MC_CG_DATAPORT, reg);
3374
3375         return 0;
3376 }
3377
3378 static int ni_enable_smc_cac(struct radeon_device *rdev,
3379                              struct radeon_ps *radeon_new_state,
3380                              bool enable)
3381 {
3382         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3383         int ret = 0;
3384         PPSMC_Result smc_result;
3385
3386         if (ni_pi->enable_cac) {
3387                 if (enable) {
3388                         if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) {
3389                                 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_CollectCAC_PowerCorreln);
3390
3391                                 if (ni_pi->support_cac_long_term_average) {
3392                                         smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgEnable);
3393                                         if (PPSMC_Result_OK != smc_result)
3394                                                 ni_pi->support_cac_long_term_average = false;
3395                                 }
3396
3397                                 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_EnableCac);
3398                                 if (PPSMC_Result_OK != smc_result)
3399                                         ret = -EINVAL;
3400
3401                                 ni_pi->cac_enabled = (PPSMC_Result_OK == smc_result) ? true : false;
3402                         }
3403                 } else if (ni_pi->cac_enabled) {
3404                         smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_DisableCac);
3405
3406                         ni_pi->cac_enabled = false;
3407
3408                         if (ni_pi->support_cac_long_term_average) {
3409                                 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgDisable);
3410                                 if (PPSMC_Result_OK != smc_result)
3411                                         ni_pi->support_cac_long_term_average = false;
3412                         }
3413                 }
3414         }
3415
3416         return ret;
3417 }
3418
3419 static int ni_pcie_performance_request(struct radeon_device *rdev,
3420                                        u8 perf_req, bool advertise)
3421 {
3422 #if defined(CONFIG_ACPI)
3423         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3424
3425         if ((perf_req == PCIE_PERF_REQ_PECI_GEN1) ||
3426             (perf_req == PCIE_PERF_REQ_PECI_GEN2)) {
3427                 if (eg_pi->pcie_performance_request_registered == false)
3428                         radeon_acpi_pcie_notify_device_ready(rdev);
3429                 eg_pi->pcie_performance_request_registered = true;
3430                 return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise);
3431         } else if ((perf_req == PCIE_PERF_REQ_REMOVE_REGISTRY) &&
3432                     eg_pi->pcie_performance_request_registered) {
3433                 eg_pi->pcie_performance_request_registered = false;
3434                 return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise);
3435         }
3436 #endif
3437         return 0;
3438 }
3439
3440 static int ni_advertise_gen2_capability(struct radeon_device *rdev)
3441 {
3442         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3443         u32 tmp;
3444
3445         tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
3446
3447         if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3448             (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2))
3449                 pi->pcie_gen2 = true;
3450         else
3451                 pi->pcie_gen2 = false;
3452
3453         if (!pi->pcie_gen2)
3454                 ni_pcie_performance_request(rdev, PCIE_PERF_REQ_PECI_GEN2, true);
3455
3456         return 0;
3457 }
3458
3459 static void ni_enable_bif_dynamic_pcie_gen2(struct radeon_device *rdev,
3460                                             bool enable)
3461 {
3462         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3463         u32 tmp, bif;
3464
3465         tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
3466
3467         if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3468             (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2)) {
3469                 if (enable) {
3470                         if (!pi->boot_in_gen2) {
3471                                 bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK;
3472                                 bif |= CG_CLIENT_REQ(0xd);
3473                                 WREG32(CG_BIF_REQ_AND_RSP, bif);
3474                         }
3475                         tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK;
3476                         tmp |= LC_HW_VOLTAGE_IF_CONTROL(1);
3477                         tmp |= LC_GEN2_EN_STRAP;
3478
3479                         tmp |= LC_CLR_FAILED_SPD_CHANGE_CNT;
3480                         WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3481                         udelay(10);
3482                         tmp &= ~LC_CLR_FAILED_SPD_CHANGE_CNT;
3483                         WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3484                 } else {
3485                         if (!pi->boot_in_gen2) {
3486                                 bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK;
3487                                 bif |= CG_CLIENT_REQ(0xd);
3488                                 WREG32(CG_BIF_REQ_AND_RSP, bif);
3489
3490                                 tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK;
3491                                 tmp &= ~LC_GEN2_EN_STRAP;
3492                         }
3493                         WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3494                 }
3495         }
3496 }
3497
3498 static void ni_enable_dynamic_pcie_gen2(struct radeon_device *rdev,
3499                                         bool enable)
3500 {
3501         ni_enable_bif_dynamic_pcie_gen2(rdev, enable);
3502
3503         if (enable)
3504                 WREG32_P(GENERAL_PWRMGT, ENABLE_GEN2PCIE, ~ENABLE_GEN2PCIE);
3505         else
3506                 WREG32_P(GENERAL_PWRMGT, 0, ~ENABLE_GEN2PCIE);
3507 }
3508
3509 void ni_set_uvd_clock_before_set_eng_clock(struct radeon_device *rdev,
3510                                            struct radeon_ps *new_ps,
3511                                            struct radeon_ps *old_ps)
3512 {
3513         struct ni_ps *new_state = ni_get_ps(new_ps);
3514         struct ni_ps *current_state = ni_get_ps(old_ps);
3515
3516         if ((new_ps->vclk == old_ps->vclk) &&
3517             (new_ps->dclk == old_ps->dclk))
3518                 return;
3519
3520         if (new_state->performance_levels[new_state->performance_level_count - 1].sclk >=
3521             current_state->performance_levels[current_state->performance_level_count - 1].sclk)
3522                 return;
3523
3524         radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk);
3525 }
3526
3527 void ni_set_uvd_clock_after_set_eng_clock(struct radeon_device *rdev,
3528                                           struct radeon_ps *new_ps,
3529                                           struct radeon_ps *old_ps)
3530 {
3531         struct ni_ps *new_state = ni_get_ps(new_ps);
3532         struct ni_ps *current_state = ni_get_ps(old_ps);
3533
3534         if ((new_ps->vclk == old_ps->vclk) &&
3535             (new_ps->dclk == old_ps->dclk))
3536                 return;
3537
3538         if (new_state->performance_levels[new_state->performance_level_count - 1].sclk <
3539             current_state->performance_levels[current_state->performance_level_count - 1].sclk)
3540                 return;
3541
3542         radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk);
3543 }
3544
3545 void ni_dpm_setup_asic(struct radeon_device *rdev)
3546 {
3547         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3548         int r;
3549
3550         r = ni_mc_load_microcode(rdev);
3551         if (r)
3552                 DRM_ERROR("Failed to load MC firmware!\n");
3553         ni_read_clock_registers(rdev);
3554         btc_read_arb_registers(rdev);
3555         rv770_get_memory_type(rdev);
3556         if (eg_pi->pcie_performance_request)
3557                 ni_advertise_gen2_capability(rdev);
3558         rv770_get_pcie_gen2_status(rdev);
3559         rv770_enable_acpi_pm(rdev);
3560 }
3561
3562 void ni_update_current_ps(struct radeon_device *rdev,
3563                           struct radeon_ps *rps)
3564 {
3565         struct ni_ps *new_ps = ni_get_ps(rps);
3566         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3567         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3568
3569         eg_pi->current_rps = *rps;
3570         ni_pi->current_ps = *new_ps;
3571         eg_pi->current_rps.ps_priv = &ni_pi->current_ps;
3572 }
3573
3574 void ni_update_requested_ps(struct radeon_device *rdev,
3575                             struct radeon_ps *rps)
3576 {
3577         struct ni_ps *new_ps = ni_get_ps(rps);
3578         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3579         struct ni_power_info *ni_pi = ni_get_pi(rdev);
3580
3581         eg_pi->requested_rps = *rps;
3582         ni_pi->requested_ps = *new_ps;
3583         eg_pi->requested_rps.ps_priv = &ni_pi->requested_ps;
3584 }
3585
3586 int ni_dpm_enable(struct radeon_device *rdev)
3587 {
3588         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3589         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3590         struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps;
3591         int ret;
3592
3593         if (pi->gfx_clock_gating)
3594                 ni_cg_clockgating_default(rdev);
3595         if (btc_dpm_enabled(rdev))
3596                 return -EINVAL;
3597         if (pi->mg_clock_gating)
3598                 ni_mg_clockgating_default(rdev);
3599         if (eg_pi->ls_clock_gating)
3600                 ni_ls_clockgating_default(rdev);
3601         if (pi->voltage_control) {
3602                 rv770_enable_voltage_control(rdev, true);
3603                 ret = cypress_construct_voltage_tables(rdev);
3604                 if (ret) {
3605                         DRM_ERROR("cypress_construct_voltage_tables failed\n");
3606                         return ret;
3607                 }
3608         }
3609         if (eg_pi->dynamic_ac_timing) {
3610                 ret = ni_initialize_mc_reg_table(rdev);
3611                 if (ret)
3612                         eg_pi->dynamic_ac_timing = false;
3613         }
3614         if (pi->dynamic_ss)
3615                 cypress_enable_spread_spectrum(rdev, true);
3616         if (pi->thermal_protection)
3617                 rv770_enable_thermal_protection(rdev, true);
3618         rv770_setup_bsp(rdev);
3619         rv770_program_git(rdev);
3620         rv770_program_tp(rdev);
3621         rv770_program_tpp(rdev);
3622         rv770_program_sstp(rdev);
3623         cypress_enable_display_gap(rdev);
3624         rv770_program_vc(rdev);
3625         if (pi->dynamic_pcie_gen2)
3626                 ni_enable_dynamic_pcie_gen2(rdev, true);
3627         ret = rv770_upload_firmware(rdev);
3628         if (ret) {
3629                 DRM_ERROR("rv770_upload_firmware failed\n");
3630                 return ret;
3631         }
3632         ret = ni_process_firmware_header(rdev);
3633         if (ret) {
3634                 DRM_ERROR("ni_process_firmware_header failed\n");
3635                 return ret;
3636         }
3637         ret = ni_initial_switch_from_arb_f0_to_f1(rdev);
3638         if (ret) {
3639                 DRM_ERROR("ni_initial_switch_from_arb_f0_to_f1 failed\n");
3640                 return ret;
3641         }
3642         ret = ni_init_smc_table(rdev);
3643         if (ret) {
3644                 DRM_ERROR("ni_init_smc_table failed\n");
3645                 return ret;
3646         }
3647         ret = ni_init_smc_spll_table(rdev);
3648         if (ret) {
3649                 DRM_ERROR("ni_init_smc_spll_table failed\n");
3650                 return ret;
3651         }
3652         ret = ni_init_arb_table_index(rdev);
3653         if (ret) {
3654                 DRM_ERROR("ni_init_arb_table_index failed\n");
3655                 return ret;
3656         }
3657         if (eg_pi->dynamic_ac_timing) {
3658                 ret = ni_populate_mc_reg_table(rdev, boot_ps);
3659                 if (ret) {
3660                         DRM_ERROR("ni_populate_mc_reg_table failed\n");
3661                         return ret;
3662                 }
3663         }
3664         ret = ni_initialize_smc_cac_tables(rdev);
3665         if (ret) {
3666                 DRM_ERROR("ni_initialize_smc_cac_tables failed\n");
3667                 return ret;
3668         }
3669         ret = ni_initialize_hardware_cac_manager(rdev);
3670         if (ret) {
3671                 DRM_ERROR("ni_initialize_hardware_cac_manager failed\n");
3672                 return ret;
3673         }
3674         ret = ni_populate_smc_tdp_limits(rdev, boot_ps);
3675         if (ret) {
3676                 DRM_ERROR("ni_populate_smc_tdp_limits failed\n");
3677                 return ret;
3678         }
3679         ni_program_response_times(rdev);
3680         r7xx_start_smc(rdev);
3681         ret = cypress_notify_smc_display_change(rdev, false);
3682         if (ret) {
3683                 DRM_ERROR("cypress_notify_smc_display_change failed\n");
3684                 return ret;
3685         }
3686         cypress_enable_sclk_control(rdev, true);
3687         if (eg_pi->memory_transition)
3688                 cypress_enable_mclk_control(rdev, true);
3689         cypress_start_dpm(rdev);
3690         if (pi->gfx_clock_gating)
3691                 ni_gfx_clockgating_enable(rdev, true);
3692         if (pi->mg_clock_gating)
3693                 ni_mg_clockgating_enable(rdev, true);
3694         if (eg_pi->ls_clock_gating)
3695                 ni_ls_clockgating_enable(rdev, true);
3696
3697         rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, true);
3698
3699         ni_update_current_ps(rdev, boot_ps);
3700
3701         return 0;
3702 }
3703
3704 void ni_dpm_disable(struct radeon_device *rdev)
3705 {
3706         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3707         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3708         struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps;
3709
3710         if (!btc_dpm_enabled(rdev))
3711                 return;
3712         rv770_clear_vc(rdev);
3713         if (pi->thermal_protection)
3714                 rv770_enable_thermal_protection(rdev, false);
3715         ni_enable_power_containment(rdev, boot_ps, false);
3716         ni_enable_smc_cac(rdev, boot_ps, false);
3717         cypress_enable_spread_spectrum(rdev, false);
3718         rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, false);
3719         if (pi->dynamic_pcie_gen2)
3720                 ni_enable_dynamic_pcie_gen2(rdev, false);
3721
3722         if (rdev->irq.installed &&
3723             r600_is_internal_thermal_sensor(rdev->pm.int_thermal_type)) {
3724                 rdev->irq.dpm_thermal = false;
3725                 radeon_irq_set(rdev);
3726         }
3727
3728         if (pi->gfx_clock_gating)
3729                 ni_gfx_clockgating_enable(rdev, false);
3730         if (pi->mg_clock_gating)
3731                 ni_mg_clockgating_enable(rdev, false);
3732         if (eg_pi->ls_clock_gating)
3733                 ni_ls_clockgating_enable(rdev, false);
3734         ni_stop_dpm(rdev);
3735         btc_reset_to_default(rdev);
3736         ni_stop_smc(rdev);
3737         ni_force_switch_to_arb_f0(rdev);
3738
3739         ni_update_current_ps(rdev, boot_ps);
3740 }
3741
3742 static int ni_power_control_set_level(struct radeon_device *rdev)
3743 {
3744         struct radeon_ps *new_ps = rdev->pm.dpm.requested_ps;
3745         int ret;
3746
3747         ret = ni_restrict_performance_levels_before_switch(rdev);
3748         if (ret)
3749                 return ret;
3750         ret = rv770_halt_smc(rdev);
3751         if (ret)
3752                 return ret;
3753         ret = ni_populate_smc_tdp_limits(rdev, new_ps);
3754         if (ret)
3755                 return ret;
3756         ret = rv770_resume_smc(rdev);
3757         if (ret)
3758                 return ret;
3759         ret = rv770_set_sw_state(rdev);
3760         if (ret)
3761                 return ret;
3762
3763         return 0;
3764 }
3765
3766 int ni_dpm_pre_set_power_state(struct radeon_device *rdev)
3767 {
3768         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3769         struct radeon_ps requested_ps = *rdev->pm.dpm.requested_ps;
3770         struct radeon_ps *new_ps = &requested_ps;
3771
3772         ni_update_requested_ps(rdev, new_ps);
3773
3774         ni_apply_state_adjust_rules(rdev, &eg_pi->requested_rps);
3775
3776         return 0;
3777 }
3778
3779 int ni_dpm_set_power_state(struct radeon_device *rdev)
3780 {
3781         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3782         struct radeon_ps *new_ps = &eg_pi->requested_rps;
3783         struct radeon_ps *old_ps = &eg_pi->current_rps;
3784         int ret;
3785
3786         ret = ni_restrict_performance_levels_before_switch(rdev);
3787         if (ret) {
3788                 DRM_ERROR("ni_restrict_performance_levels_before_switch failed\n");
3789                 return ret;
3790         }
3791         ni_set_uvd_clock_before_set_eng_clock(rdev, new_ps, old_ps);
3792         ret = ni_enable_power_containment(rdev, new_ps, false);
3793         if (ret) {
3794                 DRM_ERROR("ni_enable_power_containment failed\n");
3795                 return ret;
3796         }
3797         ret = ni_enable_smc_cac(rdev, new_ps, false);
3798         if (ret) {
3799                 DRM_ERROR("ni_enable_smc_cac failed\n");
3800                 return ret;
3801         }
3802         ret = rv770_halt_smc(rdev);
3803         if (ret) {
3804                 DRM_ERROR("rv770_halt_smc failed\n");
3805                 return ret;
3806         }
3807         if (eg_pi->smu_uvd_hs)
3808                 btc_notify_uvd_to_smc(rdev, new_ps);
3809         ret = ni_upload_sw_state(rdev, new_ps);
3810         if (ret) {
3811                 DRM_ERROR("ni_upload_sw_state failed\n");
3812                 return ret;
3813         }
3814         if (eg_pi->dynamic_ac_timing) {
3815                 ret = ni_upload_mc_reg_table(rdev, new_ps);
3816                 if (ret) {
3817                         DRM_ERROR("ni_upload_mc_reg_table failed\n");
3818                         return ret;
3819                 }
3820         }
3821         ret = ni_program_memory_timing_parameters(rdev, new_ps);
3822         if (ret) {
3823                 DRM_ERROR("ni_program_memory_timing_parameters failed\n");
3824                 return ret;
3825         }
3826         ret = rv770_resume_smc(rdev);
3827         if (ret) {
3828                 DRM_ERROR("rv770_resume_smc failed\n");
3829                 return ret;
3830         }
3831         ret = rv770_set_sw_state(rdev);
3832         if (ret) {
3833                 DRM_ERROR("rv770_set_sw_state failed\n");
3834                 return ret;
3835         }
3836         ni_set_uvd_clock_after_set_eng_clock(rdev, new_ps, old_ps);
3837         ret = ni_enable_smc_cac(rdev, new_ps, true);
3838         if (ret) {
3839                 DRM_ERROR("ni_enable_smc_cac failed\n");
3840                 return ret;
3841         }
3842         ret = ni_enable_power_containment(rdev, new_ps, true);
3843         if (ret) {
3844                 DRM_ERROR("ni_enable_power_containment failed\n");
3845                 return ret;
3846         }
3847
3848         /* update tdp */
3849         ret = ni_power_control_set_level(rdev);
3850         if (ret) {
3851                 DRM_ERROR("ni_power_control_set_level failed\n");
3852                 return ret;
3853         }
3854
3855         return 0;
3856 }
3857
3858 void ni_dpm_post_set_power_state(struct radeon_device *rdev)
3859 {
3860         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3861         struct radeon_ps *new_ps = &eg_pi->requested_rps;
3862
3863         ni_update_current_ps(rdev, new_ps);
3864 }
3865
3866 #if 0
3867 void ni_dpm_reset_asic(struct radeon_device *rdev)
3868 {
3869         ni_restrict_performance_levels_before_switch(rdev);
3870         rv770_set_boot_state(rdev);
3871 }
3872 #endif
3873
3874 union power_info {
3875         struct _ATOM_POWERPLAY_INFO info;
3876         struct _ATOM_POWERPLAY_INFO_V2 info_2;
3877         struct _ATOM_POWERPLAY_INFO_V3 info_3;
3878         struct _ATOM_PPLIB_POWERPLAYTABLE pplib;
3879         struct _ATOM_PPLIB_POWERPLAYTABLE2 pplib2;
3880         struct _ATOM_PPLIB_POWERPLAYTABLE3 pplib3;
3881 };
3882
3883 union pplib_clock_info {
3884         struct _ATOM_PPLIB_R600_CLOCK_INFO r600;
3885         struct _ATOM_PPLIB_RS780_CLOCK_INFO rs780;
3886         struct _ATOM_PPLIB_EVERGREEN_CLOCK_INFO evergreen;
3887         struct _ATOM_PPLIB_SUMO_CLOCK_INFO sumo;
3888 };
3889
3890 union pplib_power_state {
3891         struct _ATOM_PPLIB_STATE v1;
3892         struct _ATOM_PPLIB_STATE_V2 v2;
3893 };
3894
3895 static void ni_parse_pplib_non_clock_info(struct radeon_device *rdev,
3896                                           struct radeon_ps *rps,
3897                                           struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info,
3898                                           u8 table_rev)
3899 {
3900         rps->caps = le32_to_cpu(non_clock_info->ulCapsAndSettings);
3901         rps->class = le16_to_cpu(non_clock_info->usClassification);
3902         rps->class2 = le16_to_cpu(non_clock_info->usClassification2);
3903
3904         if (ATOM_PPLIB_NONCLOCKINFO_VER1 < table_rev) {
3905                 rps->vclk = le32_to_cpu(non_clock_info->ulVCLK);
3906                 rps->dclk = le32_to_cpu(non_clock_info->ulDCLK);
3907         } else if (r600_is_uvd_state(rps->class, rps->class2)) {
3908                 rps->vclk = RV770_DEFAULT_VCLK_FREQ;
3909                 rps->dclk = RV770_DEFAULT_DCLK_FREQ;
3910         } else {
3911                 rps->vclk = 0;
3912                 rps->dclk = 0;
3913         }
3914
3915         if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT)
3916                 rdev->pm.dpm.boot_ps = rps;
3917         if (rps->class & ATOM_PPLIB_CLASSIFICATION_UVDSTATE)
3918                 rdev->pm.dpm.uvd_ps = rps;
3919 }
3920
3921 static void ni_parse_pplib_clock_info(struct radeon_device *rdev,
3922                                       struct radeon_ps *rps, int index,
3923                                       union pplib_clock_info *clock_info)
3924 {
3925         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3926         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3927         struct ni_ps *ps = ni_get_ps(rps);
3928         struct rv7xx_pl *pl = &ps->performance_levels[index];
3929
3930         ps->performance_level_count = index + 1;
3931
3932         pl->sclk = le16_to_cpu(clock_info->evergreen.usEngineClockLow);
3933         pl->sclk |= clock_info->evergreen.ucEngineClockHigh << 16;
3934         pl->mclk = le16_to_cpu(clock_info->evergreen.usMemoryClockLow);
3935         pl->mclk |= clock_info->evergreen.ucMemoryClockHigh << 16;
3936
3937         pl->vddc = le16_to_cpu(clock_info->evergreen.usVDDC);
3938         pl->vddci = le16_to_cpu(clock_info->evergreen.usVDDCI);
3939         pl->flags = le32_to_cpu(clock_info->evergreen.ulFlags);
3940
3941         /* patch up vddc if necessary */
3942         if (pl->vddc == 0xff01) {
3943                 if (pi->max_vddc)
3944                         pl->vddc = pi->max_vddc;
3945         }
3946
3947         if (rps->class & ATOM_PPLIB_CLASSIFICATION_ACPI) {
3948                 pi->acpi_vddc = pl->vddc;
3949                 eg_pi->acpi_vddci = pl->vddci;
3950                 if (ps->performance_levels[0].flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2)
3951                         pi->acpi_pcie_gen2 = true;
3952                 else
3953                         pi->acpi_pcie_gen2 = false;
3954         }
3955
3956         if (rps->class2 & ATOM_PPLIB_CLASSIFICATION2_ULV) {
3957                 eg_pi->ulv.supported = true;
3958                 eg_pi->ulv.pl = pl;
3959         }
3960
3961         if (pi->min_vddc_in_table > pl->vddc)
3962                 pi->min_vddc_in_table = pl->vddc;
3963
3964         if (pi->max_vddc_in_table < pl->vddc)
3965                 pi->max_vddc_in_table = pl->vddc;
3966
3967         /* patch up boot state */
3968         if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT) {
3969                 u16 vddc, vddci, mvdd;
3970                 radeon_atombios_get_default_voltages(rdev, &vddc, &vddci, &mvdd);
3971                 pl->mclk = rdev->clock.default_mclk;
3972                 pl->sclk = rdev->clock.default_sclk;
3973                 pl->vddc = vddc;
3974                 pl->vddci = vddci;
3975         }
3976
3977         if ((rps->class & ATOM_PPLIB_CLASSIFICATION_UI_MASK) ==
3978             ATOM_PPLIB_CLASSIFICATION_UI_PERFORMANCE) {
3979                 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.sclk = pl->sclk;
3980                 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.mclk = pl->mclk;
3981                 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddc = pl->vddc;
3982                 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddci = pl->vddci;
3983         }
3984 }
3985
3986 static int ni_parse_power_table(struct radeon_device *rdev)
3987 {
3988         struct radeon_mode_info *mode_info = &rdev->mode_info;
3989         struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info;
3990         union pplib_power_state *power_state;
3991         int i, j;
3992         union pplib_clock_info *clock_info;
3993         union power_info *power_info;
3994         int index = GetIndexIntoMasterTable(DATA, PowerPlayInfo);
3995         u16 data_offset;
3996         u8 frev, crev;
3997         struct ni_ps *ps;
3998
3999         if (!atom_parse_data_header(mode_info->atom_context, index, NULL,
4000                                    &frev, &crev, &data_offset))
4001                 return -EINVAL;
4002         power_info = (union power_info *)(mode_info->atom_context->bios + data_offset);
4003
4004         rdev->pm.dpm.ps = kcalloc(power_info->pplib.ucNumStates,
4005                                   sizeof(struct radeon_ps),
4006                                   GFP_KERNEL);
4007         if (!rdev->pm.dpm.ps)
4008                 return -ENOMEM;
4009
4010         for (i = 0; i < power_info->pplib.ucNumStates; i++) {
4011                 power_state = (union pplib_power_state *)
4012                         (mode_info->atom_context->bios + data_offset +
4013                          le16_to_cpu(power_info->pplib.usStateArrayOffset) +
4014                          i * power_info->pplib.ucStateEntrySize);
4015                 non_clock_info = (struct _ATOM_PPLIB_NONCLOCK_INFO *)
4016                         (mode_info->atom_context->bios + data_offset +
4017                          le16_to_cpu(power_info->pplib.usNonClockInfoArrayOffset) +
4018                          (power_state->v1.ucNonClockStateIndex *
4019                           power_info->pplib.ucNonClockSize));
4020                 if (power_info->pplib.ucStateEntrySize - 1) {
4021                         u8 *idx;
4022                         ps = kzalloc(sizeof(struct ni_ps), GFP_KERNEL);
4023                         if (ps == NULL) {
4024                                 kfree(rdev->pm.dpm.ps);
4025                                 return -ENOMEM;
4026                         }
4027                         rdev->pm.dpm.ps[i].ps_priv = ps;
4028                         ni_parse_pplib_non_clock_info(rdev, &rdev->pm.dpm.ps[i],
4029                                                          non_clock_info,
4030                                                          power_info->pplib.ucNonClockSize);
4031                         idx = (u8 *)&power_state->v1.ucClockStateIndices[0];
4032                         for (j = 0; j < (power_info->pplib.ucStateEntrySize - 1); j++) {
4033                                 clock_info = (union pplib_clock_info *)
4034                                         (mode_info->atom_context->bios + data_offset +
4035                                          le16_to_cpu(power_info->pplib.usClockInfoArrayOffset) +
4036                                          (idx[j] * power_info->pplib.ucClockInfoSize));
4037                                 ni_parse_pplib_clock_info(rdev,
4038                                                           &rdev->pm.dpm.ps[i], j,
4039                                                           clock_info);
4040                         }
4041                 }
4042         }
4043         rdev->pm.dpm.num_ps = power_info->pplib.ucNumStates;
4044         return 0;
4045 }
4046
4047 int ni_dpm_init(struct radeon_device *rdev)
4048 {
4049         struct rv7xx_power_info *pi;
4050         struct evergreen_power_info *eg_pi;
4051         struct ni_power_info *ni_pi;
4052         struct atom_clock_dividers dividers;
4053         int ret;
4054
4055         ni_pi = kzalloc(sizeof(struct ni_power_info), GFP_KERNEL);
4056         if (ni_pi == NULL)
4057                 return -ENOMEM;
4058         rdev->pm.dpm.priv = ni_pi;
4059         eg_pi = &ni_pi->eg;
4060         pi = &eg_pi->rv7xx;
4061
4062         rv770_get_max_vddc(rdev);
4063
4064         eg_pi->ulv.supported = false;
4065         pi->acpi_vddc = 0;
4066         eg_pi->acpi_vddci = 0;
4067         pi->min_vddc_in_table = 0;
4068         pi->max_vddc_in_table = 0;
4069
4070         ret = r600_get_platform_caps(rdev);
4071         if (ret)
4072                 return ret;
4073
4074         ret = ni_parse_power_table(rdev);
4075         if (ret)
4076                 return ret;
4077         ret = r600_parse_extended_power_table(rdev);
4078         if (ret)
4079                 return ret;
4080
4081         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries =
4082                 kcalloc(4,
4083                         sizeof(struct radeon_clock_voltage_dependency_entry),
4084                         GFP_KERNEL);
4085         if (!rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries) {
4086                 r600_free_extended_power_table(rdev);
4087                 return -ENOMEM;
4088         }
4089         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.count = 4;
4090         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].clk = 0;
4091         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].v = 0;
4092         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].clk = 36000;
4093         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].v = 720;
4094         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].clk = 54000;
4095         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].v = 810;
4096         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].clk = 72000;
4097         rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].v = 900;
4098
4099         ni_patch_dependency_tables_based_on_leakage(rdev);
4100
4101         if (rdev->pm.dpm.voltage_response_time == 0)
4102                 rdev->pm.dpm.voltage_response_time = R600_VOLTAGERESPONSETIME_DFLT;
4103         if (rdev->pm.dpm.backbias_response_time == 0)
4104                 rdev->pm.dpm.backbias_response_time = R600_BACKBIASRESPONSETIME_DFLT;
4105
4106         ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
4107                                              0, false, &dividers);
4108         if (ret)
4109                 pi->ref_div = dividers.ref_div + 1;
4110         else
4111                 pi->ref_div = R600_REFERENCEDIVIDER_DFLT;
4112
4113         pi->rlp = RV770_RLP_DFLT;
4114         pi->rmp = RV770_RMP_DFLT;
4115         pi->lhp = RV770_LHP_DFLT;
4116         pi->lmp = RV770_LMP_DFLT;
4117
4118         eg_pi->ats[0].rlp = RV770_RLP_DFLT;
4119         eg_pi->ats[0].rmp = RV770_RMP_DFLT;
4120         eg_pi->ats[0].lhp = RV770_LHP_DFLT;
4121         eg_pi->ats[0].lmp = RV770_LMP_DFLT;
4122
4123         eg_pi->ats[1].rlp = BTC_RLP_UVD_DFLT;
4124         eg_pi->ats[1].rmp = BTC_RMP_UVD_DFLT;
4125         eg_pi->ats[1].lhp = BTC_LHP_UVD_DFLT;
4126         eg_pi->ats[1].lmp = BTC_LMP_UVD_DFLT;
4127
4128         eg_pi->smu_uvd_hs = true;
4129
4130         if (rdev->pdev->device == 0x6707) {
4131                 pi->mclk_strobe_mode_threshold = 55000;
4132                 pi->mclk_edc_enable_threshold = 55000;
4133                 eg_pi->mclk_edc_wr_enable_threshold = 55000;
4134         } else {
4135                 pi->mclk_strobe_mode_threshold = 40000;
4136                 pi->mclk_edc_enable_threshold = 40000;
4137                 eg_pi->mclk_edc_wr_enable_threshold = 40000;
4138         }
4139         ni_pi->mclk_rtt_mode_threshold = eg_pi->mclk_edc_wr_enable_threshold;
4140
4141         pi->voltage_control =
4142                 radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDC, 0);
4143
4144         pi->mvdd_control =
4145                 radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_MVDDC, 0);
4146
4147         eg_pi->vddci_control =
4148                 radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDCI, 0);
4149
4150         rv770_get_engine_memory_ss(rdev);
4151
4152         pi->asi = RV770_ASI_DFLT;
4153         pi->pasi = CYPRESS_HASI_DFLT;
4154         pi->vrc = CYPRESS_VRC_DFLT;
4155
4156         pi->power_gating = false;
4157
4158         pi->gfx_clock_gating = true;
4159
4160         pi->mg_clock_gating = true;
4161         pi->mgcgtssm = true;
4162         eg_pi->ls_clock_gating = false;
4163         eg_pi->sclk_deep_sleep = false;
4164
4165         pi->dynamic_pcie_gen2 = true;
4166
4167         if (rdev->pm.int_thermal_type != THERMAL_TYPE_NONE)
4168                 pi->thermal_protection = true;
4169         else
4170                 pi->thermal_protection = false;
4171
4172         pi->display_gap = true;
4173
4174         pi->dcodt = true;
4175
4176         pi->ulps = true;
4177
4178         eg_pi->dynamic_ac_timing = true;
4179         eg_pi->abm = true;
4180         eg_pi->mcls = true;
4181         eg_pi->light_sleep = true;
4182         eg_pi->memory_transition = true;
4183 #if defined(CONFIG_ACPI)
4184         eg_pi->pcie_performance_request =
4185                 radeon_acpi_is_pcie_performance_request_supported(rdev);
4186 #else
4187         eg_pi->pcie_performance_request = false;
4188 #endif
4189
4190         eg_pi->dll_default_on = false;
4191
4192         eg_pi->sclk_deep_sleep = false;
4193
4194         pi->mclk_stutter_mode_threshold = 0;
4195
4196         pi->sram_end = SMC_RAM_END;
4197
4198         rdev->pm.dpm.dyn_state.mclk_sclk_ratio = 3;
4199         rdev->pm.dpm.dyn_state.vddc_vddci_delta = 200;
4200         rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2 = 900;
4201         rdev->pm.dpm.dyn_state.valid_sclk_values.count = ARRAY_SIZE(btc_valid_sclk);
4202         rdev->pm.dpm.dyn_state.valid_sclk_values.values = btc_valid_sclk;
4203         rdev->pm.dpm.dyn_state.valid_mclk_values.count = 0;
4204         rdev->pm.dpm.dyn_state.valid_mclk_values.values = NULL;
4205         rdev->pm.dpm.dyn_state.sclk_mclk_delta = 12500;
4206
4207         ni_pi->cac_data.leakage_coefficients.at = 516;
4208         ni_pi->cac_data.leakage_coefficients.bt = 18;
4209         ni_pi->cac_data.leakage_coefficients.av = 51;
4210         ni_pi->cac_data.leakage_coefficients.bv = 2957;
4211
4212         switch (rdev->pdev->device) {
4213         case 0x6700:
4214         case 0x6701:
4215         case 0x6702:
4216         case 0x6703:
4217         case 0x6718:
4218                 ni_pi->cac_weights = &cac_weights_cayman_xt;
4219                 break;
4220         case 0x6705:
4221         case 0x6719:
4222         case 0x671D:
4223         case 0x671C:
4224         default:
4225                 ni_pi->cac_weights = &cac_weights_cayman_pro;
4226                 break;
4227         case 0x6704:
4228         case 0x6706:
4229         case 0x6707:
4230         case 0x6708:
4231         case 0x6709:
4232                 ni_pi->cac_weights = &cac_weights_cayman_le;
4233                 break;
4234         }
4235
4236         if (ni_pi->cac_weights->enable_power_containment_by_default) {
4237                 ni_pi->enable_power_containment = true;
4238                 ni_pi->enable_cac = true;
4239                 ni_pi->enable_sq_ramping = true;
4240         } else {
4241                 ni_pi->enable_power_containment = false;
4242                 ni_pi->enable_cac = false;
4243                 ni_pi->enable_sq_ramping = false;
4244         }
4245
4246         ni_pi->driver_calculate_cac_leakage = false;
4247         ni_pi->cac_configuration_required = true;
4248
4249         if (ni_pi->cac_configuration_required) {
4250                 ni_pi->support_cac_long_term_average = true;
4251                 ni_pi->lta_window_size = ni_pi->cac_weights->l2_lta_window_size;
4252                 ni_pi->lts_truncate = ni_pi->cac_weights->lts_truncate;
4253         } else {
4254                 ni_pi->support_cac_long_term_average = false;
4255                 ni_pi->lta_window_size = 0;
4256                 ni_pi->lts_truncate = 0;
4257         }
4258
4259         ni_pi->use_power_boost_limit = true;
4260
4261         /* make sure dc limits are valid */
4262         if ((rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.sclk == 0) ||
4263             (rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.mclk == 0))
4264                 rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc =
4265                         rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac;
4266
4267         return 0;
4268 }
4269
4270 void ni_dpm_fini(struct radeon_device *rdev)
4271 {
4272         int i;
4273
4274         for (i = 0; i < rdev->pm.dpm.num_ps; i++) {
4275                 kfree(rdev->pm.dpm.ps[i].ps_priv);
4276         }
4277         kfree(rdev->pm.dpm.ps);
4278         kfree(rdev->pm.dpm.priv);
4279         kfree(rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries);
4280         r600_free_extended_power_table(rdev);
4281 }
4282
4283 void ni_dpm_print_power_state(struct radeon_device *rdev,
4284                               struct radeon_ps *rps)
4285 {
4286         struct ni_ps *ps = ni_get_ps(rps);
4287         struct rv7xx_pl *pl;
4288         int i;
4289
4290         r600_dpm_print_class_info(rps->class, rps->class2);
4291         r600_dpm_print_cap_info(rps->caps);
4292         printk("\tuvd    vclk: %d dclk: %d\n", rps->vclk, rps->dclk);
4293         for (i = 0; i < ps->performance_level_count; i++) {
4294                 pl = &ps->performance_levels[i];
4295                 if (rdev->family >= CHIP_TAHITI)
4296                         printk("\t\tpower level %d    sclk: %u mclk: %u vddc: %u vddci: %u pcie gen: %u\n",
4297                                i, pl->sclk, pl->mclk, pl->vddc, pl->vddci, pl->pcie_gen + 1);
4298                 else
4299                         printk("\t\tpower level %d    sclk: %u mclk: %u vddc: %u vddci: %u\n",
4300                                i, pl->sclk, pl->mclk, pl->vddc, pl->vddci);
4301         }
4302         r600_dpm_print_ps_status(rdev, rps);
4303 }
4304
4305 void ni_dpm_debugfs_print_current_performance_level(struct radeon_device *rdev,
4306                                                     struct seq_file *m)
4307 {
4308         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4309         struct radeon_ps *rps = &eg_pi->current_rps;
4310         struct ni_ps *ps = ni_get_ps(rps);
4311         struct rv7xx_pl *pl;
4312         u32 current_index =
4313                 (RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4314                 CURRENT_STATE_INDEX_SHIFT;
4315
4316         if (current_index >= ps->performance_level_count) {
4317                 seq_printf(m, "invalid dpm profile %d\n", current_index);
4318         } else {
4319                 pl = &ps->performance_levels[current_index];
4320                 seq_printf(m, "uvd    vclk: %d dclk: %d\n", rps->vclk, rps->dclk);
4321                 seq_printf(m, "power level %d    sclk: %u mclk: %u vddc: %u vddci: %u\n",
4322                            current_index, pl->sclk, pl->mclk, pl->vddc, pl->vddci);
4323         }
4324 }
4325
4326 u32 ni_dpm_get_current_sclk(struct radeon_device *rdev)
4327 {
4328         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4329         struct radeon_ps *rps = &eg_pi->current_rps;
4330         struct ni_ps *ps = ni_get_ps(rps);
4331         struct rv7xx_pl *pl;
4332         u32 current_index =
4333                 (RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4334                 CURRENT_STATE_INDEX_SHIFT;
4335
4336         if (current_index >= ps->performance_level_count) {
4337                 return 0;
4338         } else {
4339                 pl = &ps->performance_levels[current_index];
4340                 return pl->sclk;
4341         }
4342 }
4343
4344 u32 ni_dpm_get_current_mclk(struct radeon_device *rdev)
4345 {
4346         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4347         struct radeon_ps *rps = &eg_pi->current_rps;
4348         struct ni_ps *ps = ni_get_ps(rps);
4349         struct rv7xx_pl *pl;
4350         u32 current_index =
4351                 (RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4352                 CURRENT_STATE_INDEX_SHIFT;
4353
4354         if (current_index >= ps->performance_level_count) {
4355                 return 0;
4356         } else {
4357                 pl = &ps->performance_levels[current_index];
4358                 return pl->mclk;
4359         }
4360 }
4361
4362 u32 ni_dpm_get_sclk(struct radeon_device *rdev, bool low)
4363 {
4364         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4365         struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps);
4366
4367         if (low)
4368                 return requested_state->performance_levels[0].sclk;
4369         else
4370                 return requested_state->performance_levels[requested_state->performance_level_count - 1].sclk;
4371 }
4372
4373 u32 ni_dpm_get_mclk(struct radeon_device *rdev, bool low)
4374 {
4375         struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4376         struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps);
4377
4378         if (low)
4379                 return requested_state->performance_levels[0].mclk;
4380         else
4381                 return requested_state->performance_levels[requested_state->performance_level_count - 1].mclk;
4382 }
4383