GNU Linux-libre 4.19.304-gnu1
[releases.git] / drivers / gpu / drm / radeon / rv740_dpm.c
1 /*
2  * Copyright 2011 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Authors: Alex Deucher
23  */
24
25 #include <drm/drmP.h>
26 #include "radeon.h"
27 #include "rv740d.h"
28 #include "r600_dpm.h"
29 #include "rv770_dpm.h"
30 #include "atom.h"
31
32 struct rv7xx_power_info *rv770_get_pi(struct radeon_device *rdev);
33
34 u32 rv740_get_decoded_reference_divider(u32 encoded_ref)
35 {
36         u32 ref = 0;
37
38         switch (encoded_ref) {
39         case 0:
40                 ref = 1;
41                 break;
42         case 16:
43                 ref = 2;
44                 break;
45         case 17:
46                 ref = 3;
47                 break;
48         case 18:
49                 ref = 2;
50                 break;
51         case 19:
52                 ref = 3;
53                 break;
54         case 20:
55                 ref = 4;
56                 break;
57         case 21:
58                 ref = 5;
59                 break;
60         default:
61                 DRM_ERROR("Invalid encoded Reference Divider\n");
62                 ref = 0;
63                 break;
64         }
65
66         return ref;
67 }
68
69 struct dll_speed_setting {
70         u16 min;
71         u16 max;
72         u32 dll_speed;
73 };
74
75 static struct dll_speed_setting dll_speed_table[16] =
76 {
77         { 270, 320, 0x0f },
78         { 240, 270, 0x0e },
79         { 200, 240, 0x0d },
80         { 180, 200, 0x0c },
81         { 160, 180, 0x0b },
82         { 140, 160, 0x0a },
83         { 120, 140, 0x09 },
84         { 110, 120, 0x08 },
85         {  95, 110, 0x07 },
86         {  85,  95, 0x06 },
87         {  78,  85, 0x05 },
88         {  70,  78, 0x04 },
89         {  65,  70, 0x03 },
90         {  60,  65, 0x02 },
91         {  42,  60, 0x01 },
92         {  00,  42, 0x00 }
93 };
94
95 u32 rv740_get_dll_speed(bool is_gddr5, u32 memory_clock)
96 {
97         int i;
98         u32 factor;
99         u16 data_rate;
100
101         if (is_gddr5)
102                 factor = 4;
103         else
104                 factor = 2;
105
106         data_rate = (u16)(memory_clock * factor / 1000);
107
108         if (data_rate < dll_speed_table[0].max) {
109                 for (i = 0; i < 16; i++) {
110                         if (data_rate > dll_speed_table[i].min &&
111                             data_rate <= dll_speed_table[i].max)
112                                 return dll_speed_table[i].dll_speed;
113                 }
114         }
115
116         DRM_DEBUG_KMS("Target MCLK greater than largest MCLK in DLL speed table\n");
117
118         return 0x0f;
119 }
120
121 int rv740_populate_sclk_value(struct radeon_device *rdev, u32 engine_clock,
122                               RV770_SMC_SCLK_VALUE *sclk)
123 {
124         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
125         struct atom_clock_dividers dividers;
126         u32 spll_func_cntl = pi->clk_regs.rv770.cg_spll_func_cntl;
127         u32 spll_func_cntl_2 = pi->clk_regs.rv770.cg_spll_func_cntl_2;
128         u32 spll_func_cntl_3 = pi->clk_regs.rv770.cg_spll_func_cntl_3;
129         u32 cg_spll_spread_spectrum = pi->clk_regs.rv770.cg_spll_spread_spectrum;
130         u32 cg_spll_spread_spectrum_2 = pi->clk_regs.rv770.cg_spll_spread_spectrum_2;
131         u64 tmp;
132         u32 reference_clock = rdev->clock.spll.reference_freq;
133         u32 reference_divider;
134         u32 fbdiv;
135         int ret;
136
137         ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
138                                              engine_clock, false, &dividers);
139         if (ret)
140                 return ret;
141
142         reference_divider = 1 + dividers.ref_div;
143
144         tmp = (u64) engine_clock * reference_divider * dividers.post_div * 16384;
145         do_div(tmp, reference_clock);
146         fbdiv = (u32) tmp;
147
148         spll_func_cntl &= ~(SPLL_PDIV_A_MASK | SPLL_REF_DIV_MASK);
149         spll_func_cntl |= SPLL_REF_DIV(dividers.ref_div);
150         spll_func_cntl |= SPLL_PDIV_A(dividers.post_div);
151
152         spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
153         spll_func_cntl_2 |= SCLK_MUX_SEL(2);
154
155         spll_func_cntl_3 &= ~SPLL_FB_DIV_MASK;
156         spll_func_cntl_3 |= SPLL_FB_DIV(fbdiv);
157         spll_func_cntl_3 |= SPLL_DITHEN;
158
159         if (pi->sclk_ss) {
160                 struct radeon_atom_ss ss;
161                 u32 vco_freq = engine_clock * dividers.post_div;
162
163                 if (radeon_atombios_get_asic_ss_info(rdev, &ss,
164                                                      ASIC_INTERNAL_ENGINE_SS, vco_freq)) {
165                         u32 clk_s = reference_clock * 5 / (reference_divider * ss.rate);
166                         u32 clk_v = 4 * ss.percentage * fbdiv / (clk_s * 10000);
167
168                         cg_spll_spread_spectrum &= ~CLK_S_MASK;
169                         cg_spll_spread_spectrum |= CLK_S(clk_s);
170                         cg_spll_spread_spectrum |= SSEN;
171
172                         cg_spll_spread_spectrum_2 &= ~CLK_V_MASK;
173                         cg_spll_spread_spectrum_2 |= CLK_V(clk_v);
174                 }
175         }
176
177         sclk->sclk_value = cpu_to_be32(engine_clock);
178         sclk->vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
179         sclk->vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
180         sclk->vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
181         sclk->vCG_SPLL_SPREAD_SPECTRUM = cpu_to_be32(cg_spll_spread_spectrum);
182         sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cpu_to_be32(cg_spll_spread_spectrum_2);
183
184         return 0;
185 }
186
187 int rv740_populate_mclk_value(struct radeon_device *rdev,
188                               u32 engine_clock, u32 memory_clock,
189                               RV7XX_SMC_MCLK_VALUE *mclk)
190 {
191         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
192         u32 mpll_ad_func_cntl = pi->clk_regs.rv770.mpll_ad_func_cntl;
193         u32 mpll_ad_func_cntl_2 = pi->clk_regs.rv770.mpll_ad_func_cntl_2;
194         u32 mpll_dq_func_cntl = pi->clk_regs.rv770.mpll_dq_func_cntl;
195         u32 mpll_dq_func_cntl_2 = pi->clk_regs.rv770.mpll_dq_func_cntl_2;
196         u32 mclk_pwrmgt_cntl = pi->clk_regs.rv770.mclk_pwrmgt_cntl;
197         u32 dll_cntl = pi->clk_regs.rv770.dll_cntl;
198         u32 mpll_ss1 = pi->clk_regs.rv770.mpll_ss1;
199         u32 mpll_ss2 = pi->clk_regs.rv770.mpll_ss2;
200         struct atom_clock_dividers dividers;
201         u32 ibias;
202         u32 dll_speed;
203         int ret;
204
205         ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_MEMORY_PLL_PARAM,
206                                              memory_clock, false, &dividers);
207         if (ret)
208                 return ret;
209
210         ibias = rv770_map_clkf_to_ibias(rdev, dividers.whole_fb_div);
211
212         mpll_ad_func_cntl &= ~(CLKR_MASK |
213                                YCLK_POST_DIV_MASK |
214                                CLKF_MASK |
215                                CLKFRAC_MASK |
216                                IBIAS_MASK);
217         mpll_ad_func_cntl |= CLKR(dividers.ref_div);
218         mpll_ad_func_cntl |= YCLK_POST_DIV(dividers.post_div);
219         mpll_ad_func_cntl |= CLKF(dividers.whole_fb_div);
220         mpll_ad_func_cntl |= CLKFRAC(dividers.frac_fb_div);
221         mpll_ad_func_cntl |= IBIAS(ibias);
222
223         if (dividers.vco_mode)
224                 mpll_ad_func_cntl_2 |= VCO_MODE;
225         else
226                 mpll_ad_func_cntl_2 &= ~VCO_MODE;
227
228         if (pi->mem_gddr5) {
229                 mpll_dq_func_cntl &= ~(CLKR_MASK |
230                                        YCLK_POST_DIV_MASK |
231                                        CLKF_MASK |
232                                        CLKFRAC_MASK |
233                                        IBIAS_MASK);
234                 mpll_dq_func_cntl |= CLKR(dividers.ref_div);
235                 mpll_dq_func_cntl |= YCLK_POST_DIV(dividers.post_div);
236                 mpll_dq_func_cntl |= CLKF(dividers.whole_fb_div);
237                 mpll_dq_func_cntl |= CLKFRAC(dividers.frac_fb_div);
238                 mpll_dq_func_cntl |= IBIAS(ibias);
239
240                 if (dividers.vco_mode)
241                         mpll_dq_func_cntl_2 |= VCO_MODE;
242                 else
243                         mpll_dq_func_cntl_2 &= ~VCO_MODE;
244         }
245
246         if (pi->mclk_ss) {
247                 struct radeon_atom_ss ss;
248                 u32 vco_freq = memory_clock * dividers.post_div;
249
250                 if (radeon_atombios_get_asic_ss_info(rdev, &ss,
251                                                      ASIC_INTERNAL_MEMORY_SS, vco_freq)) {
252                         u32 reference_clock = rdev->clock.mpll.reference_freq;
253                         u32 decoded_ref = rv740_get_decoded_reference_divider(dividers.ref_div);
254                         u32 clk_s, clk_v;
255
256                         if (!decoded_ref)
257                                 return -EINVAL;
258                         clk_s = reference_clock * 5 / (decoded_ref * ss.rate);
259                         clk_v = 0x40000 * ss.percentage *
260                                 (dividers.whole_fb_div + (dividers.frac_fb_div / 8)) / (clk_s * 10000);
261
262                         mpll_ss1 &= ~CLKV_MASK;
263                         mpll_ss1 |= CLKV(clk_v);
264
265                         mpll_ss2 &= ~CLKS_MASK;
266                         mpll_ss2 |= CLKS(clk_s);
267                 }
268         }
269
270         dll_speed = rv740_get_dll_speed(pi->mem_gddr5,
271                                         memory_clock);
272
273         mclk_pwrmgt_cntl &= ~DLL_SPEED_MASK;
274         mclk_pwrmgt_cntl |= DLL_SPEED(dll_speed);
275
276         mclk->mclk770.mclk_value = cpu_to_be32(memory_clock);
277         mclk->mclk770.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
278         mclk->mclk770.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
279         mclk->mclk770.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
280         mclk->mclk770.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
281         mclk->mclk770.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
282         mclk->mclk770.vDLL_CNTL = cpu_to_be32(dll_cntl);
283         mclk->mclk770.vMPLL_SS = cpu_to_be32(mpll_ss1);
284         mclk->mclk770.vMPLL_SS2 = cpu_to_be32(mpll_ss2);
285
286         return 0;
287 }
288
289 void rv740_read_clock_registers(struct radeon_device *rdev)
290 {
291         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
292
293         pi->clk_regs.rv770.cg_spll_func_cntl =
294                 RREG32(CG_SPLL_FUNC_CNTL);
295         pi->clk_regs.rv770.cg_spll_func_cntl_2 =
296                 RREG32(CG_SPLL_FUNC_CNTL_2);
297         pi->clk_regs.rv770.cg_spll_func_cntl_3 =
298                 RREG32(CG_SPLL_FUNC_CNTL_3);
299         pi->clk_regs.rv770.cg_spll_spread_spectrum =
300                 RREG32(CG_SPLL_SPREAD_SPECTRUM);
301         pi->clk_regs.rv770.cg_spll_spread_spectrum_2 =
302                 RREG32(CG_SPLL_SPREAD_SPECTRUM_2);
303
304         pi->clk_regs.rv770.mpll_ad_func_cntl =
305                 RREG32(MPLL_AD_FUNC_CNTL);
306         pi->clk_regs.rv770.mpll_ad_func_cntl_2 =
307                 RREG32(MPLL_AD_FUNC_CNTL_2);
308         pi->clk_regs.rv770.mpll_dq_func_cntl =
309                 RREG32(MPLL_DQ_FUNC_CNTL);
310         pi->clk_regs.rv770.mpll_dq_func_cntl_2 =
311                 RREG32(MPLL_DQ_FUNC_CNTL_2);
312         pi->clk_regs.rv770.mclk_pwrmgt_cntl =
313                 RREG32(MCLK_PWRMGT_CNTL);
314         pi->clk_regs.rv770.dll_cntl = RREG32(DLL_CNTL);
315         pi->clk_regs.rv770.mpll_ss1 = RREG32(MPLL_SS1);
316         pi->clk_regs.rv770.mpll_ss2 = RREG32(MPLL_SS2);
317 }
318
319 int rv740_populate_smc_acpi_state(struct radeon_device *rdev,
320                                   RV770_SMC_STATETABLE *table)
321 {
322         struct rv7xx_power_info *pi = rv770_get_pi(rdev);
323         u32 mpll_ad_func_cntl = pi->clk_regs.rv770.mpll_ad_func_cntl;
324         u32 mpll_ad_func_cntl_2 = pi->clk_regs.rv770.mpll_ad_func_cntl_2;
325         u32 mpll_dq_func_cntl = pi->clk_regs.rv770.mpll_dq_func_cntl;
326         u32 mpll_dq_func_cntl_2 = pi->clk_regs.rv770.mpll_dq_func_cntl_2;
327         u32 spll_func_cntl = pi->clk_regs.rv770.cg_spll_func_cntl;
328         u32 spll_func_cntl_2 = pi->clk_regs.rv770.cg_spll_func_cntl_2;
329         u32 spll_func_cntl_3 = pi->clk_regs.rv770.cg_spll_func_cntl_3;
330         u32 mclk_pwrmgt_cntl = pi->clk_regs.rv770.mclk_pwrmgt_cntl;
331         u32 dll_cntl = pi->clk_regs.rv770.dll_cntl;
332
333         table->ACPIState = table->initialState;
334
335         table->ACPIState.flags &= ~PPSMC_SWSTATE_FLAG_DC;
336
337         if (pi->acpi_vddc) {
338                 rv770_populate_vddc_value(rdev, pi->acpi_vddc,
339                                           &table->ACPIState.levels[0].vddc);
340                 table->ACPIState.levels[0].gen2PCIE =
341                         pi->pcie_gen2 ?
342                         pi->acpi_pcie_gen2 : 0;
343                 table->ACPIState.levels[0].gen2XSP =
344                         pi->acpi_pcie_gen2;
345         } else {
346                 rv770_populate_vddc_value(rdev, pi->min_vddc_in_table,
347                                           &table->ACPIState.levels[0].vddc);
348                 table->ACPIState.levels[0].gen2PCIE = 0;
349         }
350
351         mpll_ad_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN;
352
353         mpll_dq_func_cntl_2 |= BYPASS | BIAS_GEN_PDNB | RESET_EN;
354
355         mclk_pwrmgt_cntl |= (MRDCKA0_RESET |
356                              MRDCKA1_RESET |
357                              MRDCKB0_RESET |
358                              MRDCKB1_RESET |
359                              MRDCKC0_RESET |
360                              MRDCKC1_RESET |
361                              MRDCKD0_RESET |
362                              MRDCKD1_RESET);
363
364         dll_cntl |= (MRDCKA0_BYPASS |
365                      MRDCKA1_BYPASS |
366                      MRDCKB0_BYPASS |
367                      MRDCKB1_BYPASS |
368                      MRDCKC0_BYPASS |
369                      MRDCKC1_BYPASS |
370                      MRDCKD0_BYPASS |
371                      MRDCKD1_BYPASS);
372
373         spll_func_cntl |= SPLL_RESET | SPLL_SLEEP | SPLL_BYPASS_EN;
374
375         spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
376         spll_func_cntl_2 |= SCLK_MUX_SEL(4);
377
378         table->ACPIState.levels[0].mclk.mclk770.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
379         table->ACPIState.levels[0].mclk.mclk770.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
380         table->ACPIState.levels[0].mclk.mclk770.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
381         table->ACPIState.levels[0].mclk.mclk770.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
382         table->ACPIState.levels[0].mclk.mclk770.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
383         table->ACPIState.levels[0].mclk.mclk770.vDLL_CNTL = cpu_to_be32(dll_cntl);
384
385         table->ACPIState.levels[0].mclk.mclk770.mclk_value = 0;
386
387         table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
388         table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
389         table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
390
391         table->ACPIState.levels[0].sclk.sclk_value = 0;
392
393         table->ACPIState.levels[1] = table->ACPIState.levels[0];
394         table->ACPIState.levels[2] = table->ACPIState.levels[0];
395
396         rv770_populate_mvdd_value(rdev, 0, &table->ACPIState.levels[0].mvdd);
397
398         return 0;
399 }
400
401 void rv740_enable_mclk_spread_spectrum(struct radeon_device *rdev,
402                                        bool enable)
403 {
404         if (enable)
405                 WREG32_P(MPLL_CNTL_MODE, SS_SSEN, ~SS_SSEN);
406         else
407                 WREG32_P(MPLL_CNTL_MODE, 0, ~SS_SSEN);
408 }
409
410 u8 rv740_get_mclk_frequency_ratio(u32 memory_clock)
411 {
412         u8 mc_para_index;
413
414         if ((memory_clock < 10000) || (memory_clock > 47500))
415                 mc_para_index = 0x00;
416         else
417                 mc_para_index = (u8)((memory_clock - 10000) / 2500);
418
419         return mc_para_index;
420 }