cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

rv740_dpm.c (12645B)


      1/*
      2 * Copyright 2011 Advanced Micro Devices, Inc.
      3 *
      4 * Permission is hereby granted, free of charge, to any person obtaining a
      5 * copy of this software and associated documentation files (the "Software"),
      6 * to deal in the Software without restriction, including without limitation
      7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
      8 * and/or sell copies of the Software, and to permit persons to whom the
      9 * Software is furnished to do so, subject to the following conditions:
     10 *
     11 * The above copyright notice and this permission notice shall be included in
     12 * all copies or substantial portions of the Software.
     13 *
     14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
     17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
     18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
     19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
     20 * OTHER DEALINGS IN THE SOFTWARE.
     21 *
     22 * Authors: Alex Deucher
     23 */
     24
     25#include "radeon.h"
     26#include "rv740d.h"
     27#include "r600_dpm.h"
     28#include "rv770.h"
     29#include "rv770_dpm.h"
     30#include "atom.h"
     31
     32u32 rv740_get_decoded_reference_divider(u32 encoded_ref)
     33{
     34	u32 ref = 0;
     35
     36	switch (encoded_ref) {
     37	case 0:
     38		ref = 1;
     39		break;
     40	case 16:
     41		ref = 2;
     42		break;
     43	case 17:
     44		ref = 3;
     45		break;
     46	case 18:
     47		ref = 2;
     48		break;
     49	case 19:
     50		ref = 3;
     51		break;
     52	case 20:
     53		ref = 4;
     54		break;
     55	case 21:
     56		ref = 5;
     57		break;
     58	default:
     59		DRM_ERROR("Invalid encoded Reference Divider\n");
     60		ref = 0;
     61		break;
     62	}
     63
     64	return ref;
     65}
     66
     67struct dll_speed_setting {
     68	u16 min;
     69	u16 max;
     70	u32 dll_speed;
     71};
     72
     73static struct dll_speed_setting dll_speed_table[16] =
     74{
     75	{ 270, 320, 0x0f },
     76	{ 240, 270, 0x0e },
     77	{ 200, 240, 0x0d },
     78	{ 180, 200, 0x0c },
     79	{ 160, 180, 0x0b },
     80	{ 140, 160, 0x0a },
     81	{ 120, 140, 0x09 },
     82	{ 110, 120, 0x08 },
     83	{  95, 110, 0x07 },
     84	{  85,  95, 0x06 },
     85	{  78,  85, 0x05 },
     86	{  70,  78, 0x04 },
     87	{  65,  70, 0x03 },
     88	{  60,  65, 0x02 },
     89	{  42,  60, 0x01 },
     90	{  00,  42, 0x00 }
     91};
     92
     93u32 rv740_get_dll_speed(bool is_gddr5, u32 memory_clock)
     94{
     95	int i;
     96	u32 factor;
     97	u16 data_rate;
     98
     99	if (is_gddr5)
    100		factor = 4;
    101	else
    102		factor = 2;
    103
    104	data_rate = (u16)(memory_clock * factor / 1000);
    105
    106	if (data_rate < dll_speed_table[0].max) {
    107		for (i = 0; i < 16; i++) {
    108			if (data_rate > dll_speed_table[i].min &&
    109			    data_rate <= dll_speed_table[i].max)
    110				return dll_speed_table[i].dll_speed;
    111		}
    112	}
    113
    114	DRM_DEBUG_KMS("Target MCLK greater than largest MCLK in DLL speed table\n");
    115
    116	return 0x0f;
    117}
    118
    119int rv740_populate_sclk_value(struct radeon_device *rdev, u32 engine_clock,
    120			      RV770_SMC_SCLK_VALUE *sclk)
    121{
    122	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
    123	struct atom_clock_dividers dividers;
    124	u32 spll_func_cntl = pi->clk_regs.rv770.cg_spll_func_cntl;
    125	u32 spll_func_cntl_2 = pi->clk_regs.rv770.cg_spll_func_cntl_2;
    126	u32 spll_func_cntl_3 = pi->clk_regs.rv770.cg_spll_func_cntl_3;
    127	u32 cg_spll_spread_spectrum = pi->clk_regs.rv770.cg_spll_spread_spectrum;
    128	u32 cg_spll_spread_spectrum_2 = pi->clk_regs.rv770.cg_spll_spread_spectrum_2;
    129	u64 tmp;
    130	u32 reference_clock = rdev->clock.spll.reference_freq;
    131	u32 reference_divider;
    132	u32 fbdiv;
    133	int ret;
    134
    135	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
    136					     engine_clock, false, &dividers);
    137	if (ret)
    138		return ret;
    139
    140	reference_divider = 1 + dividers.ref_div;
    141
    142	tmp = (u64) engine_clock * reference_divider * dividers.post_div * 16384;
    143	do_div(tmp, reference_clock);
    144	fbdiv = (u32) tmp;
    145
    146	spll_func_cntl &= ~(SPLL_PDIV_A_MASK | SPLL_REF_DIV_MASK);
    147	spll_func_cntl |= SPLL_REF_DIV(dividers.ref_div);
    148	spll_func_cntl |= SPLL_PDIV_A(dividers.post_div);
    149
    150	spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
    151	spll_func_cntl_2 |= SCLK_MUX_SEL(2);
    152
    153	spll_func_cntl_3 &= ~SPLL_FB_DIV_MASK;
    154	spll_func_cntl_3 |= SPLL_FB_DIV(fbdiv);
    155	spll_func_cntl_3 |= SPLL_DITHEN;
    156
    157	if (pi->sclk_ss) {
    158		struct radeon_atom_ss ss;
    159		u32 vco_freq = engine_clock * dividers.post_div;
    160
    161		if (radeon_atombios_get_asic_ss_info(rdev, &ss,
    162						     ASIC_INTERNAL_ENGINE_SS, vco_freq)) {
    163			u32 clk_s = reference_clock * 5 / (reference_divider * ss.rate);
    164			u32 clk_v = 4 * ss.percentage * fbdiv / (clk_s * 10000);
    165
    166			cg_spll_spread_spectrum &= ~CLK_S_MASK;
    167			cg_spll_spread_spectrum |= CLK_S(clk_s);
    168			cg_spll_spread_spectrum |= SSEN;
    169
    170			cg_spll_spread_spectrum_2 &= ~CLK_V_MASK;
    171			cg_spll_spread_spectrum_2 |= CLK_V(clk_v);
    172		}
    173	}
    174
    175	sclk->sclk_value = cpu_to_be32(engine_clock);
    176	sclk->vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
    177	sclk->vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
    178	sclk->vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
    179	sclk->vCG_SPLL_SPREAD_SPECTRUM = cpu_to_be32(cg_spll_spread_spectrum);
    180	sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cpu_to_be32(cg_spll_spread_spectrum_2);
    181
    182	return 0;
    183}
    184
    185int rv740_populate_mclk_value(struct radeon_device *rdev,
    186			      u32 engine_clock, u32 memory_clock,
    187			      RV7XX_SMC_MCLK_VALUE *mclk)
    188{
    189	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
    190	u32 mpll_ad_func_cntl = pi->clk_regs.rv770.mpll_ad_func_cntl;
    191	u32 mpll_ad_func_cntl_2 = pi->clk_regs.rv770.mpll_ad_func_cntl_2;
    192	u32 mpll_dq_func_cntl = pi->clk_regs.rv770.mpll_dq_func_cntl;
    193	u32 mpll_dq_func_cntl_2 = pi->clk_regs.rv770.mpll_dq_func_cntl_2;
    194	u32 mclk_pwrmgt_cntl = pi->clk_regs.rv770.mclk_pwrmgt_cntl;
    195	u32 dll_cntl = pi->clk_regs.rv770.dll_cntl;
    196	u32 mpll_ss1 = pi->clk_regs.rv770.mpll_ss1;
    197	u32 mpll_ss2 = pi->clk_regs.rv770.mpll_ss2;
    198	struct atom_clock_dividers dividers;
    199	u32 ibias;
    200	u32 dll_speed;
    201	int ret;
    202
    203	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_MEMORY_PLL_PARAM,
    204					     memory_clock, false, &dividers);
    205	if (ret)
    206		return ret;
    207
    208	ibias = rv770_map_clkf_to_ibias(rdev, dividers.whole_fb_div);
    209
    210	mpll_ad_func_cntl &= ~(CLKR_MASK |
    211			       YCLK_POST_DIV_MASK |
    212			       CLKF_MASK |
    213			       CLKFRAC_MASK |
    214			       IBIAS_MASK);
    215	mpll_ad_func_cntl |= CLKR(dividers.ref_div);
    216	mpll_ad_func_cntl |= YCLK_POST_DIV(dividers.post_div);
    217	mpll_ad_func_cntl |= CLKF(dividers.whole_fb_div);
    218	mpll_ad_func_cntl |= CLKFRAC(dividers.frac_fb_div);
    219	mpll_ad_func_cntl |= IBIAS(ibias);
    220
    221	if (dividers.vco_mode)
    222		mpll_ad_func_cntl_2 |= VCO_MODE;
    223	else
    224		mpll_ad_func_cntl_2 &= ~VCO_MODE;
    225
    226	if (pi->mem_gddr5) {
    227		mpll_dq_func_cntl &= ~(CLKR_MASK |
    228				       YCLK_POST_DIV_MASK |
    229				       CLKF_MASK |
    230				       CLKFRAC_MASK |
    231				       IBIAS_MASK);
    232		mpll_dq_func_cntl |= CLKR(dividers.ref_div);
    233		mpll_dq_func_cntl |= YCLK_POST_DIV(dividers.post_div);
    234		mpll_dq_func_cntl |= CLKF(dividers.whole_fb_div);
    235		mpll_dq_func_cntl |= CLKFRAC(dividers.frac_fb_div);
    236		mpll_dq_func_cntl |= IBIAS(ibias);
    237
    238		if (dividers.vco_mode)
    239			mpll_dq_func_cntl_2 |= VCO_MODE;
    240		else
    241			mpll_dq_func_cntl_2 &= ~VCO_MODE;
    242	}
    243
    244	if (pi->mclk_ss) {
    245		struct radeon_atom_ss ss;
    246		u32 vco_freq = memory_clock * dividers.post_div;
    247
    248		if (radeon_atombios_get_asic_ss_info(rdev, &ss,
    249						     ASIC_INTERNAL_MEMORY_SS, vco_freq)) {
    250			u32 reference_clock = rdev->clock.mpll.reference_freq;
    251			u32 decoded_ref = rv740_get_decoded_reference_divider(dividers.ref_div);
    252			u32 clk_s = reference_clock * 5 / (decoded_ref * ss.rate);
    253			u32 clk_v = 0x40000 * ss.percentage *
    254				(dividers.whole_fb_div + (dividers.frac_fb_div / 8)) / (clk_s * 10000);
    255
    256			mpll_ss1 &= ~CLKV_MASK;
    257			mpll_ss1 |= CLKV(clk_v);
    258
    259			mpll_ss2 &= ~CLKS_MASK;
    260			mpll_ss2 |= CLKS(clk_s);
    261		}
    262	}
    263
    264	dll_speed = rv740_get_dll_speed(pi->mem_gddr5,
    265					memory_clock);
    266
    267	mclk_pwrmgt_cntl &= ~DLL_SPEED_MASK;
    268	mclk_pwrmgt_cntl |= DLL_SPEED(dll_speed);
    269
    270	mclk->mclk770.mclk_value = cpu_to_be32(memory_clock);
    271	mclk->mclk770.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
    272	mclk->mclk770.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
    273	mclk->mclk770.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
    274	mclk->mclk770.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
    275	mclk->mclk770.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
    276	mclk->mclk770.vDLL_CNTL = cpu_to_be32(dll_cntl);
    277	mclk->mclk770.vMPLL_SS = cpu_to_be32(mpll_ss1);
    278	mclk->mclk770.vMPLL_SS2 = cpu_to_be32(mpll_ss2);
    279
    280	return 0;
    281}
    282
    283void rv740_read_clock_registers(struct radeon_device *rdev)
    284{
    285	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
    286
    287	pi->clk_regs.rv770.cg_spll_func_cntl =
    288		RREG32(CG_SPLL_FUNC_CNTL);
    289	pi->clk_regs.rv770.cg_spll_func_cntl_2 =
    290		RREG32(CG_SPLL_FUNC_CNTL_2);
    291	pi->clk_regs.rv770.cg_spll_func_cntl_3 =
    292		RREG32(CG_SPLL_FUNC_CNTL_3);
    293	pi->clk_regs.rv770.cg_spll_spread_spectrum =
    294		RREG32(CG_SPLL_SPREAD_SPECTRUM);
    295	pi->clk_regs.rv770.cg_spll_spread_spectrum_2 =
    296		RREG32(CG_SPLL_SPREAD_SPECTRUM_2);
    297
    298	pi->clk_regs.rv770.mpll_ad_func_cntl =
    299		RREG32(MPLL_AD_FUNC_CNTL);
    300	pi->clk_regs.rv770.mpll_ad_func_cntl_2 =
    301		RREG32(MPLL_AD_FUNC_CNTL_2);
    302	pi->clk_regs.rv770.mpll_dq_func_cntl =
    303		RREG32(MPLL_DQ_FUNC_CNTL);
    304	pi->clk_regs.rv770.mpll_dq_func_cntl_2 =
    305		RREG32(MPLL_DQ_FUNC_CNTL_2);
    306	pi->clk_regs.rv770.mclk_pwrmgt_cntl =
    307		RREG32(MCLK_PWRMGT_CNTL);
    308	pi->clk_regs.rv770.dll_cntl = RREG32(DLL_CNTL);
    309	pi->clk_regs.rv770.mpll_ss1 = RREG32(MPLL_SS1);
    310	pi->clk_regs.rv770.mpll_ss2 = RREG32(MPLL_SS2);
    311}
    312
    313int rv740_populate_smc_acpi_state(struct radeon_device *rdev,
    314				  RV770_SMC_STATETABLE *table)
    315{
    316	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
    317	u32 mpll_ad_func_cntl = pi->clk_regs.rv770.mpll_ad_func_cntl;
    318	u32 mpll_ad_func_cntl_2 = pi->clk_regs.rv770.mpll_ad_func_cntl_2;
    319	u32 mpll_dq_func_cntl = pi->clk_regs.rv770.mpll_dq_func_cntl;
    320	u32 mpll_dq_func_cntl_2 = pi->clk_regs.rv770.mpll_dq_func_cntl_2;
    321	u32 spll_func_cntl = pi->clk_regs.rv770.cg_spll_func_cntl;
    322	u32 spll_func_cntl_2 = pi->clk_regs.rv770.cg_spll_func_cntl_2;
    323	u32 spll_func_cntl_3 = pi->clk_regs.rv770.cg_spll_func_cntl_3;
    324	u32 mclk_pwrmgt_cntl = pi->clk_regs.rv770.mclk_pwrmgt_cntl;
    325	u32 dll_cntl = pi->clk_regs.rv770.dll_cntl;
    326
    327	table->ACPIState = table->initialState;
    328
    329	table->ACPIState.flags &= ~PPSMC_SWSTATE_FLAG_DC;
    330
    331	if (pi->acpi_vddc) {
    332		rv770_populate_vddc_value(rdev, pi->acpi_vddc,
    333					  &table->ACPIState.levels[0].vddc);
    334		table->ACPIState.levels[0].gen2PCIE =
    335			pi->pcie_gen2 ?
    336			pi->acpi_pcie_gen2 : 0;
    337		table->ACPIState.levels[0].gen2XSP =
    338			pi->acpi_pcie_gen2;
    339	} else {
    340		rv770_populate_vddc_value(rdev, pi->min_vddc_in_table,
    341					  &table->ACPIState.levels[0].vddc);
    342		table->ACPIState.levels[0].gen2PCIE = 0;
    343	}
    344
    345	mpll_ad_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN;
    346
    347	mpll_dq_func_cntl_2 |= BYPASS | BIAS_GEN_PDNB | RESET_EN;
    348
    349	mclk_pwrmgt_cntl |= (MRDCKA0_RESET |
    350			     MRDCKA1_RESET |
    351			     MRDCKB0_RESET |
    352			     MRDCKB1_RESET |
    353			     MRDCKC0_RESET |
    354			     MRDCKC1_RESET |
    355			     MRDCKD0_RESET |
    356			     MRDCKD1_RESET);
    357
    358	dll_cntl |= (MRDCKA0_BYPASS |
    359		     MRDCKA1_BYPASS |
    360		     MRDCKB0_BYPASS |
    361		     MRDCKB1_BYPASS |
    362		     MRDCKC0_BYPASS |
    363		     MRDCKC1_BYPASS |
    364		     MRDCKD0_BYPASS |
    365		     MRDCKD1_BYPASS);
    366
    367	spll_func_cntl |= SPLL_RESET | SPLL_SLEEP | SPLL_BYPASS_EN;
    368
    369	spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
    370	spll_func_cntl_2 |= SCLK_MUX_SEL(4);
    371
    372	table->ACPIState.levels[0].mclk.mclk770.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
    373	table->ACPIState.levels[0].mclk.mclk770.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
    374	table->ACPIState.levels[0].mclk.mclk770.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
    375	table->ACPIState.levels[0].mclk.mclk770.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
    376	table->ACPIState.levels[0].mclk.mclk770.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
    377	table->ACPIState.levels[0].mclk.mclk770.vDLL_CNTL = cpu_to_be32(dll_cntl);
    378
    379	table->ACPIState.levels[0].mclk.mclk770.mclk_value = 0;
    380
    381	table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
    382	table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
    383	table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
    384
    385	table->ACPIState.levels[0].sclk.sclk_value = 0;
    386
    387	table->ACPIState.levels[1] = table->ACPIState.levels[0];
    388	table->ACPIState.levels[2] = table->ACPIState.levels[0];
    389
    390	rv770_populate_mvdd_value(rdev, 0, &table->ACPIState.levels[0].mvdd);
    391
    392	return 0;
    393}
    394
    395void rv740_enable_mclk_spread_spectrum(struct radeon_device *rdev,
    396				       bool enable)
    397{
    398	if (enable)
    399		WREG32_P(MPLL_CNTL_MODE, SS_SSEN, ~SS_SSEN);
    400	else
    401		WREG32_P(MPLL_CNTL_MODE, 0, ~SS_SSEN);
    402}
    403
    404u8 rv740_get_mclk_frequency_ratio(u32 memory_clock)
    405{
    406	u8 mc_para_index;
    407
    408	if ((memory_clock < 10000) || (memory_clock > 47500))
    409		mc_para_index = 0x00;
    410	else
    411		mc_para_index = (u8)((memory_clock - 10000) / 2500);
    412
    413	return mc_para_index;
    414}