diff options
Diffstat (limited to 'drivers/gpu/drm/amd/amdgpu/si.c')
| -rw-r--r-- | drivers/gpu/drm/amd/amdgpu/si.c | 398 | 
1 files changed, 386 insertions, 12 deletions
| diff --git a/drivers/gpu/drm/amd/amdgpu/si.c b/drivers/gpu/drm/amd/amdgpu/si.c index 153db3f763bc..1b449291f068 100644 --- a/drivers/gpu/drm/amd/amdgpu/si.c +++ b/drivers/gpu/drm/amd/amdgpu/si.c @@ -41,9 +41,11 @@  #include "si_dma.h"  #include "dce_v6_0.h"  #include "si.h" +#include "uvd_v3_1.h"  #include "dce_virtual.h"  #include "gca/gfx_6_0_d.h"  #include "oss/oss_1_0_d.h" +#include "oss/oss_1_0_sh_mask.h"  #include "gmc/gmc_6_0_d.h"  #include "dce/dce_6_0_d.h"  #include "uvd/uvd_4_0_d.h" @@ -973,6 +975,28 @@ static void si_smc_wreg(struct amdgpu_device *adev, u32 reg, u32 v)  	spin_unlock_irqrestore(&adev->smc_idx_lock, flags);  } +static u32 si_uvd_ctx_rreg(struct amdgpu_device *adev, u32 reg) +{ +	unsigned long flags; +	u32 r; + +	spin_lock_irqsave(&adev->uvd_ctx_idx_lock, flags); +	WREG32(mmUVD_CTX_INDEX, ((reg) & 0x1ff)); +	r = RREG32(mmUVD_CTX_DATA); +	spin_unlock_irqrestore(&adev->uvd_ctx_idx_lock, flags); +	return r; +} + +static void si_uvd_ctx_wreg(struct amdgpu_device *adev, u32 reg, u32 v) +{ +	unsigned long flags; + +	spin_lock_irqsave(&adev->uvd_ctx_idx_lock, flags); +	WREG32(mmUVD_CTX_INDEX, ((reg) & 0x1ff)); +	WREG32(mmUVD_CTX_DATA, (v)); +	spin_unlock_irqrestore(&adev->uvd_ctx_idx_lock, flags); +} +  static struct amdgpu_allowed_register_entry si_allowed_read_registers[] = {  	{GRBM_STATUS},  	{mmGRBM_STATUS2}, @@ -1205,6 +1229,11 @@ static bool si_asic_supports_baco(struct amdgpu_device *adev)  static enum amd_reset_method  si_asic_reset_method(struct amdgpu_device *adev)  { +	if (amdgpu_reset_method != AMD_RESET_METHOD_LEGACY && +	    amdgpu_reset_method != -1) +		dev_warn(adev->dev, "Specified reset method:%d isn't supported, using AUTO instead.\n", +				  amdgpu_reset_method); +  	return AMD_RESET_METHOD_LEGACY;  } @@ -1243,12 +1272,6 @@ static u32 si_get_xclk(struct amdgpu_device *adev)  	return reference_clock;  } -//xxx:not implemented -static int si_set_uvd_clocks(struct amdgpu_device *adev, u32 vclk, u32 dclk) -{ -	return 0; -} -  static void si_flush_hdp(struct amdgpu_device *adev, struct amdgpu_ring *ring)  {  	if (!ring || !ring->funcs->emit_wreg) { @@ -1404,6 +1427,358 @@ static uint64_t si_get_pcie_replay_count(struct amdgpu_device *adev)  	return (nak_r + nak_g);  } +static int si_uvd_send_upll_ctlreq(struct amdgpu_device *adev, +				   unsigned cg_upll_func_cntl) +{ +	unsigned i; + +	/* Make sure UPLL_CTLREQ is deasserted */ +	WREG32_P(cg_upll_func_cntl, 0, ~UPLL_CTLREQ_MASK); + +	mdelay(10); + +	/* Assert UPLL_CTLREQ */ +	WREG32_P(cg_upll_func_cntl, UPLL_CTLREQ_MASK, ~UPLL_CTLREQ_MASK); + +	/* Wait for CTLACK and CTLACK2 to get asserted */ +	for (i = 0; i < SI_MAX_CTLACKS_ASSERTION_WAIT; ++i) { +		uint32_t mask = UPLL_CTLACK_MASK | UPLL_CTLACK2_MASK; + +		if ((RREG32(cg_upll_func_cntl) & mask) == mask) +			break; +		mdelay(10); +	} + +	/* Deassert UPLL_CTLREQ */ +	WREG32_P(cg_upll_func_cntl, 0, ~UPLL_CTLREQ_MASK); + +	if (i == SI_MAX_CTLACKS_ASSERTION_WAIT) { +		DRM_ERROR("Timeout setting UVD clocks!\n"); +		return -ETIMEDOUT; +	} + +	return 0; +} + +static unsigned si_uvd_calc_upll_post_div(unsigned vco_freq, +					  unsigned target_freq, +					  unsigned pd_min, +					  unsigned pd_even) +{ +	unsigned post_div = vco_freq / target_freq; + +	/* Adjust to post divider minimum value */ +	if (post_div < pd_min) +		post_div = pd_min; + +	/* We alway need a frequency less than or equal the target */ +	if ((vco_freq / post_div) > target_freq) +		post_div += 1; + +	/* Post dividers above a certain value must be even */ +	if (post_div > pd_even && post_div % 2) +		post_div += 1; + +	return post_div; +} + +/** + * si_calc_upll_dividers - calc UPLL clock dividers + * + * @adev: amdgpu_device pointer + * @vclk: wanted VCLK + * @dclk: wanted DCLK + * @vco_min: minimum VCO frequency + * @vco_max: maximum VCO frequency + * @fb_factor: factor to multiply vco freq with + * @fb_mask: limit and bitmask for feedback divider + * @pd_min: post divider minimum + * @pd_max: post divider maximum + * @pd_even: post divider must be even above this value + * @optimal_fb_div: resulting feedback divider + * @optimal_vclk_div: resulting vclk post divider + * @optimal_dclk_div: resulting dclk post divider + * + * Calculate dividers for UVDs UPLL (except APUs). + * Returns zero on success; -EINVAL on error. + */ +static int si_calc_upll_dividers(struct amdgpu_device *adev, +				 unsigned vclk, unsigned dclk, +				 unsigned vco_min, unsigned vco_max, +				 unsigned fb_factor, unsigned fb_mask, +				 unsigned pd_min, unsigned pd_max, +				 unsigned pd_even, +				 unsigned *optimal_fb_div, +				 unsigned *optimal_vclk_div, +				 unsigned *optimal_dclk_div) +{ +	unsigned vco_freq, ref_freq = adev->clock.spll.reference_freq; + +	/* Start off with something large */ +	unsigned optimal_score = ~0; + +	/* Loop through vco from low to high */ +	vco_min = max(max(vco_min, vclk), dclk); +	for (vco_freq = vco_min; vco_freq <= vco_max; vco_freq += 100) { +		uint64_t fb_div = (uint64_t)vco_freq * fb_factor; +		unsigned vclk_div, dclk_div, score; + +		do_div(fb_div, ref_freq); + +		/* fb div out of range ? */ +		if (fb_div > fb_mask) +			break; /* It can oly get worse */ + +		fb_div &= fb_mask; + +		/* Calc vclk divider with current vco freq */ +		vclk_div = si_uvd_calc_upll_post_div(vco_freq, vclk, +						     pd_min, pd_even); +		if (vclk_div > pd_max) +			break; /* vco is too big, it has to stop */ + +		/* Calc dclk divider with current vco freq */ +		dclk_div = si_uvd_calc_upll_post_div(vco_freq, dclk, +						     pd_min, pd_even); +		if (dclk_div > pd_max) +			break; /* vco is too big, it has to stop */ + +		/* Calc score with current vco freq */ +		score = vclk - (vco_freq / vclk_div) + dclk - (vco_freq / dclk_div); + +		/* Determine if this vco setting is better than current optimal settings */ +		if (score < optimal_score) { +			*optimal_fb_div = fb_div; +			*optimal_vclk_div = vclk_div; +			*optimal_dclk_div = dclk_div; +			optimal_score = score; +			if (optimal_score == 0) +				break; /* It can't get better than this */ +		} +	} + +	/* Did we found a valid setup ? */ +	if (optimal_score == ~0) +		return -EINVAL; + +	return 0; +} + +static int si_set_uvd_clocks(struct amdgpu_device *adev, u32 vclk, u32 dclk) +{ +	unsigned fb_div = 0, vclk_div = 0, dclk_div = 0; +	int r; + +	/* Bypass vclk and dclk with bclk */ +	WREG32_P(CG_UPLL_FUNC_CNTL_2, +		 VCLK_SRC_SEL(1) | DCLK_SRC_SEL(1), +		 ~(VCLK_SRC_SEL_MASK | DCLK_SRC_SEL_MASK)); + +	/* Put PLL in bypass mode */ +	WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_BYPASS_EN_MASK, ~UPLL_BYPASS_EN_MASK); + +	if (!vclk || !dclk) { +		/* Keep the Bypass mode */ +		return 0; +	} + +	r = si_calc_upll_dividers(adev, vclk, dclk, 125000, 250000, +				  16384, 0x03FFFFFF, 0, 128, 5, +				  &fb_div, &vclk_div, &dclk_div); +	if (r) +		return r; + +	/* Set RESET_ANTI_MUX to 0 */ +	WREG32_P(CG_UPLL_FUNC_CNTL_5, 0, ~RESET_ANTI_MUX_MASK); + +	/* Set VCO_MODE to 1 */ +	WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_VCO_MODE_MASK, ~UPLL_VCO_MODE_MASK); + +	/* Disable sleep mode */ +	WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_SLEEP_MASK); + +	/* Deassert UPLL_RESET */ +	WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_RESET_MASK); + +	mdelay(1); + +	r = si_uvd_send_upll_ctlreq(adev, CG_UPLL_FUNC_CNTL); +	if (r) +		return r; + +	/* Assert UPLL_RESET again */ +	WREG32_P(CG_UPLL_FUNC_CNTL, UPLL_RESET_MASK, ~UPLL_RESET_MASK); + +	/* Disable spread spectrum. */ +	WREG32_P(CG_UPLL_SPREAD_SPECTRUM, 0, ~SSEN_MASK); + +	/* Set feedback divider */ +	WREG32_P(CG_UPLL_FUNC_CNTL_3, UPLL_FB_DIV(fb_div), ~UPLL_FB_DIV_MASK); + +	/* Set ref divider to 0 */ +	WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_REF_DIV_MASK); + +	if (fb_div < 307200) +		WREG32_P(CG_UPLL_FUNC_CNTL_4, 0, ~UPLL_SPARE_ISPARE9); +	else +		WREG32_P(CG_UPLL_FUNC_CNTL_4, +			 UPLL_SPARE_ISPARE9, +			 ~UPLL_SPARE_ISPARE9); + +	/* Set PDIV_A and PDIV_B */ +	WREG32_P(CG_UPLL_FUNC_CNTL_2, +		 UPLL_PDIV_A(vclk_div) | UPLL_PDIV_B(dclk_div), +		 ~(UPLL_PDIV_A_MASK | UPLL_PDIV_B_MASK)); + +	/* Give the PLL some time to settle */ +	mdelay(15); + +	/* Deassert PLL_RESET */ +	WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_RESET_MASK); + +	mdelay(15); + +	/* Switch from bypass mode to normal mode */ +	WREG32_P(CG_UPLL_FUNC_CNTL, 0, ~UPLL_BYPASS_EN_MASK); + +	r = si_uvd_send_upll_ctlreq(adev, CG_UPLL_FUNC_CNTL); +	if (r) +		return r; + +	/* Switch VCLK and DCLK selection */ +	WREG32_P(CG_UPLL_FUNC_CNTL_2, +		 VCLK_SRC_SEL(2) | DCLK_SRC_SEL(2), +		 ~(VCLK_SRC_SEL_MASK | DCLK_SRC_SEL_MASK)); + +	mdelay(100); + +	return 0; +} + +static int si_vce_send_vcepll_ctlreq(struct amdgpu_device *adev) +{ +	unsigned i; + +	/* Make sure VCEPLL_CTLREQ is deasserted */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~UPLL_CTLREQ_MASK); + +	mdelay(10); + +	/* Assert UPLL_CTLREQ */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, UPLL_CTLREQ_MASK, ~UPLL_CTLREQ_MASK); + +	/* Wait for CTLACK and CTLACK2 to get asserted */ +	for (i = 0; i < SI_MAX_CTLACKS_ASSERTION_WAIT; ++i) { +		uint32_t mask = UPLL_CTLACK_MASK | UPLL_CTLACK2_MASK; + +		if ((RREG32_SMC(CG_VCEPLL_FUNC_CNTL) & mask) == mask) +			break; +		mdelay(10); +	} + +	/* Deassert UPLL_CTLREQ */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~UPLL_CTLREQ_MASK); + +	if (i == SI_MAX_CTLACKS_ASSERTION_WAIT) { +		DRM_ERROR("Timeout setting UVD clocks!\n"); +		return -ETIMEDOUT; +	} + +	return 0; +} + +static int si_set_vce_clocks(struct amdgpu_device *adev, u32 evclk, u32 ecclk) +{ +	unsigned fb_div = 0, evclk_div = 0, ecclk_div = 0; +	int r; + +	/* Bypass evclk and ecclk with bclk */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL_2, +		     EVCLK_SRC_SEL(1) | ECCLK_SRC_SEL(1), +		     ~(EVCLK_SRC_SEL_MASK | ECCLK_SRC_SEL_MASK)); + +	/* Put PLL in bypass mode */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, VCEPLL_BYPASS_EN_MASK, +		     ~VCEPLL_BYPASS_EN_MASK); + +	if (!evclk || !ecclk) { +		/* Keep the Bypass mode, put PLL to sleep */ +		WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, VCEPLL_SLEEP_MASK, +			     ~VCEPLL_SLEEP_MASK); +		return 0; +	} + +	r = si_calc_upll_dividers(adev, evclk, ecclk, 125000, 250000, +				  16384, 0x03FFFFFF, 0, 128, 5, +				  &fb_div, &evclk_div, &ecclk_div); +	if (r) +		return r; + +	/* Set RESET_ANTI_MUX to 0 */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL_5, 0, ~RESET_ANTI_MUX_MASK); + +	/* Set VCO_MODE to 1 */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, VCEPLL_VCO_MODE_MASK, +		     ~VCEPLL_VCO_MODE_MASK); + +	/* Toggle VCEPLL_SLEEP to 1 then back to 0 */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, VCEPLL_SLEEP_MASK, +		     ~VCEPLL_SLEEP_MASK); +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~VCEPLL_SLEEP_MASK); + +	/* Deassert VCEPLL_RESET */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~VCEPLL_RESET_MASK); + +	mdelay(1); + +	r = si_vce_send_vcepll_ctlreq(adev); +	if (r) +		return r; + +	/* Assert VCEPLL_RESET again */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, VCEPLL_RESET_MASK, ~VCEPLL_RESET_MASK); + +	/* Disable spread spectrum. */ +	WREG32_SMC_P(CG_VCEPLL_SPREAD_SPECTRUM, 0, ~SSEN_MASK); + +	/* Set feedback divider */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL_3, +		     VCEPLL_FB_DIV(fb_div), +		     ~VCEPLL_FB_DIV_MASK); + +	/* Set ref divider to 0 */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~VCEPLL_REF_DIV_MASK); + +	/* Set PDIV_A and PDIV_B */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL_2, +		     VCEPLL_PDIV_A(evclk_div) | VCEPLL_PDIV_B(ecclk_div), +		     ~(VCEPLL_PDIV_A_MASK | VCEPLL_PDIV_B_MASK)); + +	/* Give the PLL some time to settle */ +	mdelay(15); + +	/* Deassert PLL_RESET */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~VCEPLL_RESET_MASK); + +	mdelay(15); + +	/* Switch from bypass mode to normal mode */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL, 0, ~VCEPLL_BYPASS_EN_MASK); + +	r = si_vce_send_vcepll_ctlreq(adev); +	if (r) +		return r; + +	/* Switch VCLK and DCLK selection */ +	WREG32_SMC_P(CG_VCEPLL_FUNC_CNTL_2, +		     EVCLK_SRC_SEL(16) | ECCLK_SRC_SEL(16), +		     ~(EVCLK_SRC_SEL_MASK | ECCLK_SRC_SEL_MASK)); + +	mdelay(100); + +	return 0; +} +  static const struct amdgpu_asic_funcs si_asic_funcs =  {  	.read_disabled_bios = &si_read_disabled_bios, @@ -1414,7 +1789,7 @@ static const struct amdgpu_asic_funcs si_asic_funcs =  	.set_vga_state = &si_vga_set_state,  	.get_xclk = &si_get_xclk,  	.set_uvd_clocks = &si_set_uvd_clocks, -	.set_vce_clocks = NULL, +	.set_vce_clocks = &si_set_vce_clocks,  	.get_pcie_lanes = &si_get_pcie_lanes,  	.set_pcie_lanes = &si_set_pcie_lanes,  	.get_config_memsize = &si_get_config_memsize, @@ -1443,8 +1818,8 @@ static int si_common_early_init(void *handle)  	adev->pcie_wreg = &si_pcie_wreg;  	adev->pciep_rreg = &si_pciep_rreg;  	adev->pciep_wreg = &si_pciep_wreg; -	adev->uvd_ctx_rreg = NULL; -	adev->uvd_ctx_wreg = NULL; +	adev->uvd_ctx_rreg = si_uvd_ctx_rreg; +	adev->uvd_ctx_wreg = si_uvd_ctx_wreg;  	adev->didt_rreg = NULL;  	adev->didt_wreg = NULL; @@ -2173,7 +2548,7 @@ int si_set_ip_blocks(struct amdgpu_device *adev)  			amdgpu_device_ip_block_add(adev, &dce_virtual_ip_block);  		else  			amdgpu_device_ip_block_add(adev, &dce_v6_0_ip_block); -		/* amdgpu_device_ip_block_add(adev, &uvd_v3_1_ip_block); */ +		amdgpu_device_ip_block_add(adev, &uvd_v3_1_ip_block);  		/* amdgpu_device_ip_block_add(adev, &vce_v1_0_ip_block); */  		break;  	case CHIP_OLAND: @@ -2187,8 +2562,7 @@ int si_set_ip_blocks(struct amdgpu_device *adev)  			amdgpu_device_ip_block_add(adev, &dce_virtual_ip_block);  		else  			amdgpu_device_ip_block_add(adev, &dce_v6_4_ip_block); - -		/* amdgpu_device_ip_block_add(adev, &uvd_v3_1_ip_block); */ +		amdgpu_device_ip_block_add(adev, &uvd_v3_1_ip_block);  		/* amdgpu_device_ip_block_add(adev, &vce_v1_0_ip_block); */  		break;  	case CHIP_HAINAN: | 
