drm/amd/amdgpu: add vce3.0 clock gating support. (v2)
authorEric Huang <JinHuiEric.Huang@amd.com>
Mon, 23 Nov 2015 21:57:53 +0000 (16:57 -0500)
committerAlex Deucher <alexander.deucher@amd.com>
Mon, 21 Dec 2015 21:42:45 +0000 (16:42 -0500)
v2: fix grbm locking

Reviewed-by: Alex Deucher <alexander.deucher@amd.com>
Reviewed-by: Christian König <christian.koenig@amd.com>
Acked-by: Jammy Zhou <Jammy.Zhou@amd.com>
Signed-off-by: Eric Huang <JinHuiEric.Huang@amd.com>
drivers/gpu/drm/amd/amdgpu/vce_v3_0.c

index 370c6c9d81c26550302b974a4b794ed464090b65..35f48ad7644dc66d15730afc2929fa022c85ee0a 100644 (file)
@@ -103,6 +103,108 @@ static void vce_v3_0_ring_set_wptr(struct amdgpu_ring *ring)
                WREG32(mmVCE_RB_WPTR2, ring->wptr);
 }
 
+static void vce_v3_0_override_vce_clock_gating(struct amdgpu_device *adev, bool override)
+{
+       u32 tmp, data;
+
+       tmp = data = RREG32(mmVCE_RB_ARB_CTRL);
+       if (override)
+               data |= VCE_RB_ARB_CTRL__VCE_CGTT_OVERRIDE_MASK;
+       else
+               data &= ~VCE_RB_ARB_CTRL__VCE_CGTT_OVERRIDE_MASK;
+
+       if (tmp != data)
+               WREG32(mmVCE_RB_ARB_CTRL, data);
+}
+
+static void vce_v3_0_set_vce_sw_clock_gating(struct amdgpu_device *adev,
+                                            bool gated)
+{
+       u32 tmp, data;
+       /* Set Override to disable Clock Gating */
+       vce_v3_0_override_vce_clock_gating(adev, true);
+
+       if (!gated) {
+               /* Force CLOCK ON for VCE_CLOCK_GATING_B,
+                * {*_FORCE_ON, *_FORCE_OFF} = {1, 0}
+                * VREG can be FORCE ON or set to Dynamic, but can't be OFF
+                */
+               tmp = data = RREG32(mmVCE_CLOCK_GATING_B);
+               data |= 0x1ff;
+               data &= ~0xef0000;
+               if (tmp != data)
+                       WREG32(mmVCE_CLOCK_GATING_B, data);
+
+               /* Force CLOCK ON for VCE_UENC_CLOCK_GATING,
+                * {*_FORCE_ON, *_FORCE_OFF} = {1, 0}
+                */
+               tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING);
+               data |= 0x3ff000;
+               data &= ~0xffc00000;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_CLOCK_GATING, data);
+
+               /* set VCE_UENC_CLOCK_GATING_2 */
+               tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING_2);
+               data |= 0x2;
+               data &= ~0x2;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_CLOCK_GATING_2, data);
+
+               /* Force CLOCK ON for VCE_UENC_REG_CLOCK_GATING */
+               tmp = data = RREG32(mmVCE_UENC_REG_CLOCK_GATING);
+               data |= 0x37f;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_REG_CLOCK_GATING, data);
+
+               /* Force VCE_UENC_DMA_DCLK_CTRL Clock ON */
+               tmp = data = RREG32(mmVCE_UENC_DMA_DCLK_CTRL);
+               data |= VCE_UENC_DMA_DCLK_CTRL__WRDMCLK_FORCEON_MASK |
+                               VCE_UENC_DMA_DCLK_CTRL__RDDMCLK_FORCEON_MASK |
+                               VCE_UENC_DMA_DCLK_CTRL__REGCLK_FORCEON_MASK  |
+                               0x8;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_DMA_DCLK_CTRL, data);
+       } else {
+               /* Force CLOCK OFF for VCE_CLOCK_GATING_B,
+                * {*, *_FORCE_OFF} = {*, 1}
+                * set VREG to Dynamic, as it can't be OFF
+                */
+               tmp = data = RREG32(mmVCE_CLOCK_GATING_B);
+               data &= ~0x80010;
+               data |= 0xe70008;
+               if (tmp != data)
+                       WREG32(mmVCE_CLOCK_GATING_B, data);
+               /* Force CLOCK OFF for VCE_UENC_CLOCK_GATING,
+                * Force ClOCK OFF takes precedent over Force CLOCK ON setting.
+                * {*_FORCE_ON, *_FORCE_OFF} = {*, 1}
+                */
+               tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING);
+               data |= 0xffc00000;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_CLOCK_GATING, data);
+               /* Set VCE_UENC_CLOCK_GATING_2 */
+               tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING_2);
+               data |= 0x10000;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_CLOCK_GATING_2, data);
+               /* Set VCE_UENC_REG_CLOCK_GATING to dynamic */
+               tmp = data = RREG32(mmVCE_UENC_REG_CLOCK_GATING);
+               data &= ~0xffc00000;
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_REG_CLOCK_GATING, data);
+               /* Set VCE_UENC_DMA_DCLK_CTRL CG always in dynamic mode */
+               tmp = data = RREG32(mmVCE_UENC_DMA_DCLK_CTRL);
+               data &= ~(VCE_UENC_DMA_DCLK_CTRL__WRDMCLK_FORCEON_MASK |
+                               VCE_UENC_DMA_DCLK_CTRL__RDDMCLK_FORCEON_MASK |
+                               VCE_UENC_DMA_DCLK_CTRL__REGCLK_FORCEON_MASK  |
+                               0x8);
+               if (tmp != data)
+                       WREG32(mmVCE_UENC_DMA_DCLK_CTRL, data);
+       }
+       vce_v3_0_override_vce_clock_gating(adev, false);
+}
+
 /**
  * vce_v3_0_start - start VCE block
  *
@@ -121,7 +223,7 @@ static int vce_v3_0_start(struct amdgpu_device *adev)
                if (adev->vce.harvest_config & (1 << idx))
                        continue;
 
-               if(idx == 0)
+               if (idx == 0)
                        WREG32_P(mmGRBM_GFX_INDEX, 0,
                                ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK);
                else
@@ -174,6 +276,10 @@ static int vce_v3_0_start(struct amdgpu_device *adev)
                /* clear BUSY flag */
                WREG32_P(mmVCE_STATUS, 0, ~1);
 
+               /* Set Clock-Gating off */
+               if (adev->cg_flags & AMDGPU_CG_SUPPORT_VCE_MGCG)
+                       vce_v3_0_set_vce_sw_clock_gating(adev, false);
+
                if (r) {
                        DRM_ERROR("VCE not responding, giving up!!!\n");
                        mutex_unlock(&adev->grbm_idx_mutex);
@@ -609,6 +715,47 @@ static int vce_v3_0_process_interrupt(struct amdgpu_device *adev,
 static int vce_v3_0_set_clockgating_state(void *handle,
                                          enum amd_clockgating_state state)
 {
+       struct amdgpu_device *adev = (struct amdgpu_device *)handle;
+       bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
+       int i;
+
+       if (!(adev->cg_flags & AMDGPU_CG_SUPPORT_VCE_MGCG))
+               return 0;
+
+       mutex_lock(&adev->grbm_idx_mutex);
+       for (i = 0; i < 2; i++) {
+               /* Program VCE Instance 0 or 1 if not harvested */
+               if (adev->vce.harvest_config & (1 << i))
+                       continue;
+
+               if (i == 0)
+                       WREG32_P(mmGRBM_GFX_INDEX, 0,
+                                       ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK);
+               else
+                       WREG32_P(mmGRBM_GFX_INDEX,
+                                       GRBM_GFX_INDEX__VCE_INSTANCE_MASK,
+                                       ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK);
+
+               if (enable) {
+                       /* initialize VCE_CLOCK_GATING_A: Clock ON/OFF delay */
+                       uint32_t data = RREG32(mmVCE_CLOCK_GATING_A);
+                       data &= ~(0xf | 0xff0);
+                       data |= ((0x0 << 0) | (0x04 << 4));
+                       WREG32(mmVCE_CLOCK_GATING_A, data);
+
+                       /* initialize VCE_UENC_CLOCK_GATING: Clock ON/OFF delay */
+                       data = RREG32(mmVCE_UENC_CLOCK_GATING);
+                       data &= ~(0xf | 0xff0);
+                       data |= ((0x0 << 0) | (0x04 << 4));
+                       WREG32(mmVCE_UENC_CLOCK_GATING, data);
+               }
+
+               vce_v3_0_set_vce_sw_clock_gating(adev, enable);
+       }
+
+       WREG32_P(mmGRBM_GFX_INDEX, 0, ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK);
+       mutex_unlock(&adev->grbm_idx_mutex);
+
        return 0;
 }