Hi,

On Tue, Nov 26, 2019 at 10:04:35AM +0000, Chris Wilson wrote:
> Now that we rapidly park the GT when the GPU idles, we often find
> ourselves idling faster than the RC6 promotion timer. Thus if we tell
> the GPU to enter RC6 manually as we park, we can do so quicker (by
> around 50ms, half an EI on average) and marginally increase our
> powersaving across all execlists platforms.
> 
> Signed-off-by: Chris Wilson <[email protected]>
> Cc: Andi Shyti <[email protected]>
> Cc: Mika Kuoppala <[email protected]>
> Cc: Imre Deak <[email protected]>

Looks ok:
Acked-by: Imre Deak <[email protected]>

Does intel_rc6_park() work on VLV/CHV too? I can't see at least that
we'd enable RC6 on those with GEN6_RC_CTL_RC6_ENABLE.

Also what is the value written to GEN6_RC_STATE? Is it ok to use the
same value after unpark()?

> ---
>  drivers/gpu/drm/i915/gt/intel_gt_pm.c     |  2 +
>  drivers/gpu/drm/i915/gt/intel_rc6.c       | 53 ++++++++++++++++-------
>  drivers/gpu/drm/i915/gt/intel_rc6.h       |  3 ++
>  drivers/gpu/drm/i915/gt/intel_rc6_types.h |  2 +
>  4 files changed, 45 insertions(+), 15 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/gt/intel_gt_pm.c 
> b/drivers/gpu/drm/i915/gt/intel_gt_pm.c
> index 9d3045096e37..2000018b6464 100644
> --- a/drivers/gpu/drm/i915/gt/intel_gt_pm.c
> +++ b/drivers/gpu/drm/i915/gt/intel_gt_pm.c
> @@ -64,6 +64,7 @@ static int __gt_unpark(struct intel_wakeref *wf)
>       if (NEEDS_RC6_CTX_CORRUPTION_WA(i915))
>               intel_uncore_forcewake_get(gt->uncore, FORCEWAKE_ALL);
>  
> +     intel_rc6_unpark(&gt->rc6);
>       intel_rps_unpark(&gt->rps);
>       i915_pmu_gt_unparked(i915);
>  
> @@ -85,6 +86,7 @@ static int __gt_park(struct intel_wakeref *wf)
>       i915_vma_parked(gt);
>       i915_pmu_gt_parked(i915);
>       intel_rps_park(&gt->rps);
> +     intel_rc6_park(&gt->rc6);
>  
>       /* Everything switched off, flush any residual interrupt just in case */
>       intel_synchronize_irq(i915);
> diff --git a/drivers/gpu/drm/i915/gt/intel_rc6.c 
> b/drivers/gpu/drm/i915/gt/intel_rc6.c
> index 7a0bc6dde009..c4379c49c20d 100644
> --- a/drivers/gpu/drm/i915/gt/intel_rc6.c
> +++ b/drivers/gpu/drm/i915/gt/intel_rc6.c
> @@ -96,10 +96,10 @@ static void gen11_rc6_enable(struct intel_rc6 *rc6)
>       set(uncore, GEN9_RENDER_PG_IDLE_HYSTERESIS, 60);
>  
>       /* 3a: Enable RC6 */
> -     set(uncore, GEN6_RC_CONTROL,
> -         GEN6_RC_CTL_HW_ENABLE |
> -         GEN6_RC_CTL_RC6_ENABLE |
> -         GEN6_RC_CTL_EI_MODE(1));
> +     rc6->ctl_enable =
> +             GEN6_RC_CTL_HW_ENABLE |
> +             GEN6_RC_CTL_RC6_ENABLE |
> +             GEN6_RC_CTL_EI_MODE(1);
>  
>       set(uncore, GEN9_PG_ENABLE,
>           GEN9_RENDER_PG_ENABLE |
> @@ -170,10 +170,10 @@ static void gen9_rc6_enable(struct intel_rc6 *rc6)
>       else
>               rc6_mode = GEN6_RC_CTL_EI_MODE(1);
>  
> -     set(uncore, GEN6_RC_CONTROL,
> -         GEN6_RC_CTL_HW_ENABLE |
> -         GEN6_RC_CTL_RC6_ENABLE |
> -         rc6_mode);
> +     rc6->ctl_enable =
> +             GEN6_RC_CTL_HW_ENABLE |
> +             GEN6_RC_CTL_RC6_ENABLE |
> +             rc6_mode;
>  
>       /*
>        * WaRsDisableCoarsePowerGating:skl,cnl
> @@ -200,10 +200,10 @@ static void gen8_rc6_enable(struct intel_rc6 *rc6)
>       set(uncore, GEN6_RC6_THRESHOLD, 625); /* 800us/1.28 for TO */
>  
>       /* 3: Enable RC6 */
> -     set(uncore, GEN6_RC_CONTROL,
> +     rc6->ctl_enable =
>           GEN6_RC_CTL_HW_ENABLE |
>           GEN7_RC_CTL_TO_MODE |
> -         GEN6_RC_CTL_RC6_ENABLE);
> +         GEN6_RC_CTL_RC6_ENABLE;
>  }
>  
>  static void gen6_rc6_enable(struct intel_rc6 *rc6)
> @@ -239,10 +239,10 @@ static void gen6_rc6_enable(struct intel_rc6 *rc6)
>               rc6_mask |= GEN6_RC_CTL_RC6p_ENABLE;
>       if (HAS_RC6pp(i915))
>               rc6_mask |= GEN6_RC_CTL_RC6pp_ENABLE;
> -     set(uncore, GEN6_RC_CONTROL,
> +     rc6->ctl_enable =
>           rc6_mask |
>           GEN6_RC_CTL_EI_MODE(1) |
> -         GEN6_RC_CTL_HW_ENABLE);
> +         GEN6_RC_CTL_HW_ENABLE;
>  
>       rc6vids = 0;
>       ret = sandybridge_pcode_read(i915, GEN6_PCODE_READ_RC6VIDS,
> @@ -360,7 +360,7 @@ static void chv_rc6_enable(struct intel_rc6 *rc6)
>                              VLV_RENDER_RC6_COUNT_EN));
>  
>       /* 3: Enable RC6 */
> -     set(uncore, GEN6_RC_CONTROL, GEN7_RC_CTL_TO_MODE);
> +     rc6->ctl_enable = GEN7_RC_CTL_TO_MODE;
>  }
>  
>  static void vlv_rc6_enable(struct intel_rc6 *rc6)
> @@ -386,8 +386,8 @@ static void vlv_rc6_enable(struct intel_rc6 *rc6)
>                              VLV_MEDIA_RC6_COUNT_EN |
>                              VLV_RENDER_RC6_COUNT_EN));
>  
> -     set(uncore, GEN6_RC_CONTROL,
> -         GEN7_RC_CTL_TO_MODE | VLV_RC_CTL_CTX_RST_PARALLEL);
> +     rc6->ctl_enable =
> +         GEN7_RC_CTL_TO_MODE | VLV_RC_CTL_CTX_RST_PARALLEL;
>  }
>  
>  static bool bxt_check_bios_rc6_setup(struct intel_rc6 *rc6)
> @@ -634,6 +634,29 @@ void intel_rc6_enable(struct intel_rc6 *rc6)
>       rc6->enabled = true;
>  }
>  
> +void intel_rc6_unpark(struct intel_rc6 *rc6)
> +{
> +     struct intel_uncore *uncore = rc6_to_uncore(rc6);
> +
> +     if (!rc6->enabled)
> +             return;
> +
> +     /* Restore HW timers for automatic RC6 entry while busy */
> +     set(uncore, GEN6_RC_CONTROL, rc6->ctl_enable);
> +}
> +
> +void intel_rc6_park(struct intel_rc6 *rc6)
> +{
> +     struct intel_uncore *uncore = rc6_to_uncore(rc6);
> +
> +     if (!rc6->enabled)
> +             return;
> +
> +     /* Turn off the HW timers and go directly to rc6 */
> +     set(uncore, GEN6_RC_CONTROL, GEN6_RC_CTL_RC6_ENABLE);
> +     set(uncore, GEN6_RC_STATE, 0x4 << RC_SW_TARGET_STATE_SHIFT);
> +}
> +
>  void intel_rc6_disable(struct intel_rc6 *rc6)
>  {
>       if (!rc6->enabled)
> diff --git a/drivers/gpu/drm/i915/gt/intel_rc6.h 
> b/drivers/gpu/drm/i915/gt/intel_rc6.h
> index 1370f6834a4c..20d740ff7e55 100644
> --- a/drivers/gpu/drm/i915/gt/intel_rc6.h
> +++ b/drivers/gpu/drm/i915/gt/intel_rc6.h
> @@ -15,6 +15,9 @@ struct intel_rc6;
>  void intel_rc6_init(struct intel_rc6 *rc6);
>  void intel_rc6_fini(struct intel_rc6 *rc6);
>  
> +void intel_rc6_unpark(struct intel_rc6 *rc6);
> +void intel_rc6_park(struct intel_rc6 *rc6);
> +
>  void intel_rc6_sanitize(struct intel_rc6 *rc6);
>  void intel_rc6_enable(struct intel_rc6 *rc6);
>  void intel_rc6_disable(struct intel_rc6 *rc6);
> diff --git a/drivers/gpu/drm/i915/gt/intel_rc6_types.h 
> b/drivers/gpu/drm/i915/gt/intel_rc6_types.h
> index 89ad5697a8d4..9f3d56817c97 100644
> --- a/drivers/gpu/drm/i915/gt/intel_rc6_types.h
> +++ b/drivers/gpu/drm/i915/gt/intel_rc6_types.h
> @@ -18,6 +18,8 @@ struct intel_rc6 {
>       u64 prev_hw_residency[4];
>       u64 cur_residency[4];
>  
> +     u32 ctl_enable;
> +
>       struct drm_i915_gem_object *pctx;
>  
>       bool supported : 1;
> -- 
> 2.24.0
> 
_______________________________________________
Intel-gfx mailing list
[email protected]
https://lists.freedesktop.org/mailman/listinfo/intel-gfx

Reply via email to