On Mon, Oct 18, 2021 at 02:50:28PM +0300, Ville Syrjala wrote:
> From: Ville Syrjälä <[email protected]>
> 
> Chop g4x_sprite_update() into two halves. Fist half becomes
> the _noarm() variant, second part the _arm() variant.
> 
> Fortunately I have already previously grouped the register
> writes into roughtly the correct order, so the split looks
> surprisingly clean.
> 
> Not much of a change in i915_update_info on these older
> platforms that don't have so many planes or registers to
> begin with. Here are the numbers from snb (totally unpatched
> vs. both primary plane and sprite patched applied) running
> kms_atomic_transition --r plane-all-transition --extended:
> w/o patch                           w/ patch
> Updates: 5404                     Updates: 5405
>        |                                 |
>    1us |******                               1us |******
>        |*********                        |*********
>    4us |***********                  4us |***********
>        |**********                       |**********
>   16us |**                          16us |**
>        |                                 |
>   66us |                            66us |
>        |                                 |
>  262us |                           262us |
>        |                                 |
>    1ms |                             1ms |
>        |                                 |
>    4ms |                             4ms |
>        |                                 |
>   17ms |                            17ms |
>        |                                 |
> Min update: 1400ns                Min update: 1307ns
> Max update: 19809ns               Max update: 20194ns
> Average update: 6957ns                    Average update: 6432ns
> Overruns > 100us: 0               Overruns > 100us: 0
> 
> But there seems to be a slight improvement with
> lockdep enabled:
> w/o patch                           w/ patch
> Updates: 17612                            Updates: 16364
>        |                                 |
>    1us |                             1us |
>        |******                                   |******
>    4us |**********                   4us |**********
>        |************                     |*************
>   16us |*************               16us |************
>        |***                              |*
>   66us |                            66us |
>        |                                 |
>  262us |                           262us |
>        |                                 |
>    1ms |                             1ms |
>        |                                 |
>    4ms |                             4ms |
>        |                                 |
>   17ms |                            17ms |
>        |                                 |
> Min update: 3141ns                Min update: 3562ns
> Max update: 126450ns              Max update: 73354ns
> Average update: 16373ns                   Average update: 15153ns
> Overruns > 250us: 0               Overruns > 250us: 0

Reviewed-by: Stanislav Lisovskiy <[email protected]>

> 
> Cc: Stanislav Lisovskiy <[email protected]>
> Signed-off-by: Ville Syrjälä <[email protected]>
> ---
>  drivers/gpu/drm/i915/display/intel_sprite.c | 41 ++++++++++++++-------
>  1 file changed, 28 insertions(+), 13 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/display/intel_sprite.c 
> b/drivers/gpu/drm/i915/display/intel_sprite.c
> index 9c36c1492b33..03e3bf890ce9 100644
> --- a/drivers/gpu/drm/i915/display/intel_sprite.c
> +++ b/drivers/gpu/drm/i915/display/intel_sprite.c
> @@ -1165,28 +1165,21 @@ static void ilk_sprite_update_gamma(const struct 
> intel_plane_state *plane_state)
>  }
>  
>  static void
> -g4x_sprite_update_arm(struct intel_plane *plane,
> -                   const struct intel_crtc_state *crtc_state,
> -                   const struct intel_plane_state *plane_state)
> +g4x_sprite_update_noarm(struct intel_plane *plane,
> +                     const struct intel_crtc_state *crtc_state,
> +                     const struct intel_plane_state *plane_state)
>  {
>       struct drm_i915_private *dev_priv = to_i915(plane->base.dev);
>       enum pipe pipe = plane->pipe;
> -     u32 dvssurf_offset = plane_state->view.color_plane[0].offset;
> -     u32 linear_offset;
> -     const struct drm_intel_sprite_colorkey *key = &plane_state->ckey;
>       int crtc_x = plane_state->uapi.dst.x1;
>       int crtc_y = plane_state->uapi.dst.y1;
>       u32 crtc_w = drm_rect_width(&plane_state->uapi.dst);
>       u32 crtc_h = drm_rect_height(&plane_state->uapi.dst);
> -     u32 x = plane_state->view.color_plane[0].x;
> -     u32 y = plane_state->view.color_plane[0].y;
>       u32 src_w = drm_rect_width(&plane_state->uapi.src) >> 16;
>       u32 src_h = drm_rect_height(&plane_state->uapi.src) >> 16;
> -     u32 dvscntr, dvsscale = 0;
> +     u32 dvsscale = 0;
>       unsigned long irqflags;
>  
> -     dvscntr = plane_state->ctl | g4x_sprite_ctl_crtc(crtc_state);
> -
>       /* Sizes are 0 based */
>       src_w--;
>       src_h--;
> @@ -1196,8 +1189,6 @@ g4x_sprite_update_arm(struct intel_plane *plane,
>       if (crtc_w != src_w || crtc_h != src_h)
>               dvsscale = DVS_SCALE_ENABLE | (src_w << 16) | src_h;
>  
> -     linear_offset = intel_fb_xy_to_linear(x, y, plane_state, 0);
> -
>       spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
>  
>       intel_de_write_fw(dev_priv, DVSSTRIDE(pipe),
> @@ -1206,6 +1197,29 @@ g4x_sprite_update_arm(struct intel_plane *plane,
>       intel_de_write_fw(dev_priv, DVSSIZE(pipe), (crtc_h << 16) | crtc_w);
>       intel_de_write_fw(dev_priv, DVSSCALE(pipe), dvsscale);
>  
> +     spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
> +}
> +
> +static void
> +g4x_sprite_update_arm(struct intel_plane *plane,
> +                   const struct intel_crtc_state *crtc_state,
> +                   const struct intel_plane_state *plane_state)
> +{
> +     struct drm_i915_private *dev_priv = to_i915(plane->base.dev);
> +     enum pipe pipe = plane->pipe;
> +     const struct drm_intel_sprite_colorkey *key = &plane_state->ckey;
> +     u32 dvssurf_offset = plane_state->view.color_plane[0].offset;
> +     u32 x = plane_state->view.color_plane[0].x;
> +     u32 y = plane_state->view.color_plane[0].y;
> +     u32 dvscntr, linear_offset;
> +     unsigned long irqflags;
> +
> +     dvscntr = plane_state->ctl | g4x_sprite_ctl_crtc(crtc_state);
> +
> +     linear_offset = intel_fb_xy_to_linear(x, y, plane_state, 0);
> +
> +     spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
> +
>       if (key->flags) {
>               intel_de_write_fw(dev_priv, DVSKEYVAL(pipe), key->min_value);
>               intel_de_write_fw(dev_priv, DVSKEYMSK(pipe),
> @@ -1801,6 +1815,7 @@ intel_sprite_plane_create(struct drm_i915_private 
> *dev_priv,
>  
>               plane_funcs = &snb_sprite_funcs;
>       } else {
> +             plane->update_noarm = g4x_sprite_update_noarm;
>               plane->update_arm = g4x_sprite_update_arm;
>               plane->disable_arm = g4x_sprite_disable_arm;
>               plane->get_hw_state = g4x_sprite_get_hw_state;
> -- 
> 2.32.0
> 

Reply via email to