diff mbox series

[v1,1/2] drm/i915/xe2lpd: check selective fetch is optimal in some cases

Message ID 20231102215519.135847-2-vinod.govindapillai@intel.com (mailing list archive)
State New, archived
Headers show
Series drm/i915/xe2lpd: choose between PSR2 and FBC | expand

Commit Message

Vinod Govindapillai Nov. 2, 2023, 9:55 p.m. UTC
If both PSR2 + FBC is supported, in cases where the selective
fetch area is greater than 25% of the screen area, FBC might
be more efficient. So have a possibility to check this and add
provision to enable FBC in such cases.

Bspec: 68881
Signed-off-by: Vinod Govindapillai <vinod.govindapillai@intel.com>
---
 .../drm/i915/display/intel_display_types.h    |  1 +
 drivers/gpu/drm/i915/display/intel_psr.c      | 42 ++++++++++++++++---
 2 files changed, 38 insertions(+), 5 deletions(-)

Comments

Jouni Högander Nov. 6, 2023, 10:31 a.m. UTC | #1
On Thu, 2023-11-02 at 23:55 +0200, Vinod Govindapillai wrote:
> If both PSR2 + FBC is supported, in cases where the selective
> fetch area is greater than 25% of the screen area, FBC might
> be more efficient. So have a possibility to check this and add
> provision to enable FBC in such cases.
> 
> Bspec: 68881
> Signed-off-by: Vinod Govindapillai <vinod.govindapillai@intel.com>
> ---
>  .../drm/i915/display/intel_display_types.h    |  1 +
>  drivers/gpu/drm/i915/display/intel_psr.c      | 42 ++++++++++++++++-
> --
>  2 files changed, 38 insertions(+), 5 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h
> b/drivers/gpu/drm/i915/display/intel_display_types.h
> index 047fe3f8905a..bcc5fd8d8a00 100644
> --- a/drivers/gpu/drm/i915/display/intel_display_types.h
> +++ b/drivers/gpu/drm/i915/display/intel_display_types.h
> @@ -1207,6 +1207,7 @@ struct intel_crtc_state {
>         bool has_psr;
>         bool has_psr2;
>         bool enable_psr2_sel_fetch;
> +       bool full_frame_fetch;

I have a patch somewhere where I'm carrying su area in
intel_crtc_state. Maybe that could be utilized here?

>         bool req_psr2_sdp_prior_scanline;
>         bool wm_level_disabled;
>         u32 dc3co_exitline;
> diff --git a/drivers/gpu/drm/i915/display/intel_psr.c
> b/drivers/gpu/drm/i915/display/intel_psr.c
> index ecd24a0b86cb..6cb32fd29d10 100644
> --- a/drivers/gpu/drm/i915/display/intel_psr.c
> +++ b/drivers/gpu/drm/i915/display/intel_psr.c
> @@ -1987,10 +1987,35 @@ static bool
> psr2_sel_fetch_pipe_state_supported(const struct intel_crtc_state *c
>         return true;
>  }
>  
> +/*
> + * Check selective fetch is optimum
> + *
> + * Compare selective fetch area w.r.t screen size in case both FBC
> and PSR2
> + * is supported. If the selective fetch area is more than 25% of
> screen
> + * size, FBC is might be more efficient than PSR2. So force full
> frame
> + * update.
> + */
> +static bool psr2_sel_fetch_not_optimal(struct drm_i915_private
> *i915,
> +                                      struct drm_rect *sel_fetch,
> +                                      struct drm_rect *src)
> +{
> +       int screen_area, selfetch_area;
> +
> +       /* This is needed where FBC + PSR can be supported */
> +       if (DISPLAY_VER(i915) < 20 || !i915-
> >display.params.enable_fbc ||
> +           !HAS_FBC(i915))
> +               return false;

The problem with this is that you don't know if FBC is really enabled
after intel_fbc_atomic_check. Maybe this (policy) decision should be
done there where intel_fbc_atomic_check and intel_psr_compute_config
are called? that logic would set intel_crtc_state->full_frame_fetch
which would be taken into account in
intel_psr2_program_trans_man_trk_ctl. Also I think it would be good to
have some kind of knob to enable/disable this optimization.

> +
> +       selfetch_area = drm_rect_height(sel_fetch) *
> drm_rect_width(sel_fetch);
> +       screen_area = drm_rect_height(src) * drm_rect_width(src);
> +
> +       return DIV_ROUND_CLOSEST(screen_area, selfetch_area) <= 4;
> +}
> +
>  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
>                                 struct intel_crtc *crtc)
>  {
> -       struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +       struct drm_i915_private *i915 = to_i915(state->base.dev);

This change is not related to this patch.

BR,

Jouni Högander

>         struct intel_crtc_state *crtc_state =
> intel_atomic_get_new_crtc_state(state, crtc);
>         struct drm_rect pipe_clip = { .x1 = 0, .y1 = -1, .x2 =
> INT_MAX, .y2 = -1 };
>         struct intel_plane_state *new_plane_state, *old_plane_state;
> @@ -2082,7 +2107,7 @@ int intel_psr2_sel_fetch_update(struct
> intel_atomic_state *state,
>          * calculation for those.
>          */
>         if (pipe_clip.y1 == -1) {
> -               drm_info_once(&dev_priv->drm,
> +               drm_info_once(&i915->drm,
>                               "Selective fetch area calculation
> failed in pipe %c\n",
>                               pipe_name(crtc->pipe));
>                 full_update = true;
> @@ -2092,9 +2117,9 @@ int intel_psr2_sel_fetch_update(struct
> intel_atomic_state *state,
>                 goto skip_sel_fetch_set_loop;
>  
>         /* Wa_14014971492 */
> -       if ((IS_DISPLAY_IP_STEP(dev_priv, IP_VER(14, 0), STEP_A0,
> STEP_B0) ||
> -            IS_ALDERLAKE_P(dev_priv) || IS_TIGERLAKE(dev_priv)) &&
> -           crtc_state->splitter.enable)
> +       if ((IS_DISPLAY_IP_STEP(i915, IP_VER(14, 0), STEP_A0,
> STEP_B0) ||
> +            IS_ALDERLAKE_P(i915) || IS_TIGERLAKE(i915)) &&
> +            crtc_state->splitter.enable)
>                 pipe_clip.y1 = 0;
>  
>         ret = drm_atomic_add_affected_planes(&state->base, &crtc-
> >base);
> @@ -2149,7 +2174,14 @@ int intel_psr2_sel_fetch_update(struct
> intel_atomic_state *state,
>                 }
>         }
>  
> +       if (full_update)
> +               goto skip_sel_fetch_set_loop;
> +
> +       full_update = psr2_sel_fetch_not_optimal(i915, &pipe_clip,
> +                                                &crtc_state-
> >pipe_src);
> +
>  skip_sel_fetch_set_loop:
> +       crtc_state->full_frame_fetch = full_update;
>         psr2_man_trk_ctl_calc(crtc_state, &pipe_clip, full_update);
>         return 0;
>  }
Ville Syrjala Nov. 6, 2023, 8:12 p.m. UTC | #2
On Thu, Nov 02, 2023 at 11:55:18PM +0200, Vinod Govindapillai wrote:
> If both PSR2 + FBC is supported, in cases where the selective
> fetch area is greater than 25% of the screen area, FBC might
> be more efficient.

"might be more efficient" is a very weak justification.

This sort of stuff would really need to be accompanied by 
some actual power numbers (for some actually reasonable
workloads) to justify the extra complication.

> So have a possibility to check this and add
> provision to enable FBC in such cases.
> 
> Bspec: 68881
> Signed-off-by: Vinod Govindapillai <vinod.govindapillai@intel.com>
> ---
>  .../drm/i915/display/intel_display_types.h    |  1 +
>  drivers/gpu/drm/i915/display/intel_psr.c      | 42 ++++++++++++++++---
>  2 files changed, 38 insertions(+), 5 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h b/drivers/gpu/drm/i915/display/intel_display_types.h
> index 047fe3f8905a..bcc5fd8d8a00 100644
> --- a/drivers/gpu/drm/i915/display/intel_display_types.h
> +++ b/drivers/gpu/drm/i915/display/intel_display_types.h
> @@ -1207,6 +1207,7 @@ struct intel_crtc_state {
>  	bool has_psr;
>  	bool has_psr2;
>  	bool enable_psr2_sel_fetch;
> +	bool full_frame_fetch;
>  	bool req_psr2_sdp_prior_scanline;
>  	bool wm_level_disabled;
>  	u32 dc3co_exitline;
> diff --git a/drivers/gpu/drm/i915/display/intel_psr.c b/drivers/gpu/drm/i915/display/intel_psr.c
> index ecd24a0b86cb..6cb32fd29d10 100644
> --- a/drivers/gpu/drm/i915/display/intel_psr.c
> +++ b/drivers/gpu/drm/i915/display/intel_psr.c
> @@ -1987,10 +1987,35 @@ static bool psr2_sel_fetch_pipe_state_supported(const struct intel_crtc_state *c
>  	return true;
>  }
>  
> +/*
> + * Check selective fetch is optimum
> + *
> + * Compare selective fetch area w.r.t screen size in case both FBC and PSR2
> + * is supported. If the selective fetch area is more than 25% of screen
> + * size, FBC is might be more efficient than PSR2. So force full frame
> + * update.
> + */
> +static bool psr2_sel_fetch_not_optimal(struct drm_i915_private *i915,
> +				       struct drm_rect *sel_fetch,
> +				       struct drm_rect *src)
> +{
> +	int screen_area, selfetch_area;
> +
> +	/* This is needed where FBC + PSR can be supported */
> +	if (DISPLAY_VER(i915) < 20 || !i915->display.params.enable_fbc ||
> +	    !HAS_FBC(i915))
> +		return false;
> +
> +	selfetch_area = drm_rect_height(sel_fetch) * drm_rect_width(sel_fetch);
> +	screen_area = drm_rect_height(src) * drm_rect_width(src);
> +
> +	return DIV_ROUND_CLOSEST(screen_area, selfetch_area) <= 4;
> +}
> +
>  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
>  				struct intel_crtc *crtc)
>  {
> -	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +	struct drm_i915_private *i915 = to_i915(state->base.dev);
>  	struct intel_crtc_state *crtc_state = intel_atomic_get_new_crtc_state(state, crtc);
>  	struct drm_rect pipe_clip = { .x1 = 0, .y1 = -1, .x2 = INT_MAX, .y2 = -1 };
>  	struct intel_plane_state *new_plane_state, *old_plane_state;
> @@ -2082,7 +2107,7 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
>  	 * calculation for those.
>  	 */
>  	if (pipe_clip.y1 == -1) {
> -		drm_info_once(&dev_priv->drm,
> +		drm_info_once(&i915->drm,
>  			      "Selective fetch area calculation failed in pipe %c\n",
>  			      pipe_name(crtc->pipe));
>  		full_update = true;
> @@ -2092,9 +2117,9 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
>  		goto skip_sel_fetch_set_loop;
>  
>  	/* Wa_14014971492 */
> -	if ((IS_DISPLAY_IP_STEP(dev_priv, IP_VER(14, 0), STEP_A0, STEP_B0) ||
> -	     IS_ALDERLAKE_P(dev_priv) || IS_TIGERLAKE(dev_priv)) &&
> -	    crtc_state->splitter.enable)
> +	if ((IS_DISPLAY_IP_STEP(i915, IP_VER(14, 0), STEP_A0, STEP_B0) ||
> +	     IS_ALDERLAKE_P(i915) || IS_TIGERLAKE(i915)) &&
> +	     crtc_state->splitter.enable)
>  		pipe_clip.y1 = 0;
>  
>  	ret = drm_atomic_add_affected_planes(&state->base, &crtc->base);
> @@ -2149,7 +2174,14 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
>  		}
>  	}
>  
> +	if (full_update)
> +		goto skip_sel_fetch_set_loop;
> +
> +	full_update = psr2_sel_fetch_not_optimal(i915, &pipe_clip,
> +						 &crtc_state->pipe_src);
> +
>  skip_sel_fetch_set_loop:
> +	crtc_state->full_frame_fetch = full_update;
>  	psr2_man_trk_ctl_calc(crtc_state, &pipe_clip, full_update);
>  	return 0;
>  }
> -- 
> 2.34.1
Vinod Govindapillai Nov. 7, 2023, 9:32 a.m. UTC | #3
Hi Ville,

On Mon, 2023-11-06 at 22:12 +0200, Ville Syrjälä wrote:
> On Thu, Nov 02, 2023 at 11:55:18PM +0200, Vinod Govindapillai wrote:
> > If both PSR2 + FBC is supported, in cases where the selective
> > fetch area is greater than 25% of the screen area, FBC might
> > be more efficient.
> 
> "might be more efficient" is a very weak justification.

That is a poor choice of wording from me! I will update!

The feature HAS has documented power assessment information

BR
Vinod
> 
> This sort of stuff would really need to be accompanied by 
> some actual power numbers (for some actually reasonable
> workloads) to justify the extra complication.
> 
> > So have a possibility to check this and add
> > provision to enable FBC in such cases.
> > 
> > Bspec: 68881
> > Signed-off-by: Vinod Govindapillai <vinod.govindapillai@intel.com>
> > ---
> >  .../drm/i915/display/intel_display_types.h    |  1 +
> >  drivers/gpu/drm/i915/display/intel_psr.c      | 42 ++++++++++++++++---
> >  2 files changed, 38 insertions(+), 5 deletions(-)
> > 
> > diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h
> > b/drivers/gpu/drm/i915/display/intel_display_types.h
> > index 047fe3f8905a..bcc5fd8d8a00 100644
> > --- a/drivers/gpu/drm/i915/display/intel_display_types.h
> > +++ b/drivers/gpu/drm/i915/display/intel_display_types.h
> > @@ -1207,6 +1207,7 @@ struct intel_crtc_state {
> >         bool has_psr;
> >         bool has_psr2;
> >         bool enable_psr2_sel_fetch;
> > +       bool full_frame_fetch;
> >         bool req_psr2_sdp_prior_scanline;
> >         bool wm_level_disabled;
> >         u32 dc3co_exitline;
> > diff --git a/drivers/gpu/drm/i915/display/intel_psr.c b/drivers/gpu/drm/i915/display/intel_psr.c
> > index ecd24a0b86cb..6cb32fd29d10 100644
> > --- a/drivers/gpu/drm/i915/display/intel_psr.c
> > +++ b/drivers/gpu/drm/i915/display/intel_psr.c
> > @@ -1987,10 +1987,35 @@ static bool psr2_sel_fetch_pipe_state_supported(const struct
> > intel_crtc_state *c
> >         return true;
> >  }
> >  
> > +/*
> > + * Check selective fetch is optimum
> > + *
> > + * Compare selective fetch area w.r.t screen size in case both FBC and PSR2
> > + * is supported. If the selective fetch area is more than 25% of screen
> > + * size, FBC is might be more efficient than PSR2. So force full frame
> > + * update.
> > + */
> > +static bool psr2_sel_fetch_not_optimal(struct drm_i915_private *i915,
> > +                                      struct drm_rect *sel_fetch,
> > +                                      struct drm_rect *src)
> > +{
> > +       int screen_area, selfetch_area;
> > +
> > +       /* This is needed where FBC + PSR can be supported */
> > +       if (DISPLAY_VER(i915) < 20 || !i915->display.params.enable_fbc ||
> > +           !HAS_FBC(i915))
> > +               return false;
> > +
> > +       selfetch_area = drm_rect_height(sel_fetch) * drm_rect_width(sel_fetch);
> > +       screen_area = drm_rect_height(src) * drm_rect_width(src);
> > +
> > +       return DIV_ROUND_CLOSEST(screen_area, selfetch_area) <= 4;
> > +}
> > +
> >  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> >                                 struct intel_crtc *crtc)
> >  {
> > -       struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> > +       struct drm_i915_private *i915 = to_i915(state->base.dev);
> >         struct intel_crtc_state *crtc_state = intel_atomic_get_new_crtc_state(state, crtc);
> >         struct drm_rect pipe_clip = { .x1 = 0, .y1 = -1, .x2 = INT_MAX, .y2 = -1 };
> >         struct intel_plane_state *new_plane_state, *old_plane_state;
> > @@ -2082,7 +2107,7 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> >          * calculation for those.
> >          */
> >         if (pipe_clip.y1 == -1) {
> > -               drm_info_once(&dev_priv->drm,
> > +               drm_info_once(&i915->drm,
> >                               "Selective fetch area calculation failed in pipe %c\n",
> >                               pipe_name(crtc->pipe));
> >                 full_update = true;
> > @@ -2092,9 +2117,9 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> >                 goto skip_sel_fetch_set_loop;
> >  
> >         /* Wa_14014971492 */
> > -       if ((IS_DISPLAY_IP_STEP(dev_priv, IP_VER(14, 0), STEP_A0, STEP_B0) ||
> > -            IS_ALDERLAKE_P(dev_priv) || IS_TIGERLAKE(dev_priv)) &&
> > -           crtc_state->splitter.enable)
> > +       if ((IS_DISPLAY_IP_STEP(i915, IP_VER(14, 0), STEP_A0, STEP_B0) ||
> > +            IS_ALDERLAKE_P(i915) || IS_TIGERLAKE(i915)) &&
> > +            crtc_state->splitter.enable)
> >                 pipe_clip.y1 = 0;
> >  
> >         ret = drm_atomic_add_affected_planes(&state->base, &crtc->base);
> > @@ -2149,7 +2174,14 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> >                 }
> >         }
> >  
> > +       if (full_update)
> > +               goto skip_sel_fetch_set_loop;
> > +
> > +       full_update = psr2_sel_fetch_not_optimal(i915, &pipe_clip,
> > +                                                &crtc_state->pipe_src);
> > +
> >  skip_sel_fetch_set_loop:
> > +       crtc_state->full_frame_fetch = full_update;
> >         psr2_man_trk_ctl_calc(crtc_state, &pipe_clip, full_update);
> >         return 0;
> >  }
> > -- 
> > 2.34.1
>
Ville Syrjala Nov. 7, 2023, 3:48 p.m. UTC | #4
On Tue, Nov 07, 2023 at 09:32:47AM +0000, Govindapillai, Vinod wrote:
> Hi Ville,
> 
> On Mon, 2023-11-06 at 22:12 +0200, Ville Syrjälä wrote:
> > On Thu, Nov 02, 2023 at 11:55:18PM +0200, Vinod Govindapillai wrote:
> > > If both PSR2 + FBC is supported, in cases where the selective
> > > fetch area is greater than 25% of the screen area, FBC might
> > > be more efficient.
> > 
> > "might be more efficient" is a very weak justification.
> 
> That is a poor choice of wording from me! I will update!
> 
> The feature HAS has documented power assessment information

I see nothing there that actually justifies this 25%
threshold.

> 
> BR
> Vinod
> > 
> > This sort of stuff would really need to be accompanied by 
> > some actual power numbers (for some actually reasonable
> > workloads) to justify the extra complication.
> > 
> > > So have a possibility to check this and add
> > > provision to enable FBC in such cases.
> > > 
> > > Bspec: 68881
> > > Signed-off-by: Vinod Govindapillai <vinod.govindapillai@intel.com>
> > > ---
> > >  .../drm/i915/display/intel_display_types.h    |  1 +
> > >  drivers/gpu/drm/i915/display/intel_psr.c      | 42 ++++++++++++++++---
> > >  2 files changed, 38 insertions(+), 5 deletions(-)
> > > 
> > > diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h
> > > b/drivers/gpu/drm/i915/display/intel_display_types.h
> > > index 047fe3f8905a..bcc5fd8d8a00 100644
> > > --- a/drivers/gpu/drm/i915/display/intel_display_types.h
> > > +++ b/drivers/gpu/drm/i915/display/intel_display_types.h
> > > @@ -1207,6 +1207,7 @@ struct intel_crtc_state {
> > >         bool has_psr;
> > >         bool has_psr2;
> > >         bool enable_psr2_sel_fetch;
> > > +       bool full_frame_fetch;
> > >         bool req_psr2_sdp_prior_scanline;
> > >         bool wm_level_disabled;
> > >         u32 dc3co_exitline;
> > > diff --git a/drivers/gpu/drm/i915/display/intel_psr.c b/drivers/gpu/drm/i915/display/intel_psr.c
> > > index ecd24a0b86cb..6cb32fd29d10 100644
> > > --- a/drivers/gpu/drm/i915/display/intel_psr.c
> > > +++ b/drivers/gpu/drm/i915/display/intel_psr.c
> > > @@ -1987,10 +1987,35 @@ static bool psr2_sel_fetch_pipe_state_supported(const struct
> > > intel_crtc_state *c
> > >         return true;
> > >  }
> > >  
> > > +/*
> > > + * Check selective fetch is optimum
> > > + *
> > > + * Compare selective fetch area w.r.t screen size in case both FBC and PSR2
> > > + * is supported. If the selective fetch area is more than 25% of screen
> > > + * size, FBC is might be more efficient than PSR2. So force full frame
> > > + * update.
> > > + */
> > > +static bool psr2_sel_fetch_not_optimal(struct drm_i915_private *i915,
> > > +                                      struct drm_rect *sel_fetch,
> > > +                                      struct drm_rect *src)
> > > +{
> > > +       int screen_area, selfetch_area;
> > > +
> > > +       /* This is needed where FBC + PSR can be supported */
> > > +       if (DISPLAY_VER(i915) < 20 || !i915->display.params.enable_fbc ||
> > > +           !HAS_FBC(i915))
> > > +               return false;
> > > +
> > > +       selfetch_area = drm_rect_height(sel_fetch) * drm_rect_width(sel_fetch);
> > > +       screen_area = drm_rect_height(src) * drm_rect_width(src);
> > > +
> > > +       return DIV_ROUND_CLOSEST(screen_area, selfetch_area) <= 4;
> > > +}
> > > +
> > >  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> > >                                 struct intel_crtc *crtc)
> > >  {
> > > -       struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> > > +       struct drm_i915_private *i915 = to_i915(state->base.dev);
> > >         struct intel_crtc_state *crtc_state = intel_atomic_get_new_crtc_state(state, crtc);
> > >         struct drm_rect pipe_clip = { .x1 = 0, .y1 = -1, .x2 = INT_MAX, .y2 = -1 };
> > >         struct intel_plane_state *new_plane_state, *old_plane_state;
> > > @@ -2082,7 +2107,7 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> > >          * calculation for those.
> > >          */
> > >         if (pipe_clip.y1 == -1) {
> > > -               drm_info_once(&dev_priv->drm,
> > > +               drm_info_once(&i915->drm,
> > >                               "Selective fetch area calculation failed in pipe %c\n",
> > >                               pipe_name(crtc->pipe));
> > >                 full_update = true;
> > > @@ -2092,9 +2117,9 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> > >                 goto skip_sel_fetch_set_loop;
> > >  
> > >         /* Wa_14014971492 */
> > > -       if ((IS_DISPLAY_IP_STEP(dev_priv, IP_VER(14, 0), STEP_A0, STEP_B0) ||
> > > -            IS_ALDERLAKE_P(dev_priv) || IS_TIGERLAKE(dev_priv)) &&
> > > -           crtc_state->splitter.enable)
> > > +       if ((IS_DISPLAY_IP_STEP(i915, IP_VER(14, 0), STEP_A0, STEP_B0) ||
> > > +            IS_ALDERLAKE_P(i915) || IS_TIGERLAKE(i915)) &&
> > > +            crtc_state->splitter.enable)
> > >                 pipe_clip.y1 = 0;
> > >  
> > >         ret = drm_atomic_add_affected_planes(&state->base, &crtc->base);
> > > @@ -2149,7 +2174,14 @@ int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
> > >                 }
> > >         }
> > >  
> > > +       if (full_update)
> > > +               goto skip_sel_fetch_set_loop;
> > > +
> > > +       full_update = psr2_sel_fetch_not_optimal(i915, &pipe_clip,
> > > +                                                &crtc_state->pipe_src);
> > > +
> > >  skip_sel_fetch_set_loop:
> > > +       crtc_state->full_frame_fetch = full_update;
> > >         psr2_man_trk_ctl_calc(crtc_state, &pipe_clip, full_update);
> > >         return 0;
> > >  }
> > > -- 
> > > 2.34.1
> > 
>
diff mbox series

Patch

diff --git a/drivers/gpu/drm/i915/display/intel_display_types.h b/drivers/gpu/drm/i915/display/intel_display_types.h
index 047fe3f8905a..bcc5fd8d8a00 100644
--- a/drivers/gpu/drm/i915/display/intel_display_types.h
+++ b/drivers/gpu/drm/i915/display/intel_display_types.h
@@ -1207,6 +1207,7 @@  struct intel_crtc_state {
 	bool has_psr;
 	bool has_psr2;
 	bool enable_psr2_sel_fetch;
+	bool full_frame_fetch;
 	bool req_psr2_sdp_prior_scanline;
 	bool wm_level_disabled;
 	u32 dc3co_exitline;
diff --git a/drivers/gpu/drm/i915/display/intel_psr.c b/drivers/gpu/drm/i915/display/intel_psr.c
index ecd24a0b86cb..6cb32fd29d10 100644
--- a/drivers/gpu/drm/i915/display/intel_psr.c
+++ b/drivers/gpu/drm/i915/display/intel_psr.c
@@ -1987,10 +1987,35 @@  static bool psr2_sel_fetch_pipe_state_supported(const struct intel_crtc_state *c
 	return true;
 }
 
+/*
+ * Check selective fetch is optimum
+ *
+ * Compare selective fetch area w.r.t screen size in case both FBC and PSR2
+ * is supported. If the selective fetch area is more than 25% of screen
+ * size, FBC is might be more efficient than PSR2. So force full frame
+ * update.
+ */
+static bool psr2_sel_fetch_not_optimal(struct drm_i915_private *i915,
+				       struct drm_rect *sel_fetch,
+				       struct drm_rect *src)
+{
+	int screen_area, selfetch_area;
+
+	/* This is needed where FBC + PSR can be supported */
+	if (DISPLAY_VER(i915) < 20 || !i915->display.params.enable_fbc ||
+	    !HAS_FBC(i915))
+		return false;
+
+	selfetch_area = drm_rect_height(sel_fetch) * drm_rect_width(sel_fetch);
+	screen_area = drm_rect_height(src) * drm_rect_width(src);
+
+	return DIV_ROUND_CLOSEST(screen_area, selfetch_area) <= 4;
+}
+
 int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
 				struct intel_crtc *crtc)
 {
-	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
+	struct drm_i915_private *i915 = to_i915(state->base.dev);
 	struct intel_crtc_state *crtc_state = intel_atomic_get_new_crtc_state(state, crtc);
 	struct drm_rect pipe_clip = { .x1 = 0, .y1 = -1, .x2 = INT_MAX, .y2 = -1 };
 	struct intel_plane_state *new_plane_state, *old_plane_state;
@@ -2082,7 +2107,7 @@  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
 	 * calculation for those.
 	 */
 	if (pipe_clip.y1 == -1) {
-		drm_info_once(&dev_priv->drm,
+		drm_info_once(&i915->drm,
 			      "Selective fetch area calculation failed in pipe %c\n",
 			      pipe_name(crtc->pipe));
 		full_update = true;
@@ -2092,9 +2117,9 @@  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
 		goto skip_sel_fetch_set_loop;
 
 	/* Wa_14014971492 */
-	if ((IS_DISPLAY_IP_STEP(dev_priv, IP_VER(14, 0), STEP_A0, STEP_B0) ||
-	     IS_ALDERLAKE_P(dev_priv) || IS_TIGERLAKE(dev_priv)) &&
-	    crtc_state->splitter.enable)
+	if ((IS_DISPLAY_IP_STEP(i915, IP_VER(14, 0), STEP_A0, STEP_B0) ||
+	     IS_ALDERLAKE_P(i915) || IS_TIGERLAKE(i915)) &&
+	     crtc_state->splitter.enable)
 		pipe_clip.y1 = 0;
 
 	ret = drm_atomic_add_affected_planes(&state->base, &crtc->base);
@@ -2149,7 +2174,14 @@  int intel_psr2_sel_fetch_update(struct intel_atomic_state *state,
 		}
 	}
 
+	if (full_update)
+		goto skip_sel_fetch_set_loop;
+
+	full_update = psr2_sel_fetch_not_optimal(i915, &pipe_clip,
+						 &crtc_state->pipe_src);
+
 skip_sel_fetch_set_loop:
+	crtc_state->full_frame_fetch = full_update;
 	psr2_man_trk_ctl_calc(crtc_state, &pipe_clip, full_update);
 	return 0;
 }