Re: [PATCH 05/20] drm/i915/fbc: Nuke more FBC state

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



> -----Original Message-----
> From: Intel-gfx <intel-gfx-bounces@xxxxxxxxxxxxxxxxxxxxx> On Behalf Of Ville
> Syrjala
> Sent: Wednesday, November 24, 2021 1:37 PM
> To: intel-gfx@xxxxxxxxxxxxxxxxxxxxx
> Subject:  [PATCH 05/20] drm/i915/fbc: Nuke more FBC state
> 
> From: Ville Syrjälä <ville.syrjala@xxxxxxxxxxxxxxx>
> 
> There isn't a good reason why we'd have to cache all this plane state stuff in the
> FBC state. Instead we can just pre-calculate what FBC will really need.
> 
> Signed-off-by: Ville Syrjälä <ville.syrjala@xxxxxxxxxxxxxxx>

Reviewed-by: Mika Kahola <mika.kahola@xxxxxxxxx>

> ---
>  drivers/gpu/drm/i915/display/intel_fbc.c | 132 +++++++++++------------
>  drivers/gpu/drm/i915/i915_drv.h          |  20 +---
>  2 files changed, 67 insertions(+), 85 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/display/intel_fbc.c
> b/drivers/gpu/drm/i915/display/intel_fbc.c
> index 6368dddf977c..1e8b75cdfad8 100644
> --- a/drivers/gpu/drm/i915/display/intel_fbc.c
> +++ b/drivers/gpu/drm/i915/display/intel_fbc.c
> @@ -73,25 +73,25 @@ static unsigned int intel_fbc_plane_stride(const struct
> intel_plane_state *plane  }
> 
>  /* plane stride based cfb stride in bytes, assuming 1:1 compression limit */ -
> static unsigned int _intel_fbc_cfb_stride(const struct intel_fbc_state_cache
> *cache)
> +static unsigned int _intel_fbc_cfb_stride(const struct
> +intel_plane_state *plane_state)
>  {
>  	unsigned int cpp = 4; /* FBC always 4 bytes per pixel */
> 
> -	return cache->fb.stride * cpp;
> +	return intel_fbc_plane_stride(plane_state) * cpp;
>  }
> 
>  /* minimum acceptable cfb stride in bytes, assuming 1:1 compression limit */ -
> static unsigned int skl_fbc_min_cfb_stride(struct intel_fbc *fbc,
> -					   const struct intel_fbc_state_cache
> *cache)
> +static unsigned int skl_fbc_min_cfb_stride(const struct
> +intel_plane_state *plane_state)
>  {
> -	struct drm_i915_private *i915 = fbc->i915;
> +	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
>  	unsigned int limit = 4; /* 1:4 compression limit is the worst case */
>  	unsigned int cpp = 4; /* FBC always 4 bytes per pixel */
> +	unsigned int width = drm_rect_width(&plane_state->uapi.src) >> 16;
>  	unsigned int height = 4; /* FBC segment is 4 lines */
>  	unsigned int stride;
> 
>  	/* minimum segment stride we can use */
> -	stride = cache->plane.src_w * cpp * height / limit;
> +	stride = width * cpp * height / limit;
> 
>  	/*
>  	 * Wa_16011863758: icl+
> @@ -111,11 +111,10 @@ static unsigned int skl_fbc_min_cfb_stride(struct
> intel_fbc *fbc,  }
> 
>  /* properly aligned cfb stride in bytes, assuming 1:1 compression limit */ -static
> unsigned int intel_fbc_cfb_stride(struct intel_fbc *fbc,
> -					 const struct intel_fbc_state_cache
> *cache)
> +static unsigned int intel_fbc_cfb_stride(const struct intel_plane_state
> +*plane_state)
>  {
> -	struct drm_i915_private *i915 = fbc->i915;
> -	unsigned int stride = _intel_fbc_cfb_stride(cache);
> +	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
> +	unsigned int stride = _intel_fbc_cfb_stride(plane_state);
> 
>  	/*
>  	 * At least some of the platforms require each 4 line segment to @@ -
> 123,30 +122,30 @@ static unsigned int intel_fbc_cfb_stride(struct intel_fbc
> *fbc,
>  	 * that regardless of the compression limit we choose later.
>  	 */
>  	if (DISPLAY_VER(i915) >= 9)
> -		return max(ALIGN(stride, 512), skl_fbc_min_cfb_stride(fbc,
> cache));
> +		return max(ALIGN(stride, 512),
> skl_fbc_min_cfb_stride(plane_state));
>  	else
>  		return stride;
>  }
> 
> -static unsigned int intel_fbc_cfb_size(struct intel_fbc *fbc,
> -				       const struct intel_fbc_state_cache *cache)
> +static unsigned int intel_fbc_cfb_size(const struct intel_plane_state
> +*plane_state)
>  {
> -	struct drm_i915_private *i915 = fbc->i915;
> -	int lines = cache->plane.src_h;
> +	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
> +	int lines = drm_rect_height(&plane_state->uapi.src) >> 16;
> 
>  	if (DISPLAY_VER(i915) == 7)
>  		lines = min(lines, 2048);
>  	else if (DISPLAY_VER(i915) >= 8)
>  		lines = min(lines, 2560);
> 
> -	return lines * intel_fbc_cfb_stride(fbc, cache);
> +	return lines * intel_fbc_cfb_stride(plane_state);
>  }
> 
> -static u16 intel_fbc_override_cfb_stride(struct intel_fbc *fbc,
> -					 const struct intel_fbc_state_cache
> *cache)
> +static u16 intel_fbc_override_cfb_stride(const struct intel_plane_state
> +*plane_state)
>  {
> -	unsigned int stride = _intel_fbc_cfb_stride(cache);
> -	unsigned int stride_aligned = intel_fbc_cfb_stride(fbc, cache);
> +	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
> +	unsigned int stride_aligned = intel_fbc_cfb_stride(plane_state);
> +	unsigned int stride = _intel_fbc_cfb_stride(plane_state);
> +	const struct drm_framebuffer *fb = plane_state->hw.fb;
> 
>  	/*
>  	 * Override stride in 64 byte units per 4 line segment.
> @@ -156,8 +155,7 @@ static u16 intel_fbc_override_cfb_stride(struct intel_fbc
> *fbc,
>  	 * we always need to use the override there.
>  	 */
>  	if (stride != stride_aligned ||
> -	    (DISPLAY_VER(fbc->i915) == 9 &&
> -	     cache->fb.modifier == DRM_FORMAT_MOD_LINEAR))
> +	    (DISPLAY_VER(i915) == 9 && fb->modifier ==
> DRM_FORMAT_MOD_LINEAR))
>  		return stride_aligned * 4 / 64;
> 
>  	return 0;
> @@ -925,31 +923,22 @@ static bool tiling_is_valid(const struct
> intel_plane_state *plane_state)
>  	}
>  }
> 
> -static void intel_fbc_update_state_cache(struct intel_crtc *crtc,
> -					 const struct intel_crtc_state
> *crtc_state,
> -					 const struct intel_plane_state
> *plane_state)
> +static void intel_fbc_update_state_cache(struct intel_atomic_state *state,
> +					 struct intel_crtc *crtc,
> +					 struct intel_plane *plane)
>  {
> -	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
> -	struct intel_fbc *fbc = &i915->fbc;
> +	struct drm_i915_private *i915 = to_i915(state->base.dev);
> +	const struct intel_crtc_state *crtc_state =
> +		intel_atomic_get_new_crtc_state(state, crtc);
> +	const struct intel_plane_state *plane_state =
> +		intel_atomic_get_new_plane_state(state, plane);
> +	struct intel_fbc *fbc = plane->fbc;
>  	struct intel_fbc_state_cache *cache = &fbc->state_cache;
> -	struct drm_framebuffer *fb = plane_state->hw.fb;
> 
>  	cache->no_fbc_reason = plane_state->no_fbc_reason;
>  	if (cache->no_fbc_reason)
>  		return;
> 
> -	/*
> -	 * Src coordinates are already rotated by 270 degrees for
> -	 * the 90/270 degree plane rotation cases (to match the
> -	 * GTT mapping), hence no need to account for rotation here.
> -	 */
> -	cache->plane.src_w = drm_rect_width(&plane_state->uapi.src) >> 16;
> -	cache->plane.src_h = drm_rect_height(&plane_state->uapi.src) >> 16;
> -
> -	cache->fb.format = fb->format;
> -	cache->fb.modifier = fb->modifier;
> -	cache->fb.stride = intel_fbc_plane_stride(plane_state);
> -
>  	/* FBC1 compression interval: arbitrary choice of 1 second */
>  	cache->interval = drm_mode_vrefresh(&crtc_state-
> >hw.adjusted_mode);
> 
> @@ -963,12 +952,15 @@ static void intel_fbc_update_state_cache(struct
> intel_crtc *crtc,
>  		cache->fence_id = plane_state->ggtt_vma->fence->id;
>  	else
>  		cache->fence_id = -1;
> +
> +	cache->cfb_stride = intel_fbc_cfb_stride(plane_state);
> +	cache->cfb_size = intel_fbc_cfb_size(plane_state);
> +	cache->override_cfb_stride =
> +intel_fbc_override_cfb_stride(plane_state);
>  }
> 
>  static bool intel_fbc_cfb_size_changed(struct intel_fbc *fbc)  {
> -	return intel_fbc_cfb_size(fbc, &fbc->state_cache) >
> -		fbc->compressed_fb.size * fbc->limit;
> +	return fbc->state_cache.cfb_size > fbc->compressed_fb.size *
> +fbc->limit;
>  }
> 
>  static bool intel_fbc_can_enable(struct intel_fbc *fbc) @@ -1178,45 +1170,53
> @@ static void intel_fbc_get_reg_params(struct intel_fbc *fbc,
>  	params->interval = cache->interval;
>  	params->crtc.i9xx_plane = to_intel_plane(crtc->base.primary)-
> >i9xx_plane;
> 
> -	params->fb.format = cache->fb.format;
> -	params->fb.modifier = cache->fb.modifier;
> -	params->fb.stride = cache->fb.stride;
> -
> -	params->cfb_stride = intel_fbc_cfb_stride(fbc, cache);
> -	params->cfb_size = intel_fbc_cfb_size(fbc, cache);
> -	params->override_cfb_stride = intel_fbc_override_cfb_stride(fbc,
> cache);
> +	params->cfb_stride = cache->cfb_stride;
> +	params->cfb_size = cache->cfb_size;
> +	params->override_cfb_stride = cache->override_cfb_stride;
>  }
> 
> -static bool intel_fbc_can_flip_nuke(const struct intel_crtc_state *crtc_state)
> +static bool intel_fbc_can_flip_nuke(struct intel_atomic_state *state,
> +				    struct intel_crtc *crtc,
> +				    struct intel_plane *plane)
>  {
> -	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
> -	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
> -	struct intel_fbc *fbc = &i915->fbc;
> +	struct intel_fbc *fbc = plane->fbc;
> +	const struct intel_crtc_state *new_crtc_state =
> +		intel_atomic_get_new_crtc_state(state, crtc);
> +	const struct intel_plane_state *old_plane_state =
> +		intel_atomic_get_old_plane_state(state, plane);
> +	const struct intel_plane_state *new_plane_state =
> +		intel_atomic_get_new_plane_state(state, plane);
> +	const struct drm_framebuffer *old_fb = old_plane_state->hw.fb;
> +	const struct drm_framebuffer *new_fb = new_plane_state->hw.fb;
>  	const struct intel_fbc_state_cache *cache = &fbc->state_cache;
>  	const struct intel_fbc_reg_params *params = &fbc->params;
> 
> -	if (drm_atomic_crtc_needs_modeset(&crtc_state->uapi))
> +	if (drm_atomic_crtc_needs_modeset(&new_crtc_state->uapi))
>  		return false;
> 
>  	if (!intel_fbc_can_activate(crtc))
>  		return false;
> 
> -	if (params->fb.format != cache->fb.format)
> +	if (!old_fb || !new_fb)
>  		return false;
> 
> -	if (params->fb.modifier != cache->fb.modifier)
> +	if (old_fb->format->format != new_fb->format->format)
>  		return false;
> 
> -	if (params->fb.stride != cache->fb.stride)
> +	if (old_fb->modifier != new_fb->modifier)
>  		return false;
> 
> -	if (params->cfb_stride != intel_fbc_cfb_stride(fbc, cache))
> +	if (intel_fbc_plane_stride(old_plane_state) !=
> +	    intel_fbc_plane_stride(new_plane_state))
>  		return false;
> 
> -	if (params->cfb_size != intel_fbc_cfb_size(fbc, cache))
> +	if (params->cfb_stride != cache->cfb_stride)
>  		return false;
> 
> -	if (params->override_cfb_stride != intel_fbc_override_cfb_stride(fbc,
> cache))
> +	if (params->cfb_size != cache->cfb_size)
> +		return false;
> +
> +	if (params->override_cfb_stride != cache->override_cfb_stride)
>  		return false;
> 
>  	return true;
> @@ -1226,8 +1226,6 @@ bool intel_fbc_pre_update(struct intel_atomic_state
> *state,
>  			  struct intel_crtc *crtc)
>  {
>  	struct intel_plane *plane = to_intel_plane(crtc->base.primary);
> -	const struct intel_crtc_state *crtc_state =
> -		intel_atomic_get_new_crtc_state(state, crtc);
>  	const struct intel_plane_state *plane_state =
>  		intel_atomic_get_new_plane_state(state, plane);
>  	struct drm_i915_private *i915 = to_i915(crtc->base.dev); @@ -1243,10
> +1241,10 @@ bool intel_fbc_pre_update(struct intel_atomic_state *state,
>  	if (fbc->crtc != crtc)
>  		goto unlock;
> 
> -	intel_fbc_update_state_cache(crtc, crtc_state, plane_state);
> +	intel_fbc_update_state_cache(state, crtc, plane);
>  	fbc->flip_pending = true;
> 
> -	if (!intel_fbc_can_flip_nuke(crtc_state)) {
> +	if (!intel_fbc_can_flip_nuke(state, crtc, plane)) {
>  		intel_fbc_deactivate(fbc, reason);
> 
>  		/*
> @@ -1425,8 +1423,6 @@ static void intel_fbc_enable(struct intel_atomic_state
> *state,  {
>  	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
>  	struct intel_plane *plane = to_intel_plane(crtc->base.primary);
> -	const struct intel_crtc_state *crtc_state =
> -		intel_atomic_get_new_crtc_state(state, crtc);
>  	const struct intel_plane_state *plane_state =
>  		intel_atomic_get_new_plane_state(state, plane);
>  	struct intel_fbc *fbc = plane->fbc;
> @@ -1455,12 +1451,12 @@ static void intel_fbc_enable(struct
> intel_atomic_state *state,
> 
>  	drm_WARN_ON(&i915->drm, fbc->active);
> 
> -	intel_fbc_update_state_cache(crtc, crtc_state, plane_state);
> +	intel_fbc_update_state_cache(state, crtc, plane);
> 
>  	if (cache->no_fbc_reason)
>  		goto out;
> 
> -	if (intel_fbc_alloc_cfb(fbc, intel_fbc_cfb_size(fbc, cache), min_limit)) {
> +	if (intel_fbc_alloc_cfb(fbc, intel_fbc_cfb_size(plane_state),
> +min_limit)) {
>  		fbc->no_fbc_reason = "not enough stolen memory";
>  		goto out;
>  	}
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index d79aa827d937..66fa46d41fa5 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -436,18 +436,10 @@ struct intel_fbc {
>  	struct intel_fbc_state_cache {
>  		const char *no_fbc_reason;
> 
> -		struct {
> -			int src_w;
> -			int src_h;
> -		} plane;
> -
> -		struct {
> -			const struct drm_format_info *format;
> -			unsigned int stride;
> -			u64 modifier;
> -		} fb;
> -
> +		unsigned int cfb_stride;
> +		unsigned int cfb_size;
>  		unsigned int fence_y_offset;
> +		u16 override_cfb_stride;
>  		u16 interval;
>  		s8 fence_id;
>  	} state_cache;
> @@ -464,12 +456,6 @@ struct intel_fbc {
>  			enum i9xx_plane_id i9xx_plane;
>  		} crtc;
> 
> -		struct {
> -			const struct drm_format_info *format;
> -			unsigned int stride;
> -			u64 modifier;
> -		} fb;
> -
>  		unsigned int cfb_stride;
>  		unsigned int cfb_size;
>  		unsigned int fence_y_offset;
> --
> 2.32.0





[Index of Archives]     [AMD Graphics]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]

  Powered by Linux