Commit 873c995a authored by Ville Syrjälä's avatar Ville Syrjälä
Browse files

drm/i915/fbc: Nuke more FBC state



There isn't a good reason why we'd have to cache all this
plane state stuff in the FBC state. Instead we can just
pre-calculate what FBC will really need.

Signed-off-by: default avatarVille Syrjälä <ville.syrjala@linux.intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20211124113652.22090-6-ville.syrjala@linux.intel.com


Reviewed-by: default avatarMika Kahola <mika.kahola@intel.com>
parent 26679087
Loading
Loading
Loading
Loading
+64 −68
Original line number Diff line number Diff line
@@ -73,25 +73,25 @@ static unsigned int intel_fbc_plane_stride(const struct intel_plane_state *plane
}

/* plane stride based cfb stride in bytes, assuming 1:1 compression limit */
static unsigned int _intel_fbc_cfb_stride(const struct intel_fbc_state_cache *cache)
static unsigned int _intel_fbc_cfb_stride(const struct intel_plane_state *plane_state)
{
	unsigned int cpp = 4; /* FBC always 4 bytes per pixel */

	return cache->fb.stride * cpp;
	return intel_fbc_plane_stride(plane_state) * cpp;
}

/* minimum acceptable cfb stride in bytes, assuming 1:1 compression limit */
static unsigned int skl_fbc_min_cfb_stride(struct intel_fbc *fbc,
					   const struct intel_fbc_state_cache *cache)
static unsigned int skl_fbc_min_cfb_stride(const struct intel_plane_state *plane_state)
{
	struct drm_i915_private *i915 = fbc->i915;
	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
	unsigned int limit = 4; /* 1:4 compression limit is the worst case */
	unsigned int cpp = 4; /* FBC always 4 bytes per pixel */
	unsigned int width = drm_rect_width(&plane_state->uapi.src) >> 16;
	unsigned int height = 4; /* FBC segment is 4 lines */
	unsigned int stride;

	/* minimum segment stride we can use */
	stride = cache->plane.src_w * cpp * height / limit;
	stride = width * cpp * height / limit;

	/*
	 * Wa_16011863758: icl+
@@ -111,11 +111,10 @@ static unsigned int skl_fbc_min_cfb_stride(struct intel_fbc *fbc,
}

/* properly aligned cfb stride in bytes, assuming 1:1 compression limit */
static unsigned int intel_fbc_cfb_stride(struct intel_fbc *fbc,
					 const struct intel_fbc_state_cache *cache)
static unsigned int intel_fbc_cfb_stride(const struct intel_plane_state *plane_state)
{
	struct drm_i915_private *i915 = fbc->i915;
	unsigned int stride = _intel_fbc_cfb_stride(cache);
	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
	unsigned int stride = _intel_fbc_cfb_stride(plane_state);

	/*
	 * At least some of the platforms require each 4 line segment to
@@ -123,30 +122,30 @@ static unsigned int intel_fbc_cfb_stride(struct intel_fbc *fbc,
	 * that regardless of the compression limit we choose later.
	 */
	if (DISPLAY_VER(i915) >= 9)
		return max(ALIGN(stride, 512), skl_fbc_min_cfb_stride(fbc, cache));
		return max(ALIGN(stride, 512), skl_fbc_min_cfb_stride(plane_state));
	else
		return stride;
}

static unsigned int intel_fbc_cfb_size(struct intel_fbc *fbc,
				       const struct intel_fbc_state_cache *cache)
static unsigned int intel_fbc_cfb_size(const struct intel_plane_state *plane_state)
{
	struct drm_i915_private *i915 = fbc->i915;
	int lines = cache->plane.src_h;
	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
	int lines = drm_rect_height(&plane_state->uapi.src) >> 16;

	if (DISPLAY_VER(i915) == 7)
		lines = min(lines, 2048);
	else if (DISPLAY_VER(i915) >= 8)
		lines = min(lines, 2560);

	return lines * intel_fbc_cfb_stride(fbc, cache);
	return lines * intel_fbc_cfb_stride(plane_state);
}

static u16 intel_fbc_override_cfb_stride(struct intel_fbc *fbc,
					 const struct intel_fbc_state_cache *cache)
static u16 intel_fbc_override_cfb_stride(const struct intel_plane_state *plane_state)
{
	unsigned int stride = _intel_fbc_cfb_stride(cache);
	unsigned int stride_aligned = intel_fbc_cfb_stride(fbc, cache);
	struct drm_i915_private *i915 = to_i915(plane_state->uapi.plane->dev);
	unsigned int stride_aligned = intel_fbc_cfb_stride(plane_state);
	unsigned int stride = _intel_fbc_cfb_stride(plane_state);
	const struct drm_framebuffer *fb = plane_state->hw.fb;

	/*
	 * Override stride in 64 byte units per 4 line segment.
@@ -156,8 +155,7 @@ static u16 intel_fbc_override_cfb_stride(struct intel_fbc *fbc,
	 * we always need to use the override there.
	 */
	if (stride != stride_aligned ||
	    (DISPLAY_VER(fbc->i915) == 9 &&
	     cache->fb.modifier == DRM_FORMAT_MOD_LINEAR))
	    (DISPLAY_VER(i915) == 9 && fb->modifier == DRM_FORMAT_MOD_LINEAR))
		return stride_aligned * 4 / 64;

	return 0;
@@ -925,31 +923,22 @@ static bool tiling_is_valid(const struct intel_plane_state *plane_state)
	}
}

static void intel_fbc_update_state_cache(struct intel_crtc *crtc,
					 const struct intel_crtc_state *crtc_state,
					 const struct intel_plane_state *plane_state)
static void intel_fbc_update_state_cache(struct intel_atomic_state *state,
					 struct intel_crtc *crtc,
					 struct intel_plane *plane)
{
	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
	struct intel_fbc *fbc = &i915->fbc;
	struct drm_i915_private *i915 = to_i915(state->base.dev);
	const struct intel_crtc_state *crtc_state =
		intel_atomic_get_new_crtc_state(state, crtc);
	const struct intel_plane_state *plane_state =
		intel_atomic_get_new_plane_state(state, plane);
	struct intel_fbc *fbc = plane->fbc;
	struct intel_fbc_state_cache *cache = &fbc->state_cache;
	struct drm_framebuffer *fb = plane_state->hw.fb;

	cache->no_fbc_reason = plane_state->no_fbc_reason;
	if (cache->no_fbc_reason)
		return;

	/*
	 * Src coordinates are already rotated by 270 degrees for
	 * the 90/270 degree plane rotation cases (to match the
	 * GTT mapping), hence no need to account for rotation here.
	 */
	cache->plane.src_w = drm_rect_width(&plane_state->uapi.src) >> 16;
	cache->plane.src_h = drm_rect_height(&plane_state->uapi.src) >> 16;

	cache->fb.format = fb->format;
	cache->fb.modifier = fb->modifier;
	cache->fb.stride = intel_fbc_plane_stride(plane_state);

	/* FBC1 compression interval: arbitrary choice of 1 second */
	cache->interval = drm_mode_vrefresh(&crtc_state->hw.adjusted_mode);

@@ -963,12 +952,15 @@ static void intel_fbc_update_state_cache(struct intel_crtc *crtc,
		cache->fence_id = plane_state->ggtt_vma->fence->id;
	else
		cache->fence_id = -1;

	cache->cfb_stride = intel_fbc_cfb_stride(plane_state);
	cache->cfb_size = intel_fbc_cfb_size(plane_state);
	cache->override_cfb_stride = intel_fbc_override_cfb_stride(plane_state);
}

static bool intel_fbc_cfb_size_changed(struct intel_fbc *fbc)
{
	return intel_fbc_cfb_size(fbc, &fbc->state_cache) >
		fbc->compressed_fb.size * fbc->limit;
	return fbc->state_cache.cfb_size > fbc->compressed_fb.size * fbc->limit;
}

static bool intel_fbc_can_enable(struct intel_fbc *fbc)
@@ -1178,45 +1170,53 @@ static void intel_fbc_get_reg_params(struct intel_fbc *fbc,
	params->interval = cache->interval;
	params->crtc.i9xx_plane = to_intel_plane(crtc->base.primary)->i9xx_plane;

	params->fb.format = cache->fb.format;
	params->fb.modifier = cache->fb.modifier;
	params->fb.stride = cache->fb.stride;

	params->cfb_stride = intel_fbc_cfb_stride(fbc, cache);
	params->cfb_size = intel_fbc_cfb_size(fbc, cache);
	params->override_cfb_stride = intel_fbc_override_cfb_stride(fbc, cache);
	params->cfb_stride = cache->cfb_stride;
	params->cfb_size = cache->cfb_size;
	params->override_cfb_stride = cache->override_cfb_stride;
}

static bool intel_fbc_can_flip_nuke(const struct intel_crtc_state *crtc_state)
static bool intel_fbc_can_flip_nuke(struct intel_atomic_state *state,
				    struct intel_crtc *crtc,
				    struct intel_plane *plane)
{
	struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
	struct intel_fbc *fbc = &i915->fbc;
	struct intel_fbc *fbc = plane->fbc;
	const struct intel_crtc_state *new_crtc_state =
		intel_atomic_get_new_crtc_state(state, crtc);
	const struct intel_plane_state *old_plane_state =
		intel_atomic_get_old_plane_state(state, plane);
	const struct intel_plane_state *new_plane_state =
		intel_atomic_get_new_plane_state(state, plane);
	const struct drm_framebuffer *old_fb = old_plane_state->hw.fb;
	const struct drm_framebuffer *new_fb = new_plane_state->hw.fb;
	const struct intel_fbc_state_cache *cache = &fbc->state_cache;
	const struct intel_fbc_reg_params *params = &fbc->params;

	if (drm_atomic_crtc_needs_modeset(&crtc_state->uapi))
	if (drm_atomic_crtc_needs_modeset(&new_crtc_state->uapi))
		return false;

	if (!intel_fbc_can_activate(crtc))
		return false;

	if (params->fb.format != cache->fb.format)
	if (!old_fb || !new_fb)
		return false;

	if (old_fb->format->format != new_fb->format->format)
		return false;

	if (params->fb.modifier != cache->fb.modifier)
	if (old_fb->modifier != new_fb->modifier)
		return false;

	if (params->fb.stride != cache->fb.stride)
	if (intel_fbc_plane_stride(old_plane_state) !=
	    intel_fbc_plane_stride(new_plane_state))
		return false;

	if (params->cfb_stride != intel_fbc_cfb_stride(fbc, cache))
	if (params->cfb_stride != cache->cfb_stride)
		return false;

	if (params->cfb_size != intel_fbc_cfb_size(fbc, cache))
	if (params->cfb_size != cache->cfb_size)
		return false;

	if (params->override_cfb_stride != intel_fbc_override_cfb_stride(fbc, cache))
	if (params->override_cfb_stride != cache->override_cfb_stride)
		return false;

	return true;
@@ -1226,8 +1226,6 @@ bool intel_fbc_pre_update(struct intel_atomic_state *state,
			  struct intel_crtc *crtc)
{
	struct intel_plane *plane = to_intel_plane(crtc->base.primary);
	const struct intel_crtc_state *crtc_state =
		intel_atomic_get_new_crtc_state(state, crtc);
	const struct intel_plane_state *plane_state =
		intel_atomic_get_new_plane_state(state, plane);
	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
@@ -1243,10 +1241,10 @@ bool intel_fbc_pre_update(struct intel_atomic_state *state,
	if (fbc->crtc != crtc)
		goto unlock;

	intel_fbc_update_state_cache(crtc, crtc_state, plane_state);
	intel_fbc_update_state_cache(state, crtc, plane);
	fbc->flip_pending = true;

	if (!intel_fbc_can_flip_nuke(crtc_state)) {
	if (!intel_fbc_can_flip_nuke(state, crtc, plane)) {
		intel_fbc_deactivate(fbc, reason);

		/*
@@ -1425,8 +1423,6 @@ static void intel_fbc_enable(struct intel_atomic_state *state,
{
	struct drm_i915_private *i915 = to_i915(crtc->base.dev);
	struct intel_plane *plane = to_intel_plane(crtc->base.primary);
	const struct intel_crtc_state *crtc_state =
		intel_atomic_get_new_crtc_state(state, crtc);
	const struct intel_plane_state *plane_state =
		intel_atomic_get_new_plane_state(state, plane);
	struct intel_fbc *fbc = plane->fbc;
@@ -1455,12 +1451,12 @@ static void intel_fbc_enable(struct intel_atomic_state *state,

	drm_WARN_ON(&i915->drm, fbc->active);

	intel_fbc_update_state_cache(crtc, crtc_state, plane_state);
	intel_fbc_update_state_cache(state, crtc, plane);

	if (cache->no_fbc_reason)
		goto out;

	if (intel_fbc_alloc_cfb(fbc, intel_fbc_cfb_size(fbc, cache), min_limit)) {
	if (intel_fbc_alloc_cfb(fbc, intel_fbc_cfb_size(plane_state), min_limit)) {
		fbc->no_fbc_reason = "not enough stolen memory";
		goto out;
	}
+3 −17
Original line number Diff line number Diff line
@@ -415,18 +415,10 @@ struct intel_fbc {
	struct intel_fbc_state_cache {
		const char *no_fbc_reason;

		struct {
			int src_w;
			int src_h;
		} plane;

		struct {
			const struct drm_format_info *format;
			unsigned int stride;
			u64 modifier;
		} fb;

		unsigned int cfb_stride;
		unsigned int cfb_size;
		unsigned int fence_y_offset;
		u16 override_cfb_stride;
		u16 interval;
		s8 fence_id;
	} state_cache;
@@ -443,12 +435,6 @@ struct intel_fbc {
			enum i9xx_plane_id i9xx_plane;
		} crtc;

		struct {
			const struct drm_format_info *format;
			unsigned int stride;
			u64 modifier;
		} fb;

		unsigned int cfb_stride;
		unsigned int cfb_size;
		unsigned int fence_y_offset;