Commit 4cfd1665 authored by Matt Roper's avatar Matt Roper
Browse files

drm/i915/sseu: Simplify gen11+ SSEU handling



Although gen11 and gen12 architectures supported the concept of multiple
slices, in practice all the platforms that were actually designed only
had a single slice (i.e., note the parameters to 'intel_sseu_set_info'
that we pass for each platform).  We can simplify the code slightly by
dropping the multi-slice logic from gen11+ platforms.

v2:
 - Promote drm_dbg to drm_WARN_ON if the slice fuse register reports
   unexpected fusing.  (Tvrtko)

Cc: Tvrtko Ursulin <tvrtko.ursulin@linux.intel.com>
Signed-off-by: default avatarMatt Roper <matthew.d.roper@intel.com>
Acked-by: default avatarTvrtko Ursulin <tvrtko.ursulin@intel.com>
Reviewed-by: default avatarBalasubramani Vivekanandan <balasubramani.vivekanandan@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20220601150725.521468-4-matthew.d.roper@intel.com
parent aa2bdc48
Loading
Loading
Loading
Loading
+36 −40
Original line number Diff line number Diff line
@@ -119,52 +119,37 @@ static u16 compute_eu_total(const struct sseu_dev_info *sseu)
	return total;
}

static u32 get_ss_stride_mask(struct sseu_dev_info *sseu, u8 s, u32 ss_en)
{
	u32 ss_mask;

	ss_mask = ss_en >> (s * sseu->max_subslices);
	ss_mask &= GENMASK(sseu->max_subslices - 1, 0);

	return ss_mask;
}

static void gen11_compute_sseu_info(struct sseu_dev_info *sseu, u8 s_en,
static void gen11_compute_sseu_info(struct sseu_dev_info *sseu,
				    u32 g_ss_en, u32 c_ss_en, u16 eu_en)
{
	int s, ss;
	u32 valid_ss_mask = GENMASK(sseu->max_subslices - 1, 0);
	int ss;

	/* g_ss_en/c_ss_en represent entire subslice mask across all slices */
	GEM_BUG_ON(sseu->max_slices * sseu->max_subslices >
		   sizeof(g_ss_en) * BITS_PER_BYTE);

	for (s = 0; s < sseu->max_slices; s++) {
		if ((s_en & BIT(s)) == 0)
			continue;

		sseu->slice_mask |= BIT(s);
	sseu->slice_mask |= BIT(0);

	/*
		 * XeHP introduces the concept of compute vs geometry DSS. To
		 * reduce variation between GENs around subslice usage, store a
		 * mask for both the geometry and compute enabled masks since
		 * userspace will need to be able to query these masks
		 * independently.  Also compute a total enabled subslice count
		 * for the purposes of selecting subslices to use in a
		 * particular GEM context.
	 * XeHP introduces the concept of compute vs geometry DSS. To reduce
	 * variation between GENs around subslice usage, store a mask for both
	 * the geometry and compute enabled masks since userspace will need to
	 * be able to query these masks independently.  Also compute a total
	 * enabled subslice count for the purposes of selecting subslices to
	 * use in a particular GEM context.
	 */
		intel_sseu_set_subslices(sseu, s, sseu->compute_subslice_mask,
					 get_ss_stride_mask(sseu, s, c_ss_en));
		intel_sseu_set_subslices(sseu, s, sseu->geometry_subslice_mask,
					 get_ss_stride_mask(sseu, s, g_ss_en));
		intel_sseu_set_subslices(sseu, s, sseu->subslice_mask,
					 get_ss_stride_mask(sseu, s,
							    g_ss_en | c_ss_en));
	intel_sseu_set_subslices(sseu, 0, sseu->compute_subslice_mask,
				 c_ss_en & valid_ss_mask);
	intel_sseu_set_subslices(sseu, 0, sseu->geometry_subslice_mask,
				 g_ss_en & valid_ss_mask);
	intel_sseu_set_subslices(sseu, 0, sseu->subslice_mask,
				 (g_ss_en | c_ss_en) & valid_ss_mask);

	for (ss = 0; ss < sseu->max_subslices; ss++)
			if (intel_sseu_has_subslice(sseu, s, ss))
				sseu_set_eus(sseu, s, ss, eu_en);
	}
		if (intel_sseu_has_subslice(sseu, 0, ss))
			sseu_set_eus(sseu, 0, ss, eu_en);

	sseu->eu_per_subslice = hweight16(eu_en);
	sseu->eu_total = compute_eu_total(sseu);
}
@@ -196,7 +181,7 @@ static void xehp_sseu_info_init(struct intel_gt *gt)
		if (eu_en_fuse & BIT(eu))
			eu_en |= BIT(eu * 2) | BIT(eu * 2 + 1);

	gen11_compute_sseu_info(sseu, 0x1, g_dss_en, c_dss_en, eu_en);
	gen11_compute_sseu_info(sseu, g_dss_en, c_dss_en, eu_en);
}

static void gen12_sseu_info_init(struct intel_gt *gt)
@@ -216,8 +201,13 @@ static void gen12_sseu_info_init(struct intel_gt *gt)
	 */
	intel_sseu_set_info(sseu, 1, 6, 16);

	/*
	 * Although gen12 architecture supported multiple slices, TGL, RKL,
	 * DG1, and ADL only had a single slice.
	 */
	s_en = intel_uncore_read(uncore, GEN11_GT_SLICE_ENABLE) &
		GEN11_GT_S_ENA_MASK;
	drm_WARN_ON(&gt->i915->drm, s_en != 0x1);

	g_dss_en = intel_uncore_read(uncore, GEN12_GT_GEOMETRY_DSS_ENABLE);

@@ -229,7 +219,7 @@ static void gen12_sseu_info_init(struct intel_gt *gt)
		if (eu_en_fuse & BIT(eu))
			eu_en |= BIT(eu * 2) | BIT(eu * 2 + 1);

	gen11_compute_sseu_info(sseu, s_en, g_dss_en, 0, eu_en);
	gen11_compute_sseu_info(sseu, g_dss_en, 0, eu_en);

	/* TGL only supports slice-level power gating */
	sseu->has_slice_pg = 1;
@@ -248,14 +238,20 @@ static void gen11_sseu_info_init(struct intel_gt *gt)
	else
		intel_sseu_set_info(sseu, 1, 8, 8);

	/*
	 * Although gen11 architecture supported multiple slices, ICL and
	 * EHL/JSL only had a single slice in practice.
	 */
	s_en = intel_uncore_read(uncore, GEN11_GT_SLICE_ENABLE) &
		GEN11_GT_S_ENA_MASK;
	drm_WARN_ON(&gt->i915->drm, s_en != 0x1);

	ss_en = ~intel_uncore_read(uncore, GEN11_GT_SUBSLICE_DISABLE);

	eu_en = ~(intel_uncore_read(uncore, GEN11_EU_DISABLE) &
		  GEN11_EU_DIS_MASK);

	gen11_compute_sseu_info(sseu, s_en, ss_en, 0, eu_en);
	gen11_compute_sseu_info(sseu, ss_en, 0, eu_en);

	/* ICL has no power gating restrictions. */
	sseu->has_slice_pg = 1;