Commit fa9899da authored by Matt Roper's avatar Matt Roper

drm/i915/xehp: Loop over all gslices for INSTDONE processing

We no longer have traditional slices on Xe_HP platforms, but the
INSTDONE registers are replicated according to gslice representation
which is similar.  We can mostly re-use the existing instdone code with
just a few modifications:

 * Create an alternate instdone loop macro that will iterate over the
   flat DSS space, but still provide the gslice/dss steering values for
   compatibility with the legacy code.

 * We should allocate INSTDONE storage space according to the maximum
   number of gslices rather than the maximum number of legacy slices to
   ensure we have enough storage space to hold all of the values.  XeHP
   design has 8 gslices, whereas older platforms never had more than 3
   slices.
Signed-off-by: default avatarMatt Roper <matthew.d.roper@intel.com>
Reviewed-by: default avatarLucas De Marchi <lucas.demarchi@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20210805163647.801064-3-matthew.d.roper@intel.com
parent dae2d288
...@@ -1163,16 +1163,16 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine, ...@@ -1163,16 +1163,16 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine,
u32 mmio_base = engine->mmio_base; u32 mmio_base = engine->mmio_base;
int slice; int slice;
int subslice; int subslice;
int iter;
memset(instdone, 0, sizeof(*instdone)); memset(instdone, 0, sizeof(*instdone));
switch (GRAPHICS_VER(i915)) { if (GRAPHICS_VER(i915) >= 8) {
default:
instdone->instdone = instdone->instdone =
intel_uncore_read(uncore, RING_INSTDONE(mmio_base)); intel_uncore_read(uncore, RING_INSTDONE(mmio_base));
if (engine->id != RCS0) if (engine->id != RCS0)
break; return;
instdone->slice_common = instdone->slice_common =
intel_uncore_read(uncore, GEN7_SC_INSTDONE); intel_uncore_read(uncore, GEN7_SC_INSTDONE);
...@@ -1182,6 +1182,17 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine, ...@@ -1182,6 +1182,17 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine,
instdone->slice_common_extra[1] = instdone->slice_common_extra[1] =
intel_uncore_read(uncore, GEN12_SC_INSTDONE_EXTRA2); intel_uncore_read(uncore, GEN12_SC_INSTDONE_EXTRA2);
} }
if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) {
for_each_instdone_gslice_dss_xehp(i915, sseu, iter, slice, subslice) {
instdone->sampler[slice][subslice] =
read_subslice_reg(engine, slice, subslice,
GEN7_SAMPLER_INSTDONE);
instdone->row[slice][subslice] =
read_subslice_reg(engine, slice, subslice,
GEN7_ROW_INSTDONE);
}
} else {
for_each_instdone_slice_subslice(i915, sseu, slice, subslice) { for_each_instdone_slice_subslice(i915, sseu, slice, subslice) {
instdone->sampler[slice][subslice] = instdone->sampler[slice][subslice] =
read_subslice_reg(engine, slice, subslice, read_subslice_reg(engine, slice, subslice,
...@@ -1190,13 +1201,13 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine, ...@@ -1190,13 +1201,13 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine,
read_subslice_reg(engine, slice, subslice, read_subslice_reg(engine, slice, subslice,
GEN7_ROW_INSTDONE); GEN7_ROW_INSTDONE);
} }
break; }
case 7: } else if (GRAPHICS_VER(i915) >= 7) {
instdone->instdone = instdone->instdone =
intel_uncore_read(uncore, RING_INSTDONE(mmio_base)); intel_uncore_read(uncore, RING_INSTDONE(mmio_base));
if (engine->id != RCS0) if (engine->id != RCS0)
break; return;
instdone->slice_common = instdone->slice_common =
intel_uncore_read(uncore, GEN7_SC_INSTDONE); intel_uncore_read(uncore, GEN7_SC_INSTDONE);
...@@ -1204,22 +1215,15 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine, ...@@ -1204,22 +1215,15 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine,
intel_uncore_read(uncore, GEN7_SAMPLER_INSTDONE); intel_uncore_read(uncore, GEN7_SAMPLER_INSTDONE);
instdone->row[0][0] = instdone->row[0][0] =
intel_uncore_read(uncore, GEN7_ROW_INSTDONE); intel_uncore_read(uncore, GEN7_ROW_INSTDONE);
} else if (GRAPHICS_VER(i915) >= 4) {
break;
case 6:
case 5:
case 4:
instdone->instdone = instdone->instdone =
intel_uncore_read(uncore, RING_INSTDONE(mmio_base)); intel_uncore_read(uncore, RING_INSTDONE(mmio_base));
if (engine->id == RCS0) if (engine->id == RCS0)
/* HACK: Using the wrong struct member */ /* HACK: Using the wrong struct member */
instdone->slice_common = instdone->slice_common =
intel_uncore_read(uncore, GEN4_INSTDONE1); intel_uncore_read(uncore, GEN4_INSTDONE1);
break; } else {
case 3:
case 2:
instdone->instdone = intel_uncore_read(uncore, GEN2_INSTDONE); instdone->instdone = intel_uncore_read(uncore, GEN2_INSTDONE);
break;
} }
} }
......
...@@ -67,8 +67,8 @@ struct intel_instdone { ...@@ -67,8 +67,8 @@ struct intel_instdone {
/* The following exist only in the RCS engine */ /* The following exist only in the RCS engine */
u32 slice_common; u32 slice_common;
u32 slice_common_extra[2]; u32 slice_common_extra[2];
u32 sampler[I915_MAX_SLICES][I915_MAX_SUBSLICES]; u32 sampler[GEN_MAX_GSLICES][I915_MAX_SUBSLICES];
u32 row[I915_MAX_SLICES][I915_MAX_SUBSLICES]; u32 row[GEN_MAX_GSLICES][I915_MAX_SUBSLICES];
}; };
/* /*
...@@ -578,4 +578,12 @@ intel_engine_has_relative_mmio(const struct intel_engine_cs * const engine) ...@@ -578,4 +578,12 @@ intel_engine_has_relative_mmio(const struct intel_engine_cs * const engine)
for_each_if((instdone_has_slice(dev_priv_, sseu_, slice_)) && \ for_each_if((instdone_has_slice(dev_priv_, sseu_, slice_)) && \
(instdone_has_subslice(dev_priv_, sseu_, slice_, \ (instdone_has_subslice(dev_priv_, sseu_, slice_, \
subslice_))) subslice_)))
#define for_each_instdone_gslice_dss_xehp(dev_priv_, sseu_, iter_, gslice_, dss_) \
for ((iter_) = 0, (gslice_) = 0, (dss_) = 0; \
(iter_) < GEN_MAX_SUBSLICES; \
(iter_)++, (gslice_) = (iter_) / GEN_DSS_PER_GSLICE, \
(dss_) = (iter_) % GEN_DSS_PER_GSLICE) \
for_each_if(intel_sseu_has_subslice((sseu_), 0, (iter_)))
#endif /* __INTEL_ENGINE_TYPES_H__ */ #endif /* __INTEL_ENGINE_TYPES_H__ */
...@@ -26,6 +26,9 @@ struct drm_printer; ...@@ -26,6 +26,9 @@ struct drm_printer;
#define GEN_DSS_PER_CSLICE 8 #define GEN_DSS_PER_CSLICE 8
#define GEN_DSS_PER_MSLICE 8 #define GEN_DSS_PER_MSLICE 8
#define GEN_MAX_GSLICES (GEN_MAX_SUBSLICES / GEN_DSS_PER_GSLICE)
#define GEN_MAX_CSLICES (GEN_MAX_SUBSLICES / GEN_DSS_PER_CSLICE)
struct sseu_dev_info { struct sseu_dev_info {
u8 slice_mask; u8 slice_mask;
u8 subslice_mask[GEN_MAX_SLICES * GEN_MAX_SUBSLICE_STRIDE]; u8 subslice_mask[GEN_MAX_SLICES * GEN_MAX_SUBSLICE_STRIDE];
...@@ -78,6 +81,10 @@ intel_sseu_has_subslice(const struct sseu_dev_info *sseu, int slice, ...@@ -78,6 +81,10 @@ intel_sseu_has_subslice(const struct sseu_dev_info *sseu, int slice,
u8 mask; u8 mask;
int ss_idx = subslice / BITS_PER_BYTE; int ss_idx = subslice / BITS_PER_BYTE;
if (slice >= sseu->max_slices ||
subslice >= sseu->max_subslices)
return false;
GEM_BUG_ON(ss_idx >= sseu->ss_stride); GEM_BUG_ON(ss_idx >= sseu->ss_stride);
mask = sseu->subslice_mask[slice * sseu->ss_stride + ss_idx]; mask = sseu->subslice_mask[slice * sseu->ss_stride + ss_idx];
......
...@@ -444,6 +444,19 @@ static void error_print_instdone(struct drm_i915_error_state_buf *m, ...@@ -444,6 +444,19 @@ static void error_print_instdone(struct drm_i915_error_state_buf *m,
if (GRAPHICS_VER(m->i915) <= 6) if (GRAPHICS_VER(m->i915) <= 6)
return; return;
if (GRAPHICS_VER_FULL(m->i915) >= IP_VER(12, 50)) {
int iter;
for_each_instdone_gslice_dss_xehp(m->i915, sseu, iter, slice, subslice)
err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n",
slice, subslice,
ee->instdone.sampler[slice][subslice]);
for_each_instdone_gslice_dss_xehp(m->i915, sseu, iter, slice, subslice)
err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n",
slice, subslice,
ee->instdone.row[slice][subslice]);
} else {
for_each_instdone_slice_subslice(m->i915, sseu, slice, subslice) for_each_instdone_slice_subslice(m->i915, sseu, slice, subslice)
err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n", err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n",
slice, subslice, slice, subslice,
...@@ -453,6 +466,7 @@ static void error_print_instdone(struct drm_i915_error_state_buf *m, ...@@ -453,6 +466,7 @@ static void error_print_instdone(struct drm_i915_error_state_buf *m,
err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n", err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n",
slice, subslice, slice, subslice,
ee->instdone.row[slice][subslice]); ee->instdone.row[slice][subslice]);
}
if (GRAPHICS_VER(m->i915) < 12) if (GRAPHICS_VER(m->i915) < 12)
return; return;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment