RE: [Intel-gfx] [PATCH 2/3] drm/i915/dg2: Add initial gt/ctx/engine workarounds

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



This issue was not catched by CI, because of series of unfortunate events.

Before, CI has rebooted without module blocklist, and CI catched boot-time
dmesg correctly and marked it as 'ci@boot' test with failure if there was a taint.

I've been doing changes to make blocklisting i915 possible and load it as
the first test of IGT: that'd make possible to remove some workarounds
and integrate the result better on our framework.

The test to decide if i915 should be modprobed was slightly off, and
on these runs where i915 failed to load in boot, it was modprobed again,
and modprobe hanged because of existing i915. Results were not collected.

I've added the condition to the conditional modprobe, and the results
from failed boot-time modprobe should be soon available as before,
eg. CI_DRM_10873 later shards with SNB.

Regards,

Tomi

> From: Latvala, Petri <petri.latvala@xxxxxxxxx>
> On Tue, Nov 02, 2021 at 03:25:10PM -0700, Matt Roper wrote:
> > Bspec: 54077,68173,54833
> > Cc: Anusha Srivatsa <anusha.srivatsa@xxxxxxxxx>
> > Signed-off-by: Matt Roper <matthew.d.roper@xxxxxxxxx>
> > ---
> >  drivers/gpu/drm/i915/gt/intel_workarounds.c | 278
> +++++++++++++++++++-
> >  drivers/gpu/drm/i915/i915_reg.h             |  94 +++++--
> >  drivers/gpu/drm/i915/intel_pm.c             |  21 +-
> >  3 files changed, 372 insertions(+), 21 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/i915/gt/intel_workarounds.c
> b/drivers/gpu/drm/i915/gt/intel_workarounds.c
> > index 4aaa210fc003..37fd541a9719 100644
> > --- a/drivers/gpu/drm/i915/gt/intel_workarounds.c
> > +++ b/drivers/gpu/drm/i915/gt/intel_workarounds.c
> > @@ -644,6 +644,42 @@ static void dg1_ctx_workarounds_init(struct
> intel_engine_cs *engine,
> >
> DG1_HZ_READ_SUPPRESSION_OPTIMIZATION_DISABLE);
> >  }
> >
> > +static void dg2_ctx_workarounds_init(struct intel_engine_cs *engine,
> > +				     struct
> i915_wa_list *wal)
> > +{
> > +	gen12_ctx_gt_tuning_init(engine, wal);
> > +
> > +	/* Wa_16011186671:dg2_g11 */
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0,
> STEP_B0)) {
> > +		wa_masked_dis(wal, VFLSKPD,
> DIS_MULT_MISS_RD_SQUASH);
> > +		wa_masked_en(wal, VFLSKPD,
> DIS_OVER_FETCH_CACHE);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0,
> STEP_B0)) {
> > +		/* Wa_14010469329:dg2_g10 */
> > +		wa_masked_en(wal,
> GEN11_COMMON_SLICE_CHICKEN3,
> > +
> XEHP_DUAL_SIMD8_SEQ_MERGE_DISABLE);
> > +
> > +		/*
> > +		 * Wa_22010465075:dg2_g10
> > +		 * Wa_22010613112:dg2_g10
> > +		 * Wa_14010698770:dg2_g10
> > +		 */
> > +		wa_masked_en(wal,
> GEN11_COMMON_SLICE_CHICKEN3,
> > +
> GEN12_DISABLE_CPS_AWARE_COLOR_PIPE);
> > +	}
> > +
> > +	/* Wa_16013271637:dg2 */
> > +	wa_masked_en(wal, SLICE_COMMON_ECO_CHICKEN1,
> > +
> MSC_MSAA_REODER_BUF_BYPASS_DISABLE);
> > +
> > +	/* Wa_22012532006:dg2 */
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0,
> STEP_C0) ||
> > +	    IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0,
> STEP_B0))
> > +		wa_masked_en(wal,
> GEN9_HALF_SLICE_CHICKEN7,
> > +
> DG2_DISABLE_ROUND_ENABLE_ALLOW_FOR_SSLA);
> > +}
> > +
> >  static void fakewa_disable_nestedbb_mode(struct intel_engine_cs
> *engine,
> >
> struct i915_wa_list *wal)
> >  {
> > @@ -730,7 +766,9 @@ __intel_engine_init_ctx_wa(struct intel_engine_cs
> *engine,
> >  	if (engine->class != RENDER_CLASS)
> >  		goto done;
> >
> > -	if (IS_XEHPSDV(i915))
> > +	if (IS_DG2(i915))
> > +		dg2_ctx_workarounds_init(engine, wal);
> > +	else if (IS_XEHPSDV(i915))
> >  		; /* noop; none at this time */
> >  	else if (IS_DG1(i915))
> >  		dg1_ctx_workarounds_init(engine, wal);
> > @@ -1343,12 +1381,117 @@ xehpsdv_gt_workarounds_init(struct intel_gt
> *gt, struct i915_wa_list *wal)
> >  		    GLOBAL_INVALIDATION_MODE);
> >  }
> >
> > +static void
> > +dg2_gt_workarounds_init(struct intel_gt *gt, struct i915_wa_list *wal)
> > +{
> > +	struct intel_engine_cs *engine;
> > +	int id;
> > +
> > +	xehp_init_mcr(gt, wal);
> > +
> > +	/* Wa_14011060649:dg2 */
> > +	wa_14011060649(gt, wal);
> > +
> > +	/*
> > +	 * Although there are per-engine instances of these registers,
> > +	 * they technically exist outside the engine itself and are not
> > +	 * impacted by engine resets.  Furthermore, they're part of the
> > +	 * GuC blacklist so trying to treat them as engine workarounds
> > +	 * will result in GuC initialization failure and a wedged GPU.
> > +	 */
> > +	for_each_engine(engine, gt, id) {
> > +		if (engine->class != VIDEO_DECODE_CLASS)
> > +			continue;
> > +
> > +		/* Wa_16010515920:dg2_g10 */
> > +		if (IS_DG2_GRAPHICS_STEP(gt->i915, G10,
> STEP_A0, STEP_B0))
> > +			wa_write_or(wal,
> VDBOX_CGCTL3F18(engine->mmio_base),
> > +
> ALNUNIT_CLKGATE_DIS);
> > +	}
> > +
> > +	if (IS_DG2_G10(gt->i915)) {
> > +		/* Wa_22010523718:dg2 */
> > +		wa_write_or(wal,
> UNSLICE_UNIT_LEVEL_CLKGATE,
> > +			    CG3DDISCFEG_CLKGATE_DIS);
> > +
> > +		/* Wa_14011006942:dg2 */
> > +		wa_write_or(wal,
> SUBSLICE_UNIT_LEVEL_CLKGATE,
> > +			    DSS_ROUTER_CLKGATE_DIS);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(gt->i915, G10, STEP_A0, STEP_B0))
> {
> > +		/* Wa_14010680813:dg2_g10 */
> > +		wa_write_or(wal, GEN12_GAMSTLB_CTRL,
> CONTROL_BLOCK_CLKGATE_DIS |
> > +			    EGRESS_BLOCK_CLKGATE_DIS |
> TAG_BLOCK_CLKGATE_DIS);
> > +
> > +		/* Wa_14010948348:dg2_g10 */
> > +		wa_write_or(wal, UNSLCGCTL9430,
> MSQDUNIT_CLKGATE_DIS);
> > +
> > +		/* Wa_14011037102:dg2_g10 */
> > +		wa_write_or(wal, UNSLCGCTL9444,
> LTCDD_CLKGATE_DIS);
> > +
> > +		/* Wa_14011371254:dg2_g10 */
> > +		wa_write_or(wal, SLICE_UNIT_LEVEL_CLKGATE,
> NODEDSS_CLKGATE_DIS);
> > +
> > +		/* Wa_14011431319:dg2_g10 */
> > +		wa_write_or(wal, UNSLCGCTL9440,
> GAMTLBOACS_CLKGATE_DIS |
> > +			    GAMTLBVDBOX7_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX6_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX5_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX4_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX3_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX2_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX1_CLKGATE_DIS
> |
> > +			    GAMTLBVDBOX0_CLKGATE_DIS
> |
> > +			    GAMTLBKCR_CLKGATE_DIS |
> > +			    GAMTLBGUC_CLKGATE_DIS |
> > +			    GAMTLBBLT_CLKGATE_DIS);
> > +		wa_write_or(wal, UNSLCGCTL9444,
> GAMTLBGFXA0_CLKGATE_DIS |
> > +			    GAMTLBGFXA1_CLKGATE_DIS |
> > +
> GAMTLBCOMPA0_CLKGATE_DIS |
> > +
> GAMTLBCOMPA1_CLKGATE_DIS |
> > +
> GAMTLBCOMPB0_CLKGATE_DIS |
> > +
> GAMTLBCOMPB1_CLKGATE_DIS |
> > +
> GAMTLBCOMPC0_CLKGATE_DIS |
> > +
> GAMTLBCOMPC1_CLKGATE_DIS |
> > +
> GAMTLBCOMPD0_CLKGATE_DIS |
> > +
> GAMTLBCOMPD1_CLKGATE_DIS |
> > +			    GAMTLBMERT_CLKGATE_DIS   |
> > +			    GAMTLBVEBOX3_CLKGATE_DIS
> |
> > +			    GAMTLBVEBOX2_CLKGATE_DIS
> |
> > +			    GAMTLBVEBOX1_CLKGATE_DIS
> |
> > +
> GAMTLBVEBOX0_CLKGATE_DIS);
> > +
> > +		/* Wa_14010569222:dg2_g10 */
> > +		wa_write_or(wal,
> UNSLICE_UNIT_LEVEL_CLKGATE,
> > +			    GAMEDIA_CLKGATE_DIS);
> > +
> > +		/* Wa_14011028019:dg2_g10 */
> > +		wa_write_or(wal, SSMCGCTL9530,
> RTFUNIT_CLKGATE_DIS);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(gt->i915, G10, STEP_A0, STEP_B0)
> ||
> > +	    IS_DG2_GRAPHICS_STEP(gt->i915, G11, STEP_A0, STEP_B0))
> {
> > +		/* Wa_14012362059:dg2 */
> > +		wa_write_or(wal, GEN12_MERT_MOD_CTRL,
> FORCE_MISS_FTLB);
> > +	}
> > +
> > +	/* Wa_1509235366:dg2 */
> > +	wa_write_or(wal, GEN12_GAMCNTRL_CTRL,
> INVALIDATION_BROADCAST_MODE_DIS |
> > +		    GLOBAL_INVALIDATION_MODE);
> > +
> > +	/* Wa_14014830051:dg2 */
> > +	wa_write_clr(wal, SARB_CHICKEN1, COMP_CKN_IN);
> > +}
> > +
> >  static void
> >  gt_init_workarounds(struct intel_gt *gt, struct i915_wa_list *wal)
> >  {
> >  	struct drm_i915_private *i915 = gt->i915;
> >
> > -	if (IS_XEHPSDV(i915))
> > +	if (IS_DG2(i915))
> > +		dg2_gt_workarounds_init(gt, wal);
> > +	else if (IS_XEHPSDV(i915))
> >  		xehpsdv_gt_workarounds_init(gt, wal);
> >  	else if (IS_DG1(i915))
> >  		dg1_gt_workarounds_init(gt, wal);
> > @@ -1739,6 +1882,34 @@ static void xehpsdv_whitelist_build(struct
> intel_engine_cs *engine)
> >  	allow_read_ctx_timestamp(engine);
> >  }
> >
> > +static void dg2_whitelist_build(struct intel_engine_cs *engine)
> > +{
> > +	struct i915_wa_list *w = &engine->whitelist;
> > +
> > +	allow_read_ctx_timestamp(engine);
> > +
> > +	switch (engine->class) {
> > +	case RENDER_CLASS:
> > +		/*
> > +		 * Wa_1507100340:dg2_g10
> > +		 *
> > +		 * This covers 4 registers which are next to one
> another :
> > +		 *   - PS_INVOCATION_COUNT
> > +		 *   - PS_INVOCATION_COUNT_UDW
> > +		 *   - PS_DEPTH_COUNT
> > +		 *   - PS_DEPTH_COUNT_UDW
> > +		 */
> > +		if (IS_DG2_GRAPHICS_STEP(engine->i915, G10,
> STEP_A0, STEP_B0))
> > +			whitelist_reg_ext(w,
> PS_INVOCATION_COUNT,
> > +
> RING_FORCE_TO_NONPRIV_ACCESS_RD |
> > +
> RING_FORCE_TO_NONPRIV_RANGE_4);
> > +
> > +		break;
> > +	default:
> > +		break;
> > +	}
> > +}
> > +
> >  void intel_engine_init_whitelist(struct intel_engine_cs *engine)
> >  {
> >  	struct drm_i915_private *i915 = engine->i915;
> > @@ -1746,7 +1917,9 @@ void intel_engine_init_whitelist(struct
> intel_engine_cs *engine)
> >
> >  	wa_init_start(w, "whitelist", engine->name);
> >
> > -	if (IS_XEHPSDV(i915))
> > +	if (IS_DG2(i915))
> > +		dg2_whitelist_build(engine);
> > +	else if (IS_XEHPSDV(i915))
> >  		xehpsdv_whitelist_build(engine);
> >  	else if (IS_DG1(i915))
> >  		dg1_whitelist_build(engine);
> > @@ -1826,6 +1999,105 @@ static void
> >  rcs_engine_wa_init(struct intel_engine_cs *engine, struct i915_wa_list
> *wal)
> >  {
> >  	struct drm_i915_private *i915 = engine->i915;
> > +	u64 dss_mask = intel_sseu_get_subslices(&engine->gt-
> >info.sseu, 0);
> 
> fi-snb-2600:
> 
> https://paste.debian.net/1219275
> 
> [    4.348876] intel_sseu_get_subslices:39 GEM_BUG_ON(slice >= sseu-
> >max_slices)
> 
> 
> 
> --
> Petri Latvala
> 
> 
> 
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0,
> STEP_B0)) {
> > +		/* Wa_14013392000:dg2_g11 */
> > +		wa_masked_en(wal, GEN7_ROW_CHICKEN2,
> GEN12_ENABLE_LARGE_GRF_MODE);
> > +
> > +		/* Wa_16011620976:dg2_g11 */
> > +		wa_write_or(wal, LSC_CHICKEN_BIT_0_UDW,
> DIS_CHAIN_2XSIMD8);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0,
> STEP_B0) ||
> > +	    IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0,
> STEP_B0)) {
> > +		/* Wa_14012419201:dg2 */
> > +		wa_masked_en(wal, GEN9_ROW_CHICKEN4,
> > +
> GEN12_DISABLE_HDR_PAST_PAYLOAD_HOLD_FIX);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0,
> STEP_C0) ||
> > +	    IS_DG2_G11(engine->i915)) {
> > +		/*
> > +		 * Wa_22012826095:dg2
> > +		 * Wa_22013059131:dg2
> > +		 */
> > +		wa_write_clr_set(wal,
> LSC_CHICKEN_BIT_0_UDW,
> > +
> MAXREQS_PER_BANK,
> > +
> REG_FIELD_PREP(MAXREQS_PER_BANK, 2));
> > +
> > +		/* Wa_22013059131:dg2 */
> > +		wa_write_or(wal, LSC_CHICKEN_BIT_0,
> > +
> FORCE_1_SUB_MESSAGE_PER_FRAGMENT);
> > +	}
> > +
> > +	/* Wa_1308578152:dg2_g10 when first gslice is fused off */
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0,
> STEP_C0) &&
> > +	    (dss_mask & GENMASK(GEN_DSS_PER_GSLICE - 1, 0)) == 0)
> {
> > +		wa_masked_dis(wal,
> GEN12_CS_DEBUG_MODE1_CCCSUNIT_BE_COMMON,
> > +
> GEN12_REPLAY_MODE_GRANULARITY);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0,
> STEP_FOREVER) ||
> > +	    IS_DG2_G11(engine->i915)) {
> > +		/* Wa_22013037850:dg2 */
> > +		wa_write_or(wal, LSC_CHICKEN_BIT_0_UDW,
> > +
> DISABLE_128B_EVICTION_COMMAND_UDW);
> > +
> > +		/* Wa_22012856258:dg2 */
> > +		wa_masked_en(wal, GEN7_ROW_CHICKEN2,
> > +
> GEN12_DISABLE_READ_SUPPRESSION);
> > +
> > +		/*
> > +		 * Wa_22010960976:dg2
> > +		 * Wa_14013347512:dg2
> > +		 */
> > +		wa_masked_dis(wal, GEN12_HDC_CHICKEN0,
> > +
> LSC_L1_FLUSH_CTL_3D_DATAPORT_FLUSH_EVENTS_MASK);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0,
> STEP_B0)) {
> > +		/*
> > +		 * Wa_1608949956:dg2_g10
> > +		 * Wa_14010198302:dg2_g10
> > +		 */
> > +		wa_masked_en(wal, GEN8_ROW_CHICKEN,
> > +			     MDQ_ARBITRATION_MODE |
> UGM_BACKUP_MODE);
> > +
> > +		/*
> > +		 * Wa_14010918519:dg2_g10
> > +		 *
> > +		 * LSC_CHICKEN_BIT_0 always reads back as 0 is
> this stepping,
> > +		 * so ignoring verification.
> > +		 */
> > +		wa_add(wal, LSC_CHICKEN_BIT_0_UDW, 0,
> > +		       FORCE_SLM_FENCE_SCOPE_TO_TILE |
> FORCE_UGM_FENCE_SCOPE_TO_TILE,
> > +		       0, false);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0,
> STEP_B0)) {
> > +		/* Wa_22010430635:dg2 */
> > +		wa_masked_en(wal,
> > +			     GEN9_ROW_CHICKEN4,
> > +			     GEN12_DISABLE_GRF_CLEAR);
> > +
> > +		/* Wa_14010648519:dg2 */
> > +		wa_write_or(wal, XEHP_L3NODEARBCFG,
> XEHP_LNESPARE);
> > +	}
> > +
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0,
> STEP_C0) ||
> > +	    IS_DG2_G11(engine->i915)) {
> > +		/* Wa_22012654132:dg2 */
> > +		wa_add(wal, GEN10_CACHE_MODE_SS, 0,
> > +
> _MASKED_BIT_ENABLE(ENABLE_PREFETCH_INTO_IC),
> > +		       0 /* write-only, so skip validation */,
> > +		       true);
> > +	}
> > +
> > +	/* Wa_14013202645:dg2 */
> > +	if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0,
> STEP_C0) ||
> > +	    IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0,
> STEP_B0))
> > +		wa_write_or(wal, RT_CTRL, DIS_NULL_QUERY);
> >
> >  	if (IS_DG1_GRAPHICS_STEP(i915, STEP_A0, STEP_B0) ||
> >  	    IS_TGL_UY_GRAPHICS_STEP(i915, STEP_A0, STEP_B0)) {
> > diff --git a/drivers/gpu/drm/i915/i915_reg.h
> b/drivers/gpu/drm/i915/i915_reg.h
> > index b806ad4bdeca..ee39d6bd0f3c 100644
> > --- a/drivers/gpu/drm/i915/i915_reg.h
> > +++ b/drivers/gpu/drm/i915/i915_reg.h
> > @@ -502,6 +502,11 @@ static inline bool i915_mmio_reg_valid(i915_reg_t
> reg)
> >  #define   INVALIDATION_BROADCAST_MODE_DIS	REG_BIT(12)
> >  #define   GLOBAL_INVALIDATION_MODE
> 	REG_BIT(2)
> >
> > +#define GEN12_GAMSTLB_CTRL		_MMIO(0xcf4c)
> > +#define   CONTROL_BLOCK_CLKGATE_DIS	REG_BIT(12)
> > +#define   EGRESS_BLOCK_CLKGATE_DIS	REG_BIT(11)
> > +#define   TAG_BLOCK_CLKGATE_DIS		REG_BIT(7)
> > +
> >  #define GEN12_MERT_MOD_CTRL		_MMIO(0xcf28)
> >  #define   FORCE_MISS_FTLB		REG_BIT(3)
> >
> > @@ -777,6 +782,9 @@ static inline bool i915_mmio_reg_valid(i915_reg_t
> reg)
> >  #define EU_PERF_CNTL5	    _MMIO(0xe55c)
> >  #define EU_PERF_CNTL6	    _MMIO(0xe65c)
> >
> > +#define RT_CTRL			_MMIO(0xe530)
> > +#define  DIS_NULL_QUERY		REG_BIT(10)
> > +
> >  /*
> >   * OA Boolean state
> >   */
> > @@ -2781,6 +2789,9 @@ static inline bool i915_mmio_reg_valid(i915_reg_t
> reg)
> >  #define VDBOX_CGCTL3F10(base)		_MMIO((base) +
> 0x3f10)
> >  #define   IECPUNIT_CLKGATE_DIS		REG_BIT(22)
> >
> > +#define VDBOX_CGCTL3F18(base)		_MMIO((base) +
> 0x3f18)
> > +#define   ALNUNIT_CLKGATE_DIS		REG_BIT(13)
> > +
> >  #define ERROR_GEN6	_MMIO(0x40a0)
> >  #define GEN7_ERR_INT	_MMIO(0x44040)
> >  #define   ERR_INT_POISON		(1 << 31)
> > @@ -3124,7 +3135,8 @@ static inline bool i915_mmio_reg_valid(i915_reg_t
> reg)
> >  #define GEN9_RCS_FE_FSM2 _MMIO(0x22a4)
> >
> >  #define GEN10_CACHE_MODE_SS
> 	_MMIO(0xe420)
> > -#define   FLOAT_BLEND_OPTIMIZATION_ENABLE	(1 << 4)
> > +#define   ENABLE_PREFETCH_INTO_IC		REG_BIT(3)
> > +#define   FLOAT_BLEND_OPTIMIZATION_ENABLE	REG_BIT(4)
> >
> >  /* Fuse readout registers for GT */
> >  #define HSW_PAVP_FUSE1
> 	_MMIO(0x911C)
> > @@ -4333,18 +4345,25 @@ enum {
> >  #define  SARBUNIT_CLKGATE_DIS		(1 << 5)
> >  #define  RCCUNIT_CLKGATE_DIS		(1 << 7)
> >  #define  MSCUNIT_CLKGATE_DIS		(1 << 10)
> > +#define  NODEDSS_CLKGATE_DIS		REG_BIT(12)
> >  #define  L3_CLKGATE_DIS			REG_BIT(16)
> >  #define  L3_CR2X_CLKGATE_DIS		REG_BIT(17)
> >
> >  #define SUBSLICE_UNIT_LEVEL_CLKGATE	_MMIO(0x9524)
> > -#define  GWUNIT_CLKGATE_DIS		(1 << 16)
> > +#define   DSS_ROUTER_CLKGATE_DIS	REG_BIT(28)
> > +#define   GWUNIT_CLKGATE_DIS		REG_BIT(16)
> >
> >  #define SUBSLICE_UNIT_LEVEL_CLKGATE2	_MMIO(0x9528)
> >  #define  CPSSUNIT_CLKGATE_DIS		REG_BIT(9)
> >
> > +#define SSMCGCTL9530			_MMIO(0x9530)
> > +#define   RTFUNIT_CLKGATE_DIS		REG_BIT(18)
> > +
> >  #define UNSLICE_UNIT_LEVEL_CLKGATE	_MMIO(0x9434)
> >  #define   VFUNIT_CLKGATE_DIS		REG_BIT(20)
> > -#define   TSGUNIT_CLKGATE_DIS		REG_BIT(17)
> > +#define   TSGUNIT_CLKGATE_DIS		REG_BIT(17) /*
> XEHPSDV */
> > +#define   CG3DDISCFEG_CLKGATE_DIS	REG_BIT(17) /* DG2 */
> > +#define   GAMEDIA_CLKGATE_DIS		REG_BIT(11)
> >  #define   HSUNIT_CLKGATE_DIS		REG_BIT(8)
> >  #define   VSUNIT_CLKGATE_DIS		REG_BIT(3)
> >
> > @@ -8404,6 +8423,9 @@ enum {
> >  #define GEN9_CTX_PREEMPT_REG		_MMIO(0x2248)
> >  #define   GEN12_DISABLE_POSH_BUSY_FF_DOP_CG REG_BIT(11)
> >
> > +#define GEN12_CS_DEBUG_MODE1_CCCSUNIT_BE_COMMON
> 	_MMIO(0x20EC)
> > +#define   GEN12_REPLAY_MODE_GRANULARITY
> 	REG_BIT(0)
> > +
> >  #define GEN8_CS_CHICKEN1		_MMIO(0x2580)
> >  #define GEN9_PREEMPT_3D_OBJECT_LEVEL		(1 <<
> 0)
> >  #define GEN9_PREEMPT_GPGPU_LEVEL(hi, lo)	(((hi) << 2) | ((lo)
> << 1))
> > @@ -8427,9 +8449,10 @@ enum {
> >    #define GEN8_ERRDETBCTRL (1 << 9)
> >
> >  #define GEN11_COMMON_SLICE_CHICKEN3
> 	_MMIO(0x7304)
> > -  #define DG1_FLOAT_POINT_BLEND_OPT_STRICT_MODE_EN
> 	REG_BIT(12)
> > -  #define GEN11_BLEND_EMB_FIX_DISABLE_IN_RCC
> 	REG_BIT(11)
> > -  #define GEN12_DISABLE_CPS_AWARE_COLOR_PIPE
> 	REG_BIT(9)
> > +#define   DG1_FLOAT_POINT_BLEND_OPT_STRICT_MODE_EN
> 	REG_BIT(12)
> > +#define   XEHP_DUAL_SIMD8_SEQ_MERGE_DISABLE
> 	REG_BIT(12)
> > +#define   GEN11_BLEND_EMB_FIX_DISABLE_IN_RCC
> 	REG_BIT(11)
> > +#define   GEN12_DISABLE_CPS_AWARE_COLOR_PIPE
> 	REG_BIT(9)
> >
> >  #define HIZ_CHICKEN
> 	_MMIO(0x7018)
> >  # define CHV_HZ_8X8_MODE_IN_1X
> 	REG_BIT(15)
> > @@ -8493,6 +8516,12 @@ enum {
> >  #define  HDC_FORCE_NON_COHERENT			(1 <<
> 4)
> >  #define  HDC_BARRIER_PERFORMANCE_DISABLE	(1 << 10)
> >
> > +#define GEN12_HDC_CHICKEN0
> 		_MMIO(0xE5F0)
> > +#define   LSC_L1_FLUSH_CTL_3D_DATAPORT_FLUSH_EVENTS_MASK
> 	REG_GENMASK(13, 11)
> > +
> > +#define SARB_CHICKEN1
> 	_MMIO(0xe90c)
> > +#define   COMP_CKN_IN
> 	REG_GENMASK(30, 29)
> > +
> >  #define GEN8_HDC_CHICKEN1
> 	_MMIO(0x7304)
> >
> >  /* GEN9 chicken */
> > @@ -8523,6 +8552,10 @@ enum {
> >  #define   PIXEL_ROUNDING_TRUNC_FB_PASSTHRU 	(1 << 15)
> >  #define   PER_PIXEL_ALPHA_BYPASS_EN		(1 <<
> 7)
> >
> > +#define VFLSKPD
> 	_MMIO(0x62a8)
> > +#define   DIS_OVER_FETCH_CACHE		REG_BIT(1)
> > +#define   DIS_MULT_MISS_RD_SQUASH	REG_BIT(0)
> > +
> >  #define FF_MODE2			_MMIO(0x6604)
> >  #define   FF_MODE2_GS_TIMER_MASK	REG_GENMASK(31, 24)
> >  #define   FF_MODE2_GS_TIMER_224
> 	REG_FIELD_PREP(FF_MODE2_GS_TIMER_MASK, 224)
> > @@ -9346,6 +9379,9 @@ enum {
> >  #define   GEN8_SDEUNIT_CLOCK_GATE_DISABLE	(1 << 14)
> >  #define   GEN8_HDCUNIT_CLOCK_GATE_DISABLE_HDCREQ (1 << 28)
> >
> > +#define UNSLCGCTL9430
> 	_MMIO(0x9430)
> > +#define   MSQDUNIT_CLKGATE_DIS
> 	REG_BIT(3)
> > +
> >  #define GEN6_GFXPAUSE
> 	_MMIO(0xA000)
> >  #define GEN6_RPNSWREQ
> 	_MMIO(0xA008)
> >  #define   GEN6_TURBO_DISABLE			(1 <<
> 31)
> > @@ -9661,24 +9697,39 @@ enum {
> >  #define   GEN9_CCS_TLB_PREFETCH_ENABLE	(1 << 3)
> >
> >  #define GEN8_ROW_CHICKEN		_MMIO(0xe4f0)
> > -#define   FLOW_CONTROL_ENABLE		(1 << 15)
> > -#define   PARTIAL_INSTRUCTION_SHOOTDOWN_DISABLE	(1 <<
> 8)
> > -#define   STALL_DOP_GATING_DISABLE		(1 << 5)
> > -#define   THROTTLE_12_5				(7 <<
> 2)
> > -#define   DISABLE_EARLY_EOT			(1 <<
> 1)
> > +#define   FLOW_CONTROL_ENABLE
> 	REG_BIT(15)
> > +#define   UGM_BACKUP_MODE
> 	REG_BIT(13)
> > +#define   MDQ_ARBITRATION_MODE
> 	REG_BIT(12)
> > +#define   PARTIAL_INSTRUCTION_SHOOTDOWN_DISABLE
> 	REG_BIT(8)
> > +#define   STALL_DOP_GATING_DISABLE
> 	REG_BIT(5)
> > +#define   THROTTLE_12_5
> 	REG_GENMASK(4, 2)
> > +#define   DISABLE_EARLY_EOT
> 	REG_BIT(1)
> >
> >  #define GEN7_ROW_CHICKEN2
> 	_MMIO(0xe4f4)
> > +#define   GEN12_DISABLE_READ_SUPPRESSION	REG_BIT(15)
> >  #define   GEN12_DISABLE_EARLY_READ		REG_BIT(14)
> > +#define   GEN12_ENABLE_LARGE_GRF_MODE
> 	REG_BIT(12)
> >  #define   GEN12_PUSH_CONST_DEREF_HOLD_DIS	REG_BIT(8)
> >
> > +#define LSC_CHICKEN_BIT_0
> 	_MMIO(0xe7c8)
> > +#define   FORCE_1_SUB_MESSAGE_PER_FRAGMENT	REG_BIT(15)
> > +#define LSC_CHICKEN_BIT_0_UDW
> 	_MMIO(0xe7c8 + 4)
> > +#define   DIS_CHAIN_2XSIMD8
> 	REG_BIT(55 - 32)
> > +#define   FORCE_SLM_FENCE_SCOPE_TO_TILE
> 	REG_BIT(42 - 32)
> > +#define   FORCE_UGM_FENCE_SCOPE_TO_TILE
> 	REG_BIT(41 - 32)
> > +#define   MAXREQS_PER_BANK
> 	REG_GENMASK(39 - 32, 37 - 32)
> > +#define   DISABLE_128B_EVICTION_COMMAND_UDW
> 	REG_BIT(36 - 32)
> > +
> >  #define GEN7_ROW_CHICKEN2_GT2		_MMIO(0xf4f4)
> >  #define   DOP_CLOCK_GATING_DISABLE	(1 << 0)
> >  #define   PUSH_CONSTANT_DEREF_DISABLE	(1 << 8)
> >  #define   GEN11_TDL_CLOCK_GATING_FIX_DISABLE	(1 << 1)
> >
> > -#define GEN9_ROW_CHICKEN4		_MMIO(0xe48c)
> > -#define   GEN12_DISABLE_TDL_PUSH	REG_BIT(9)
> > -#define   GEN11_DIS_PICK_2ND_EU		REG_BIT(7)
> > +#define GEN9_ROW_CHICKEN4
> 	_MMIO(0xe48c)
> > +#define   GEN12_DISABLE_GRF_CLEAR
> 	REG_BIT(13)
> > +#define   GEN12_DISABLE_TDL_PUSH
> 	REG_BIT(9)
> > +#define   GEN11_DIS_PICK_2ND_EU
> 	REG_BIT(7)
> > +#define   GEN12_DISABLE_HDR_PAST_PAYLOAD_HOLD_FIX
> 	REG_BIT(4)
> >
> >  #define HSW_ROW_CHICKEN3		_MMIO(0xe49c)
> >  #define  HSW_ROW_CHICKEN3_L3_GLOBAL_ATOMICS_DISABLE    (1 << 6)
> > @@ -9693,9 +9744,10 @@ enum {
> >  #define   GEN8_SAMPLER_POWER_BYPASS_DIS	(1 << 1)
> >
> >  #define GEN9_HALF_SLICE_CHICKEN7	_MMIO(0xe194)
> > -#define   GEN9_SAMPLER_HASH_COMPRESSED_READ_ADDR	(1 <<
> 8)
> > -#define   GEN9_ENABLE_YV12_BUGFIX	(1 << 4)
> > -#define   GEN9_ENABLE_GPGPU_PREEMPTION	(1 << 2)
> > +#define   DG2_DISABLE_ROUND_ENABLE_ALLOW_FOR_SSLA
> 	REG_BIT(15)
> > +#define   GEN9_SAMPLER_HASH_COMPRESSED_READ_ADDR
> 	REG_BIT(8)
> > +#define   GEN9_ENABLE_YV12_BUGFIX
> 	REG_BIT(4)
> > +#define   GEN9_ENABLE_GPGPU_PREEMPTION
> 	REG_BIT(2)
> >
> >  /* Audio */
> >  #define G4X_AUD_VID_DID
> 	_MMIO(DISPLAY_MMIO_BASE(dev_priv) + 0x62020)
> > @@ -12519,12 +12571,17 @@ enum skl_power_gate {
> >  #define   PMFLUSH_GAPL3UNBLOCK		(1 << 21)
> >  #define   PMFLUSHDONE_LNEBLK		(1 << 22)
> >
> > +#define XEHP_L3NODEARBCFG		_MMIO(0xb0b4)
> > +#define   XEHP_LNESPARE
> 	REG_BIT(19)
> > +
> >  #define GEN12_GLOBAL_MOCS(i)	_MMIO(0x4000 + (i) * 4) /* Global
> MOCS regs */
> >
> >  #define GEN12_GSMBASE
> 	_MMIO(0x108100)
> >  #define GEN12_DSMBASE
> 	_MMIO(0x1080C0)
> >
> >  #define XEHP_CLOCK_GATE_DIS		_MMIO(0x101014)
> > +#define   SGSI_SIDECLK_DIS		REG_BIT(17)
> > +#define   SGGI_DIS			REG_BIT(15)
> >  #define   SGR_DIS			REG_BIT(13)
> >
> >  /* gamt regs */
> > @@ -12903,4 +12960,7 @@ enum skl_power_gate {
> >  #define CLKGATE_DIS_MISC
> 	_MMIO(0x46534)
> >  #define  CLKGATE_DIS_MISC_DMASC_GATING_DIS	REG_BIT(21)
> >
> > +#define SLICE_COMMON_ECO_CHICKEN1
> 	_MMIO(0x731C)
> > +#define   MSC_MSAA_REODER_BUF_BYPASS_DISABLE
> 	REG_BIT(14)
> > +
> >  #endif /* _I915_REG_H_ */
> > diff --git a/drivers/gpu/drm/i915/intel_pm.c
> b/drivers/gpu/drm/i915/intel_pm.c
> > index 16fa3306d83d..a1d9a6ac3e49 100644
> > --- a/drivers/gpu/drm/i915/intel_pm.c
> > +++ b/drivers/gpu/drm/i915/intel_pm.c
> > @@ -7486,6 +7486,22 @@ static void xehpsdv_init_clock_gating(struct
> drm_i915_private *dev_priv)
> >  		intel_uncore_rmw(&dev_priv->uncore,
> XEHP_CLOCK_GATE_DIS, 0, SGR_DIS);
> >  }
> >
> > +static void dg2_init_clock_gating(struct drm_i915_private *i915)
> > +{
> > +	/* Wa_22010954014:dg2_g10 */
> > +	if (IS_DG2_G10(i915))
> > +		intel_uncore_rmw(&i915->uncore,
> XEHP_CLOCK_GATE_DIS, 0,
> > +
> SGSI_SIDECLK_DIS);
> > +
> > +	/*
> > +	 * Wa_14010733611:dg2_g10
> > +	 * Wa_22010146351:dg2_g10
> > +	 */
> > +	if (IS_DG2_GRAPHICS_STEP(i915, G10, STEP_A0, STEP_B0))
> > +		intel_uncore_rmw(&i915->uncore,
> XEHP_CLOCK_GATE_DIS, 0,
> > +				 SGR_DIS |
> SGGI_DIS);
> > +}
> > +
> >  static void cnp_init_clock_gating(struct drm_i915_private *dev_priv)
> >  {
> >  	if (!HAS_PCH_CNP(dev_priv))
> > @@ -7896,6 +7912,7 @@ static const struct drm_i915_clock_gating_funcs
> platform##_clock_gating_funcs =
> >  	.init_clock_gating = platform##_init_clock_gating,
> 	\
> >  }
> >
> > +CG_FUNCS(dg2);
> >  CG_FUNCS(xehpsdv);
> >  CG_FUNCS(adlp);
> >  CG_FUNCS(dg1);
> > @@ -7933,7 +7950,9 @@ CG_FUNCS(nop);
> >   */
> >  void intel_init_clock_gating_hooks(struct drm_i915_private *dev_priv)
> >  {
> > -	if (IS_XEHPSDV(dev_priv))
> > +	if (IS_DG2(dev_priv))
> > +		dev_priv->clock_gating_funcs =
> &dg2_clock_gating_funcs;
> > +	else if (IS_XEHPSDV(dev_priv))
> >  		dev_priv->clock_gating_funcs =
> &xehpsdv_clock_gating_funcs;
> >  	else if (IS_ALDERLAKE_P(dev_priv))
> >  		dev_priv->clock_gating_funcs =
> &adlp_clock_gating_funcs;
> > --
> > 2.33.0
> >




[Index of Archives]     [Linux DRI Users]     [Linux Intel Graphics]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]     [XFree86]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Linux Kernel]     [Linux SCSI]     [XFree86]
  Powered by Linux