Thanks, Oak > -----Original Message----- > From: Roper, Matthew D <matthew.d.roper@xxxxxxxxx> > Sent: August 24, 2023 11:52 AM > To: Zeng, Oak <oak.zeng@xxxxxxxxx> > Cc: intel-gfx@xxxxxxxxxxxxxxxxxxxxx; Shyti, Andi <andi.shyti@xxxxxxxxx>; > chris.p.wilson@xxxxxxxxxxxxxxx; Das, Nirmoy <nirmoy.das@xxxxxxxxx> > Subject: Re: [PATCH 1/3] drm/i915: Create a blitter context for GGTT > updates > > On Tue, Aug 22, 2023 at 11:28:57AM -0400, Oak Zeng wrote: > > From: Nirmoy Das <nirmoy.das@xxxxxxxxx> > > > > Create a separate blitter context if a platform requires > > GGTT updates using MI_UPDATE_GTT blitter command. > > > > Subsequent patch will introduce methods to update > > GGTT using this blitter context and MI_UPDATE_GTT blitter > > command. > > > > v2: Fix a typo in comment. (Oak) > > > > Signed-off-by: Nirmoy Das <nirmoy.das@xxxxxxxxx> > > Signed-off-by: Oak Zeng <oak.zeng@xxxxxxxxx> > > --- > > drivers/gpu/drm/i915/gt/intel_engine.h | 4 ++ > > drivers/gpu/drm/i915/gt/intel_engine_cs.c | 44 +++++++++++++++++++- > > drivers/gpu/drm/i915/gt/intel_engine_types.h | 3 ++ > > drivers/gpu/drm/i915/gt/intel_gtt.c | 4 ++ > > drivers/gpu/drm/i915/gt/intel_gtt.h | 2 + > > 5 files changed, 56 insertions(+), 1 deletion(-) > > > > diff --git a/drivers/gpu/drm/i915/gt/intel_engine.h > b/drivers/gpu/drm/i915/gt/intel_engine.h > > index b58c30ac8ef0..ee36db2fdaa7 100644 > > --- a/drivers/gpu/drm/i915/gt/intel_engine.h > > +++ b/drivers/gpu/drm/i915/gt/intel_engine.h > > @@ -170,6 +170,8 @@ intel_write_status_page(struct intel_engine_cs *engine, > int reg, u32 value) > > #define I915_GEM_HWS_SEQNO 0x40 > > #define I915_GEM_HWS_SEQNO_ADDR (I915_GEM_HWS_SEQNO > * sizeof(u32)) > > #define I915_GEM_HWS_MIGRATE (0x42 * sizeof(u32)) > > +#define I915_GEM_HWS_GGTT_BLIT 0x46 > > +#define I915_GEM_HWS_GGTT_BLIT_ADDR > (I915_GEM_HWS_GGTT_BLIT * sizeof(u32)) > > #define I915_GEM_HWS_PXP 0x60 > > #define I915_GEM_HWS_PXP_ADDR (I915_GEM_HWS_PXP * > sizeof(u32)) > > #define I915_GEM_HWS_GSC 0x62 > > @@ -356,4 +358,6 @@ u64 intel_clamp_preempt_timeout_ms(struct > intel_engine_cs *engine, u64 value); > > u64 intel_clamp_stop_timeout_ms(struct intel_engine_cs *engine, u64 value); > > u64 intel_clamp_timeslice_duration_ms(struct intel_engine_cs *engine, u64 > value); > > > > +void intel_engine_blitter_context_set_ready(struct intel_gt *gt, bool ready); > > +bool intel_engine_blitter_context_ready(struct intel_gt *gt); > > #endif /* _INTEL_RINGBUFFER_H_ */ > > diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c > b/drivers/gpu/drm/i915/gt/intel_engine_cs.c > > index dfb69fc977a0..d8c492a507a4 100644 > > --- a/drivers/gpu/drm/i915/gt/intel_engine_cs.c > > +++ b/drivers/gpu/drm/i915/gt/intel_engine_cs.c > > @@ -27,6 +27,7 @@ > > #include "intel_gt_mcr.h" > > #include "intel_gt_pm.h" > > #include "intel_gt_requests.h" > > +#include "intel_gtt.h" > > #include "intel_lrc.h" > > #include "intel_lrc_reg.h" > > #include "intel_reset.h" > > @@ -1419,6 +1420,34 @@ void intel_engine_destroy_pinned_context(struct > intel_context *ce) > > intel_context_put(ce); > > } > > > > +void intel_engine_blitter_context_set_ready(struct intel_gt *gt, bool ready) > > +{ > > + struct intel_engine_cs *engine = gt->engine[BCS0]; > > + > > + if (engine && engine->blitter_context) > > + atomic_set(&engine->blitter_context_ready, ready ? 1 : 0); > > +} > > + > > +bool intel_engine_blitter_context_ready(struct intel_gt *gt) > > +{ > > + struct intel_engine_cs *engine = gt->engine[BCS0]; > > + > > + if (engine) > > + return atomic_read(&engine->blitter_context_ready) == 1; > > + > > + return false; > > +} > > + > > +static struct intel_context * > > +create_ggtt_blitter_context(struct intel_engine_cs *engine) > > +{ > > + static struct lock_class_key kernel; > > + > > + /* MI_UPDATE_GTT can insert up to 512 PTE entries so get a bigger ring > */ > > + return intel_engine_create_pinned_context(engine, engine->gt->vm, > SZ_512K, > > + > I915_GEM_HWS_GGTT_BLIT_ADDR, > > + &kernel, "ggtt_blitter_context"); > > +} > > static struct intel_context * > > create_kernel_context(struct intel_engine_cs *engine) > > { > > @@ -1442,7 +1471,7 @@ create_kernel_context(struct intel_engine_cs > *engine) > > */ > > static int engine_init_common(struct intel_engine_cs *engine) > > { > > - struct intel_context *ce; > > + struct intel_context *ce, *bce = NULL; > > int ret; > > > > engine->set_default_submission(engine); > > @@ -1458,6 +1487,15 @@ static int engine_init_common(struct > intel_engine_cs *engine) > > ce = create_kernel_context(engine); > > if (IS_ERR(ce)) > > return PTR_ERR(ce); > > + /* > > + * Create a separate pinned context for GGTT update using blitter > > + * if a platform require such service. > > + */ > > + if (i915_ggtt_require_blitter(engine->i915) && engine->id == BCS0) { > > + bce = create_ggtt_blitter_context(engine); > > + if (IS_ERR(bce)) > > + return PTR_ERR(bce); > > + } > > > > ret = measure_breadcrumb_dw(ce); > > if (ret < 0) > > @@ -1465,6 +1503,7 @@ static int engine_init_common(struct intel_engine_cs > *engine) > > > > engine->emit_fini_breadcrumb_dw = ret; > > engine->kernel_context = ce; > > + engine->blitter_context = bce; > > > > return 0; > > > > @@ -1537,6 +1576,9 @@ void intel_engine_cleanup_common(struct > intel_engine_cs *engine) > > > > if (engine->kernel_context) > > intel_engine_destroy_pinned_context(engine->kernel_context); > > + if (engine->blitter_context) > > + intel_engine_destroy_pinned_context(engine->blitter_context); > > + > > > > GEM_BUG_ON(!llist_empty(&engine->barrier_tasks)); > > cleanup_status_page(engine); > > diff --git a/drivers/gpu/drm/i915/gt/intel_engine_types.h > b/drivers/gpu/drm/i915/gt/intel_engine_types.h > > index e99a6fa03d45..62095c0d8783 100644 > > --- a/drivers/gpu/drm/i915/gt/intel_engine_types.h > > +++ b/drivers/gpu/drm/i915/gt/intel_engine_types.h > > @@ -415,6 +415,9 @@ struct intel_engine_cs { > > struct llist_head barrier_tasks; > > > > struct intel_context *kernel_context; /* pinned */ > > + struct intel_context *blitter_context; /* pinned, only for BCS0 */ > > + /* mark the blitter engine's availability status */ > > + atomic_t blitter_context_ready; > > > > /** > > * pinned_contexts_list: List of pinned contexts. This list is only > > diff --git a/drivers/gpu/drm/i915/gt/intel_gtt.c > b/drivers/gpu/drm/i915/gt/intel_gtt.c > > index 13944a14ea2d..9c77c97670fe 100644 > > --- a/drivers/gpu/drm/i915/gt/intel_gtt.c > > +++ b/drivers/gpu/drm/i915/gt/intel_gtt.c > > @@ -21,6 +21,10 @@ > > #include "intel_gt_regs.h" > > #include "intel_gtt.h" > > > > +bool i915_ggtt_require_blitter(struct drm_i915_private *i915) > > +{ > > + return IS_METEORLAKE(i915); > > Drive-by comment: this workaround is tied to the Xe_LPM+ media IP, not > to the MTL platform. Other platforms that re-use Xe_LPM+ IP will also > be affected, whereas MTL platforms that lack media, or integrate a > different media chiplet will not be affected. So the condition here > should be: > > /* Wa_13010847436 */ > return MEDIA_VER_FULL(i915) == IP_VER(13, 0); Issue was observed on LNL A0 (fixed in A1), MTL. Not sure whether it is fixed on ARL or not. For LNL A0, there might be a different wa so this software wa is not needed. Double confirming. For now let's only enable MTL. > > But does this even belong in this patch? It sounds like patch #3 of the > series is where you intended to hook up this programming to the specific > workaround. This function is called from patch 2. So will keep it to patch 1. Oak > > > Matt > > > +} > > > > static bool intel_ggtt_update_needs_vtd_wa(struct drm_i915_private *i915) > > { > > diff --git a/drivers/gpu/drm/i915/gt/intel_gtt.h > b/drivers/gpu/drm/i915/gt/intel_gtt.h > > index 4d6296cdbcfd..9710eb031fb2 100644 > > --- a/drivers/gpu/drm/i915/gt/intel_gtt.h > > +++ b/drivers/gpu/drm/i915/gt/intel_gtt.h > > @@ -688,4 +688,6 @@ static inline struct sgt_dma { > > return (struct sgt_dma){ sg, addr, addr + sg_dma_len(sg) }; > > } > > > > +bool i915_ggtt_require_blitter(struct drm_i915_private *i915); > > + > > #endif > > -- > > 2.26.3 > > > > -- > Matt Roper > Graphics Software Engineer > Linux GPU Platform Enablement > Intel Corporation