On 18.11.2022 02:58, John.C.Harrison@xxxxxxxxx wrote: > From: John Harrison <John.C.Harrison@xxxxxxxxx> > > When trying to analyse bug reports from CI, customers, etc. it can be > difficult to work out exactly what is happening on which GT in a > multi-GT system. So add GT oriented debug/error message wrappers. If > used instead of the drm_ equivalents, you get the same output but with > a GT# prefix on it. > > v2: Go back to using lower case names (combined review feedback). > Convert intel_gt.c as a first step. > > Signed-off-by: John Harrison <John.C.Harrison@xxxxxxxxx> > --- > drivers/gpu/drm/i915/gt/intel_gt.c | 96 ++++++++++++++---------------- > drivers/gpu/drm/i915/gt/intel_gt.h | 35 +++++++++++ > 2 files changed, 81 insertions(+), 50 deletions(-) > > diff --git a/drivers/gpu/drm/i915/gt/intel_gt.c b/drivers/gpu/drm/i915/gt/intel_gt.c > index 0325f071046ca..349fcfdd14a6d 100644 > --- a/drivers/gpu/drm/i915/gt/intel_gt.c > +++ b/drivers/gpu/drm/i915/gt/intel_gt.c > @@ -90,9 +90,8 @@ static int intel_gt_probe_lmem(struct intel_gt *gt) > if (err == -ENODEV) > return 0; > > - drm_err(&i915->drm, > - "Failed to setup region(%d) type=%d\n", > - err, INTEL_MEMORY_LOCAL); > + gt_err(gt, "Failed to setup region(%d) type=%d\n", > + err, INTEL_MEMORY_LOCAL); > return err; > } > > @@ -192,14 +191,14 @@ int intel_gt_init_hw(struct intel_gt *gt) > > ret = i915_ppgtt_init_hw(gt); > if (ret) { > - drm_err(&i915->drm, "Enabling PPGTT failed (%d)\n", ret); > + gt_err(gt, "Enabling PPGTT failed (%d)\n", ret); > goto out; > } > > /* We can't enable contexts until all firmware is loaded */ > ret = intel_uc_init_hw(>->uc); > if (ret) { > - i915_probe_error(i915, "Enabling uc failed (%d)\n", ret); > + gt_probe_error(gt, "Enabling uc failed (%d)\n", ret); > goto out; > } > > @@ -264,7 +263,7 @@ intel_gt_clear_error_registers(struct intel_gt *gt, > * some errors might have become stuck, > * mask them. > */ > - drm_dbg(>->i915->drm, "EIR stuck: 0x%08x, masking\n", eir); > + gt_dbg(gt, "EIR stuck: 0x%08x, masking\n", eir); > rmw_set(uncore, EMR, eir); > intel_uncore_write(uncore, GEN2_IIR, > I915_MASTER_ERROR_INTERRUPT); > @@ -298,16 +297,16 @@ static void gen6_check_faults(struct intel_gt *gt) > for_each_engine(engine, gt, id) { > fault = GEN6_RING_FAULT_REG_READ(engine); > if (fault & RING_FAULT_VALID) { > - drm_dbg(&engine->i915->drm, "Unexpected fault\n" > - "\tAddr: 0x%08lx\n" > - "\tAddress space: %s\n" > - "\tSource ID: %d\n" > - "\tType: %d\n", > - fault & PAGE_MASK, > - fault & RING_FAULT_GTTSEL_MASK ? > - "GGTT" : "PPGTT", > - RING_FAULT_SRCID(fault), > - RING_FAULT_FAULT_TYPE(fault)); > + gt_dbg(gt, "Unexpected fault\n" > + "\tAddr: 0x%08lx\n" > + "\tAddress space: %s\n" > + "\tSource ID: %d\n" > + "\tType: %d\n", > + fault & PAGE_MASK, > + fault & RING_FAULT_GTTSEL_MASK ? > + "GGTT" : "PPGTT", > + RING_FAULT_SRCID(fault), > + RING_FAULT_FAULT_TYPE(fault)); > } > } > } > @@ -334,17 +333,17 @@ static void xehp_check_faults(struct intel_gt *gt) > fault_addr = ((u64)(fault_data1 & FAULT_VA_HIGH_BITS) << 44) | > ((u64)fault_data0 << 12); > > - drm_dbg(>->i915->drm, "Unexpected fault\n" > - "\tAddr: 0x%08x_%08x\n" > - "\tAddress space: %s\n" > - "\tEngine ID: %d\n" > - "\tSource ID: %d\n" > - "\tType: %d\n", > - upper_32_bits(fault_addr), lower_32_bits(fault_addr), > - fault_data1 & FAULT_GTT_SEL ? "GGTT" : "PPGTT", > - GEN8_RING_FAULT_ENGINE_ID(fault), > - RING_FAULT_SRCID(fault), > - RING_FAULT_FAULT_TYPE(fault)); > + gt_dbg(gt, "Unexpected fault\n" > + "\tAddr: 0x%08x_%08x\n" > + "\tAddress space: %s\n" > + "\tEngine ID: %d\n" > + "\tSource ID: %d\n" > + "\tType: %d\n", > + upper_32_bits(fault_addr), lower_32_bits(fault_addr), > + fault_data1 & FAULT_GTT_SEL ? "GGTT" : "PPGTT", > + GEN8_RING_FAULT_ENGINE_ID(fault), > + RING_FAULT_SRCID(fault), > + RING_FAULT_FAULT_TYPE(fault)); > } > } > > @@ -375,17 +374,17 @@ static void gen8_check_faults(struct intel_gt *gt) > fault_addr = ((u64)(fault_data1 & FAULT_VA_HIGH_BITS) << 44) | > ((u64)fault_data0 << 12); > > - drm_dbg(&uncore->i915->drm, "Unexpected fault\n" > - "\tAddr: 0x%08x_%08x\n" > - "\tAddress space: %s\n" > - "\tEngine ID: %d\n" > - "\tSource ID: %d\n" > - "\tType: %d\n", > - upper_32_bits(fault_addr), lower_32_bits(fault_addr), > - fault_data1 & FAULT_GTT_SEL ? "GGTT" : "PPGTT", > - GEN8_RING_FAULT_ENGINE_ID(fault), > - RING_FAULT_SRCID(fault), > - RING_FAULT_FAULT_TYPE(fault)); > + gt_dbg(gt, "Unexpected fault\n" > + "\tAddr: 0x%08x_%08x\n" > + "\tAddress space: %s\n" > + "\tEngine ID: %d\n" > + "\tSource ID: %d\n" > + "\tType: %d\n", > + upper_32_bits(fault_addr), lower_32_bits(fault_addr), > + fault_data1 & FAULT_GTT_SEL ? "GGTT" : "PPGTT", > + GEN8_RING_FAULT_ENGINE_ID(fault), > + RING_FAULT_SRCID(fault), > + RING_FAULT_FAULT_TYPE(fault)); > } > } > > @@ -479,7 +478,7 @@ static int intel_gt_init_scratch(struct intel_gt *gt, unsigned int size) > if (IS_ERR(obj)) > obj = i915_gem_object_create_internal(i915, size); > if (IS_ERR(obj)) { > - drm_err(&i915->drm, "Failed to allocate scratch page\n"); > + gt_err(gt, "Failed to allocate scratch page\n"); > return PTR_ERR(obj); > } > > @@ -729,8 +728,7 @@ int intel_gt_init(struct intel_gt *gt) > > err = intel_gt_init_hwconfig(gt); > if (err) > - drm_err(>->i915->drm, "Failed to retrieve hwconfig table: %pe\n", > - ERR_PTR(err)); > + gt_err(gt, "Failed to retrieve hwconfig table: %pe\n", ERR_PTR(err)); > > err = __engines_record_defaults(gt); > if (err) > @@ -891,7 +889,7 @@ int intel_gt_probe_all(struct drm_i915_private *i915) > gt->name = "Primary GT"; > gt->info.engine_mask = RUNTIME_INFO(i915)->platform_engine_mask; > > - drm_dbg(&i915->drm, "Setting up %s\n", gt->name); > + gt_dbg(gt, "Setting up %s\n", gt->name); > ret = intel_gt_tile_setup(gt, phys_addr); > if (ret) > return ret; > @@ -916,7 +914,7 @@ int intel_gt_probe_all(struct drm_i915_private *i915) > gt->info.engine_mask = gtdef->engine_mask; > gt->info.id = i; > > - drm_dbg(&i915->drm, "Setting up %s\n", gt->name); > + gt_dbg(gt, "Setting up %s\n", gt->name); > if (GEM_WARN_ON(range_overflows_t(resource_size_t, > gtdef->mapping_base, > SZ_16M, > @@ -951,7 +949,7 @@ int intel_gt_probe_all(struct drm_i915_private *i915) > return 0; > > err: > - i915_probe_error(i915, "Failed to initialize %s! (%d)\n", gtdef->name, ret); > + gt_probe_error(gt, "Failed to initialize %s! (%d)\n", gtdef->name, ret); on -ENOMEM error, this gt will be NULL so likely we should stay with i915 variant > intel_gt_release_all(i915); > > return ret; > @@ -1004,8 +1002,7 @@ get_reg_and_bit(const struct intel_engine_cs *engine, const bool gen8, > const unsigned int class = engine->class; > struct reg_and_bit rb = { }; > > - if (drm_WARN_ON_ONCE(&engine->i915->drm, > - class >= num || !regs[class].reg)) > + if (gt_WARN_ON_ONCE(engine->gt, class >= num || !regs[class].reg)) > return rb; > > rb.reg = regs[class]; > @@ -1088,8 +1085,7 @@ static void mmio_invalidate_full(struct intel_gt *gt) > return; > } > > - if (drm_WARN_ONCE(&i915->drm, !num, > - "Platform does not implement TLB invalidation!")) > + if (gt_WARN_ONCE(gt, !num, "Platform does not implement TLB invalidation!")) > return; > > intel_uncore_forcewake_get(uncore, FORCEWAKE_ALL); > @@ -1142,8 +1138,8 @@ static void mmio_invalidate_full(struct intel_gt *gt) > > if (wait_for_invalidate(gt, rb)) > drm_err_ratelimited(>->i915->drm, > - "%s TLB invalidation did not complete in %ums!\n", > - engine->name, TLB_INVAL_TIMEOUT_MS); > + "GT%d: %s TLB invalidation did not complete in %ums!\n", > + gt->info.id, engine->name, TLB_INVAL_TIMEOUT_MS); that's inconsistent, we should use gt_err_ratelimited() > } > > /* > diff --git a/drivers/gpu/drm/i915/gt/intel_gt.h b/drivers/gpu/drm/i915/gt/intel_gt.h > index e0365d5562484..5bf2d53f4b4d0 100644 > --- a/drivers/gpu/drm/i915/gt/intel_gt.h > +++ b/drivers/gpu/drm/i915/gt/intel_gt.h > @@ -13,6 +13,41 @@ > struct drm_i915_private; > struct drm_printer; > > +#define gt_err(_gt, _fmt, ...) \ > + drm_err(&(_gt)->i915->drm, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > +#define gt_warn(_gt, _fmt, ...) \ > + drm_warn(&(_gt)->i915->drm, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > +#define gt_notice(_gt, _fmt, ...) \ > + drm_notice(&(_gt)->i915->drm, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > +#define gt_info(_gt, _fmt, ...) \ > + drm_info(&(_gt)->i915->drm, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > +#define gt_dbg(_gt, _fmt, ...) \ > + drm_dbg(&(_gt)->i915->drm, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > +#define gt_probe_error(_gt, _fmt, ...) \ > + do { \ > + if (i915_error_injected()) \ > + gt_dbg(_gt, _fmt, ##__VA_ARGS__); \ > + else \ > + gt_err(_gt, _fmt, ##__VA_ARGS__); \ > + } while (0) > + > +#define gt_WARN_ON(_gt, _condition) \ > + gt_WARN(_gt, _condition, "%s", "gt_WARN_ON(" __stringify(_condition) ")") > + > +#define gt_WARN_ON_ONCE(_gt, _condition) \ > + gt_WARN_ONCE(_gt, _condition, "%s", "gt_WARN_ONCE(" __stringify(_condition) ")") > + > +#define gt_WARN(_gt, _condition, _fmt, ...) \ > + drm_WARN(&(_gt)->i915->drm, _condition, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > +#define gt_WARN_ONCE(_gt, _condition, _fmt, ...) \ > + drm_WARN_ONCE(&(_gt)->i915->drm, _condition, "GT%u: " _fmt, (_gt)->info.id, ##__VA_ARGS__) > + > #define GT_TRACE(gt, fmt, ...) do { \ > const struct intel_gt *gt__ __maybe_unused = (gt); \ > GEM_TRACE("%s " fmt, dev_name(gt__->i915->drm.dev), \ btw, shouldn't we also update GT_TRACE macros to include GT.id ? (naturally not in this series) Michal