On 14.10.2022 16:02, Matt Roper wrote: > On Xe_HP the fault registers are now in a multicast register range. > However as part of the GAM these registers follow special rules and we > need only read from the "primary" GAM's instance to get the information > we need. So a single intel_gt_mcr_read_any() (which will automatically > steer to the primary GAM) is sufficient; we don't need to loop over each > instance of the MCR register. > > v2: > - Update more instances of fault registers. (Bala) > > Signed-off-by: Matt Roper <matthew.d.roper@xxxxxxxxx> > --- > drivers/gpu/drm/i915/gt/intel_gt.c | 52 +++++++++++++++++++++++---- > drivers/gpu/drm/i915/i915_gpu_error.c | 12 +++++-- > 2 files changed, 55 insertions(+), 9 deletions(-) Reviewed-by: Balasubramani Vivekanandan <balasubramani.vivekanandan@xxxxxxxxx> Regards, Bala > > diff --git a/drivers/gpu/drm/i915/gt/intel_gt.c b/drivers/gpu/drm/i915/gt/intel_gt.c > index 445e171940fa..e14f159ad9fc 100644 > --- a/drivers/gpu/drm/i915/gt/intel_gt.c > +++ b/drivers/gpu/drm/i915/gt/intel_gt.c > @@ -270,7 +270,11 @@ intel_gt_clear_error_registers(struct intel_gt *gt, > I915_MASTER_ERROR_INTERRUPT); > } > > - if (GRAPHICS_VER(i915) >= 12) { > + if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) { > + intel_gt_mcr_multicast_rmw(gt, XEHP_RING_FAULT_REG, > + RING_FAULT_VALID, 0); > + intel_gt_mcr_read_any(gt, XEHP_RING_FAULT_REG); > + } else if (GRAPHICS_VER(i915) >= 12) { > rmw_clear(uncore, GEN12_RING_FAULT_REG, RING_FAULT_VALID); > intel_uncore_posting_read(uncore, GEN12_RING_FAULT_REG); > } else if (GRAPHICS_VER(i915) >= 8) { > @@ -308,17 +312,49 @@ static void gen6_check_faults(struct intel_gt *gt) > } > } > > +static void xehp_check_faults(struct intel_gt *gt) > +{ > + u32 fault; > + > + /* > + * Although the fault register now lives in an MCR register range, > + * the GAM registers are special and we only truly need to read > + * the "primary" GAM instance rather than handling each instance > + * individually. intel_gt_mcr_read_any() will automatically steer > + * toward the primary instance. > + */ > + fault = intel_gt_mcr_read_any(gt, XEHP_RING_FAULT_REG); > + if (fault & RING_FAULT_VALID) { > + u32 fault_data0, fault_data1; > + u64 fault_addr; > + > + fault_data0 = intel_gt_mcr_read_any(gt, XEHP_FAULT_TLB_DATA0); > + fault_data1 = intel_gt_mcr_read_any(gt, XEHP_FAULT_TLB_DATA1); > + > + fault_addr = ((u64)(fault_data1 & FAULT_VA_HIGH_BITS) << 44) | > + ((u64)fault_data0 << 12); > + > + drm_dbg(>->i915->drm, "Unexpected fault\n" > + "\tAddr: 0x%08x_%08x\n" > + "\tAddress space: %s\n" > + "\tEngine ID: %d\n" > + "\tSource ID: %d\n" > + "\tType: %d\n", > + upper_32_bits(fault_addr), lower_32_bits(fault_addr), > + fault_data1 & FAULT_GTT_SEL ? "GGTT" : "PPGTT", > + GEN8_RING_FAULT_ENGINE_ID(fault), > + RING_FAULT_SRCID(fault), > + RING_FAULT_FAULT_TYPE(fault)); > + } > +} > + > static void gen8_check_faults(struct intel_gt *gt) > { > struct intel_uncore *uncore = gt->uncore; > i915_reg_t fault_reg, fault_data0_reg, fault_data1_reg; > u32 fault; > > - if (GRAPHICS_VER_FULL(gt->i915) >= IP_VER(12, 50)) { > - fault_reg = XEHP_RING_FAULT_REG; > - fault_data0_reg = XEHP_FAULT_TLB_DATA0; > - fault_data1_reg = XEHP_FAULT_TLB_DATA1; > - } else if (GRAPHICS_VER(gt->i915) >= 12) { > + if (GRAPHICS_VER(gt->i915) >= 12) { > fault_reg = GEN12_RING_FAULT_REG; > fault_data0_reg = GEN12_FAULT_TLB_DATA0; > fault_data1_reg = GEN12_FAULT_TLB_DATA1; > @@ -358,7 +394,9 @@ void intel_gt_check_and_clear_faults(struct intel_gt *gt) > struct drm_i915_private *i915 = gt->i915; > > /* From GEN8 onwards we only have one 'All Engine Fault Register' */ > - if (GRAPHICS_VER(i915) >= 8) > + if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) > + xehp_check_faults(gt); > + else if (GRAPHICS_VER(i915) >= 8) > gen8_check_faults(gt); > else if (GRAPHICS_VER(i915) >= 6) > gen6_check_faults(gt); > diff --git a/drivers/gpu/drm/i915/i915_gpu_error.c b/drivers/gpu/drm/i915/i915_gpu_error.c > index 9ea2fe34e7d3..f2d53edcd2ee 100644 > --- a/drivers/gpu/drm/i915/i915_gpu_error.c > +++ b/drivers/gpu/drm/i915/i915_gpu_error.c > @@ -1221,7 +1221,10 @@ static void engine_record_registers(struct intel_engine_coredump *ee) > if (GRAPHICS_VER(i915) >= 6) { > ee->rc_psmi = ENGINE_READ(engine, RING_PSMI_CTL); > > - if (GRAPHICS_VER(i915) >= 12) > + if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) > + ee->fault_reg = intel_gt_mcr_read_any(engine->gt, > + XEHP_RING_FAULT_REG); > + else if (GRAPHICS_VER(i915) >= 12) > ee->fault_reg = intel_uncore_read(engine->uncore, > GEN12_RING_FAULT_REG); > else if (GRAPHICS_VER(i915) >= 8) > @@ -1820,7 +1823,12 @@ static void gt_record_global_regs(struct intel_gt_coredump *gt) > if (GRAPHICS_VER(i915) == 7) > gt->err_int = intel_uncore_read(uncore, GEN7_ERR_INT); > > - if (GRAPHICS_VER(i915) >= 12) { > + if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) { > + gt->fault_data0 = intel_gt_mcr_read_any((struct intel_gt *)gt->_gt, > + XEHP_FAULT_TLB_DATA0); > + gt->fault_data1 = intel_gt_mcr_read_any((struct intel_gt *)gt->_gt, > + XEHP_FAULT_TLB_DATA1); > + } else if (GRAPHICS_VER(i915) >= 12) { > gt->fault_data0 = intel_uncore_read(uncore, > GEN12_FAULT_TLB_DATA0); > gt->fault_data1 = intel_uncore_read(uncore, > -- > 2.37.3 >