Re: [PATCH v3 4/6] drm/msm/a7xx: Initialize a750 "software fuse"

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Wed, Jun 26, 2024 at 10:33 AM Neil Armstrong
<neil.armstrong@xxxxxxxxxx> wrote:
>
> Hi,
>
> On 30/04/2024 12:43, Connor Abbott wrote:
> > On all Qualcomm platforms with a7xx GPUs, qcom_scm provides a method to
> > initialize cx_mem. Copy this from downstream (minus BCL which we
> > currently don't support). On a750, this includes a new "fuse" register
> > which can be used by qcom_scm to fuse off certain features like
> > raytracing in software. The fuse is default off, and is initialized by
> > calling the method. Afterwards we have to read it to find out which
> > features were enabled.
> >
> > Reviewed-by: Dmitry Baryshkov <dmitry.baryshkov@xxxxxxxxxx>
> > Signed-off-by: Connor Abbott <cwabbott0@xxxxxxxxx>
> > ---
> >   drivers/gpu/drm/msm/adreno/a6xx_gpu.c   | 91 ++++++++++++++++++++++++++++++++-
> >   drivers/gpu/drm/msm/adreno/adreno_gpu.h |  2 +
> >   2 files changed, 92 insertions(+), 1 deletion(-)
> >
> > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gpu.c b/drivers/gpu/drm/msm/adreno/a6xx_gpu.c
> > index cf0b1de1c071..52b080206090 100644
> > --- a/drivers/gpu/drm/msm/adreno/a6xx_gpu.c
> > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gpu.c
> > @@ -10,6 +10,7 @@
> >
> >   #include <linux/bitfield.h>
> >   #include <linux/devfreq.h>
> > +#include <linux/firmware/qcom/qcom_scm.h>
> >   #include <linux/pm_domain.h>
> >   #include <linux/soc/qcom/llcc-qcom.h>
> >
> > @@ -1686,7 +1687,8 @@ static int a6xx_zap_shader_init(struct msm_gpu *gpu)
> >                      A6XX_RBBM_INT_0_MASK_RBBM_HANG_DETECT | \
> >                      A6XX_RBBM_INT_0_MASK_UCHE_OOB_ACCESS | \
> >                      A6XX_RBBM_INT_0_MASK_UCHE_TRAP_INTR | \
> > -                    A6XX_RBBM_INT_0_MASK_TSBWRITEERROR)
> > +                    A6XX_RBBM_INT_0_MASK_TSBWRITEERROR | \
> > +                    A6XX_RBBM_INT_0_MASK_SWFUSEVIOLATION)
> >
> >   #define A7XX_APRIV_MASK (A6XX_CP_APRIV_CNTL_ICACHE | \
> >                        A6XX_CP_APRIV_CNTL_RBFETCH | \
> > @@ -2356,6 +2358,27 @@ static void a6xx_fault_detect_irq(struct msm_gpu *gpu)
> >       kthread_queue_work(gpu->worker, &gpu->recover_work);
> >   }
> >
> > +static void a7xx_sw_fuse_violation_irq(struct msm_gpu *gpu)
> > +{
> > +     u32 status;
> > +
> > +     status = gpu_read(gpu, REG_A7XX_RBBM_SW_FUSE_INT_STATUS);
> > +     gpu_write(gpu, REG_A7XX_RBBM_SW_FUSE_INT_MASK, 0);
> > +
> > +     dev_err_ratelimited(&gpu->pdev->dev, "SW fuse violation status=%8.8x\n", status);
> > +
> > +     /*
> > +      * Ignore FASTBLEND violations, because the HW will silently fall back
> > +      * to legacy blending.
> > +      */
> > +     if (status & (A7XX_CX_MISC_SW_FUSE_VALUE_RAYTRACING |
> > +                   A7XX_CX_MISC_SW_FUSE_VALUE_LPAC)) {
> > +             del_timer(&gpu->hangcheck_timer);
> > +
> > +             kthread_queue_work(gpu->worker, &gpu->recover_work);
> > +     }
> > +}
> > +
> >   static irqreturn_t a6xx_irq(struct msm_gpu *gpu)
> >   {
> >       struct msm_drm_private *priv = gpu->dev->dev_private;
> > @@ -2384,6 +2407,9 @@ static irqreturn_t a6xx_irq(struct msm_gpu *gpu)
> >       if (status & A6XX_RBBM_INT_0_MASK_UCHE_OOB_ACCESS)
> >               dev_err_ratelimited(&gpu->pdev->dev, "UCHE | Out of bounds access\n");
> >
> > +     if (status & A6XX_RBBM_INT_0_MASK_SWFUSEVIOLATION)
> > +             a7xx_sw_fuse_violation_irq(gpu);
> > +
> >       if (status & A6XX_RBBM_INT_0_MASK_CP_CACHE_FLUSH_TS)
> >               msm_gpu_retire(gpu);
> >
> > @@ -2525,6 +2551,61 @@ static void a6xx_llc_slices_init(struct platform_device *pdev,
> >               a6xx_gpu->llc_mmio = ERR_PTR(-EINVAL);
> >   }
> >
> > +static int a7xx_cx_mem_init(struct a6xx_gpu *a6xx_gpu)
> > +{
> > +     struct adreno_gpu *adreno_gpu = &a6xx_gpu->base;
> > +     struct msm_gpu *gpu = &adreno_gpu->base;
> > +     u32 fuse_val;
> > +     int ret;
> > +
> > +     if (adreno_is_a750(adreno_gpu)) {
> > +             /*
> > +              * Assume that if qcom scm isn't available, that whatever
> > +              * replacement allows writing the fuse register ourselves.
> > +              * Users of alternative firmware need to make sure this
> > +              * register is writeable or indicate that it's not somehow.
> > +              * Print a warning because if you mess this up you're about to
> > +              * crash horribly.
> > +              */
> > +             if (!qcom_scm_is_available()) {
> > +                     dev_warn_once(gpu->dev->dev,
> > +                             "SCM is not available, poking fuse register\n");
> > +                     a6xx_llc_write(a6xx_gpu, REG_A7XX_CX_MISC_SW_FUSE_VALUE,
> > +                             A7XX_CX_MISC_SW_FUSE_VALUE_RAYTRACING |
> > +                             A7XX_CX_MISC_SW_FUSE_VALUE_FASTBLEND |
> > +                             A7XX_CX_MISC_SW_FUSE_VALUE_LPAC);
> > +                     adreno_gpu->has_ray_tracing = true;
> > +                     return 0;
> > +             }
> > +
> > +             ret = qcom_scm_gpu_init_regs(QCOM_SCM_GPU_ALWAYS_EN_REQ |
> > +                                          QCOM_SCM_GPU_TSENSE_EN_REQ);
> > +             if (ret)
> > +                     return ret;
> > +
> > +             /*
> > +              * On a750 raytracing may be disabled by the firmware, find out
> > +              * whether that's the case. The scm call above sets the fuse
> > +              * register.
> > +              */
> > +             fuse_val = a6xx_llc_read(a6xx_gpu,
> > +                                      REG_A7XX_CX_MISC_SW_FUSE_VALUE);
> > +             adreno_gpu->has_ray_tracing =
> > +                     !!(fuse_val & A7XX_CX_MISC_SW_FUSE_VALUE_RAYTRACING);
> > +     } else {
> > +             if (adreno_is_a740(adreno_gpu)) {
> > +                     /* Raytracing is always enabled on a740 */
> > +                     adreno_gpu->has_ray_tracing = true;
> > +             }
> > +
> > +             if (qcom_scm_is_available())
> > +                     return qcom_scm_gpu_init_regs(QCOM_SCM_GPU_ALWAYS_EN_REQ);
> > +     }
> > +
> > +     return 0;
> > +}
> > +
> > +
> >   #define GBIF_CLIENT_HALT_MASK               BIT(0)
> >   #define GBIF_ARB_HALT_MASK          BIT(1)
> >   #define VBIF_XIN_HALT_CTRL0_MASK    GENMASK(3, 0)
> > @@ -3094,6 +3175,14 @@ struct msm_gpu *a6xx_gpu_init(struct drm_device *dev)
> >               return ERR_PTR(ret);
> >       }
> >
> > +     if (adreno_is_a7xx(adreno_gpu)) {
> > +             ret = a7xx_cx_mem_init(a6xx_gpu);
> > +             if (ret) {
> > +                     a6xx_destroy(&(a6xx_gpu->base.base));
> > +                     return ERR_PTR(ret);
> > +             }
> > +     }
> > +
> >       if (gpu->aspace)
> >               msm_mmu_set_fault_handler(gpu->aspace->mmu, gpu,
> >                               a6xx_fault_handler);
> > diff --git a/drivers/gpu/drm/msm/adreno/adreno_gpu.h b/drivers/gpu/drm/msm/adreno/adreno_gpu.h
> > index 77526892eb8c..4180f3149dd8 100644
> > --- a/drivers/gpu/drm/msm/adreno/adreno_gpu.h
> > +++ b/drivers/gpu/drm/msm/adreno/adreno_gpu.h
> > @@ -182,6 +182,8 @@ struct adreno_gpu {
> >        */
> >       const unsigned int *reg_offsets;
> >       bool gmu_is_wrapper;
> > +
> > +     bool has_ray_tracing;
> >   };
> >   #define to_adreno_gpu(x) container_of(x, struct adreno_gpu, base)
> >
> >
>
> This patch break GPU init on SM8450-HDK and SM8550-HDK, call to
> qcom_scm_gpu_init_regs(QCOM_SCM_GPU_ALWAYS_EN_REQ) returns -5.
>
> On which device did you test this ?
>
> Neil

I tested on SM8650-HDK (with your DTS patches on top). kgsl does call
this on SM8450/SM8550 [1], and doesn't swallow -EIO, which is why I
thought it was safe. But looking more into it now, the commit message
introducing it mentions the software fuse which is SM8650-only, so
maybe they broke SM8550 when adding this for SM8650?

Connor

[1] https://git.codelinaro.org/clo/le/platform/vendor/qcom/opensource/graphics-kernel/-/blob/gfx-kernel.le.0.0.r1-rel/adreno_gen7.c?ref_type=heads#L915.





[Index of Archives]     [Device Tree Compilter]     [Device Tree Spec]     [Linux Driver Backports]     [Video for Linux]     [Linux USB Devel]     [Linux PCI Devel]     [Linux Audio Users]     [Linux Kernel]     [Linux SCSI]     [XFree86]     [Yosemite Backpacking]


  Powered by Linux