On Tue, Dec 03, 2019 at 03:06:11PM +0000, Sharat Masetty wrote: > This patch adds support for enabling Graphics Bus Interface(GBIF) > used in multiple A6xx series chipets. Also makes changes to the > PDC/RSC sequencing specifically required for A618. This is needed > for proper interfacing with RPMH. > > Change-Id: I0e7a314b0ae0d562f602512ad978f5d1ced5fb26 > Signed-off-by: Sharat Masetty <smasetty@xxxxxxxxxxxxxx> > --- > drivers/gpu/drm/msm/adreno/a6xx.xml.h | 52 +++++++++++++++++++++++- > drivers/gpu/drm/msm/adreno/a6xx_gmu.c | 24 +++++++++-- > drivers/gpu/drm/msm/adreno/a6xx_gpu.c | 70 ++++++++++++++++++++++++++++++--- > drivers/gpu/drm/msm/adreno/a6xx_gpu.h | 9 ++++- > drivers/gpu/drm/msm/adreno/adreno_gpu.h | 12 +++++- > 5 files changed, 154 insertions(+), 13 deletions(-) > > diff --git a/drivers/gpu/drm/msm/adreno/a6xx.xml.h b/drivers/gpu/drm/msm/adreno/a6xx.xml.h > index f44553e..ed78fee 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx.xml.h > +++ b/drivers/gpu/drm/msm/adreno/a6xx.xml.h > @@ -16,11 +16,11 @@ > - /home/robclark/src/envytools/rnndb/adreno/a3xx.xml ( 83840 bytes, from 2018-07-03 19:37:13) > - /home/robclark/src/envytools/rnndb/adreno/a4xx.xml ( 112086 bytes, from 2018-07-03 19:37:13) > - /home/robclark/src/envytools/rnndb/adreno/a5xx.xml ( 147240 bytes, from 2018-12-02 17:29:54) > -- /home/robclark/src/envytools/rnndb/adreno/a6xx.xml ( 140790 bytes, from 2018-12-02 17:29:54) > +- /home/smasetty/playarea/envytools/rnndb/adreno/a6xx.xml ( 161969 bytes, from 2019-11-29 07:18:16) > - /home/robclark/src/envytools/rnndb/adreno/a6xx_gmu.xml ( 10431 bytes, from 2018-09-14 13:03:07) > - /home/robclark/src/envytools/rnndb/adreno/ocmem.xml ( 1773 bytes, from 2018-07-03 19:37:13) > > -Copyright (C) 2013-2018 by the following authors: > +Copyright (C) 2013-2019 by the following authors: > - Rob Clark <robdclark@xxxxxxxxx> (robclark) > - Ilia Mirkin <imirkin@xxxxxxxxxxxx> (imirkin) > > @@ -2519,6 +2519,54 @@ static inline uint32_t A6XX_VBIF_TEST_BUS2_CTRL1_DATA_SEL(uint32_t val) > > #define REG_A6XX_VBIF_PERF_PWR_CNT_HIGH2 0x0000311a > > +#define REG_A6XX_GBIF_SCACHE_CNTL1 0x00003c02 > + > +#define REG_A6XX_GBIF_QSB_SIDE0 0x00003c03 > + > +#define REG_A6XX_GBIF_QSB_SIDE1 0x00003c04 > + > +#define REG_A6XX_GBIF_QSB_SIDE2 0x00003c05 > + > +#define REG_A6XX_GBIF_QSB_SIDE3 0x00003c06 > + > +#define REG_A6XX_GBIF_HALT 0x00003c45 > + > +#define REG_A6XX_GBIF_HALT_ACK 0x00003c46 > + > +#define REG_A6XX_GBIF_PERF_PWR_CNT_EN 0x00003cc0 > + > +#define REG_A6XX_GBIF_PERF_CNT_SEL 0x00003cc2 > + > +#define REG_A6XX_GBIF_PERF_PWR_CNT_SEL 0x00003cc3 > + > +#define REG_A6XX_GBIF_PERF_CNT_LOW0 0x00003cc4 > + > +#define REG_A6XX_GBIF_PERF_CNT_LOW1 0x00003cc5 > + > +#define REG_A6XX_GBIF_PERF_CNT_LOW2 0x00003cc6 > + > +#define REG_A6XX_GBIF_PERF_CNT_LOW3 0x00003cc7 > + > +#define REG_A6XX_GBIF_PERF_CNT_HIGH0 0x00003cc8 > + > +#define REG_A6XX_GBIF_PERF_CNT_HIGH1 0x00003cc9 > + > +#define REG_A6XX_GBIF_PERF_CNT_HIGH2 0x00003cca > + > +#define REG_A6XX_GBIF_PERF_CNT_HIGH3 0x00003ccb > + > +#define REG_A6XX_GBIF_PWR_CNT_LOW0 0x00003ccc > + > +#define REG_A6XX_GBIF_PWR_CNT_LOW1 0x00003ccd > + > +#define REG_A6XX_GBIF_PWR_CNT_LOW2 0x00003cce > + > +#define REG_A6XX_GBIF_PWR_CNT_HIGH0 0x00003ccf > + > +#define REG_A6XX_GBIF_PWR_CNT_HIGH1 0x00003cd0 > + > +#define REG_A6XX_GBIF_PWR_CNT_HIGH2 0x00003cd1 > + > #define REG_A6XX_RB_WINDOW_OFFSET2 0x000088d4 > #define A6XX_RB_WINDOW_OFFSET2_WINDOW_OFFSET_DISABLE 0x80000000 > #define A6XX_RB_WINDOW_OFFSET2_X__MASK 0x00007fff > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gmu.c b/drivers/gpu/drm/msm/adreno/a6xx_gmu.c > index 85f14fe..158a74c 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx_gmu.c > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gmu.c > @@ -1,5 +1,5 @@ > // SPDX-License-Identifier: GPL-2.0 > -/* Copyright (c) 2017-2018 The Linux Foundation. All rights reserved. */ > +/* Copyright (c) 2017-2019 The Linux Foundation. All rights reserved. */ > > #include <linux/clk.h> > #include <linux/interconnect.h> > @@ -433,6 +433,8 @@ static void __iomem *a6xx_gmu_get_mmio(struct platform_device *pdev, > > static void a6xx_gmu_rpmh_init(struct a6xx_gmu *gmu) > { > + struct a6xx_gpu *a6xx_gpu = container_of(gmu, struct a6xx_gpu, gmu); > + struct adreno_gpu *adreno_gpu = &a6xx_gpu->base; > struct platform_device *pdev = to_platform_device(gmu->dev); > void __iomem *pdcptr = a6xx_gmu_get_mmio(pdev, "gmu_pdc"); > void __iomem *seqptr = a6xx_gmu_get_mmio(pdev, "gmu_pdc_seq"); > @@ -480,20 +482,34 @@ static void a6xx_gmu_rpmh_init(struct a6xx_gmu *gmu) > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_MSGID + 4, 0x10108); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 4, 0x30000); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_DATA + 4, 0x0); > + Unneeded whitespace change. > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_MSGID + 8, 0x10108); > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 8, 0x30080); > + if (adreno_is_a618(adreno_gpu)) > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 8, 0x30090); > + else > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 8, 0x30080); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_DATA + 8, 0x0); > + Unneeded whitespace change. > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD_ENABLE_BANK, 7); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD_WAIT_FOR_CMPL_BANK, 0); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CONTROL, 0); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_MSGID, 0x10108); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR, 0x30010); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA, 2); > + Also an uneeded whitespace change > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_MSGID + 4, 0x10108); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 4, 0x30000); > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 4, 0x3); > + if (adreno_is_a618(adreno_gpu)) > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 4, 0x2); > + else > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 4, 0x3); > + > + Extra blank line here > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_MSGID + 8, 0x10108); > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 8, 0x30080); > + if (adreno_is_a618(adreno_gpu)) > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 8, 0x30090); > + else > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 8, 0x30080); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 8, 0x3); > > /* Setup GPU PDC */ > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gpu.c b/drivers/gpu/drm/msm/adreno/a6xx_gpu.c > index dc8ec2c..6fdffae 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx_gpu.c > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gpu.c > @@ -1,5 +1,5 @@ > // SPDX-License-Identifier: GPL-2.0 > -/* Copyright (c) 2017-2018 The Linux Foundation. All rights reserved. */ > +/* Copyright (c) 2017-2019 The Linux Foundation. All rights reserved. */ > > > #include "msm_gem.h" > @@ -378,6 +378,18 @@ static int a6xx_hw_init(struct msm_gpu *gpu) > struct a6xx_gpu *a6xx_gpu = to_a6xx_gpu(adreno_gpu); > int ret; > > + /* > + * During a previous slumber, GBIF halt is asserted to ensure > + * no further transaction can go through GPU before GPU > + * headswitch is turned off. > + * > + * This halt is deasserted once headswitch goes off but > + * incase headswitch doesn't goes off clear GBIF halt > + * here to ensure GPU wake-up doesn't fail because of > + * halted GPU transactions. > + */ > + gpu_write(gpu, REG_A6XX_GBIF_HALT, 0x0); > + > /* Make sure the GMU keeps the GPU on while we set it up */ > a6xx_gmu_set_oob(&a6xx_gpu->gmu, GMU_OOB_GPU_SET); > > @@ -406,12 +418,17 @@ static int a6xx_hw_init(struct msm_gpu *gpu) > gpu_write(gpu, REG_A6XX_TPL1_ADDR_MODE_CNTL, 0x1); > gpu_write(gpu, REG_A6XX_RBBM_SECVID_TSB_ADDR_MODE_CNTL, 0x1); > > - /* enable hardware clockgating */ > - a6xx_set_hwcg(gpu, true); > + /* > + * enable hardware clockgating > + * For now enable clock gating only for a630 Why? > + */ > + if (adreno_is_a630(adreno_gpu)) If you are going to skip clock gating, do it inside the function to avoid a branch here and to avoid having two distinct locations to change to enable HWCG for a given target. > + a6xx_set_hwcg(gpu, true); > > - /* VBIF start */ > - gpu_write(gpu, REG_A6XX_VBIF_GATE_OFF_WRREQ_EN, 0x00000009); > + /* VBIF/GBIF start*/ > gpu_write(gpu, REG_A6XX_RBBM_VBIF_CLIENT_QOS_CNTL, 0x3); > + if (adreno_is_a630(adreno_gpu)) > + gpu_write(gpu, REG_A6XX_VBIF_GATE_OFF_WRREQ_EN, 0x00000009); > > /* Make all blocks contribute to the GPU BUSY perf counter */ > gpu_write(gpu, REG_A6XX_RBBM_PERFCTR_GPU_BUSY_MASKED, 0xffffffff); > @@ -724,6 +741,39 @@ static irqreturn_t a6xx_irq(struct msm_gpu *gpu) > REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_CNTL, REG_A6XX_CP_RB_CNTL), > }; > > +#define GBIF_CLIENT_HALT_MASK BIT(0) > +#define GBIF_ARB_HALT_MASK BIT(1) > + > +static void a6xx_bus_clear_pending_transactions(struct adreno_gpu *adreno_gpu) > +{ > + struct msm_gpu *gpu = &adreno_gpu->base; > + > + if(!a6xx_has_gbif(adreno_gpu)){ This should be adreno_is_a630. There is a good argument that this code should should live in its own function but I'll leave that up to you. Regardless, put a space before the {. > + gpu_write(gpu, REG_A6XX_VBIF_XIN_HALT_CTRL0, 0xf); > + spin_until((gpu_read(gpu, REG_A6XX_VBIF_XIN_HALT_CTRL1) & > + 0xf) == 0xf); > + gpu_write(gpu, REG_A6XX_VBIF_XIN_HALT_CTRL0, 0); > + > + return; > + } > + > + /* Halt new client requests on GBIF */ > + gpu_write(gpu, REG_A6XX_GBIF_HALT, GBIF_CLIENT_HALT_MASK); > + spin_until((gpu_read(gpu, REG_A6XX_GBIF_HALT_ACK) & > + (GBIF_CLIENT_HALT_MASK)) == GBIF_CLIENT_HALT_MASK); > + > + /* Halt all AXI requests on GBIF */ > + gpu_write(gpu, REG_A6XX_GBIF_HALT, GBIF_ARB_HALT_MASK); > + spin_until((gpu_read(gpu, REG_A6XX_GBIF_HALT_ACK) & > + (GBIF_ARB_HALT_MASK)) == GBIF_ARB_HALT_MASK); > + > + /* > + * GMU needs DDR access in slumber path. Deassert GBIF halt now > + * to allow for GMU to access system memory. > + */ > + gpu_write(gpu, REG_A6XX_GBIF_HALT, 0x0); > +} > + > static int a6xx_pm_resume(struct msm_gpu *gpu) > { > struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu); > @@ -748,6 +798,16 @@ static int a6xx_pm_suspend(struct msm_gpu *gpu) > > devfreq_suspend_device(gpu->devfreq.devfreq); > > + /* > + * Make sure the GMU is idle before continuing (because some transitions > + * may use VBIF > + */ > + a6xx_gmu_wait_for_idle(&a6xx_gpu->gmu); > + > + /* Clear the VBIF pipe before shutting down */ > + /* FIXME: This accesses the GPU - do we need to make sure it is on? */ You should know that it is active if you make it out of wait for idle, and the function only accesses CX so you don't need to worry about IFPC. > + a6xx_bus_clear_pending_transactions(adreno_gpu); > + > return a6xx_gmu_stop(a6xx_gpu); > } > > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gpu.h b/drivers/gpu/drm/msm/adreno/a6xx_gpu.h > index 6439955..7239b8b 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx_gpu.h > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gpu.h > @@ -1,5 +1,5 @@ > /* SPDX-License-Identifier: GPL-2.0 */ > -/* Copyright (c) 2017 The Linux Foundation. All rights reserved. */ > +/* Copyright (c) 2017, 2019 The Linux Foundation. All rights reserved. */ > > #ifndef __A6XX_GPU_H__ > #define __A6XX_GPU_H__ > @@ -42,6 +42,13 @@ struct a6xx_gpu { > #define A6XX_PROTECT_RDONLY(_reg, _len) \ > ((((_len) & 0x3FFF) << 18) | ((_reg) & 0x3FFFF)) > > +static inline bool a6xx_has_gbif(struct adreno_gpu *gpu) > +{ > + if(adreno_is_a630(gpu)) > + return false; > + > + return true; > +} This macro isn't needed - adreno_is_a630 is a sufficient check because we know that VBIF died with a630. > > int a6xx_gmu_resume(struct a6xx_gpu *gpu); > int a6xx_gmu_stop(struct a6xx_gpu *gpu); > diff --git a/drivers/gpu/drm/msm/adreno/adreno_gpu.h b/drivers/gpu/drm/msm/adreno/adreno_gpu.h > index c7441fb..e12d5a9 100644 > --- a/drivers/gpu/drm/msm/adreno/adreno_gpu.h > +++ b/drivers/gpu/drm/msm/adreno/adreno_gpu.h > @@ -3,7 +3,7 @@ > * Copyright (C) 2013 Red Hat > * Author: Rob Clark <robdclark@xxxxxxxxx> > * > - * Copyright (c) 2014,2017 The Linux Foundation. All rights reserved. > + * Copyright (c) 2014,2017, 2019 The Linux Foundation. All rights reserved. > */ > > #ifndef __ADRENO_GPU_H__ > @@ -216,6 +216,16 @@ static inline int adreno_is_a540(struct adreno_gpu *gpu) > return gpu->revn == 540; > } > > +static inline int adreno_is_a618(struct adreno_gpu *gpu) > +{ > + return gpu->revn == 618; > +} > + > +static inline int adreno_is_a630(struct adreno_gpu *gpu) > +{ > + return gpu->revn == 630; > +} > + > int adreno_get_param(struct msm_gpu *gpu, uint32_t param, uint64_t *value); > const struct firmware *adreno_request_fw(struct adreno_gpu *adreno_gpu, > const char *fwname); > -- > 1.9.1 > > _______________________________________________ > dri-devel mailing list > dri-devel@xxxxxxxxxxxxxxxxxxxxx > https://lists.freedesktop.org/mailman/listinfo/dri-devel -- The Qualcomm Innovation Center, Inc. is a member of Code Aurora Forum, a Linux Foundation Collaborative Project