On Tue, Apr 21, 2020 at 07:41:25PM -0400, Jonathan Marek wrote: > Update the gmu_pdc registers for A640 and A650. > > Some of the RSCC registers on A650 are in a separate region. > > Note this also changes the address of these registers: > > RSCC_TCS1_DRV0_STATUS > RSCC_TCS2_DRV0_STATUS > RSCC_TCS3_DRV0_STATUS > > Based on the values in msm-4.14 and msm-4.19 kernels. > > Signed-off-by: Jonathan Marek <jonathan@xxxxxxxx> > --- > drivers/gpu/drm/msm/adreno/a6xx_gmu.c | 90 ++++++++++++++--------- > drivers/gpu/drm/msm/adreno/a6xx_gmu.h | 10 +++ > drivers/gpu/drm/msm/adreno/a6xx_gmu.xml.h | 38 +++++----- > 3 files changed, 85 insertions(+), 53 deletions(-) > > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gmu.c b/drivers/gpu/drm/msm/adreno/a6xx_gmu.c > index 4aef5fe985d6..60ed5360fd8a 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx_gmu.c > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gmu.c > @@ -421,7 +421,7 @@ static int a6xx_rpmh_start(struct a6xx_gmu *gmu) > return ret; > } > > - ret = gmu_poll_timeout(gmu, REG_A6XX_RSCC_SEQ_BUSY_DRV0, val, > + ret = gmu_poll_timeout_rscc(gmu, REG_A6XX_RSCC_SEQ_BUSY_DRV0, val, > !val, 100, 10000); > > if (ret) { > @@ -447,7 +447,7 @@ static void a6xx_rpmh_stop(struct a6xx_gmu *gmu) > > gmu_write(gmu, REG_A6XX_GMU_RSCC_CONTROL_REQ, 1); > > - ret = gmu_poll_timeout(gmu, REG_A6XX_GPU_RSCC_RSC_STATUS0_DRV0, > + ret = gmu_poll_timeout_rscc(gmu, REG_A6XX_GPU_RSCC_RSC_STATUS0_DRV0, > val, val & (1 << 16), 100, 10000); > if (ret) > DRM_DEV_ERROR(gmu->dev, "Unable to power off the GPU RSC\n"); > @@ -470,32 +470,48 @@ static void a6xx_gmu_rpmh_init(struct a6xx_gmu *gmu) > struct platform_device *pdev = to_platform_device(gmu->dev); > void __iomem *pdcptr = a6xx_gmu_get_mmio(pdev, "gmu_pdc"); > void __iomem *seqptr = a6xx_gmu_get_mmio(pdev, "gmu_pdc_seq"); > + uint32_t pdc_address_offset; > > if (!pdcptr || !seqptr) > goto err; > > + if (adreno_is_a618(adreno_gpu) || adreno_is_a640(adreno_gpu)) > + pdc_address_offset = 0x30090; > + else if (adreno_is_a650(adreno_gpu)) > + pdc_address_offset = 0x300a0; > + else > + pdc_address_offset = 0x30080; This might be another one of those things that we should consider adding to the gpu list. > + > /* Disable SDE clock gating */ > - gmu_write(gmu, REG_A6XX_GPU_RSCC_RSC_STATUS0_DRV0, BIT(24)); > + gmu_write_rscc(gmu, REG_A6XX_GPU_RSCC_RSC_STATUS0_DRV0, BIT(24)); > > /* Setup RSC PDC handshake for sleep and wakeup */ > - gmu_write(gmu, REG_A6XX_RSCC_PDC_SLAVE_ID_DRV0, 1); > - gmu_write(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA, 0); > - gmu_write(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR, 0); > - gmu_write(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA + 2, 0); > - gmu_write(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR + 2, 0); > - gmu_write(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA + 4, 0x80000000); > - gmu_write(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR + 4, 0); > - gmu_write(gmu, REG_A6XX_RSCC_OVERRIDE_START_ADDR, 0); > - gmu_write(gmu, REG_A6XX_RSCC_PDC_SEQ_START_ADDR, 0x4520); > - gmu_write(gmu, REG_A6XX_RSCC_PDC_MATCH_VALUE_LO, 0x4510); > - gmu_write(gmu, REG_A6XX_RSCC_PDC_MATCH_VALUE_HI, 0x4514); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_PDC_SLAVE_ID_DRV0, 1); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA, 0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR, 0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA + 2, 0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR + 2, 0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA + 4, 0x80000000); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR + 4, 0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_OVERRIDE_START_ADDR, 0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_PDC_SEQ_START_ADDR, 0x4520); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_PDC_MATCH_VALUE_LO, 0x4510); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_PDC_MATCH_VALUE_HI, 0x4514); > > /* Load RSC sequencer uCode for sleep and wakeup */ > - gmu_write(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0, 0xa7a506a0); > - gmu_write(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 1, 0xa1e6a6e7); > - gmu_write(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 2, 0xa2e081e1); > - gmu_write(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 3, 0xe9a982e2); > - gmu_write(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 4, 0x0020e8a8); > + if (adreno_is_a650(adreno_gpu)) { > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0, 0xeaaae5a0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 1, 0xe1a1ebab); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 2, 0xa2e0a581); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 3, 0xecac82e2); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 4, 0x0020edad); > + } else { > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0, 0xa7a506a0); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 1, 0xa1e6a6e7); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 2, 0xa2e081e1); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 3, 0xe9a982e2); > + gmu_write_rscc(gmu, REG_A6XX_RSCC_SEQ_MEM_0_DRV0 + 4, 0x0020e8a8); > + } > > /* Load PDC sequencer uCode for power up and power down sequence */ > pdc_write(seqptr, REG_A6XX_PDC_GPU_SEQ_MEM_0, 0xfebea1e1); > @@ -516,10 +532,7 @@ static void a6xx_gmu_rpmh_init(struct a6xx_gmu *gmu) > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_DATA + 4, 0x0); > > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_MSGID + 8, 0x10108); > - if (adreno_is_a618(adreno_gpu)) > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 8, 0x30090); > - else > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 8, 0x30080); > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_ADDR + 8, pdc_address_offset); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS1_CMD0_DATA + 8, 0x0); > > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD_ENABLE_BANK, 7); > @@ -531,17 +544,12 @@ static void a6xx_gmu_rpmh_init(struct a6xx_gmu *gmu) > > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_MSGID + 4, 0x10108); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 4, 0x30000); > - if (adreno_is_a618(adreno_gpu)) > + if (adreno_is_a618(adreno_gpu) || adreno_is_a650(adreno_gpu)) > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 4, 0x2); > else > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 4, 0x3); > - > - > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_MSGID + 8, 0x10108); > - if (adreno_is_a618(adreno_gpu)) > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 8, 0x30090); > - else > - pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 8, 0x30080); > + pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_ADDR + 8, pdc_address_offset); > pdc_write(pdcptr, REG_A6XX_PDC_GPU_TCS3_CMD0_DATA + 8, 0x3); > > /* Setup GPU PDC */ > @@ -784,13 +792,13 @@ static void a6xx_gmu_rpmh_off(struct a6xx_gmu *gmu) > u32 val; > > /* Make sure there are no outstanding RPMh votes */ > - gmu_poll_timeout(gmu, REG_A6XX_RSCC_TCS0_DRV0_STATUS, val, > + gmu_poll_timeout_rscc(gmu, REG_A6XX_RSCC_TCS0_DRV0_STATUS, val, > (val & 1), 100, 10000); > - gmu_poll_timeout(gmu, REG_A6XX_RSCC_TCS1_DRV0_STATUS, val, > + gmu_poll_timeout_rscc(gmu, REG_A6XX_RSCC_TCS1_DRV0_STATUS, val, > (val & 1), 100, 10000); > - gmu_poll_timeout(gmu, REG_A6XX_RSCC_TCS2_DRV0_STATUS, val, > + gmu_poll_timeout_rscc(gmu, REG_A6XX_RSCC_TCS2_DRV0_STATUS, val, > (val & 1), 100, 10000); > - gmu_poll_timeout(gmu, REG_A6XX_RSCC_TCS3_DRV0_STATUS, val, > + gmu_poll_timeout_rscc(gmu, REG_A6XX_RSCC_TCS3_DRV0_STATUS, val, > (val & 1), 100, 1000); > } > > @@ -1349,6 +1357,7 @@ static int a6xx_gmu_get_irq(struct a6xx_gmu *gmu, struct platform_device *pdev, > > void a6xx_gmu_remove(struct a6xx_gpu *a6xx_gpu) > { > + struct adreno_gpu *adreno_gpu = &a6xx_gpu->base; > struct a6xx_gmu *gmu = &a6xx_gpu->gmu; > > if (!gmu->initialized) > @@ -1362,7 +1371,10 @@ void a6xx_gmu_remove(struct a6xx_gpu *a6xx_gpu) > } > > iounmap(gmu->mmio); > + if (adreno_is_a650(adreno_gpu)) > + iounmap(gmu->rscc); Another transition point. Every thing after a650 will use the rscc region. It might be better to do a resource check here instead: if (platform_get_resource_byname(pdev, "rscc", IORESOURCE_MEM)) iounmap(gmu->rscc); It would be really nice to use devm_ but I'm skeptical of how well devres works with sub-platform devices. Sean Paul has fought with that before and it takes a combination of platform_device_put() and some good luck. I've mentioned to Rob before that we might need to think of chaining components together and make GMU a top level platform-device, but I think the only way we can do that today is to make GMU a peer of adreno and I'm not sure if that is something we want to do. Other than that, I really like reusing the gmu->rscc pointer for both types. That is clever. > gmu->mmio = NULL; > + gmu->rscc = NULL; > > a6xx_gmu_memory_free(gmu); > > @@ -1445,6 +1457,14 @@ int a6xx_gmu_init(struct a6xx_gpu *a6xx_gpu, struct device_node *node) > goto err_memory; > } > > + if (adreno_is_a650(adreno_gpu)) { > + gmu->rscc = a6xx_gmu_get_mmio(pdev, "rscc"); > + if (IS_ERR(gmu->rscc)) > + goto err_mmio; > + } else { > + gmu->rscc = gmu->mmio + 0x23000; > + } > + > /* Get the HFI and GMU interrupts */ > gmu->hfi_irq = a6xx_gmu_get_irq(gmu, pdev, "hfi", a6xx_hfi_irq); > gmu->gmu_irq = a6xx_gmu_get_irq(gmu, pdev, "gmu", a6xx_gmu_irq); > @@ -1470,6 +1490,8 @@ int a6xx_gmu_init(struct a6xx_gpu *a6xx_gpu, struct device_node *node) > > err_mmio: > iounmap(gmu->mmio); > + if (adreno_is_a650(adreno_gpu)) > + iounmap(gmu->rscc); Same concern as above. > free_irq(gmu->gmu_irq, gmu); > free_irq(gmu->hfi_irq, gmu); > > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gmu.h b/drivers/gpu/drm/msm/adreno/a6xx_gmu.h > index 526911010cb1..aed02b2b7659 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx_gmu.h > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gmu.h > @@ -47,6 +47,7 @@ struct a6xx_gmu { > struct msm_gem_address_space *aspace; > > void * __iomem mmio; > + void * __iomem rscc; > > int hfi_irq; > int gmu_irq; > @@ -126,6 +127,15 @@ static inline u64 gmu_read64(struct a6xx_gmu *gmu, u32 lo, u32 hi) > readl_poll_timeout((gmu)->mmio + ((addr) << 2), val, cond, \ > interval, timeout) > > +static inline void gmu_write_rscc(struct a6xx_gmu *gmu, u32 offset, u32 value) > +{ > + return msm_writel(value, gmu->rscc + (offset << 2)); > +} > + > +#define gmu_poll_timeout_rscc(gmu, addr, val, cond, interval, timeout) \ > + readl_poll_timeout((gmu)->rscc + ((addr) << 2), val, cond, \ > + interval, timeout) > + > /* > * These are the available OOB (out of band requests) to the GMU where "out of > * band" means that the CPU talks to the GMU directly and not through HFI. > diff --git a/drivers/gpu/drm/msm/adreno/a6xx_gmu.xml.h b/drivers/gpu/drm/msm/adreno/a6xx_gmu.xml.h > index eb2cd41dae6e..b4357ea550ec 100644 > --- a/drivers/gpu/drm/msm/adreno/a6xx_gmu.xml.h > +++ b/drivers/gpu/drm/msm/adreno/a6xx_gmu.xml.h > @@ -336,8 +336,6 @@ static inline uint32_t A6XX_GMU_GPU_NAP_CTRL_SID(uint32_t val) > > #define REG_A6XX_GMU_AO_SPARE_CNTL 0x00009316 > > -#define REG_A6XX_GPU_RSCC_RSC_STATUS0_DRV0 0x00008c04 > - > #define REG_A6XX_GMU_RSCC_CONTROL_REQ 0x00009307 > > #define REG_A6XX_GMU_RSCC_CONTROL_ACK 0x00009308 > @@ -350,39 +348,41 @@ static inline uint32_t A6XX_GMU_GPU_NAP_CTRL_SID(uint32_t val) > > #define REG_A6XX_GPU_CC_GX_DOMAIN_MISC 0x00009d42 > > -#define REG_A6XX_RSCC_PDC_SEQ_START_ADDR 0x00008c08 > +#define REG_A6XX_GPU_RSCC_RSC_STATUS0_DRV0 0x00000004 > + > +#define REG_A6XX_RSCC_PDC_SEQ_START_ADDR 0x00000008 > > -#define REG_A6XX_RSCC_PDC_MATCH_VALUE_LO 0x00008c09 > +#define REG_A6XX_RSCC_PDC_MATCH_VALUE_LO 0x00000009 > > -#define REG_A6XX_RSCC_PDC_MATCH_VALUE_HI 0x00008c0a > +#define REG_A6XX_RSCC_PDC_MATCH_VALUE_HI 0x0000000a > > -#define REG_A6XX_RSCC_PDC_SLAVE_ID_DRV0 0x00008c0b > +#define REG_A6XX_RSCC_PDC_SLAVE_ID_DRV0 0x0000000b > > -#define REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR 0x00008c0d > +#define REG_A6XX_RSCC_HIDDEN_TCS_CMD0_ADDR 0x0000000d > > -#define REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA 0x00008c0e > +#define REG_A6XX_RSCC_HIDDEN_TCS_CMD0_DATA 0x0000000e > > -#define REG_A6XX_RSCC_TIMESTAMP_UNIT0_TIMESTAMP_L_DRV0 0x00008c82 > +#define REG_A6XX_RSCC_TIMESTAMP_UNIT0_TIMESTAMP_L_DRV0 0x00000082 > > -#define REG_A6XX_RSCC_TIMESTAMP_UNIT0_TIMESTAMP_H_DRV0 0x00008c83 > +#define REG_A6XX_RSCC_TIMESTAMP_UNIT0_TIMESTAMP_H_DRV0 0x00000083 > > -#define REG_A6XX_RSCC_TIMESTAMP_UNIT1_EN_DRV0 0x00008c89 > +#define REG_A6XX_RSCC_TIMESTAMP_UNIT1_EN_DRV0 0x00000089 > > -#define REG_A6XX_RSCC_TIMESTAMP_UNIT1_OUTPUT_DRV0 0x00008c8c > +#define REG_A6XX_RSCC_TIMESTAMP_UNIT1_OUTPUT_DRV0 0x0000008c > > -#define REG_A6XX_RSCC_OVERRIDE_START_ADDR 0x00008d00 > +#define REG_A6XX_RSCC_OVERRIDE_START_ADDR 0x00000100 > > -#define REG_A6XX_RSCC_SEQ_BUSY_DRV0 0x00008d01 > +#define REG_A6XX_RSCC_SEQ_BUSY_DRV0 0x00000101 > > -#define REG_A6XX_RSCC_SEQ_MEM_0_DRV0 0x00008d80 > +#define REG_A6XX_RSCC_SEQ_MEM_0_DRV0 0x00000180 > > -#define REG_A6XX_RSCC_TCS0_DRV0_STATUS 0x00008f46 > +#define REG_A6XX_RSCC_TCS0_DRV0_STATUS 0x00000346 > > -#define REG_A6XX_RSCC_TCS1_DRV0_STATUS 0x000090ae > +#define REG_A6XX_RSCC_TCS1_DRV0_STATUS 0x000003ee > > -#define REG_A6XX_RSCC_TCS2_DRV0_STATUS 0x00009216 > +#define REG_A6XX_RSCC_TCS2_DRV0_STATUS 0x00000496 > > -#define REG_A6XX_RSCC_TCS3_DRV0_STATUS 0x0000937e > +#define REG_A6XX_RSCC_TCS3_DRV0_STATUS 0x0000053e > > > #endif /* A6XX_GMU_XML */ > -- > 2.26.1 > -- The Qualcomm Innovation Center, Inc. is a member of Code Aurora Forum, a Linux Foundation Collaborative Project